docs/doxygen/MLInlineAdvisor_8cpp_source.html

//===- MLInlineAdvisor.cpp - machine learned InlineAdvisor ----------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the interface between the inliner and a learned model.

// It delegates model evaluation to either the AOT compiled model (the

// 'release' mode) or a runtime-loaded model (the 'development' case).

//

//===----------------------------------------------------------------------===//

#include "llvm/Analysis/MLInlineAdvisor.h"

#include "llvm/ADT/SCCIterator.h"

#include "llvm/Analysis/AssumptionCache.h"

#include "llvm/Analysis/BlockFrequencyInfo.h"

#include "llvm/Analysis/CallGraph.h"

#include "llvm/Analysis/FunctionPropertiesAnalysis.h"

#include "llvm/Analysis/InlineCost.h"

#include "llvm/Analysis/InlineModelFeatureMaps.h"

#include "llvm/Analysis/InteractiveModelRunner.h"

#include "llvm/Analysis/LazyCallGraph.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/MLModelRunner.h"

#include "llvm/Analysis/OptimizationRemarkEmitter.h"

#include "llvm/Analysis/ProfileSummaryInfo.h"

#include "llvm/Analysis/ReleaseModeModelRunner.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/IR/Dominators.h"

#include "llvm/IR/InstIterator.h"

#include "llvm/IR/Module.h"

#include "llvm/IR/PassManager.h"

#include "llvm/Support/CommandLine.h"


using namespace llvm;


static cl::opt<std::string> InteractiveChannelBaseName(

    "inliner-interactive-channel-base", cl::Hidden,

    cl::desc(

        "Base file path for the interactive mode. The incoming filename should "

        "have the name <inliner-interactive-channel-base>.in, while the "

        "outgoing name should be <inliner-interactive-channel-base>.out"));

static const std::string InclDefaultMsg =

    (Twine("In interactive mode, also send the default policy decision: ") +

     DefaultDecisionName + ".")

        .str();

static cl::opt<bool>

    InteractiveIncludeDefault("inliner-interactive-include-default", cl::Hidden,

                              cl::desc(InclDefaultMsg));


enum class SkipMLPolicyCriteria { Never, IfCallerIsNotCold };


static cl::opt<SkipMLPolicyCriteria> SkipPolicy(

    "ml-inliner-skip-policy", cl::Hidden, cl::init(SkipMLPolicyCriteria::Never),

    cl::values(clEnumValN(SkipMLPolicyCriteria::Never, "never", "never"),

               clEnumValN(SkipMLPolicyCriteria::IfCallerIsNotCold,

                          "if-caller-not-cold", "if the caller is not cold")));


static cl::opt<std::string> ModelSelector("ml-inliner-model-selector",

                                          cl::Hidden, cl::init(""));


#if defined(LLVM_HAVE_TF_AOT_INLINERSIZEMODEL)

// codegen-ed file

#include "InlinerSizeModel.h" // NOLINT

using CompiledModelType = llvm::InlinerSizeModel;

#else

using CompiledModelType = NoopSavedModelImpl;

#endif


std::unique_ptr<InlineAdvisor>

llvm::getReleaseModeAdvisor(Module &M, ModuleAnalysisManager &MAM,

                            std::function<bool(CallBase &)> GetDefaultAdvice) {

  if (!llvm::isEmbeddedModelEvaluatorValid<CompiledModelType>() &&

      InteractiveChannelBaseName.empty())

    return nullptr;

  std::unique_ptr<MLModelRunner> AOTRunner;

  if (InteractiveChannelBaseName.empty())

    AOTRunner = std::make_unique<ReleaseModeModelRunner<CompiledModelType>>(

        M.getContext(), FeatureMap, DecisionName,

        EmbeddedModelRunnerOptions().setModelSelector(ModelSelector));

  else {

    auto Features = FeatureMap;

    if (InteractiveIncludeDefault)

      Features.push_back(DefaultDecisionSpec);

    AOTRunner = std::make_unique<InteractiveModelRunner>(

        M.getContext(), Features, InlineDecisionSpec,

        InteractiveChannelBaseName + ".out",

        InteractiveChannelBaseName + ".in");

  }

  return std::make_unique<MLInlineAdvisor>(M, MAM, std::move(AOTRunner),

                                           GetDefaultAdvice);

}


#define DEBUG_TYPE "inline-ml"


static cl::opt<float> SizeIncreaseThreshold(

    "ml-advisor-size-increase-threshold", cl::Hidden,

    cl::desc("Maximum factor by which expected native size may increase before "

             "blocking any further inlining."),

    cl::init(2.0));


static cl::opt<bool> KeepFPICache(

    "ml-advisor-keep-fpi-cache", cl::Hidden,

    cl::desc(

        "For test - keep the ML Inline advisor's FunctionPropertiesInfo cache"),

    cl::init(false));


// clang-format off

const std::vector<TensorSpec> llvm::FeatureMap{

#define POPULATE_NAMES(DTYPE, SHAPE, NAME, __) TensorSpec::createSpec<DTYPE>(#NAME, SHAPE),

// InlineCost features - these must come first

  INLINE_COST_FEATURE_ITERATOR(POPULATE_NAMES)


// Non-cost features

  INLINE_FEATURE_ITERATOR(POPULATE_NAMES)

#undef POPULATE_NAMES

};

// clang-format on


const char *const llvm::DecisionName = "inlining_decision";

const TensorSpec llvm::InlineDecisionSpec =

    TensorSpec::createSpec<int64_t>(DecisionName, {1});

const char *const llvm::DefaultDecisionName = "inlining_default";

const TensorSpec llvm::DefaultDecisionSpec =

    TensorSpec::createSpec<int64_t>(DefaultDecisionName, {1});

const char *const llvm::RewardName = "delta_size";


CallBase *getInlinableCS(Instruction &I) {

  if (auto *CS = dyn_cast<CallBase>(&I))

    if (Function *Callee = CS->getCalledFunction()) {

      if (!Callee->isDeclaration()) {

        return CS;

      }

    }

  return nullptr;

}


MLInlineAdvisor::MLInlineAdvisor(

    Module &M, ModuleAnalysisManager &MAM,

    std::unique_ptr<MLModelRunner> Runner,

    std::function<bool(CallBase &)> GetDefaultAdvice)

    : InlineAdvisor(

          M, MAM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager()),

      ModelRunner(std::move(Runner)), GetDefaultAdvice(GetDefaultAdvice),

      CG(MAM.getResult<LazyCallGraphAnalysis>(M)),

      InitialIRSize(getModuleIRSize()), CurrentIRSize(InitialIRSize),

      PSI(MAM.getResult<ProfileSummaryAnalysis>(M)) {

  assert(ModelRunner);

  ModelRunner->switchContext("");

  // Extract the 'call site height' feature - the position of a call site

  // relative to the farthest statically reachable SCC node. We don't mutate

  // this value while inlining happens. Empirically, this feature proved

  // critical in behavioral cloning - i.e. training a model to mimic the manual

  // heuristic's decisions - and, thus, equally important for training for

  // improvement.

  CallGraph CGraph(M);

  for (auto I = scc_begin(&CGraph); !I.isAtEnd(); ++I) {

    const std::vector<CallGraphNode *> &CGNodes = *I;

    unsigned Level = 0;

    for (auto *CGNode : CGNodes) {

      Function *F = CGNode->getFunction();

      if (!F || F->isDeclaration())

        continue;

      for (auto &I : instructions(F)) {

        if (auto *CS = getInlinableCS(I)) {

          auto *Called = CS->getCalledFunction();

          auto Pos = FunctionLevels.find(&CG.get(*Called));

          // In bottom up traversal, an inlinable callee is either in the

          // same SCC, or to a function in a visited SCC. So not finding its

          // level means we haven't visited it yet, meaning it's in this SCC.

          if (Pos == FunctionLevels.end())

            continue;

          Level = std::max(Level, Pos->second + 1);

        }

      }

    }

    for (auto *CGNode : CGNodes) {

      Function *F = CGNode->getFunction();

      if (F && !F->isDeclaration())

        FunctionLevels[&CG.get(*F)] = Level;

    }

  }

  for (auto KVP : FunctionLevels) {

    AllNodes.insert(KVP.first);

    EdgeCount += getLocalCalls(KVP.first->getFunction());

  }

  NodeCount = AllNodes.size();

}


unsigned MLInlineAdvisor::getInitialFunctionLevel(const Function &F) const {

  return CG.lookup(F) ? FunctionLevels.at(CG.lookup(F)) : 0;

}


void MLInlineAdvisor::onPassEntry(LazyCallGraph::SCC *CurSCC) {

  if (!CurSCC || ForceStop)

    return;

  FPICache.clear();

  // Function passes executed between InlinerPass runs may have changed the

  // module-wide features.

  // The cgscc pass manager rules are such that:

  // - if a pass leads to merging SCCs, then the pipeline is restarted on the

  // merged SCC

  // - if a pass leads to splitting the SCC, then we continue with one of the

  // splits

  // This means that the NodesInLastSCC is a superset (not strict) of the nodes

  // that subsequent passes would have processed

  // - in addition, if new Nodes were created by a pass (e.g. CoroSplit),

  // they'd be adjacent to Nodes in the last SCC. So we just need to check the

  // boundary of Nodes in NodesInLastSCC for Nodes we haven't seen. We don't

  // care about the nature of the Edge (call or ref). `FunctionLevels`-wise, we

  // record them at the same level as the original node (this is a choice, may

  // need revisiting).

  // - nodes are only deleted at the end of a call graph walk where they are

  // batch deleted, so we shouldn't see any dead nodes here.

  while (!NodesInLastSCC.empty()) {

    const auto *N = *NodesInLastSCC.begin();

    assert(!N->isDead());

    NodesInLastSCC.erase(N);

    EdgeCount += getLocalCalls(N->getFunction());

    const auto NLevel = FunctionLevels.at(N);

    for (const auto &E : *(*N)) {

      const auto *AdjNode = &E.getNode();

      assert(!AdjNode->isDead() && !AdjNode->getFunction().isDeclaration());

      auto I = AllNodes.insert(AdjNode);

      // We've discovered a new function.

      if (I.second) {

        ++NodeCount;

        NodesInLastSCC.insert(AdjNode);

        FunctionLevels[AdjNode] = NLevel;

      }

    }

  }


  EdgeCount -= EdgesOfLastSeenNodes;

  EdgesOfLastSeenNodes = 0;


  // (Re)use NodesInLastSCC to remember the nodes in the SCC right now,

  // in case the SCC is split before onPassExit and some nodes are split out

  assert(NodesInLastSCC.empty());

  for (const auto &N : *CurSCC)

    NodesInLastSCC.insert(&N);

}


void MLInlineAdvisor::onPassExit(LazyCallGraph::SCC *CurSCC) {

  // No need to keep this around - function passes will invalidate it.

  if (!KeepFPICache)

    FPICache.clear();

  if (!CurSCC || ForceStop)

    return;

  // Keep track of the nodes and edges we last saw. Then, in onPassEntry,

  // we update the node count and edge count from the subset of these nodes that

  // survived.

  EdgesOfLastSeenNodes = 0;


  // Check on nodes that were in SCC onPassEntry

  for (const LazyCallGraph::Node *N : NodesInLastSCC) {

    assert(!N->isDead());

    EdgesOfLastSeenNodes += getLocalCalls(N->getFunction());

  }


  // Check on nodes that may have got added to SCC

  for (const auto &N : *CurSCC) {

    assert(!N.isDead());

    auto I = NodesInLastSCC.insert(&N);

    if (I.second)

      EdgesOfLastSeenNodes += getLocalCalls(N.getFunction());

  }

  assert(NodeCount >= NodesInLastSCC.size());

  assert(EdgeCount >= EdgesOfLastSeenNodes);

}


int64_t MLInlineAdvisor::getLocalCalls(Function &F) {

  return getCachedFPI(F).DirectCallsToDefinedFunctions;

}


// Update the internal state of the advisor, and force invalidate feature

// analysis. Currently, we maintain minimal (and very simple) global state - the

// number of functions and the number of static calls. We also keep track of the

// total IR size in this module, to stop misbehaving policies at a certain bloat

// factor (SizeIncreaseThreshold)

void MLInlineAdvisor::onSuccessfulInlining(const MLInlineAdvice &Advice,

                                           bool CalleeWasDeleted) {

  assert(!ForceStop);

  Function *Caller = Advice.getCaller();

  Function *Callee = Advice.getCallee();

  // The caller features aren't valid anymore.

  {

    PreservedAnalyses PA = PreservedAnalyses::all();

    PA.abandon<FunctionPropertiesAnalysis>();

    PA.abandon<LoopAnalysis>();

    FAM.invalidate(*Caller, PA);

  }

  Advice.updateCachedCallerFPI(FAM);

  int64_t IRSizeAfter =

      getIRSize(*Caller) + (CalleeWasDeleted ? 0 : Advice.CalleeIRSize);

  CurrentIRSize += IRSizeAfter - (Advice.CallerIRSize + Advice.CalleeIRSize);

  if (CurrentIRSize > SizeIncreaseThreshold * InitialIRSize)

    ForceStop = true;


  // We can delta-update module-wide features. We know the inlining only changed

  // the caller, and maybe the callee (by deleting the latter).

  // Nodes are simple to update.

  // For edges, we 'forget' the edges that the caller and callee used to have

  // before inlining, and add back what they currently have together.

  int64_t NewCallerAndCalleeEdges =

      getCachedFPI(*Caller).DirectCallsToDefinedFunctions;


  // A dead function's node is not actually removed from the call graph until

  // the end of the call graph walk, but the node no longer belongs to any valid

  // SCC.

  if (CalleeWasDeleted) {

    --NodeCount;

    NodesInLastSCC.erase(CG.lookup(*Callee));

    DeadFunctions.insert(Callee);

  } else {

    NewCallerAndCalleeEdges +=

        getCachedFPI(*Callee).DirectCallsToDefinedFunctions;

  }

  EdgeCount += (NewCallerAndCalleeEdges - Advice.CallerAndCalleeEdges);

  assert(CurrentIRSize >= 0 && EdgeCount >= 0 && NodeCount >= 0);

}


int64_t MLInlineAdvisor::getModuleIRSize() const {

  int64_t Ret = 0;

  for (auto &F : M)

    if (!F.isDeclaration())

      Ret += getIRSize(F);

  return Ret;

}


FunctionPropertiesInfo &MLInlineAdvisor::getCachedFPI(Function &F) const {

  auto InsertPair =

      FPICache.insert(std::make_pair(&F, FunctionPropertiesInfo()));

  if (!InsertPair.second)

    return InsertPair.first->second;

  InsertPair.first->second = FAM.getResult<FunctionPropertiesAnalysis>(F);

  return InsertPair.first->second;

}


std::unique_ptr<InlineAdvice> MLInlineAdvisor::getAdviceImpl(CallBase &CB) {

  if (auto Skip = getSkipAdviceIfUnreachableCallsite(CB))

    return Skip;


  auto &Caller = *CB.getCaller();

  auto &Callee = *CB.getCalledFunction();


  auto GetAssumptionCache = [&](Function &F) -> AssumptionCache & {

    return FAM.getResult<AssumptionAnalysis>(F);

  };

  auto &TIR = FAM.getResult<TargetIRAnalysis>(Callee);

  auto &ORE = FAM.getResult<OptimizationRemarkEmitterAnalysis>(Caller);


  if (SkipPolicy == SkipMLPolicyCriteria::IfCallerIsNotCold) {

    if (!PSI.isFunctionEntryCold(&Caller))

      return std::make_unique<InlineAdvice>(this, CB, ORE,

                                            GetDefaultAdvice(CB));

  }

  auto MandatoryKind = InlineAdvisor::getMandatoryKind(CB, FAM, ORE);

  // If this is a "never inline" case, there won't be any changes to internal

  // state we need to track, so we can just return the base InlineAdvice, which

  // will do nothing interesting.

  // Same thing if this is a recursive case.

  if (MandatoryKind == InlineAdvisor::MandatoryInliningKind::Never ||

      &Caller == &Callee)

    return getMandatoryAdvice(CB, false);


  bool Mandatory =

      MandatoryKind == InlineAdvisor::MandatoryInliningKind::Always;


  // If we need to stop, we won't want to track anymore any state changes, so

  // we just return the base InlineAdvice, which acts as a noop.

  if (ForceStop) {

    ORE.emit([&] {

      return OptimizationRemarkMissed(DEBUG_TYPE, "ForceStop", &CB)

             << "Won't attempt inlining because module size grew too much.";

    });

    return std::make_unique<InlineAdvice>(this, CB, ORE, Mandatory);

  }


  int CostEstimate = 0;

  if (!Mandatory) {

    auto IsCallSiteInlinable =

        llvm::getInliningCostEstimate(CB, TIR, GetAssumptionCache);

    if (!IsCallSiteInlinable) {

      // We can't inline this for correctness reasons, so return the base

      // InlineAdvice, as we don't care about tracking any state changes (which

      // won't happen).

      return std::make_unique<InlineAdvice>(this, CB, ORE, false);

    }

    CostEstimate = *IsCallSiteInlinable;

  }


  const auto CostFeatures =

      llvm::getInliningCostFeatures(CB, TIR, GetAssumptionCache);

  if (!CostFeatures) {

    return std::make_unique<InlineAdvice>(this, CB, ORE, false);

  }


  if (Mandatory)

    return getMandatoryAdvice(CB, true);


  auto NumCtantParams = 0;

  for (auto I = CB.arg_begin(), E = CB.arg_end(); I != E; ++I) {

    NumCtantParams += (isa<Constant>(*I));

  }


  auto &CallerBefore = getCachedFPI(Caller);

  auto &CalleeBefore = getCachedFPI(Callee);


  *ModelRunner->getTensor<int64_t>(FeatureIndex::callee_basic_block_count) =

      CalleeBefore.BasicBlockCount;

  *ModelRunner->getTensor<int64_t>(FeatureIndex::callsite_height) =

      getInitialFunctionLevel(Caller);

  *ModelRunner->getTensor<int64_t>(FeatureIndex::node_count) = NodeCount;

  *ModelRunner->getTensor<int64_t>(FeatureIndex::nr_ctant_params) =

      NumCtantParams;

  *ModelRunner->getTensor<int64_t>(FeatureIndex::edge_count) = EdgeCount;

  *ModelRunner->getTensor<int64_t>(FeatureIndex::caller_users) =

      CallerBefore.Uses;

  *ModelRunner->getTensor<int64_t>(

      FeatureIndex::caller_conditionally_executed_blocks) =

      CallerBefore.BlocksReachedFromConditionalInstruction;

  *ModelRunner->getTensor<int64_t>(FeatureIndex::caller_basic_block_count) =

      CallerBefore.BasicBlockCount;

  *ModelRunner->getTensor<int64_t>(

      FeatureIndex::callee_conditionally_executed_blocks) =

      CalleeBefore.BlocksReachedFromConditionalInstruction;

  *ModelRunner->getTensor<int64_t>(FeatureIndex::callee_users) =

      CalleeBefore.Uses;

  *ModelRunner->getTensor<int64_t>(FeatureIndex::cost_estimate) = CostEstimate;

  *ModelRunner->getTensor<int64_t>(FeatureIndex::is_callee_avail_external) =

      Callee.hasAvailableExternallyLinkage();

  *ModelRunner->getTensor<int64_t>(FeatureIndex::is_caller_avail_external) =

      Caller.hasAvailableExternallyLinkage();


  // Add the cost features

  for (size_t I = 0;

       I < static_cast<size_t>(InlineCostFeatureIndex::NumberOfFeatures); ++I) {

    *ModelRunner->getTensor<int64_t>(inlineCostFeatureToMlFeature(

        static_cast<InlineCostFeatureIndex>(I))) = CostFeatures->at(I);

  }

  // This one would have been set up to be right at the end.

  if (!InteractiveChannelBaseName.empty() && InteractiveIncludeDefault)

    *ModelRunner->getTensor<int64_t>(InlineCostFeatureIndex::NumberOfFeatures) =

        GetDefaultAdvice(CB);

  return getAdviceFromModel(CB, ORE);

}


std::unique_ptr<MLInlineAdvice>

MLInlineAdvisor::getAdviceFromModel(CallBase &CB,

                                    OptimizationRemarkEmitter &ORE) {

  return std::make_unique<MLInlineAdvice>(

      this, CB, ORE, static_cast<bool>(ModelRunner->evaluate<int64_t>()));

}


std::unique_ptr<InlineAdvice>

MLInlineAdvisor::getSkipAdviceIfUnreachableCallsite(CallBase &CB) {

  if (!FAM.getResult<DominatorTreeAnalysis>(*CB.getCaller())

           .isReachableFromEntry(CB.getParent()))

    return std::make_unique<InlineAdvice>(this, CB, getCallerORE(CB), false);

  return nullptr;

}


std::unique_ptr<InlineAdvice> MLInlineAdvisor::getMandatoryAdvice(CallBase &CB,

                                                                  bool Advice) {

  // Make sure we track inlinings in all cases - mandatory or not.

  if (auto Skip = getSkipAdviceIfUnreachableCallsite(CB))

    return Skip;

  if (Advice && !ForceStop)

    return getMandatoryAdviceImpl(CB);


  // If this is a "never inline" case, there won't be any changes to internal

  // state we need to track, so we can just return the base InlineAdvice, which

  // will do nothing interesting.

  // Same if we are forced to stop - we don't track anymore.

  return std::make_unique<InlineAdvice>(this, CB, getCallerORE(CB), Advice);

}


std::unique_ptr<MLInlineAdvice>

MLInlineAdvisor::getMandatoryAdviceImpl(CallBase &CB) {

  return std::make_unique<MLInlineAdvice>(this, CB, getCallerORE(CB), true);

}


void MLInlineAdvisor::print(raw_ostream &OS) const {

  OS << "[MLInlineAdvisor] Nodes: " << NodeCount << " Edges: " << EdgeCount

     << " EdgesOfLastSeenNodes: " << EdgesOfLastSeenNodes << "\n";

  OS << "[MLInlineAdvisor] FPI:\n";

  for (auto I : FPICache) {

    OS << I.first->getName() << ":\n";

    I.second.print(OS);

    OS << "\n";

  }

  OS << "\n";

  OS << "[MLInlineAdvisor] FuncLevels:\n";

  for (auto I : FunctionLevels)

    OS << (DeadFunctions.contains(&I.first->getFunction())

               ? "<deleted>"

               : I.first->getFunction().getName())

       << " : " << I.second << "\n";


  OS << "\n";

}


MLInlineAdvice::MLInlineAdvice(MLInlineAdvisor *Advisor, CallBase &CB,

                               OptimizationRemarkEmitter &ORE,

                               bool Recommendation)

    : InlineAdvice(Advisor, CB, ORE, Recommendation),

      CallerIRSize(Advisor->isForcedToStop() ? 0 : Advisor->getIRSize(*Caller)),

      CalleeIRSize(Advisor->isForcedToStop() ? 0 : Advisor->getIRSize(*Callee)),

      CallerAndCalleeEdges(Advisor->isForcedToStop()

                               ? 0

                               : (Advisor->getLocalCalls(*Caller) +

                                  Advisor->getLocalCalls(*Callee))),

      PreInlineCallerFPI(Advisor->getCachedFPI(*Caller)) {

  if (Recommendation)

    FPU.emplace(Advisor->getCachedFPI(*getCaller()), CB);

}


void MLInlineAdvice::reportContextForRemark(

    DiagnosticInfoOptimizationBase &OR) {

  using namespace ore;

  OR << NV("Callee", Callee->getName());

  for (size_t I = 0; I < NumberOfFeatures; ++I)

    OR << NV(FeatureMap[I].name(),

             *getAdvisor()->getModelRunner().getTensor<int64_t>(I));

  OR << NV("ShouldInline", isInliningRecommended());

}


void MLInlineAdvice::updateCachedCallerFPI(FunctionAnalysisManager &FAM) const {

  FPU->finish(FAM);

}


void MLInlineAdvice::recordInliningImpl() {

  ORE.emit([&]() {

    OptimizationRemark R(DEBUG_TYPE, "InliningSuccess", DLoc, Block);

    reportContextForRemark(R);

    return R;

  });

  getAdvisor()->onSuccessfulInlining(*this, /*CalleeWasDeleted*/ false);

}


void MLInlineAdvice::recordInliningWithCalleeDeletedImpl() {

  ORE.emit([&]() {

    OptimizationRemark R(DEBUG_TYPE, "InliningSuccessWithCalleeDeleted", DLoc,

                         Block);

    reportContextForRemark(R);

    return R;

  });

  getAdvisor()->onSuccessfulInlining(*this, /*CalleeWasDeleted*/ true);

}


void MLInlineAdvice::recordUnsuccessfulInliningImpl(

    const InlineResult &Result) {

  getAdvisor()->getCachedFPI(*Caller) = PreInlineCallerFPI;

  ORE.emit([&]() {

    OptimizationRemarkMissed R(DEBUG_TYPE, "InliningAttemptedAndUnsuccessful",

                               DLoc, Block);

    reportContextForRemark(R);

    return R;

  });

}

void MLInlineAdvice::recordUnattemptedInliningImpl() {

  assert(!FPU);

  ORE.emit([&]() {

    OptimizationRemarkMissed R(DEBUG_TYPE, "IniningNotAttempted", DLoc, Block);

    reportContextForRemark(R);

    return R;

  });

}

AssumptionCache.h

instructions
Expand Atomic instructions
Definition: AtomicExpandPass.cpp:172

BlockFrequencyInfo.h

CallGraph.h
This file provides interfaces used to build and manipulate a call graph, which is a very useful tool ...

CommandLine.h

clEnumValN
#define clEnumValN(ENUMVAL, FLAGNAME, DESC)
Definition: CommandLine.h:686

Dominators.h

FunctionPropertiesAnalysis.h

DEBUG_TYPE
#define DEBUG_TYPE
Definition: GenericCycleImpl.h:31

Module.h
Module.h This file contains the declarations for the Module class.

PassManager.h
This header defines various interfaces for pass management in LLVM.

InlineCost.h

InlineModelFeatureMaps.h

INLINE_COST_FEATURE_ITERATOR
#define INLINE_COST_FEATURE_ITERATOR(M)
Definition: InlineModelFeatureMaps.h:23

INLINE_FEATURE_ITERATOR
#define INLINE_FEATURE_ITERATOR(M)
Definition: InlineModelFeatureMaps.h:101

InstIterator.h

InteractiveModelRunner.h

LazyCallGraph.h
Implements a lazy call graph analysis and related passes for the new pass manager.

LoopInfo.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

KeepFPICache
static cl::opt< bool > KeepFPICache("ml-advisor-keep-fpi-cache", cl::Hidden, cl::desc("For test - keep the ML Inline advisor's FunctionPropertiesInfo cache"), cl::init(false))

ModelSelector
static cl::opt< std::string > ModelSelector("ml-inliner-model-selector", cl::Hidden, cl::init(""))

getInlinableCS
CallBase * getInlinableCS(Instruction &I)
Definition: MLInlineAdvisor.cpp:129

SkipMLPolicyCriteria
SkipMLPolicyCriteria
Definition: MLInlineAdvisor.cpp:52

SkipMLPolicyCriteria::Never
@ Never

SkipMLPolicyCriteria::IfCallerIsNotCold
@ IfCallerIsNotCold

InteractiveChannelBaseName
static cl::opt< std::string > InteractiveChannelBaseName("inliner-interactive-channel-base", cl::Hidden, cl::desc("Base file path for the interactive mode. The incoming filename should " "have the name <inliner-interactive-channel-base>.in, while the " "outgoing name should be <inliner-interactive-channel-base>.out"))

POPULATE_NAMES
#define POPULATE_NAMES(DTYPE, SHAPE, NAME, __)

SizeIncreaseThreshold
static cl::opt< float > SizeIncreaseThreshold("ml-advisor-size-increase-threshold", cl::Hidden, cl::desc("Maximum factor by which expected native size may increase before " "blocking any further inlining."), cl::init(2.0))

InclDefaultMsg
static const std::string InclDefaultMsg
Definition: MLInlineAdvisor.cpp:44

SkipPolicy
static cl::opt< SkipMLPolicyCriteria > SkipPolicy("ml-inliner-skip-policy", cl::Hidden, cl::init(SkipMLPolicyCriteria::Never), cl::values(clEnumValN(SkipMLPolicyCriteria::Never, "never", "never"), clEnumValN(SkipMLPolicyCriteria::IfCallerIsNotCold, "if-caller-not-cold", "if the caller is not cold")))

InteractiveIncludeDefault
static cl::opt< bool > InteractiveIncludeDefault("inliner-interactive-include-default", cl::Hidden, cl::desc(InclDefaultMsg))

MLInlineAdvisor.h

MLModelRunner.h

DecisionName
#define DecisionName

OptimizationRemarkEmitter.h

FAM
FunctionAnalysisManager FAM
Definition: PassBuilderBindings.cpp:61

MAM
ModuleAnalysisManager MAM
Definition: PassBuilderBindings.cpp:63

if
if(PassOpts->AAPipeline)
Definition: PassBuilderBindings.cpp:64

ProfileSummaryInfo.h

ReleaseModeModelRunner.h

SCCIterator.h
This builds on the llvm/ADT/GraphTraits.h file to find the strongly connected components (SCCs) of a ...

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

name
static const char * name
Definition: SMEABIPass.cpp:46

OS
raw_pwrite_stream & OS
Definition: SampleProfWriter.cpp:51

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

llvm::AnalysisManager
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:253

llvm::AnalysisManager::invalidate
void invalidate(IRUnitT &IR, const PreservedAnalyses &PA)
Invalidate cached analyses for an IR unit.
Definition: PassManagerImpl.h:172

llvm::AnalysisManager::getResult
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Definition: PassManager.h:410

llvm::AssumptionAnalysis
A function analysis which provides an AssumptionCache.
Definition: AssumptionCache.h:173

llvm::AssumptionCache
A cache of @llvm.assume calls within a function.
Definition: AssumptionCache.h:42

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1112

llvm::CallBase::getCalledFunction
Function * getCalledFunction() const
Returns the function called, or null if this is an indirect function invocation or the function signa...
Definition: InstrTypes.h:1341

llvm::CallBase::arg_begin
User::op_iterator arg_begin()
Return the iterator pointing to the beginning of the argument list.
Definition: InstrTypes.h:1261

llvm::CallBase::arg_end
User::op_iterator arg_end()
Return the iterator pointing to the end of the argument list.
Definition: InstrTypes.h:1267

llvm::CallBase::getCaller
Function * getCaller()
Helper to get the caller (the parent function).
Definition: Instructions.cpp:327

llvm::CallGraph
The basic data container for the call graph of a Module of IR.
Definition: CallGraph.h:71

llvm::DiagnosticInfoOptimizationBase
Common features for diagnostics dealing with optimization remarks that are used by both IR and MIR pa...
Definition: DiagnosticInfo.h:486

llvm::DominatorTreeAnalysis
Analysis pass which computes a DominatorTree.
Definition: Dominators.h:279

llvm::FunctionPropertiesAnalysis
Definition: FunctionPropertiesAnalysis.h:143

llvm::FunctionPropertiesInfo
Definition: FunctionPropertiesAnalysis.h:28

llvm::FunctionPropertiesInfo::DirectCallsToDefinedFunctions
int64_t DirectCallsToDefinedFunctions
Number of direct calls made from this function to other functions defined in this module.
Definition: FunctionPropertiesAnalysis.h:69

llvm::Function
Definition: Function.h:63

llvm::InlineAdvice
Capture state between an inlining decision having had been made, and its impact being observable.
Definition: InlineAdvisor.h:74

llvm::InlineAdvice::Callee
Function *const Callee
Definition: InlineAdvisor.h:123

llvm::InlineAdvice::Caller
Function *const Caller
Caller and Callee are pre-inlining.
Definition: InlineAdvisor.h:122

llvm::InlineAdvice::Block
const BasicBlock *const Block
Definition: InlineAdvisor.h:129

llvm::InlineAdvice::ORE
OptimizationRemarkEmitter & ORE
Definition: InlineAdvisor.h:130

llvm::InlineAdvice::Advisor
InlineAdvisor *const Advisor
Definition: InlineAdvisor.h:120

llvm::InlineAdvice::DLoc
const DebugLoc DLoc
Definition: InlineAdvisor.h:128

llvm::InlineAdvice::isInliningRecommended
bool isInliningRecommended() const
Get the inlining recommendation.
Definition: InlineAdvisor.h:110

llvm::InlineAdvisor
Interface for deciding whether to inline a call site or not.
Definition: InlineAdvisor.h:163

llvm::InlineAdvisor::getCallerORE
OptimizationRemarkEmitter & getCallerORE(CallBase &CB)
Definition: InlineAdvisor.cpp:625

llvm::InlineAdvisor::FAM
FunctionAnalysisManager & FAM
Definition: InlineAdvisor.h:209

llvm::InlineAdvisor::getMandatoryKind
static MandatoryInliningKind getMandatoryKind(CallBase &CB, FunctionAnalysisManager &FAM, OptimizationRemarkEmitter &ORE)
Definition: InlineAdvisor.cpp:593

llvm::InlineAdvisor::MandatoryInliningKind::Always
@ Always

llvm::InlineAdvisor::MandatoryInliningKind::Never
@ Never

llvm::InlineAdvisor::M
Module & M
Definition: InlineAdvisor.h:208

llvm::InlineResult
InlineResult is basically true or false.
Definition: InlineCost.h:179

llvm::InnerAnalysisManagerProxy
An analysis over an "outer" IR unit that provides access to an analysis manager over an "inner" IR un...
Definition: PassManager.h:567

llvm::Instruction
Definition: Instruction.h:68

llvm::LazyCallGraphAnalysis
An analysis pass which computes the call graph for a module.
Definition: LazyCallGraph.h:1259

llvm::LazyCallGraph::Node
A node in the call graph.
Definition: LazyCallGraph.h:312

llvm::LazyCallGraph::SCC
An SCC of the call graph.
Definition: LazyCallGraph.h:416

llvm::LazyCallGraph::get
Node & get(Function &F)
Get a graph node for a given function, scanning it to populate the graph data as necessary.
Definition: LazyCallGraph.h:996

llvm::LazyCallGraph::lookup
Node * lookup(const Function &F) const
Lookup a function in the graph which has already been scanned and added.
Definition: LazyCallGraph.h:975

llvm::LoopAnalysis
Analysis pass that exposes the LoopInfo for a function.
Definition: LoopInfo.h:566

llvm::MLInlineAdvice
InlineAdvice that tracks changes post inlining.
Definition: MLInlineAdvisor.h:98

llvm::MLInlineAdvice::updateCachedCallerFPI
void updateCachedCallerFPI(FunctionAnalysisManager &FAM) const
Definition: MLInlineAdvisor.cpp:530

llvm::MLInlineAdvice::CallerIRSize
const int64_t CallerIRSize
Definition: MLInlineAdvisor.h:112

llvm::MLInlineAdvice::MLInlineAdvice
MLInlineAdvice(MLInlineAdvisor *Advisor, CallBase &CB, OptimizationRemarkEmitter &ORE, bool Recommendation)
Definition: MLInlineAdvisor.cpp:505

llvm::MLInlineAdvice::CalleeIRSize
const int64_t CalleeIRSize
Definition: MLInlineAdvisor.h:113

llvm::MLInlineAdvice::recordInliningImpl
void recordInliningImpl() override
Definition: MLInlineAdvisor.cpp:534

llvm::MLInlineAdvice::getCaller
Function * getCaller() const
Definition: MLInlineAdvisor.h:109

llvm::MLInlineAdvice::CallerAndCalleeEdges
const int64_t CallerAndCalleeEdges
Definition: MLInlineAdvisor.h:114

llvm::MLInlineAdvice::recordUnsuccessfulInliningImpl
void recordUnsuccessfulInliningImpl(const InlineResult &Result) override
Definition: MLInlineAdvisor.cpp:553

llvm::MLInlineAdvice::getCallee
Function * getCallee() const
Definition: MLInlineAdvisor.h:110

llvm::MLInlineAdvice::recordInliningWithCalleeDeletedImpl
void recordInliningWithCalleeDeletedImpl() override
Definition: MLInlineAdvisor.cpp:543

llvm::MLInlineAdvice::recordUnattemptedInliningImpl
void recordUnattemptedInliningImpl() override
Definition: MLInlineAdvisor.cpp:563

llvm::MLInlineAdvisor
Definition: MLInlineAdvisor.h:28

llvm::MLInlineAdvisor::ModelRunner
std::unique_ptr< MLModelRunner > ModelRunner
Definition: MLInlineAdvisor.h:66

llvm::MLInlineAdvisor::getCachedFPI
FunctionPropertiesInfo & getCachedFPI(Function &) const
Definition: MLInlineAdvisor.cpp:332

llvm::MLInlineAdvisor::onPassExit
void onPassExit(LazyCallGraph::SCC *SCC) override
This must be called when the Inliner pass is exited, as function passes may be run subsequently.
Definition: MLInlineAdvisor.cpp:245

llvm::MLInlineAdvisor::MLInlineAdvisor
MLInlineAdvisor(Module &M, ModuleAnalysisManager &MAM, std::unique_ptr< MLModelRunner > ModelRunner, std::function< bool(CallBase &)> GetDefaultAdvice)
Definition: MLInlineAdvisor.cpp:139

llvm::MLInlineAdvisor::onSuccessfulInlining
void onSuccessfulInlining(const MLInlineAdvice &Advice, bool CalleeWasDeleted)
Definition: MLInlineAdvisor.cpp:282

llvm::MLInlineAdvisor::getMandatoryAdviceImpl
virtual std::unique_ptr< MLInlineAdvice > getMandatoryAdviceImpl(CallBase &CB)
Definition: MLInlineAdvisor.cpp:481

llvm::MLInlineAdvisor::onPassEntry
void onPassEntry(LazyCallGraph::SCC *SCC) override
This must be called when the Inliner pass is entered, to allow the InlineAdvisor update internal stat...
Definition: MLInlineAdvisor.cpp:195

llvm::MLInlineAdvisor::getLocalCalls
int64_t getLocalCalls(Function &F)
Definition: MLInlineAdvisor.cpp:273

llvm::MLInlineAdvisor::getAdviceFromModel
virtual std::unique_ptr< MLInlineAdvice > getAdviceFromModel(CallBase &CB, OptimizationRemarkEmitter &ORE)
Definition: MLInlineAdvisor.cpp:451

llvm::MLInlineAdvisor::getIRSize
int64_t getIRSize(Function &F) const
Definition: MLInlineAdvisor.h:39

llvm::MLInlineAdvisor::GetDefaultAdvice
std::function< bool(CallBase &)> GetDefaultAdvice
Definition: MLInlineAdvisor.h:67

llvm::MLInlineAdvisor::getAdviceImpl
std::unique_ptr< InlineAdvice > getAdviceImpl(CallBase &CB) override
Definition: MLInlineAdvisor.cpp:341

llvm::MLInlineAdvisor::getMandatoryAdvice
std::unique_ptr< InlineAdvice > getMandatoryAdvice(CallBase &CB, bool Advice) override
Definition: MLInlineAdvisor.cpp:465

llvm::MLInlineAdvisor::getInitialFunctionLevel
unsigned getInitialFunctionLevel(const Function &F) const
Definition: MLInlineAdvisor.cpp:191

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:65

llvm::NoopSavedModelImpl
A mock class satisfying the interface expected by ReleaseModeModelRunner for its TGen parameter.
Definition: ReleaseModeModelRunner.h:142

llvm::OptimizationRemarkEmitterAnalysis
Definition: OptimizationRemarkEmitter.h:164

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition: OptimizationRemarkEmitter.h:32

llvm::OptimizationRemarkEmitter::emit
void emit(DiagnosticInfoOptimizationBase &OptDiag)
Output the remark via the diagnostic handler and to the optimization record file.
Definition: OptimizationRemarkEmitter.cpp:79

llvm::OptimizationRemarkMissed
Diagnostic information for missed-optimization remarks.
Definition: DiagnosticInfo.h:807

llvm::OptimizationRemark
Diagnostic information for applied optimization remarks.
Definition: DiagnosticInfo.h:762

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:111

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:117

llvm::PreservedAnalyses::abandon
void abandon()
Mark an analysis as abandoned.
Definition: Analysis.h:164

llvm::ProfileSummaryAnalysis
An analysis pass based on the new PM to deliver ProfileSummaryInfo.
Definition: ProfileSummaryInfo.h:372

llvm::ProfileSummaryInfo::isFunctionEntryCold
bool isFunctionEntryCold(const Function *F) const
Returns true if F has cold function entry.
Definition: ProfileSummaryInfo.cpp:96

llvm::TargetIRAnalysis
Analysis pass providing the TargetTransformInfo.
Definition: TargetTransformInfo.h:3194

llvm::TensorSpec
Definition: TensorSpec.h:62

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition: Twine.h:81

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

llvm::cl::opt
Definition: CommandLine.h:1423

llvm::detail::DenseSetImpl::insert
std::pair< iterator, bool > insert(const ValueT &V)
Definition: DenseSet.h:213

llvm::detail::DenseSetImpl::contains
bool contains(const_arg_type_t< ValueT > V) const
Check if the set contains the given element.
Definition: DenseSet.h:193

llvm::ilist_detail::node_parent_access::getParent
const ParentTy * getParent() const
Definition: ilist_node.h:32

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:52

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:137

llvm::cl::values
ValuesClass values(OptsTy... Options)
Helper to build a ValuesClass by forwarding a variable number of arguments as an initializer list to ...
Definition: CommandLine.h:711

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::inlineCostFeatureToMlFeature
constexpr FeatureIndex inlineCostFeatureToMlFeature(InlineCostFeatureIndex Feature)
Definition: InlineModelFeatureMaps.h:149

llvm::DefaultDecisionName
const char *const DefaultDecisionName
Definition: MLInlineAdvisor.cpp:124

llvm::NumberOfFeatures
constexpr size_t NumberOfFeatures
Definition: InlineModelFeatureMaps.h:153

llvm::scc_begin
scc_iterator< T > scc_begin(const T &G)
Construct the begin iterator for a deduced graph type T.
Definition: SCCIterator.h:233

llvm::getReleaseModeAdvisor
std::unique_ptr< InlineAdvisor > getReleaseModeAdvisor(Module &M, ModuleAnalysisManager &MAM, std::function< bool(CallBase &)> GetDefaultAdvice)
Definition: MLInlineAdvisor.cpp:72

llvm::DefaultDecisionSpec
const TensorSpec DefaultDecisionSpec
Definition: MLInlineAdvisor.cpp:125

llvm::DecisionName
const char *const DecisionName
Definition: MLInlineAdvisor.cpp:121

llvm::InlineCostFeatureIndex
InlineCostFeatureIndex
Definition: InlineModelFeatureMaps.h:69

llvm::InlineCostFeatureIndex::NumberOfFeatures
@ NumberOfFeatures

llvm::FeatureMap
const std::vector< TensorSpec > FeatureMap
Definition: MLInlineAdvisor.cpp:110

llvm::getInliningCostFeatures
std::optional< InlineCostFeatures > getInliningCostFeatures(CallBase &Call, TargetTransformInfo &CalleeTTI, function_ref< AssumptionCache &(Function &)> GetAssumptionCache, function_ref< BlockFrequencyInfo &(Function &)> GetBFI=nullptr, function_ref< const TargetLibraryInfo &(Function &)> GetTLI=nullptr, ProfileSummaryInfo *PSI=nullptr, OptimizationRemarkEmitter *ORE=nullptr)
Get the expanded cost features.
Definition: InlineCost.cpp:2999

llvm::InlineDecisionSpec
const TensorSpec InlineDecisionSpec
Definition: MLInlineAdvisor.cpp:122

llvm::RewardName
const char *const RewardName
Definition: MLInlineAdvisor.cpp:127

llvm::move
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1873

llvm::getInliningCostEstimate
std::optional< int > getInliningCostEstimate(CallBase &Call, TargetTransformInfo &CalleeTTI, function_ref< AssumptionCache &(Function &)> GetAssumptionCache, function_ref< BlockFrequencyInfo &(Function &)> GetBFI=nullptr, function_ref< const TargetLibraryInfo &(Function &)> GetTLI=nullptr, ProfileSummaryInfo *PSI=nullptr, OptimizationRemarkEmitter *ORE=nullptr)
Get the cost estimate ignoring thresholds.
Definition: InlineCost.cpp:2973

std
Implement std::hash so that hash_code can be used in STL containers.
Definition: BitVector.h:858

N
#define N

llvm::EmbeddedModelRunnerOptions
ReleaseModeModelRunner - production mode implementation of the MLModelRunner.
Definition: ReleaseModeModelRunner.h:29

llvm::EmbeddedModelRunnerOptions::setModelSelector
EmbeddedModelRunnerOptions & setModelSelector(StringRef Value)
Definition: ReleaseModeModelRunner.h:48

llvm::cl::desc
Definition: CommandLine.h:409