doxygen/PlaceSafepoints_8cpp_source.html

//===- PlaceSafepoints.cpp - Place GC Safepoints --------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// Place garbage collection safepoints at appropriate locations in the IR. This

// does not make relocation semantics or variable liveness explicit.  That's

// done by RewriteStatepointsForGC.

//

// Terminology:

// - A call is said to be "parseable" if there is a stack map generated for the

// return PC of the call.  A runtime can determine where values listed in the

// deopt arguments and (after RewriteStatepointsForGC) gc arguments are located

// on the stack when the code is suspended inside such a call.  Every parse

// point is represented by a call wrapped in an gc.statepoint intrinsic.

// - A "poll" is an explicit check in the generated code to determine if the

// runtime needs the generated code to cooperate by calling a helper routine

// and thus suspending its execution at a known state. The call to the helper

// routine will be parseable.  The (gc & runtime specific) logic of a poll is

// assumed to be provided in a function of the name "gc.safepoint_poll".

//

// We aim to insert polls such that running code can quickly be brought to a

// well defined state for inspection by the collector.  In the current

// implementation, this is done via the insertion of poll sites at method entry

// and the backedge of most loops.  We try to avoid inserting more polls than

// are necessary to ensure a finite period between poll sites.  This is not

// because the poll itself is expensive in the generated code; it's not.  Polls

// do tend to impact the optimizer itself in negative ways; we'd like to avoid

// perturbing the optimization of the method as much as we can.

//

// We also need to make most call sites parseable.  The callee might execute a

// poll (or otherwise be inspected by the GC).  If so, the entire stack

// (including the suspended frame of the current method) must be parseable.

//

// This pass will insert:

// - Call parse points ("call safepoints") for any call which may need to

// reach a safepoint during the execution of the callee function.

// - Backedge safepoint polls and entry safepoint polls to ensure that

// executing code reaches a safepoint poll in a finite amount of time.

//

// We do not currently support return statepoints, but adding them would not

// be hard.  They are not required for correctness - entry safepoints are an

// alternative - but some GCs may prefer them.  Patches welcome.

//

//===----------------------------------------------------------------------===//


#include "llvm/Transforms/Scalar/PlaceSafepoints.h"

#include "llvm/InitializePasses.h"

#include "llvm/Pass.h"


#include "llvm/ADT/SetVector.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/CFG.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/ScalarEvolution.h"

#include "llvm/Analysis/TargetLibraryInfo.h"

#include "llvm/IR/Dominators.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/LegacyPassManager.h"

#include "llvm/IR/Statepoint.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Debug.h"

#include "llvm/Transforms/Scalar.h"

#include "llvm/Transforms/Utils/BasicBlockUtils.h"

#include "llvm/Transforms/Utils/Cloning.h"

#include "llvm/Transforms/Utils/Local.h"


using namespace llvm;


#define DEBUG_TYPE "place-safepoints"


STATISTIC(NumEntrySafepoints, "Number of entry safepoints inserted");

STATISTIC(NumBackedgeSafepoints, "Number of backedge safepoints inserted");


STATISTIC(CallInLoop,

          "Number of loops without safepoints due to calls in loop");

STATISTIC(FiniteExecution,

          "Number of loops without safepoints finite execution");


// Ignore opportunities to avoid placing safepoints on backedges, useful for

// validation

static cl::opt<bool> AllBackedges("spp-all-backedges", cl::Hidden,

                                  cl::init(false));


/// How narrow does the trip count of a loop have to be to have to be considered

/// "counted"?  Counted loops do not get safepoints at backedges.

static cl::opt<int> CountedLoopTripWidth("spp-counted-loop-trip-width",

                                         cl::Hidden, cl::init(32));


// If true, split the backedge of a loop when placing the safepoint, otherwise

// split the latch block itself.  Both are useful to support for

// experimentation, but in practice, it looks like splitting the backedge

// optimizes better.

static cl::opt<bool> SplitBackedge("spp-split-backedge", cl::Hidden,

                                   cl::init(false));


namespace {

/// An analysis pass whose purpose is to identify each of the backedges in

/// the function which require a safepoint poll to be inserted.

class PlaceBackedgeSafepointsLegacyPass : public FunctionPass {

public:

  static char ID;


  /// The output of the pass - gives a list of each backedge (described by

  /// pointing at the branch) which need a poll inserted.

  std::vector<Instruction *> PollLocations;


  /// True unless we're running spp-no-calls in which case we need to disable

  /// the call-dependent placement opts.

  bool CallSafepointsEnabled;


  PlaceBackedgeSafepointsLegacyPass(bool CallSafepoints = false)

      : FunctionPass(ID), CallSafepointsEnabled(CallSafepoints) {

    initializePlaceBackedgeSafepointsLegacyPassPass(

        *PassRegistry::getPassRegistry());

  }


  bool runOnLoop(Loop *);


  void runOnLoopAndSubLoops(Loop *L) {

    // Visit all the subloops

    for (Loop *I : *L)

      runOnLoopAndSubLoops(I);

    runOnLoop(L);

  }


  bool runOnFunction(Function &F) override {

    SE = &getAnalysis<ScalarEvolutionWrapperPass>().getSE();

    DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();

    LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();

    TLI = &getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(F);

    for (Loop *I : *LI) {

      runOnLoopAndSubLoops(I);

    }

    return false;

  }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.addRequired<DominatorTreeWrapperPass>();

    AU.addRequired<ScalarEvolutionWrapperPass>();

    AU.addRequired<LoopInfoWrapperPass>();

    AU.addRequired<TargetLibraryInfoWrapperPass>();

    // We no longer modify the IR at all in this pass.  Thus all

    // analysis are preserved.

    AU.setPreservesAll();

  }


private:

  ScalarEvolution *SE = nullptr;

  DominatorTree *DT = nullptr;

  LoopInfo *LI = nullptr;

  TargetLibraryInfo *TLI = nullptr;

};

} // namespace


static cl::opt<bool> NoEntry("spp-no-entry", cl::Hidden, cl::init(false));

static cl::opt<bool> NoCall("spp-no-call", cl::Hidden, cl::init(false));

static cl::opt<bool> NoBackedge("spp-no-backedge", cl::Hidden, cl::init(false));


char PlaceBackedgeSafepointsLegacyPass::ID = 0;


INITIALIZE_PASS_BEGIN(PlaceBackedgeSafepointsLegacyPass,

                      "place-backedge-safepoints-impl",

                      "Place Backedge Safepoints", false, false)

INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass)

INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)

INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)

INITIALIZE_PASS_END(PlaceBackedgeSafepointsLegacyPass,

                    "place-backedge-safepoints-impl",

                    "Place Backedge Safepoints", false, false)


static bool containsUnconditionalCallSafepoint(Loop *L, BasicBlock *Header,

                                               BasicBlock *Pred,

                                               DominatorTree &DT,

                                               const TargetLibraryInfo &TLI);


static bool mustBeFiniteCountedLoop(Loop *L, ScalarEvolution *SE,

                                    BasicBlock *Pred);


static Instruction *findLocationForEntrySafepoint(Function &F,

                                                  DominatorTree &DT);


static bool isGCSafepointPoll(Function &F);

static bool shouldRewriteFunction(Function &F);

static bool enableEntrySafepoints(Function &F);

static bool enableBackedgeSafepoints(Function &F);

static bool enableCallSafepoints(Function &F);


static void

InsertSafepointPoll(BasicBlock::iterator InsertBefore,

                    std::vector<CallBase *> &ParsePointsNeeded /*rval*/,

                    const TargetLibraryInfo &TLI);


bool PlaceBackedgeSafepointsLegacyPass::runOnLoop(Loop *L) {

  // Loop through all loop latches (branches controlling backedges).  We need

  // to place a safepoint on every backedge (potentially).

  // Note: In common usage, there will be only one edge due to LoopSimplify

  // having run sometime earlier in the pipeline, but this code must be correct

  // w.r.t. loops with multiple backedges.

  BasicBlock *Header = L->getHeader();

  SmallVector<BasicBlock *, 16> LoopLatches;

  L->getLoopLatches(LoopLatches);

  for (BasicBlock *Pred : LoopLatches) {

    assert(L->contains(Pred));


    // Make a policy decision about whether this loop needs a safepoint or

    // not.  Note that this is about unburdening the optimizer in loops, not

    // avoiding the runtime cost of the actual safepoint.

    if (!AllBackedges) {

      if (mustBeFiniteCountedLoop(L, SE, Pred)) {

        LLVM_DEBUG(dbgs() << "skipping safepoint placement in finite loop\n");

        FiniteExecution++;

        continue;

      }

      if (CallSafepointsEnabled &&

          containsUnconditionalCallSafepoint(L, Header, Pred, *DT, *TLI)) {

        // Note: This is only semantically legal since we won't do any further

        // IPO or inlining before the actual call insertion..  If we hadn't, we

        // might latter loose this call safepoint.

        LLVM_DEBUG(

            dbgs()

            << "skipping safepoint placement due to unconditional call\n");

        CallInLoop++;

        continue;

      }

    }


    // TODO: We can create an inner loop which runs a finite number of

    // iterations with an outer loop which contains a safepoint.  This would

    // not help runtime performance that much, but it might help our ability to

    // optimize the inner loop.


    // Safepoint insertion would involve creating a new basic block (as the

    // target of the current backedge) which does the safepoint (of all live

    // variables) and branches to the true header

    Instruction *Term = Pred->getTerminator();


    LLVM_DEBUG(dbgs() << "[LSP] terminator instruction: " << *Term);


    PollLocations.push_back(Term);

  }


  return false;

}


bool PlaceSafepointsPass::runImpl(Function &F, const TargetLibraryInfo &TLI) {

  if (F.isDeclaration() || F.empty()) {

    // This is a declaration, nothing to do.  Must exit early to avoid crash in

    // dom tree calculation

    return false;

  }


  if (isGCSafepointPoll(F)) {

    // Given we're inlining this inside of safepoint poll insertion, this

    // doesn't make any sense.  Note that we do make any contained calls

    // parseable after we inline a poll.

    return false;

  }


  if (!shouldRewriteFunction(F))

    return false;


  bool Modified = false;


  // In various bits below, we rely on the fact that uses are reachable from

  // defs.  When there are basic blocks unreachable from the entry, dominance

  // and reachablity queries return non-sensical results.  Thus, we preprocess

  // the function to ensure these properties hold.

  Modified |= removeUnreachableBlocks(F);


  // STEP 1 - Insert the safepoint polling locations.  We do not need to

  // actually insert parse points yet.  That will be done for all polls and

  // calls in a single pass.


  DominatorTree DT;

  DT.recalculate(F);


  SmallVector<Instruction *, 16> PollsNeeded;

  std::vector<CallBase *> ParsePointNeeded;


  if (enableBackedgeSafepoints(F)) {

    // Construct a pass manager to run the LoopPass backedge logic.  We

    // need the pass manager to handle scheduling all the loop passes

    // appropriately.  Doing this by hand is painful and just not worth messing

    // with for the moment.

    legacy::FunctionPassManager FPM(F.getParent());

    bool CanAssumeCallSafepoints = enableCallSafepoints(F);

    auto *PBS = new PlaceBackedgeSafepointsLegacyPass(CanAssumeCallSafepoints);

    FPM.add(PBS);

    FPM.run(F);


    // We preserve dominance information when inserting the poll, otherwise

    // we'd have to recalculate this on every insert

    DT.recalculate(F);


    auto &PollLocations = PBS->PollLocations;


    auto OrderByBBName = [](Instruction *a, Instruction *b) {

      return a->getParent()->getName() < b->getParent()->getName();

    };

    // We need the order of list to be stable so that naming ends up stable

    // when we split edges.  This makes test cases much easier to write.

    llvm::sort(PollLocations, OrderByBBName);


    // We can sometimes end up with duplicate poll locations.  This happens if

    // a single loop is visited more than once.   The fact this happens seems

    // wrong, but it does happen for the split-backedge.ll test case.

    PollLocations.erase(std::unique(PollLocations.begin(), PollLocations.end()),

                        PollLocations.end());


    // Insert a poll at each point the analysis pass identified

    // The poll location must be the terminator of a loop latch block.

    for (Instruction *Term : PollLocations) {

      // We are inserting a poll, the function is modified

      Modified = true;


      if (SplitBackedge) {

        // Split the backedge of the loop and insert the poll within that new

        // basic block.  This creates a loop with two latches per original

        // latch (which is non-ideal), but this appears to be easier to

        // optimize in practice than inserting the poll immediately before the

        // latch test.


        // Since this is a latch, at least one of the successors must dominate

        // it. Its possible that we have a) duplicate edges to the same header

        // and b) edges to distinct loop headers.  We need to insert pools on

        // each.

        SetVector<BasicBlock *> Headers;

        for (unsigned i = 0; i < Term->getNumSuccessors(); i++) {

          BasicBlock *Succ = Term->getSuccessor(i);

          if (DT.dominates(Succ, Term->getParent())) {

            Headers.insert(Succ);

          }

        }

        assert(!Headers.empty() && "poll location is not a loop latch?");


        // The split loop structure here is so that we only need to recalculate

        // the dominator tree once.  Alternatively, we could just keep it up to

        // date and use a more natural merged loop.

        SetVector<BasicBlock *> SplitBackedges;

        for (BasicBlock *Header : Headers) {

          BasicBlock *NewBB = SplitEdge(Term->getParent(), Header, &DT);

          PollsNeeded.push_back(NewBB->getTerminator());

          NumBackedgeSafepoints++;

        }

      } else {

        // Split the latch block itself, right before the terminator.

        PollsNeeded.push_back(Term);

        NumBackedgeSafepoints++;

      }

    }

  }


  if (enableEntrySafepoints(F)) {

    if (Instruction *Location = findLocationForEntrySafepoint(F, DT)) {

      PollsNeeded.push_back(Location);

      Modified = true;

      NumEntrySafepoints++;

    }

    // TODO: else we should assert that there was, in fact, a policy choice to

    // not insert a entry safepoint poll.

  }


  // Now that we've identified all the needed safepoint poll locations, insert

  // safepoint polls themselves.

  for (Instruction *PollLocation : PollsNeeded) {

    std::vector<CallBase *> RuntimeCalls;

    InsertSafepointPoll(PollLocation->getIterator(), RuntimeCalls, TLI);

    llvm::append_range(ParsePointNeeded, RuntimeCalls);

  }


  return Modified;

}


PreservedAnalyses PlaceSafepointsPass::run(Function &F,

                                           FunctionAnalysisManager &AM) {

  auto &TLI = AM.getResult<TargetLibraryAnalysis>(F);


  if (!runImpl(F, TLI))

    return PreservedAnalyses::all();


  // TODO: can we preserve more?

  return PreservedAnalyses::none();

}


static bool needsStatepoint(CallBase *Call, const TargetLibraryInfo &TLI) {

  if (callsGCLeafFunction(Call, TLI))

    return false;

  if (auto *CI = dyn_cast<CallInst>(Call)) {

    if (CI->isInlineAsm())

      return false;

  }


  return !(isa<GCStatepointInst>(Call) || isa<GCRelocateInst>(Call) ||

           isa<GCResultInst>(Call));

}


/// Returns true if this loop is known to contain a call safepoint which

/// must unconditionally execute on any iteration of the loop which returns

/// to the loop header via an edge from Pred.  Returns a conservative correct

/// answer; i.e. false is always valid.

static bool containsUnconditionalCallSafepoint(Loop *L, BasicBlock *Header,

                                               BasicBlock *Pred,

                                               DominatorTree &DT,

                                               const TargetLibraryInfo &TLI) {

  // In general, we're looking for any cut of the graph which ensures

  // there's a call safepoint along every edge between Header and Pred.

  // For the moment, we look only for the 'cuts' that consist of a single call

  // instruction in a block which is dominated by the Header and dominates the

  // loop latch (Pred) block.  Somewhat surprisingly, walking the entire chain

  // of such dominating blocks gets substantially more occurrences than just

  // checking the Pred and Header blocks themselves.  This may be due to the

  // density of loop exit conditions caused by range and null checks.

  // TODO: structure this as an analysis pass, cache the result for subloops,

  // avoid dom tree recalculations

  assert(DT.dominates(Header, Pred) && "loop latch not dominated by header?");


  BasicBlock *Current = Pred;

  while (true) {

    for (Instruction &I : *Current) {

      if (auto *Call = dyn_cast<CallBase>(&I))

        // Note: Technically, needing a safepoint isn't quite the right

        // condition here.  We should instead be checking if the target method

        // has an

        // unconditional poll. In practice, this is only a theoretical concern

        // since we don't have any methods with conditional-only safepoint

        // polls.

        if (needsStatepoint(Call, TLI))

          return true;

    }


    if (Current == Header)

      break;

    Current = DT.getNode(Current)->getIDom()->getBlock();

  }


  return false;

}


/// Returns true if this loop is known to terminate in a finite number of

/// iterations.  Note that this function may return false for a loop which

/// does actual terminate in a finite constant number of iterations due to

/// conservatism in the analysis.

static bool mustBeFiniteCountedLoop(Loop *L, ScalarEvolution *SE,

                                    BasicBlock *Pred) {

  // A conservative bound on the loop as a whole.

  const SCEV *MaxTrips = SE->getConstantMaxBackedgeTakenCount(L);

  if (!isa<SCEVCouldNotCompute>(MaxTrips) &&

      SE->getUnsignedRange(MaxTrips).getUnsignedMax().isIntN(

          CountedLoopTripWidth))

    return true;


  // If this is a conditional branch to the header with the alternate path

  // being outside the loop, we can ask questions about the execution frequency

  // of the exit block.

  if (L->isLoopExiting(Pred)) {

    // This returns an exact expression only.  TODO: We really only need an

    // upper bound here, but SE doesn't expose that.

    const SCEV *MaxExec = SE->getExitCount(L, Pred);

    if (!isa<SCEVCouldNotCompute>(MaxExec) &&

        SE->getUnsignedRange(MaxExec).getUnsignedMax().isIntN(

            CountedLoopTripWidth))

        return true;

  }


  return /* not finite */ false;

}


static void scanOneBB(Instruction *Start, Instruction *End,

                      std::vector<CallInst *> &Calls,

                      DenseSet<BasicBlock *> &Seen,

                      std::vector<BasicBlock *> &Worklist) {

  for (BasicBlock::iterator BBI(Start), BBE0 = Start->getParent()->end(),

                                        BBE1 = BasicBlock::iterator(End);

       BBI != BBE0 && BBI != BBE1; BBI++) {

    if (CallInst *CI = dyn_cast<CallInst>(&*BBI))

      Calls.push_back(CI);


    // FIXME: This code does not handle invokes

    assert(!isa<InvokeInst>(&*BBI) &&

           "support for invokes in poll code needed");


    // Only add the successor blocks if we reach the terminator instruction

    // without encountering end first

    if (BBI->isTerminator()) {

      BasicBlock *BB = BBI->getParent();

      for (BasicBlock *Succ : successors(BB)) {

        if (Seen.insert(Succ).second) {

          Worklist.push_back(Succ);

        }

      }

    }

  }

}


static void scanInlinedCode(Instruction *Start, Instruction *End,

                            std::vector<CallInst *> &Calls,

                            DenseSet<BasicBlock *> &Seen) {

  Calls.clear();

  std::vector<BasicBlock *> Worklist;

  Seen.insert(Start->getParent());

  scanOneBB(Start, End, Calls, Seen, Worklist);

  while (!Worklist.empty()) {

    BasicBlock *BB = Worklist.back();

    Worklist.pop_back();

    scanOneBB(&*BB->begin(), End, Calls, Seen, Worklist);

  }

}


/// Returns true if an entry safepoint is not required before this callsite in

/// the caller function.

static bool doesNotRequireEntrySafepointBefore(CallBase *Call) {

  if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(Call)) {

    switch (II->getIntrinsicID()) {

    case Intrinsic::experimental_gc_statepoint:

    case Intrinsic::experimental_patchpoint_void:

    case Intrinsic::experimental_patchpoint:

      // The can wrap an actual call which may grow the stack by an unbounded

      // amount or run forever.

      return false;

    default:

      // Most LLVM intrinsics are things which do not expand to actual calls, or

      // at least if they do, are leaf functions that cause only finite stack

      // growth.  In particular, the optimizer likes to form things like memsets

      // out of stores in the original IR.  Another important example is

      // llvm.localescape which must occur in the entry block.  Inserting a

      // safepoint before it is not legal since it could push the localescape

      // out of the entry block.

      return true;

    }

  }

  return false;

}


static Instruction *findLocationForEntrySafepoint(Function &F,

                                                  DominatorTree &DT) {


  // Conceptually, this poll needs to be on method entry, but in

  // practice, we place it as late in the entry block as possible.  We

  // can place it as late as we want as long as it dominates all calls

  // that can grow the stack.  This, combined with backedge polls,

  // give us all the progress guarantees we need.


  // hasNextInstruction and nextInstruction are used to iterate

  // through a "straight line" execution sequence.


  auto HasNextInstruction = [](Instruction *I) {

    if (!I->isTerminator())

      return true;


    BasicBlock *nextBB = I->getParent()->getUniqueSuccessor();

    return nextBB && (nextBB->getUniquePredecessor() != nullptr);

  };


  auto NextInstruction = [&](Instruction *I) {

    assert(HasNextInstruction(I) &&

           "first check if there is a next instruction!");


    if (I->isTerminator())

      return &I->getParent()->getUniqueSuccessor()->front();

    return &*++I->getIterator();

  };


  Instruction *Cursor = nullptr;

  for (Cursor = &F.getEntryBlock().front(); HasNextInstruction(Cursor);

       Cursor = NextInstruction(Cursor)) {


    // We need to ensure a safepoint poll occurs before any 'real' call.  The

    // easiest way to ensure finite execution between safepoints in the face of

    // recursive and mutually recursive functions is to enforce that each take

    // a safepoint.  Additionally, we need to ensure a poll before any call

    // which can grow the stack by an unbounded amount.  This isn't required

    // for GC semantics per se, but is a common requirement for languages

    // which detect stack overflow via guard pages and then throw exceptions.

    if (auto *Call = dyn_cast<CallBase>(Cursor)) {

      if (doesNotRequireEntrySafepointBefore(Call))

        continue;

      break;

    }

  }


  assert((HasNextInstruction(Cursor) || Cursor->isTerminator()) &&

         "either we stopped because of a call, or because of terminator");


  return Cursor;

}


const char GCSafepointPollName[] = "gc.safepoint_poll";


static bool isGCSafepointPoll(Function &F) {

  return F.getName().equals(GCSafepointPollName);

}


/// Returns true if this function should be rewritten to include safepoint

/// polls and parseable call sites.  The main point of this function is to be

/// an extension point for custom logic.

static bool shouldRewriteFunction(Function &F) {

  // TODO: This should check the GCStrategy

  if (F.hasGC()) {

    const auto &FunctionGCName = F.getGC();

    const StringRef StatepointExampleName("statepoint-example");

    const StringRef CoreCLRName("coreclr");

    return (StatepointExampleName == FunctionGCName) ||

           (CoreCLRName == FunctionGCName);

  } else

    return false;

}


// TODO: These should become properties of the GCStrategy, possibly with

// command line overrides.

static bool enableEntrySafepoints(Function &F) { return !NoEntry; }

static bool enableBackedgeSafepoints(Function &F) { return !NoBackedge; }

static bool enableCallSafepoints(Function &F) { return !NoCall; }


// Insert a safepoint poll immediately before the given instruction.  Does

// not handle the parsability of state at the runtime call, that's the

// callers job.

static void

InsertSafepointPoll(BasicBlock::iterator InsertBefore,

                    std::vector<CallBase *> &ParsePointsNeeded /*rval*/,

                    const TargetLibraryInfo &TLI) {

  BasicBlock *OrigBB = InsertBefore->getParent();

  Module *M = InsertBefore->getModule();

  assert(M && "must be part of a module");


  // Inline the safepoint poll implementation - this will get all the branch,

  // control flow, etc..  Most importantly, it will introduce the actual slow

  // path call - where we need to insert a safepoint (parsepoint).


  auto *F = M->getFunction(GCSafepointPollName);

  assert(F && "gc.safepoint_poll function is missing");

  assert(F->getValueType() ==

         FunctionType::get(Type::getVoidTy(M->getContext()), false) &&

         "gc.safepoint_poll declared with wrong type");

  assert(!F->empty() && "gc.safepoint_poll must be a non-empty function");

  CallInst *PollCall = CallInst::Create(F, "", InsertBefore);


  // Record some information about the call site we're replacing

  BasicBlock::iterator Before(PollCall), After(PollCall);

  bool IsBegin = false;

  if (Before == OrigBB->begin())

    IsBegin = true;

  else

    Before--;


  After++;

  assert(After != OrigBB->end() && "must have successor");


  // Do the actual inlining

  InlineFunctionInfo IFI;

  bool InlineStatus = InlineFunction(*PollCall, IFI).isSuccess();

  assert(InlineStatus && "inline must succeed");

  (void)InlineStatus; // suppress warning in release-asserts


  // Check post-conditions

  assert(IFI.StaticAllocas.empty() && "can't have allocs");


  std::vector<CallInst *> Calls; // new calls

  DenseSet<BasicBlock *> BBs;    // new BBs + insertee


  // Include only the newly inserted instructions, Note: begin may not be valid

  // if we inserted to the beginning of the basic block

  BasicBlock::iterator Start = IsBegin ? OrigBB->begin() : std::next(Before);


  // If your poll function includes an unreachable at the end, that's not

  // valid.  Bugpoint likes to create this, so check for it.

  assert(isPotentiallyReachable(&*Start, &*After) &&

         "malformed poll function");


  scanInlinedCode(&*Start, &*After, Calls, BBs);

  assert(!Calls.empty() && "slow path not found for safepoint poll");


  // Record the fact we need a parsable state at the runtime call contained in

  // the poll function.  This is required so that the runtime knows how to

  // parse the last frame when we actually take  the safepoint (i.e. execute

  // the slow path)

  assert(ParsePointsNeeded.empty());

  for (auto *CI : Calls) {

    // No safepoint needed or wanted

    if (!needsStatepoint(CI, TLI))

      continue;


    // These are likely runtime calls.  Should we assert that via calling

    // convention or something?

    ParsePointsNeeded.push_back(CI);

  }

  assert(ParsePointsNeeded.size() <= Calls.size());

}

const
aarch64 promote const
Definition: AArch64PromoteConstant.cpp:232

vector
AMDGPU promote alloca to vector or false DEBUG_TYPE to vector
Definition: AMDGPUPromoteAlloca.cpp:214

CFG.h

BasicBlockUtils.h

Cloning.h

CommandLine.h

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(X)
Definition: Debug.h:101

Dominators.h

End
bool End
Definition: ELF_riscv.cpp:480

InitializePasses.h

IntrinsicInst.h

LegacyPassManager.h

LoopDeletionResult::Modified
@ Modified

LoopInfo.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

INITIALIZE_PASS_DEPENDENCY
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition: PassSupport.h:55

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:59

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:52

Pass.h

InsertSafepointPoll
static void InsertSafepointPoll(BasicBlock::iterator InsertBefore, std::vector< CallBase * > &ParsePointsNeeded, const TargetLibraryInfo &TLI)
Definition: PlaceSafepoints.cpp:622

GCSafepointPollName
const char GCSafepointPollName[]
Definition: PlaceSafepoints.cpp:591

AllBackedges
static cl::opt< bool > AllBackedges("spp-all-backedges", cl::Hidden, cl::init(false))

mustBeFiniteCountedLoop
static bool mustBeFiniteCountedLoop(Loop *L, ScalarEvolution *SE, BasicBlock *Pred)
Returns true if this loop is known to terminate in a finite number of iterations.
Definition: PlaceSafepoints.cpp:447

enableCallSafepoints
static bool enableCallSafepoints(Function &F)
Definition: PlaceSafepoints.cpp:616

enableEntrySafepoints
static bool enableEntrySafepoints(Function &F)
Definition: PlaceSafepoints.cpp:614

NoEntry
static cl::opt< bool > NoEntry("spp-no-entry", cl::Hidden, cl::init(false))

isGCSafepointPoll
static bool isGCSafepointPoll(Function &F)
Definition: PlaceSafepoints.cpp:593

shouldRewriteFunction
static bool shouldRewriteFunction(Function &F)
Returns true if this function should be rewritten to include safepoint polls and parseable call sites...
Definition: PlaceSafepoints.cpp:600

needsStatepoint
static bool needsStatepoint(CallBase *Call, const TargetLibraryInfo &TLI)
Definition: PlaceSafepoints.cpp:389

scanInlinedCode
static void scanInlinedCode(Instruction *Start, Instruction *End, std::vector< CallInst * > &Calls, DenseSet< BasicBlock * > &Seen)
Definition: PlaceSafepoints.cpp:499

findLocationForEntrySafepoint
static Instruction * findLocationForEntrySafepoint(Function &F, DominatorTree &DT)
Definition: PlaceSafepoints.cpp:538

SplitBackedge
static cl::opt< bool > SplitBackedge("spp-split-backedge", cl::Hidden, cl::init(false))

containsUnconditionalCallSafepoint
place backedge safepoints Place Backedge static false bool containsUnconditionalCallSafepoint(Loop *L, BasicBlock *Header, BasicBlock *Pred, DominatorTree &DT, const TargetLibraryInfo &TLI)
Returns true if this loop is known to contain a call safepoint which must unconditionally execute on ...
Definition: PlaceSafepoints.cpp:405

doesNotRequireEntrySafepointBefore
static bool doesNotRequireEntrySafepointBefore(CallBase *Call)
Returns true if an entry safepoint is not required before this callsite in the caller function.
Definition: PlaceSafepoints.cpp:515

NoCall
static cl::opt< bool > NoCall("spp-no-call", cl::Hidden, cl::init(false))

impl
place backedge safepoints impl
Definition: PlaceSafepoints.cpp:172

NoBackedge
static cl::opt< bool > NoBackedge("spp-no-backedge", cl::Hidden, cl::init(false))

Safepoints
place backedge safepoints Place Backedge Safepoints
Definition: PlaceSafepoints.cpp:173

enableBackedgeSafepoints
static bool enableBackedgeSafepoints(Function &F)
Definition: PlaceSafepoints.cpp:615

CountedLoopTripWidth
static cl::opt< int > CountedLoopTripWidth("spp-counted-loop-trip-width", cl::Hidden, cl::init(32))
How narrow does the trip count of a loop have to be to have to be considered "counted"?...

scanOneBB
static void scanOneBB(Instruction *Start, Instruction *End, std::vector< CallInst * > &Calls, DenseSet< BasicBlock * > &Seen, std::vector< BasicBlock * > &Worklist)
Definition: PlaceSafepoints.cpp:472

PlaceSafepoints.h

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

ScalarEvolution.h

Scalar.h

SetVector.h
This file implements a set that has insertion order iteration characteristics.

IRDumpFileSuffixType::After
@ After

IRDumpFileSuffixType::Before
@ Before

Statepoint.h

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition: Statistic.h:167

TargetLibraryInfo.h

Local.h

llvm::APInt::isIntN
bool isIntN(unsigned N) const
Check if this APInt has an N-bits unsigned integer value.
Definition: APInt.h:410

llvm::AnalysisManager
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:321

llvm::AnalysisManager::getResult
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Definition: PassManager.h:473

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition: PassAnalysisSupport.h:47

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition: PassAnalysisSupport.h:75

llvm::AnalysisUsage::setPreservesAll
void setPreservesAll()
Set by analyses that do not transform their input at all.
Definition: PassAnalysisSupport.h:130

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:60

llvm::BasicBlock::end
iterator end()
Definition: BasicBlock.h:443

llvm::BasicBlock::begin
iterator begin()
Instruction iterator methods.
Definition: BasicBlock.h:430

llvm::BasicBlock::getUniquePredecessor
const BasicBlock * getUniquePredecessor() const
Return the predecessor of this block if it has a unique predecessor block.
Definition: BasicBlock.cpp:460

llvm::BasicBlock::getParent
const Function * getParent() const
Return the enclosing method, or null if none.
Definition: BasicBlock.h:206

llvm::BasicBlock::iterator
InstListType::iterator iterator
Instruction iterators...
Definition: BasicBlock.h:165

llvm::BasicBlock::getTerminator
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
Definition: BasicBlock.h:221

llvm::BasicBlock::back
const Instruction & back() const
Definition: BasicBlock.h:455

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1494

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1565

llvm::CallInst::Create
static CallInst * Create(FunctionType *Ty, Value *F, const Twine &NameStr, BasicBlock::iterator InsertBefore)
Definition: Instructions.h:1620

llvm::ConstantRange::getUnsignedMax
APInt getUnsignedMax() const
Return the largest unsigned value contained in the ConstantRange.
Definition: ConstantRange.cpp:426

llvm::DenseSet
Implements a dense probed hash-table based set.
Definition: DenseSet.h:271

llvm::DomTreeNodeBase::getIDom
DomTreeNodeBase * getIDom() const
Definition: GenericDomTree.h:90

llvm::DomTreeNodeBase::getBlock
NodeT * getBlock() const
Definition: GenericDomTree.h:89

llvm::DominatorTreeBase::recalculate
void recalculate(ParentType &Func)
recalculate - compute a dominator tree for the given function
Definition: GenericDomTree.h:795

llvm::DominatorTreeBase::getNode
DomTreeNodeBase< NodeT > * getNode(const NodeT *BB) const
getNode - return the (Post)DominatorTree node for the specified basic block.
Definition: GenericDomTree.h:367

llvm::DominatorTreeWrapperPass
Legacy analysis pass which computes a DominatorTree.
Definition: Dominators.h:317

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition: Dominators.h:162

llvm::DominatorTree::dominates
bool dominates(const BasicBlock *BB, const Use &U) const
Return true if the (end of the) basic block BB dominates the use U.
Definition: Dominators.cpp:122

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition: Pass.h:311

llvm::FunctionPass::runOnFunction
virtual bool runOnFunction(Function &F)=0
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.

llvm::FunctionType::get
static FunctionType * get(Type *Result, ArrayRef< Type * > Params, bool isVarArg)
This static method is the primary way of constructing a FunctionType.

llvm::Function
Definition: Function.h:62

llvm::InlineFunctionInfo
This class captures the data input to the InlineFunction call, and records the auxiliary results prod...
Definition: Cloning.h:202

llvm::InlineFunctionInfo::StaticAllocas
SmallVector< AllocaInst *, 4 > StaticAllocas
InlineFunction fills this in with all static allocas that get copied into the caller.
Definition: Cloning.h:220

llvm::InlineResult::isSuccess
bool isSuccess() const
Definition: InlineCost.h:189

llvm::Instruction
Definition: Instruction.h:49

llvm::Instruction::getParent
const BasicBlock * getParent() const
Definition: Instruction.h:152

llvm::Instruction::isTerminator
bool isTerminator() const
Definition: Instruction.h:255

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:47

llvm::LoopInfoWrapperPass
The legacy pass manager's analysis pass to compute loop information.
Definition: LoopInfo.h:593

llvm::LoopInfo
Definition: LoopInfo.h:407

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:44

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:65

llvm::PassRegistry::getPassRegistry
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Definition: PassRegistry.cpp:24

llvm::Pass::getAnalysisUsage
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
Definition: Pass.cpp:98

llvm::PlaceSafepointsPass::run
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
Definition: PlaceSafepoints.cpp:378

llvm::PlaceSafepointsPass::runImpl
bool runImpl(Function &F, const TargetLibraryInfo &TLI)
Definition: PlaceSafepoints.cpp:249

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:109

llvm::PreservedAnalyses::none
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
Definition: Analysis.h:112

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:115

llvm::SCEV
This class represents an analyzed expression in the program.
Definition: ScalarEvolution.h:75

llvm::ScalarEvolutionWrapperPass
Definition: ScalarEvolution.h:2273

llvm::ScalarEvolution
The main scalar evolution driver.
Definition: ScalarEvolution.h:452

llvm::ScalarEvolution::getConstantMaxBackedgeTakenCount
const SCEV * getConstantMaxBackedgeTakenCount(const Loop *L)
When successful, this returns a SCEVConstant that is greater than or equal to (i.e.
Definition: ScalarEvolution.h:903

llvm::ScalarEvolution::getUnsignedRange
ConstantRange getUnsignedRange(const SCEV *S)
Determine the unsigned range for a particular SCEV.
Definition: ScalarEvolution.h:979

llvm::ScalarEvolution::getExitCount
const SCEV * getExitCount(const Loop *L, const BasicBlock *ExitingBlock, ExitCountKind Kind=Exact)
Return the number of times the backedge executes before the given exit would be taken; if not exactly...
Definition: ScalarEvolution.cpp:8265

llvm::SetVector
A vector that has set insertion semantics.
Definition: SetVector.h:57

llvm::SetVector::empty
bool empty() const
Determine if the SetVector is empty or not.
Definition: SetVector.h:93

llvm::SetVector::insert
bool insert(const value_type &X)
Insert a new element into the SetVector.
Definition: SetVector.h:162

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:426

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50

llvm::TargetLibraryAnalysis
Analysis pass providing the TargetLibraryInfo.
Definition: TargetLibraryInfo.h:599

llvm::TargetLibraryInfoWrapperPass
Definition: TargetLibraryInfo.h:624

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition: TargetLibraryInfo.h:281

llvm::Type::getVoidTy
static Type * getVoidTy(LLVMContext &C)

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

llvm::cl::opt
Definition: CommandLine.h:1430

llvm::detail::DenseSetImpl::insert
std::pair< iterator, bool > insert(const ValueT &V)
Definition: DenseSet.h:206

llvm::legacy::FunctionPassManager
FunctionPassManager manages FunctionPasses.
Definition: LegacyPassManager.h:71

llvm::legacy::FunctionPassManager::run
bool run(Function &F)
run - Execute all of the passes scheduled for execution.
Definition: LegacyPassManager.cpp:1349

llvm::legacy::FunctionPassManager::add
void add(Pass *P) override
Add a pass to the queue of passes to run.
Definition: LegacyPassManager.cpp:1341

unsigned

false
Definition: StackSlotColoring.cpp:184

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:138

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:450

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::successors
auto successors(const MachineBasicBlock *BB)
Definition: MachineBasicBlock.h:1306

llvm::append_range
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
Definition: STLExtras.h:2073

llvm::initializePlaceBackedgeSafepointsLegacyPassPass
void initializePlaceBackedgeSafepointsLegacyPassPass(PassRegistry &)

llvm::sort
void sort(IteratorTy Start, IteratorTy End)
Definition: STLExtras.h:1647

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

llvm::InlineFunction
InlineResult InlineFunction(CallBase &CB, InlineFunctionInfo &IFI, bool MergeAttributes=false, AAResults *CalleeAAR=nullptr, bool InsertLifetime=true, Function *ForwardVarArgsTo=nullptr)
This function inlines the called function into the basic block of the caller.
Definition: InlineFunction.cpp:2032

llvm::SplitEdge
BasicBlock * SplitEdge(BasicBlock *From, BasicBlock *To, DominatorTree *DT=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="")
Split the edge connecting the specified blocks, and return the newly created basic block between From...
Definition: BasicBlockUtils.cpp:761

llvm::removeUnreachableBlocks
bool removeUnreachableBlocks(Function &F, DomTreeUpdater *DTU=nullptr, MemorySSAUpdater *MSSAU=nullptr)
Remove all blocks that can not be reached from the function's entry.
Definition: Local.cpp:3197

llvm::callsGCLeafFunction
bool callsGCLeafFunction(const CallBase *Call, const TargetLibraryInfo &TLI)
Return true if this call calls a gc leaf function.
Definition: Local.cpp:3484

llvm::isPotentiallyReachable
bool isPotentiallyReachable(const Instruction *From, const Instruction *To, const SmallPtrSetImpl< BasicBlock * > *ExclusionSet=nullptr, const DominatorTree *DT=nullptr, const LoopInfo *LI=nullptr)
Determine whether instruction 'To' is reachable from 'From', without passing through any blocks in Ex...
Definition: CFG.cpp:231

std
Implement std::hash so that hash_code can be used in STL containers.
Definition: BitVector.h:858