doxygen/PostRASchedulerList_8cpp_source.html

//===----- SchedulePostRAList.cpp - list scheduler ------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This implements a top-down list scheduler, using standard algorithms.

// The basic approach uses a priority queue of available nodes to schedule.

// One at a time, nodes are taken from the priority queue (thus in priority

// order), checked for legality to schedule, and emitted if legal.

//

// Nodes may not be legal to schedule either due to structural hazards (e.g.

// pipeline or resource constraints) or because an input to the instruction has

// not completed execution.

//

//===----------------------------------------------------------------------===//


#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/CodeGen/AntiDepBreaker.h"

#include "llvm/CodeGen/LatencyPriorityQueue.h"

#include "llvm/CodeGen/MachineDominators.h"

#include "llvm/CodeGen/MachineFunctionPass.h"

#include "llvm/CodeGen/MachineLoopInfo.h"

#include "llvm/CodeGen/MachineRegisterInfo.h"

#include "llvm/CodeGen/RegisterClassInfo.h"

#include "llvm/CodeGen/ScheduleDAGInstrs.h"

#include "llvm/CodeGen/ScheduleDAGMutation.h"

#include "llvm/CodeGen/ScheduleHazardRecognizer.h"

#include "llvm/CodeGen/TargetInstrInfo.h"

#include "llvm/CodeGen/TargetPassConfig.h"

#include "llvm/CodeGen/TargetSubtargetInfo.h"

#include "llvm/Config/llvm-config.h"

#include "llvm/InitializePasses.h"

#include "llvm/Pass.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/raw_ostream.h"

using namespace llvm;


#define DEBUG_TYPE "post-RA-sched"


STATISTIC(NumNoops, "Number of noops inserted");

STATISTIC(NumStalls, "Number of pipeline stalls");

STATISTIC(NumFixedAnti, "Number of fixed anti-dependencies");


// Post-RA scheduling is enabled with

// TargetSubtargetInfo.enablePostRAScheduler(). This flag can be used to

// override the target.

static cl::opt<bool>

EnablePostRAScheduler("post-RA-scheduler",

                       cl::desc("Enable scheduling after register allocation"),

                       cl::init(false), cl::Hidden);

static cl::opt<std::string>

EnableAntiDepBreaking("break-anti-dependencies",

                      cl::desc("Break post-RA scheduling anti-dependencies: "

                               "\"critical\", \"all\", or \"none\""),

                      cl::init("none"), cl::Hidden);


// If DebugDiv > 0 then only schedule MBB with (ID % DebugDiv) == DebugMod

static cl::opt<int>

DebugDiv("postra-sched-debugdiv",

                      cl::desc("Debug control MBBs that are scheduled"),

                      cl::init(0), cl::Hidden);

static cl::opt<int>

DebugMod("postra-sched-debugmod",

                      cl::desc("Debug control MBBs that are scheduled"),

                      cl::init(0), cl::Hidden);


AntiDepBreaker::~AntiDepBreaker() = default;


namespace {

  class PostRAScheduler : public MachineFunctionPass {

    const TargetInstrInfo *TII = nullptr;

    RegisterClassInfo RegClassInfo;


  public:

    static char ID;

    PostRAScheduler() : MachineFunctionPass(ID) {}


    void getAnalysisUsage(AnalysisUsage &AU) const override {

      AU.setPreservesCFG();

      AU.addRequired<AAResultsWrapperPass>();

      AU.addRequired<TargetPassConfig>();

      AU.addRequired<MachineDominatorTreeWrapperPass>();

      AU.addPreserved<MachineDominatorTreeWrapperPass>();

      AU.addRequired<MachineLoopInfoWrapperPass>();

      AU.addPreserved<MachineLoopInfoWrapperPass>();

      MachineFunctionPass::getAnalysisUsage(AU);

    }


    MachineFunctionProperties getRequiredProperties() const override {

      return MachineFunctionProperties().set(

          MachineFunctionProperties::Property::NoVRegs);

    }


    bool runOnMachineFunction(MachineFunction &Fn) override;

  };

  char PostRAScheduler::ID = 0;


  class SchedulePostRATDList : public ScheduleDAGInstrs {

    /// AvailableQueue - The priority queue to use for the available SUnits.

    ///

    LatencyPriorityQueue AvailableQueue;


    /// PendingQueue - This contains all of the instructions whose operands have

    /// been issued, but their results are not ready yet (due to the latency of

    /// the operation).  Once the operands becomes available, the instruction is

    /// added to the AvailableQueue.

    std::vector<SUnit*> PendingQueue;


    /// HazardRec - The hazard recognizer to use.

    ScheduleHazardRecognizer *HazardRec;


    /// AntiDepBreak - Anti-dependence breaking object, or NULL if none

    AntiDepBreaker *AntiDepBreak;


    /// AA - AliasAnalysis for making memory reference queries.

    AliasAnalysis *AA;


    /// The schedule. Null SUnit*'s represent noop instructions.

    std::vector<SUnit*> Sequence;


    /// Ordered list of DAG postprocessing steps.

    std::vector<std::unique_ptr<ScheduleDAGMutation>> Mutations;


    /// The index in BB of RegionEnd.

    ///

    /// This is the instruction number from the top of the current block, not

    /// the SlotIndex. It is only used by the AntiDepBreaker.

    unsigned EndIndex = 0;


  public:

    SchedulePostRATDList(

        MachineFunction &MF, MachineLoopInfo &MLI, AliasAnalysis *AA,

        const RegisterClassInfo &,

        TargetSubtargetInfo::AntiDepBreakMode AntiDepMode,

        SmallVectorImpl<const TargetRegisterClass *> &CriticalPathRCs);


    ~SchedulePostRATDList() override;


    /// startBlock - Initialize register live-range state for scheduling in

    /// this block.

    ///

    void startBlock(MachineBasicBlock *BB) override;


    // Set the index of RegionEnd within the current BB.

    void setEndIndex(unsigned EndIdx) { EndIndex = EndIdx; }


    /// Initialize the scheduler state for the next scheduling region.

    void enterRegion(MachineBasicBlock *bb,

                     MachineBasicBlock::iterator begin,

                     MachineBasicBlock::iterator end,

                     unsigned regioninstrs) override;


    /// Notify that the scheduler has finished scheduling the current region.

    void exitRegion() override;


    /// Schedule - Schedule the instruction range using list scheduling.

    ///

    void schedule() override;


    void EmitSchedule();


    /// Observe - Update liveness information to account for the current

    /// instruction, which will not be scheduled.

    ///

    void Observe(MachineInstr &MI, unsigned Count);


    /// finishBlock - Clean up register live-range state.

    ///

    void finishBlock() override;


  private:

    /// Apply each ScheduleDAGMutation step in order.

    void postProcessDAG();


    void ReleaseSucc(SUnit *SU, SDep *SuccEdge);

    void ReleaseSuccessors(SUnit *SU);

    void ScheduleNodeTopDown(SUnit *SU, unsigned CurCycle);

    void ListScheduleTopDown();


    void dumpSchedule() const;

    void emitNoop(unsigned CurCycle);

  };

}


char &llvm::PostRASchedulerID = PostRAScheduler::ID;


INITIALIZE_PASS(PostRAScheduler, DEBUG_TYPE,

                "Post RA top-down list latency scheduler", false, false)


SchedulePostRATDList::SchedulePostRATDList(

    MachineFunction &MF, MachineLoopInfo &MLI, AliasAnalysis *AA,

    const RegisterClassInfo &RCI,

    TargetSubtargetInfo::AntiDepBreakMode AntiDepMode,

    SmallVectorImpl<const TargetRegisterClass *> &CriticalPathRCs)

    : ScheduleDAGInstrs(MF, &MLI), AA(AA) {


  const InstrItineraryData *InstrItins =

      MF.getSubtarget().getInstrItineraryData();

  HazardRec =

      MF.getSubtarget().getInstrInfo()->CreateTargetPostRAHazardRecognizer(

          InstrItins, this);

  MF.getSubtarget().getPostRAMutations(Mutations);


  assert((AntiDepMode == TargetSubtargetInfo::ANTIDEP_NONE ||

          MRI.tracksLiveness()) &&

         "Live-ins must be accurate for anti-dependency breaking");

  AntiDepBreak = ((AntiDepMode == TargetSubtargetInfo::ANTIDEP_ALL)

                      ? createAggressiveAntiDepBreaker(MF, RCI, CriticalPathRCs)

                      : ((AntiDepMode == TargetSubtargetInfo::ANTIDEP_CRITICAL)

                             ? createCriticalAntiDepBreaker(MF, RCI)

                             : nullptr));

}


SchedulePostRATDList::~SchedulePostRATDList() {

  delete HazardRec;

  delete AntiDepBreak;

}


/// Initialize state associated with the next scheduling region.

void SchedulePostRATDList::enterRegion(MachineBasicBlock *bb,

                 MachineBasicBlock::iterator begin,

                 MachineBasicBlock::iterator end,

                 unsigned regioninstrs) {

  ScheduleDAGInstrs::enterRegion(bb, begin, end, regioninstrs);

  Sequence.clear();

}


/// Print the schedule before exiting the region.

void SchedulePostRATDList::exitRegion() {

  LLVM_DEBUG({

    dbgs() << "*** Final schedule ***\n";

    dumpSchedule();

    dbgs() << '\n';

  });

  ScheduleDAGInstrs::exitRegion();

}


#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)

/// dumpSchedule - dump the scheduled Sequence.

LLVM_DUMP_METHOD void SchedulePostRATDList::dumpSchedule() const {

  for (const SUnit *SU : Sequence) {

    if (SU)

      dumpNode(*SU);

    else

      dbgs() << "**** NOOP ****\n";

  }

}

#endif


static bool enablePostRAScheduler(const TargetSubtargetInfo &ST,

                                  CodeGenOptLevel OptLevel) {

  // Check for explicit enable/disable of post-ra scheduling.

  if (EnablePostRAScheduler.getPosition() > 0)

    return EnablePostRAScheduler;


  return ST.enablePostRAScheduler() &&

         OptLevel >= ST.getOptLevelToEnablePostRAScheduler();

}


bool PostRAScheduler::runOnMachineFunction(MachineFunction &Fn) {

  if (skipFunction(Fn.getFunction()))

    return false;


  const auto &Subtarget = Fn.getSubtarget();

  TargetPassConfig *PassConfig = &getAnalysis<TargetPassConfig>();

  // Check that post-RA scheduling is enabled for this target.

  if (!enablePostRAScheduler(Subtarget, PassConfig->getOptLevel()))

    return false;


  TII = Subtarget.getInstrInfo();

  MachineLoopInfo &MLI = getAnalysis<MachineLoopInfoWrapperPass>().getLI();

  AliasAnalysis *AA = &getAnalysis<AAResultsWrapperPass>().getAAResults();

  TargetSubtargetInfo::AntiDepBreakMode AntiDepMode =

      Subtarget.getAntiDepBreakMode();

  if (EnableAntiDepBreaking.getPosition() > 0) {

    AntiDepMode = (EnableAntiDepBreaking == "all")

      ? TargetSubtargetInfo::ANTIDEP_ALL

      : ((EnableAntiDepBreaking == "critical")

         ? TargetSubtargetInfo::ANTIDEP_CRITICAL

         : TargetSubtargetInfo::ANTIDEP_NONE);

  }

  SmallVector<const TargetRegisterClass *, 4> CriticalPathRCs;

  Subtarget.getCriticalPathRCs(CriticalPathRCs);

  RegClassInfo.runOnMachineFunction(Fn);


  LLVM_DEBUG(dbgs() << "PostRAScheduler\n");


  SchedulePostRATDList Scheduler(Fn, MLI, AA, RegClassInfo, AntiDepMode,

                                 CriticalPathRCs);


  // Loop over all of the basic blocks

  for (auto &MBB : Fn) {

#ifndef NDEBUG

    // If DebugDiv > 0 then only schedule MBB with (ID % DebugDiv) == DebugMod

    if (DebugDiv > 0) {

      static int bbcnt = 0;

      if (bbcnt++ % DebugDiv != DebugMod)

        continue;

      dbgs() << "*** DEBUG scheduling " << Fn.getName() << ":"

             << printMBBReference(MBB) << " ***\n";

    }

#endif


    // Initialize register live-range state for scheduling in this block.

    Scheduler.startBlock(&MBB);


    // Schedule each sequence of instructions not interrupted by a label

    // or anything else that effectively needs to shut down scheduling.

    MachineBasicBlock::iterator Current = MBB.end();

    unsigned Count = MBB.size(), CurrentCount = Count;

    for (MachineBasicBlock::iterator I = Current; I != MBB.begin();) {

      MachineInstr &MI = *std::prev(I);

      --Count;

      // Calls are not scheduling boundaries before register allocation, but

      // post-ra we don't gain anything by scheduling across calls since we

      // don't need to worry about register pressure.

      if (MI.isCall() || TII->isSchedulingBoundary(MI, &MBB, Fn)) {

        Scheduler.enterRegion(&MBB, I, Current, CurrentCount - Count);

        Scheduler.setEndIndex(CurrentCount);

        Scheduler.schedule();

        Scheduler.exitRegion();

        Scheduler.EmitSchedule();

        Current = &MI;

        CurrentCount = Count;

        Scheduler.Observe(MI, CurrentCount);

      }

      I = MI;

      if (MI.isBundle())

        Count -= MI.getBundleSize();

    }

    assert(Count == 0 && "Instruction count mismatch!");

    assert((MBB.begin() == Current || CurrentCount != 0) &&

           "Instruction count mismatch!");

    Scheduler.enterRegion(&MBB, MBB.begin(), Current, CurrentCount);

    Scheduler.setEndIndex(CurrentCount);

    Scheduler.schedule();

    Scheduler.exitRegion();

    Scheduler.EmitSchedule();


    // Clean up register live-range state.

    Scheduler.finishBlock();


    // Update register kills

    Scheduler.fixupKills(MBB);

  }


  return true;

}


/// StartBlock - Initialize register live-range state for scheduling in

/// this block.

///

void SchedulePostRATDList::startBlock(MachineBasicBlock *BB) {

  // Call the superclass.

  ScheduleDAGInstrs::startBlock(BB);


  // Reset the hazard recognizer and anti-dep breaker.

  HazardRec->Reset();

  if (AntiDepBreak)

    AntiDepBreak->StartBlock(BB);

}


/// Schedule - Schedule the instruction range using list scheduling.

///

void SchedulePostRATDList::schedule() {

  // Build the scheduling graph.

  buildSchedGraph(AA);


  if (AntiDepBreak) {

    unsigned Broken =

      AntiDepBreak->BreakAntiDependencies(SUnits, RegionBegin, RegionEnd,

                                          EndIndex, DbgValues);


    if (Broken != 0) {

      // We made changes. Update the dependency graph.

      // Theoretically we could update the graph in place:

      // When a live range is changed to use a different register, remove

      // the def's anti-dependence *and* output-dependence edges due to

      // that register, and add new anti-dependence and output-dependence

      // edges based on the next live range of the register.

      ScheduleDAG::clearDAG();

      buildSchedGraph(AA);


      NumFixedAnti += Broken;

    }

  }


  postProcessDAG();


  LLVM_DEBUG(dbgs() << "********** List Scheduling **********\n");

  LLVM_DEBUG(dump());


  AvailableQueue.initNodes(SUnits);

  ListScheduleTopDown();

  AvailableQueue.releaseState();

}


/// Observe - Update liveness information to account for the current

/// instruction, which will not be scheduled.

///

void SchedulePostRATDList::Observe(MachineInstr &MI, unsigned Count) {

  if (AntiDepBreak)

    AntiDepBreak->Observe(MI, Count, EndIndex);

}


/// FinishBlock - Clean up register live-range state.

///

void SchedulePostRATDList::finishBlock() {

  if (AntiDepBreak)

    AntiDepBreak->FinishBlock();


  // Call the superclass.

  ScheduleDAGInstrs::finishBlock();

}


/// Apply each ScheduleDAGMutation step in order.

void SchedulePostRATDList::postProcessDAG() {

  for (auto &M : Mutations)

    M->apply(this);

}


//===----------------------------------------------------------------------===//

//  Top-Down Scheduling

//===----------------------------------------------------------------------===//


/// ReleaseSucc - Decrement the NumPredsLeft count of a successor. Add it to

/// the PendingQueue if the count reaches zero.

void SchedulePostRATDList::ReleaseSucc(SUnit *SU, SDep *SuccEdge) {

  SUnit *SuccSU = SuccEdge->getSUnit();


  if (SuccEdge->isWeak()) {

    --SuccSU->WeakPredsLeft;

    return;

  }

#ifndef NDEBUG

  if (SuccSU->NumPredsLeft == 0) {

    dbgs() << "*** Scheduling failed! ***\n";

    dumpNode(*SuccSU);

    dbgs() << " has been released too many times!\n";

    llvm_unreachable(nullptr);

  }

#endif

  --SuccSU->NumPredsLeft;


  // Standard scheduler algorithms will recompute the depth of the successor

  // here as such:

  //   SuccSU->setDepthToAtLeast(SU->getDepth() + SuccEdge->getLatency());

  //

  // However, we lazily compute node depth instead. Note that

  // ScheduleNodeTopDown has already updated the depth of this node which causes

  // all descendents to be marked dirty. Setting the successor depth explicitly

  // here would cause depth to be recomputed for all its ancestors. If the

  // successor is not yet ready (because of a transitively redundant edge) then

  // this causes depth computation to be quadratic in the size of the DAG.


  // If all the node's predecessors are scheduled, this node is ready

  // to be scheduled. Ignore the special ExitSU node.

  if (SuccSU->NumPredsLeft == 0 && SuccSU != &ExitSU)

    PendingQueue.push_back(SuccSU);

}


/// ReleaseSuccessors - Call ReleaseSucc on each of SU's successors.

void SchedulePostRATDList::ReleaseSuccessors(SUnit *SU) {

  for (SUnit::succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();

       I != E; ++I) {

    ReleaseSucc(SU, &*I);

  }

}


/// ScheduleNodeTopDown - Add the node to the schedule. Decrement the pending

/// count of its successors. If a successor pending count is zero, add it to

/// the Available queue.

void SchedulePostRATDList::ScheduleNodeTopDown(SUnit *SU, unsigned CurCycle) {

  LLVM_DEBUG(dbgs() << "*** Scheduling [" << CurCycle << "]: ");

  LLVM_DEBUG(dumpNode(*SU));


  Sequence.push_back(SU);

  assert(CurCycle >= SU->getDepth() &&

         "Node scheduled above its depth!");

  SU->setDepthToAtLeast(CurCycle);


  ReleaseSuccessors(SU);

  SU->isScheduled = true;

  AvailableQueue.scheduledNode(SU);

}


/// emitNoop - Add a noop to the current instruction sequence.

void SchedulePostRATDList::emitNoop(unsigned CurCycle) {

  LLVM_DEBUG(dbgs() << "*** Emitting noop in cycle " << CurCycle << '\n');

  HazardRec->EmitNoop();

  Sequence.push_back(nullptr);   // NULL here means noop

  ++NumNoops;

}


/// ListScheduleTopDown - The main loop of list scheduling for top-down

/// schedulers.

void SchedulePostRATDList::ListScheduleTopDown() {

  unsigned CurCycle = 0;


  // We're scheduling top-down but we're visiting the regions in

  // bottom-up order, so we don't know the hazards at the start of a

  // region. So assume no hazards (this should usually be ok as most

  // blocks are a single region).

  HazardRec->Reset();


  // Release any successors of the special Entry node.

  ReleaseSuccessors(&EntrySU);


  // Add all leaves to Available queue.

  for (SUnit &SUnit : SUnits) {

    // It is available if it has no predecessors.

    if (!SUnit.NumPredsLeft && !SUnit.isAvailable) {

      AvailableQueue.push(&SUnit);

      SUnit.isAvailable = true;

    }

  }


  // In any cycle where we can't schedule any instructions, we must

  // stall or emit a noop, depending on the target.

  bool CycleHasInsts = false;


  // While Available queue is not empty, grab the node with the highest

  // priority. If it is not ready put it back.  Schedule the node.

  std::vector<SUnit*> NotReady;

  Sequence.reserve(SUnits.size());

  while (!AvailableQueue.empty() || !PendingQueue.empty()) {

    // Check to see if any of the pending instructions are ready to issue.  If

    // so, add them to the available queue.

    unsigned MinDepth = ~0u;

    for (unsigned i = 0, e = PendingQueue.size(); i != e; ++i) {

      if (PendingQueue[i]->getDepth() <= CurCycle) {

        AvailableQueue.push(PendingQueue[i]);

        PendingQueue[i]->isAvailable = true;

        PendingQueue[i] = PendingQueue.back();

        PendingQueue.pop_back();

        --i; --e;

      } else if (PendingQueue[i]->getDepth() < MinDepth)

        MinDepth = PendingQueue[i]->getDepth();

    }


    LLVM_DEBUG(dbgs() << "\n*** Examining Available\n";

               AvailableQueue.dump(this));


    SUnit *FoundSUnit = nullptr, *NotPreferredSUnit = nullptr;

    bool HasNoopHazards = false;

    while (!AvailableQueue.empty()) {

      SUnit *CurSUnit = AvailableQueue.pop();


      ScheduleHazardRecognizer::HazardType HT =

        HazardRec->getHazardType(CurSUnit, 0/*no stalls*/);

      if (HT == ScheduleHazardRecognizer::NoHazard) {

        if (HazardRec->ShouldPreferAnother(CurSUnit)) {

          if (!NotPreferredSUnit) {

            // If this is the first non-preferred node for this cycle, then

            // record it and continue searching for a preferred node. If this

            // is not the first non-preferred node, then treat it as though

            // there had been a hazard.

            NotPreferredSUnit = CurSUnit;

            continue;

          }

        } else {

          FoundSUnit = CurSUnit;

          break;

        }

      }


      // Remember if this is a noop hazard.

      HasNoopHazards |= HT == ScheduleHazardRecognizer::NoopHazard;


      NotReady.push_back(CurSUnit);

    }


    // If we have a non-preferred node, push it back onto the available list.

    // If we did not find a preferred node, then schedule this first

    // non-preferred node.

    if (NotPreferredSUnit) {

      if (!FoundSUnit) {

        LLVM_DEBUG(

            dbgs() << "*** Will schedule a non-preferred instruction...\n");

        FoundSUnit = NotPreferredSUnit;

      } else {

        AvailableQueue.push(NotPreferredSUnit);

      }


      NotPreferredSUnit = nullptr;

    }


    // Add the nodes that aren't ready back onto the available list.

    if (!NotReady.empty()) {

      AvailableQueue.push_all(NotReady);

      NotReady.clear();

    }


    // If we found a node to schedule...

    if (FoundSUnit) {

      // If we need to emit noops prior to this instruction, then do so.

      unsigned NumPreNoops = HazardRec->PreEmitNoops(FoundSUnit);

      for (unsigned i = 0; i != NumPreNoops; ++i)

        emitNoop(CurCycle);


      // ... schedule the node...

      ScheduleNodeTopDown(FoundSUnit, CurCycle);

      HazardRec->EmitInstruction(FoundSUnit);

      CycleHasInsts = true;

      if (HazardRec->atIssueLimit()) {

        LLVM_DEBUG(dbgs() << "*** Max instructions per cycle " << CurCycle

                          << '\n');

        HazardRec->AdvanceCycle();

        ++CurCycle;

        CycleHasInsts = false;

      }

    } else {

      if (CycleHasInsts) {

        LLVM_DEBUG(dbgs() << "*** Finished cycle " << CurCycle << '\n');

        HazardRec->AdvanceCycle();

      } else if (!HasNoopHazards) {

        // Otherwise, we have a pipeline stall, but no other problem,

        // just advance the current cycle and try again.

        LLVM_DEBUG(dbgs() << "*** Stall in cycle " << CurCycle << '\n');

        HazardRec->AdvanceCycle();

        ++NumStalls;

      } else {

        // Otherwise, we have no instructions to issue and we have instructions

        // that will fault if we don't do this right.  This is the case for

        // processors without pipeline interlocks and other cases.

        emitNoop(CurCycle);

      }


      ++CurCycle;

      CycleHasInsts = false;

    }

  }


#ifndef NDEBUG

  unsigned ScheduledNodes = VerifyScheduledDAG(/*isBottomUp=*/false);

  unsigned Noops = llvm::count(Sequence, nullptr);

  assert(Sequence.size() - Noops == ScheduledNodes &&

         "The number of nodes scheduled doesn't match the expected number!");

#endif // NDEBUG

}


// EmitSchedule - Emit the machine code in scheduled order.

void SchedulePostRATDList::EmitSchedule() {

  RegionBegin = RegionEnd;


  // If first instruction was a DBG_VALUE then put it back.

  if (FirstDbgValue)

    BB->splice(RegionEnd, BB, FirstDbgValue);


  // Then re-insert them according to the given schedule.

  for (unsigned i = 0, e = Sequence.size(); i != e; i++) {

    if (SUnit *SU = Sequence[i])

      BB->splice(RegionEnd, BB, SU->getInstr());

    else

      // Null SUnit* is a noop.

      TII->insertNoop(*BB, RegionEnd);


    // Update the Begin iterator, as the first instruction in the block

    // may have been scheduled later.

    if (i == 0)

      RegionBegin = std::prev(RegionEnd);

  }


  // Reinsert any remaining debug_values.

  for (std::vector<std::pair<MachineInstr *, MachineInstr *> >::iterator

         DI = DbgValues.end(), DE = DbgValues.begin(); DI != DE; --DI) {

    std::pair<MachineInstr *, MachineInstr *> P = *std::prev(DI);

    MachineInstr *DbgValue = P.first;

    MachineBasicBlock::iterator OrigPrivMI = P.second;

    BB->splice(++OrigPrivMI, BB, DbgValue);

  }

  DbgValues.clear();

  FirstDbgValue = nullptr;

}

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:105

const
aarch64 promote const
Definition: AArch64PromoteConstant.cpp:230

MBB
MachineBasicBlock & MBB
Definition: ARMSLSHardening.cpp:71

AliasAnalysis.h

AntiDepBreaker.h

CommandLine.h

LLVM_DUMP_METHOD
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
Definition: Compiler.h:622

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition: Debug.h:106

TII
const HexagonInstrInfo * TII
Definition: HexagonCopyToCombine.cpp:125

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:112

InitializePasses.h

LatencyPriorityQueue.h

I
#define I(x, y, z)
Definition: MD5.cpp:58

MachineDominators.h

MachineFunctionPass.h

MachineLoopInfo.h

MachineRegisterInfo.h

Scheduler
Machine Instruction Scheduler
Definition: MachineScheduler.cpp:274

P
#define P(N)

INITIALIZE_PASS
#define INITIALIZE_PASS(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:38

Pass.h

DebugDiv
static cl::opt< int > DebugDiv("postra-sched-debugdiv", cl::desc("Debug control MBBs that are scheduled"), cl::init(0), cl::Hidden)

EnablePostRAScheduler
static cl::opt< bool > EnablePostRAScheduler("post-RA-scheduler", cl::desc("Enable scheduling after register allocation"), cl::init(false), cl::Hidden)

EnableAntiDepBreaking
static cl::opt< std::string > EnableAntiDepBreaking("break-anti-dependencies", cl::desc("Break post-RA scheduling anti-dependencies: " "\"critical\", \"all\", or \"none\""), cl::init("none"), cl::Hidden)

enablePostRAScheduler
static bool enablePostRAScheduler(const TargetSubtargetInfo &ST, CodeGenOptLevel OptLevel)
Definition: PostRASchedulerList.cpp:256

DEBUG_TYPE
#define DEBUG_TYPE
Definition: PostRASchedulerList.cpp:44

DebugMod
static cl::opt< int > DebugMod("postra-sched-debugmod", cl::desc("Debug control MBBs that are scheduled"), cl::init(0), cl::Hidden)

RegisterClassInfo.h

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

ScheduleDAGInstrs.h

ScheduleDAGMutation.h

ScheduleHazardRecognizer.h

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition: Statistic.h:166

TargetInstrInfo.h

TargetPassConfig.h
Target-Independent Code Generator Pass Configuration Options pass.

TargetSubtargetInfo.h

LiveDebugValues::DbgValue
Class recording the (high level) value of a variable.
Definition: InstrRefBasedImpl.h:512

llvm::AAResultsWrapperPass
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
Definition: AliasAnalysis.h:981

llvm::AAResults
Definition: AliasAnalysis.h:314

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition: PassAnalysisSupport.h:47

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition: PassAnalysisSupport.h:75

llvm::AnalysisUsage::addPreserved
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
Definition: PassAnalysisSupport.h:98

llvm::AnalysisUsage::setPreservesCFG
void setPreservesCFG()
This function should be called by the pass, iff they do not:
Definition: Pass.cpp:256

llvm::AntiDepBreaker
This class works in conjunction with the post-RA scheduler to rename registers to break register anti...
Definition: AntiDepBreaker.h:31

llvm::AntiDepBreaker::~AntiDepBreaker
virtual ~AntiDepBreaker()

llvm::HexagonInstrInfo::insertNoop
void insertNoop(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI) const override
Insert a noop into the instruction stream at the specified point.
Definition: HexagonInstrInfo.cpp:1652

llvm::HexagonInstrInfo::isSchedulingBoundary
bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const override
Test if the given instruction should be considered a scheduling boundary.
Definition: HexagonInstrInfo.cpp:1796

llvm::InstrItineraryData
Itinerary data supplied by a subtarget to be used by a target.
Definition: MCInstrItineraries.h:110

llvm::LatencyPriorityQueue
Definition: LatencyPriorityQueue.h:32

llvm::MachineBasicBlock
Definition: MachineBasicBlock.h:125

llvm::MachineBasicBlock::begin
iterator begin()
Definition: MachineBasicBlock.h:355

llvm::MachineBasicBlock::end
iterator end()
Definition: MachineBasicBlock.h:357

llvm::MachineBasicBlock::size
unsigned size() const
Definition: MachineBasicBlock.h:325

llvm::MachineBasicBlock::splice
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
Definition: MachineBasicBlock.h:1109

llvm::MachineDominatorTreeWrapperPass
Analysis pass which computes a MachineDominatorTree.
Definition: MachineDominators.h:131

llvm::MachineFunctionPass
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
Definition: MachineFunctionPass.h:30

llvm::MachineFunctionPass::getAnalysisUsage
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
Definition: MachineFunctionPass.cpp:169

llvm::MachineFunctionPass::runOnMachineFunction
virtual bool runOnMachineFunction(MachineFunction &MF)=0
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...

llvm::MachineFunctionPass::getRequiredProperties
virtual MachineFunctionProperties getRequiredProperties() const
Definition: MachineFunctionPass.h:56

llvm::MachineFunctionProperties
Properties which a MachineFunction may have at a given point in time.
Definition: MachineFunction.h:137

llvm::MachineFunctionProperties::set
MachineFunctionProperties & set(Property P)
Definition: MachineFunction.h:207

llvm::MachineFunction
Definition: MachineFunction.h:267

llvm::MachineFunction::getSubtarget
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Definition: MachineFunction.h:733

llvm::MachineFunction::getFunction
Function & getFunction()
Return the LLVM function that this machine code represents.
Definition: MachineFunction.h:704

llvm::MachineInstrBundleIterator< MachineInstr >

llvm::MachineInstr
Representation of each machine instruction.
Definition: MachineInstr.h:71

llvm::MachineLoopInfoWrapperPass
Definition: MachineLoopInfo.h:156

llvm::MachineLoopInfo
Definition: MachineLoopInfo.h:105

llvm::RegisterClassInfo
Definition: RegisterClassInfo.h:29

llvm::RegisterClassInfo::runOnMachineFunction
void runOnMachineFunction(const MachineFunction &MF)
runOnFunction - Prepare to answer questions about MF.
Definition: RegisterClassInfo.cpp:42

llvm::SDep
Scheduling dependency.
Definition: ScheduleDAG.h:49

llvm::SDep::getSUnit
SUnit * getSUnit() const
Definition: ScheduleDAG.h:498

llvm::SDep::isWeak
bool isWeak() const
Tests if this a weak dependence.
Definition: ScheduleDAG.h:194

llvm::SUnit
Scheduling unit. This is a node in the scheduling DAG.
Definition: ScheduleDAG.h:242

llvm::SUnit::getDepth
unsigned getDepth() const
Returns the depth of this node, which is the length of the maximum path up to any node which has no p...
Definition: ScheduleDAG.h:416

llvm::SUnit::isScheduled
bool isScheduled
True once scheduled.
Definition: ScheduleDAG.h:296

llvm::SUnit::isAvailable
bool isAvailable
True once available.
Definition: ScheduleDAG.h:295

llvm::SUnit::NumPredsLeft
unsigned NumPredsLeft
Definition: ScheduleDAG.h:274

llvm::SUnit::Succs
SmallVector< SDep, 4 > Succs
All sunit successors.
Definition: ScheduleDAG.h:263

llvm::SUnit::WeakPredsLeft
unsigned WeakPredsLeft
Definition: ScheduleDAG.h:276

llvm::SUnit::succ_iterator
SmallVectorImpl< SDep >::iterator succ_iterator
Definition: ScheduleDAG.h:266

llvm::SUnit::setDepthToAtLeast
void setDepthToAtLeast(unsigned NewDepth)
If NewDepth is greater than this node's depth value, sets it to be the new depth value.
Definition: ScheduleDAG.cpp:247

llvm::SUnit::getInstr
MachineInstr * getInstr() const
Returns the representative MachineInstr for this SUnit.
Definition: ScheduleDAG.h:390

llvm::ScheduleDAGInstrs
A ScheduleDAG for scheduling lists of MachineInstr.
Definition: ScheduleDAGInstrs.h:115

llvm::ScheduleDAGInstrs::finishBlock
virtual void finishBlock()
Cleans up after scheduling in the given block.
Definition: ScheduleDAGInstrs.cpp:185

llvm::ScheduleDAGInstrs::startBlock
virtual void startBlock(MachineBasicBlock *BB)
Prepares to perform scheduling in the given block.
Definition: ScheduleDAGInstrs.cpp:181

llvm::ScheduleDAGInstrs::exitRegion
virtual void exitRegion()
Called when the scheduler has finished scheduling the current region.
Definition: ScheduleDAGInstrs.cpp:200

llvm::ScheduleDAGInstrs::schedule
virtual void schedule()=0
Orders nodes according to selected style.

llvm::ScheduleDAGInstrs::enterRegion
virtual void enterRegion(MachineBasicBlock *bb, MachineBasicBlock::iterator begin, MachineBasicBlock::iterator end, unsigned regioninstrs)
Initialize the DAG and common scheduler state for a new scheduling region.
Definition: ScheduleDAGInstrs.cpp:190

llvm::ScheduleDAG::clearDAG
void clearDAG()
Clears the DAG state (between regions).
Definition: ScheduleDAG.cpp:63

llvm::ScheduleHazardRecognizer
HazardRecognizer - This determines whether or not an instruction can be issued this cycle,...
Definition: ScheduleHazardRecognizer.h:25

llvm::ScheduleHazardRecognizer::HazardType
HazardType
Definition: ScheduleHazardRecognizer.h:37

llvm::ScheduleHazardRecognizer::NoHazard
@ NoHazard
Definition: ScheduleHazardRecognizer.h:38

llvm::ScheduleHazardRecognizer::NoopHazard
@ NoopHazard
Definition: ScheduleHazardRecognizer.h:40

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:573

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::TargetInstrInfo
TargetInstrInfo - Interface to description of machine instruction set.
Definition: TargetInstrInfo.h:112

llvm::TargetPassConfig
Target-Independent Code Generator Pass Configuration Options.
Definition: TargetPassConfig.h:85

llvm::TargetPassConfig::getOptLevel
CodeGenOptLevel getOptLevel() const
Definition: TargetPassConfig.cpp:611

llvm::TargetRegisterClass
Definition: TargetRegisterInfo.h:44

llvm::TargetSubtargetInfo
TargetSubtargetInfo - Generic base class for all target subtargets.
Definition: TargetSubtargetInfo.h:63

llvm::TargetSubtargetInfo::AntiDepBreakMode
enum { ANTIDEP_NONE, ANTIDEP_CRITICAL, ANTIDEP_ALL } AntiDepBreakMode
Definition: TargetSubtargetInfo.h:77

llvm::cl::Option::getPosition
unsigned getPosition() const
Definition: CommandLine.h:306

llvm::cl::opt
Definition: CommandLine.h:1423

unsigned

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::ARM::ProfileKind::M
@ M

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::M68k::MemAddrModeKind::u
@ u

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:137

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm::numbers::e
constexpr double e
Definition: MathExtras.h:48

llvm::objcarc::Sequence
Sequence
A sequence of states that a pointer may go through in which an objc_retain and objc_release are actua...
Definition: PtrState.h:41

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::dump
void dump(const SparseBitVector< ElementSize > &LHS, raw_ostream &out)
Definition: SparseBitVector.h:877

llvm::createAggressiveAntiDepBreaker
AntiDepBreaker * createAggressiveAntiDepBreaker(MachineFunction &MFi, const RegisterClassInfo &RCI, TargetSubtargetInfo::RegClassVector &CriticalPathRCs)
Definition: AggressiveAntiDepBreaker.cpp:962

llvm::PostRASchedulerID
char & PostRASchedulerID
PostRAScheduler - This pass performs post register allocation scheduling.
Definition: PostRASchedulerList.cpp:191

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

llvm::CodeGenOptLevel
CodeGenOptLevel
Code generation optimization level.
Definition: CodeGen.h:54

llvm::count
auto count(R &&Range, const E &Element)
Wrapper function around std::count to count the number of times an element Element occurs in the give...
Definition: STLExtras.h:1938

llvm::createCriticalAntiDepBreaker
AntiDepBreaker * createCriticalAntiDepBreaker(MachineFunction &MFi, const RegisterClassInfo &RCI)
Definition: CriticalAntiDepBreaker.cpp:695

llvm::printMBBReference
Printable printMBBReference(const MachineBasicBlock &MBB)
Prints a machine basic block reference.
Definition: MachineBasicBlock.cpp:122

raw_ostream.h

llvm::cl::desc
Definition: CommandLine.h:409