/build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/llvm/lib/CodeGen/MachineScheduler.cpp

Bug Summary

File:	llvm/lib/CodeGen/MachineScheduler.cpp
Warning:	line 3629, column 12 Access to field 'isScheduled' results in a dereference of a null pointer (loaded from variable 'SU')

Annotated Source Code

Press '?' to see keyboard shortcuts

Show analyzer invocation

clang -cc1 -cc1 -triple x86_64-pc-linux-gnu -analyze -disable-free -disable-llvm-verifier -discard-value-names -main-file-name MachineScheduler.cpp -analyzer-store=region -analyzer-opt-analyze-nested-blocks -analyzer-checker=core -analyzer-checker=apiModeling -analyzer-checker=unix -analyzer-checker=deadcode -analyzer-checker=cplusplus -analyzer-checker=security.insecureAPI.UncheckedReturn -analyzer-checker=security.insecureAPI.getpw -analyzer-checker=security.insecureAPI.gets -analyzer-checker=security.insecureAPI.mktemp -analyzer-checker=security.insecureAPI.mkstemp -analyzer-checker=security.insecureAPI.vfork -analyzer-checker=nullability.NullPassedToNonnull -analyzer-checker=nullability.NullReturnedFromNonnull -analyzer-output plist -w -setup-static-analyzer -analyzer-config-compatibility-mode=true -mrelocation-model pic -pic-level 2 -mframe-pointer=none -fmath-errno -fno-rounding-math -mconstructor-aliases -munwind-tables -target-cpu x86-64 -tune-cpu generic -debugger-tuning=gdb -ffunction-sections -fdata-sections -fcoverage-compilation-dir=/build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/build-llvm/lib/CodeGen -resource-dir /usr/lib/llvm-14/lib/clang/14.0.0 -D _GNU_SOURCE -D __STDC_CONSTANT_MACROS -D __STDC_FORMAT_MACROS -D __STDC_LIMIT_MACROS -I /build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/build-llvm/lib/CodeGen -I /build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/llvm/lib/CodeGen -I /build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/build-llvm/include -I /build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/llvm/include -D NDEBUG -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../include/c++/10 -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../include/x86_64-linux-gnu/c++/10 -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../include/c++/10/backward -internal-isystem /usr/lib/llvm-14/lib/clang/14.0.0/include -internal-isystem /usr/local/include -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../x86_64-linux-gnu/include -internal-externc-isystem /usr/include/x86_64-linux-gnu -internal-externc-isystem /include -internal-externc-isystem /usr/include -O2 -Wno-unused-parameter -Wwrite-strings -Wno-missing-field-initializers -Wno-long-long -Wno-maybe-uninitialized -Wno-class-memaccess -Wno-redundant-move -Wno-pessimizing-move -Wno-noexcept-type -Wno-comment -std=c++14 -fdeprecated-macro -fdebug-compilation-dir=/build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/build-llvm/lib/CodeGen -fdebug-prefix-map=/build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e=. -ferror-limit 19 -fvisibility-inlines-hidden -stack-protector 2 -fgnuc-version=4.2.1 -vectorize-loops -vectorize-slp -analyzer-output=html -analyzer-config stable-report-filename=true -faddrsig -D__GCC_HAVE_DWARF2_CFI_ASM=1 -o /tmp/scan-build-2021-09-04-040900-46481-1 -x c++ /build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/llvm/lib/CodeGen/MachineScheduler.cpp

/build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/llvm/lib/CodeGen/MachineScheduler.cpp

→

1//===- MachineScheduler.cpp - Machine Instruction Scheduler ---------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// MachineScheduler schedules machine instructions after phi elimination. It
10// preserves LiveIntervals so it can be invoked before register allocation.
11//
12//===----------------------------------------------------------------------===//

14#include "llvm/CodeGen/MachineScheduler.h"
15#include "llvm/ADT/ArrayRef.h"
16#include "llvm/ADT/BitVector.h"
17#include "llvm/ADT/DenseMap.h"
18#include "llvm/ADT/PriorityQueue.h"
19#include "llvm/ADT/STLExtras.h"
20#include "llvm/ADT/SmallVector.h"
21#include "llvm/ADT/Statistic.h"
22#include "llvm/ADT/iterator_range.h"
23#include "llvm/Analysis/AliasAnalysis.h"
24#include "llvm/CodeGen/LiveInterval.h"
25#include "llvm/CodeGen/LiveIntervals.h"
26#include "llvm/CodeGen/MachineBasicBlock.h"
27#include "llvm/CodeGen/MachineDominators.h"
28#include "llvm/CodeGen/MachineFunction.h"
29#include "llvm/CodeGen/MachineFunctionPass.h"
30#include "llvm/CodeGen/MachineInstr.h"
31#include "llvm/CodeGen/MachineLoopInfo.h"
32#include "llvm/CodeGen/MachineOperand.h"
33#include "llvm/CodeGen/MachinePassRegistry.h"
34#include "llvm/CodeGen/MachineRegisterInfo.h"
35#include "llvm/CodeGen/Passes.h"
36#include "llvm/CodeGen/RegisterClassInfo.h"
37#include "llvm/CodeGen/RegisterPressure.h"
38#include "llvm/CodeGen/ScheduleDAG.h"
39#include "llvm/CodeGen/ScheduleDAGInstrs.h"
40#include "llvm/CodeGen/ScheduleDAGMutation.h"
41#include "llvm/CodeGen/ScheduleDFS.h"
42#include "llvm/CodeGen/ScheduleHazardRecognizer.h"
43#include "llvm/CodeGen/SlotIndexes.h"
44#include "llvm/CodeGen/TargetFrameLowering.h"
45#include "llvm/CodeGen/TargetInstrInfo.h"
46#include "llvm/CodeGen/TargetLowering.h"
47#include "llvm/CodeGen/TargetPassConfig.h"
48#include "llvm/CodeGen/TargetRegisterInfo.h"
49#include "llvm/CodeGen/TargetSchedule.h"
50#include "llvm/CodeGen/TargetSubtargetInfo.h"
51#include "llvm/Config/llvm-config.h"
52#include "llvm/InitializePasses.h"
53#include "llvm/MC/LaneBitmask.h"
54#include "llvm/Pass.h"
55#include "llvm/Support/CommandLine.h"
56#include "llvm/Support/Compiler.h"
57#include "llvm/Support/Debug.h"
58#include "llvm/Support/ErrorHandling.h"
59#include "llvm/Support/GraphWriter.h"
60#include "llvm/Support/MachineValueType.h"
61#include "llvm/Support/raw_ostream.h"
62#include <algorithm>
63#include <cassert>
64#include <cstdint>
65#include <iterator>
66#include <limits>
67#include <memory>
68#include <string>
69#include <tuple>
70#include <utility>
71#include <vector>

73using namespace llvm;

75#define DEBUG_TYPE"machine-scheduler" "machine-scheduler"

77STATISTIC(NumClustered, "Number of load/store pairs clustered")static llvm::Statistic NumClustered = {"machine-scheduler", "NumClustered"
, "Number of load/store pairs clustered"};

79namespace llvm {

81cl::opt<bool> ForceTopDown("misched-topdown", cl::Hidden,
                         cl::desc("Force top-down list scheduling"));
83cl::opt<bool> ForceBottomUp("misched-bottomup", cl::Hidden,
                          cl::desc("Force bottom-up list scheduling"));
85cl::opt<bool>
86DumpCriticalPathLength("misched-dcpl", cl::Hidden,
                     cl::desc("Print critical path length to stdout"));

89cl::opt<bool> VerifyScheduling(
  "verify-misched", cl::Hidden,
  cl::desc("Verify machine instrs before and after machine scheduling"));

93} // end namespace llvm

95#ifndef NDEBUG1
96static cl::opt<bool> ViewMISchedDAGs("view-misched-dags", cl::Hidden,
cl::desc("Pop up a window to show MISched dags after they are processed"));

99/// In some situations a few uninteresting nodes depend on nearly all other
100/// nodes in the graph, provide a cutoff to hide them.
101static cl::opt<unsigned> ViewMISchedCutoff("view-misched-cutoff", cl::Hidden,
cl::desc("Hide nodes with more predecessor/successor than cutoff"));

104static cl::opt<unsigned> MISchedCutoff("misched-cutoff", cl::Hidden,
cl::desc("Stop scheduling after N instructions"), cl::init(~0U));

107static cl::opt<std::string> SchedOnlyFunc("misched-only-func", cl::Hidden,
cl::desc("Only schedule this function"));
109static cl::opt<unsigned> SchedOnlyBlock("misched-only-block", cl::Hidden,
                                      cl::desc("Only schedule this MBB#"));
111static cl::opt<bool> PrintDAGs("misched-print-dags", cl::Hidden,
                            cl::desc("Print schedule DAGs"));
113#else
114static const bool ViewMISchedDAGs = false;
115static const bool PrintDAGs = false;
116#endif // NDEBUG

118/// Avoid quadratic complexity in unusually large basic blocks by limiting the
119/// size of the ready lists.
120static cl::opt<unsigned> ReadyListLimit("misched-limit", cl::Hidden,
cl::desc("Limit ready list to N instructions"), cl::init(256));

123static cl::opt<bool> EnableRegPressure("misched-regpressure", cl::Hidden,
cl::desc("Enable register pressure scheduling."), cl::init(true));

126static cl::opt<bool> EnableCyclicPath("misched-cyclicpath", cl::Hidden,
cl::desc("Enable cyclic critical path analysis."), cl::init(true));

129static cl::opt<bool> EnableMemOpCluster("misched-cluster", cl::Hidden,
                                      cl::desc("Enable memop clustering."),
                                      cl::init(true));
132static cl::opt<bool>
  ForceFastCluster("force-fast-cluster", cl::Hidden,
                   cl::desc("Switch to fast cluster algorithm with the lost "
                            "of some fusion opportunities"),
                   cl::init(false));
137static cl::opt<unsigned>
  FastClusterThreshold("fast-cluster-threshold", cl::Hidden,
                       cl::desc("The threshold for fast cluster"),
                       cl::init(1000));

142// DAG subtrees must have at least this many nodes.
143static const unsigned MinSubtreeSize = 8;

145// Pin the vtables to this file.
146void MachineSchedStrategy::anchor() {}

148void ScheduleDAGMutation::anchor() {}

150//===----------------------------------------------------------------------===//
151// Machine Instruction Scheduling Pass and Registry
152//===----------------------------------------------------------------------===//

154MachineSchedContext::MachineSchedContext() {
RegClassInfo = new RegisterClassInfo();
156}

158MachineSchedContext::~MachineSchedContext() {
delete RegClassInfo;
160}

162namespace {

164/// Base class for a machine scheduler class that can run at any point.
165class MachineSchedulerBase : public MachineSchedContext,
                           public MachineFunctionPass {
167public:
MachineSchedulerBase(char &ID): MachineFunctionPass(ID) {}

void print(raw_ostream &O, const Module* = nullptr) const override;

172protected:
void scheduleRegions(ScheduleDAGInstrs &Scheduler, bool FixKillFlags);
174};

176/// MachineScheduler runs after coalescing and before register allocation.
177class MachineScheduler : public MachineSchedulerBase {
178public:
MachineScheduler();

void getAnalysisUsage(AnalysisUsage &AU) const override;

bool runOnMachineFunction(MachineFunction&) override;

static char ID; // Class identification, replacement for typeinfo

187protected:
ScheduleDAGInstrs *createMachineScheduler();
189};

191/// PostMachineScheduler runs after shortly before code emission.
192class PostMachineScheduler : public MachineSchedulerBase {
193public:
PostMachineScheduler();

void getAnalysisUsage(AnalysisUsage &AU) const override;

bool runOnMachineFunction(MachineFunction&) override;

static char ID; // Class identification, replacement for typeinfo

202protected:
ScheduleDAGInstrs *createPostMachineScheduler();
204};

206} // end anonymous namespace

208char MachineScheduler::ID = 0;

210char &llvm::MachineSchedulerID = MachineScheduler::ID;

212INITIALIZE_PASS_BEGIN(MachineScheduler, DEBUG_TYPE,static void *initializeMachineSchedulerPassOnce(PassRegistry &
Registry) {
                    "Machine Instruction Scheduler", false, false)static void *initializeMachineSchedulerPassOnce(PassRegistry &
Registry) {
214INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass)initializeAAResultsWrapperPassPass(Registry);
215INITIALIZE_PASS_DEPENDENCY(MachineDominatorTree)initializeMachineDominatorTreePass(Registry);
216INITIALIZE_PASS_DEPENDENCY(MachineLoopInfo)initializeMachineLoopInfoPass(Registry);
217INITIALIZE_PASS_DEPENDENCY(SlotIndexes)initializeSlotIndexesPass(Registry);
218INITIALIZE_PASS_DEPENDENCY(LiveIntervals)initializeLiveIntervalsPass(Registry);
219INITIALIZE_PASS_END(MachineScheduler, DEBUG_TYPE,PassInfo *PI = new PassInfo( "Machine Instruction Scheduler",
 "machine-scheduler", &MachineScheduler::ID, PassInfo::NormalCtor_t
(callDefaultCtor<MachineScheduler>), false, false); Registry
.registerPass(*PI, true); return PI; } static llvm::once_flag
 InitializeMachineSchedulerPassFlag; void llvm::initializeMachineSchedulerPass
(PassRegistry &Registry) { llvm::call_once(InitializeMachineSchedulerPassFlag
, initializeMachineSchedulerPassOnce, std::ref(Registry)); }
                  "Machine Instruction Scheduler", false, false)PassInfo *PI = new PassInfo( "Machine Instruction Scheduler",
 "machine-scheduler", &MachineScheduler::ID, PassInfo::NormalCtor_t
(callDefaultCtor<MachineScheduler>), false, false); Registry
.registerPass(*PI, true); return PI; } static llvm::once_flag
 InitializeMachineSchedulerPassFlag; void llvm::initializeMachineSchedulerPass
(PassRegistry &Registry) { llvm::call_once(InitializeMachineSchedulerPassFlag
, initializeMachineSchedulerPassOnce, std::ref(Registry)); }

222MachineScheduler::MachineScheduler() : MachineSchedulerBase(ID) {
initializeMachineSchedulerPass(*PassRegistry::getPassRegistry());
224}

226void MachineScheduler::getAnalysisUsage(AnalysisUsage &AU) const {
AU.setPreservesCFG();
AU.addRequired<MachineDominatorTree>();
AU.addRequired<MachineLoopInfo>();
AU.addRequired<AAResultsWrapperPass>();
AU.addRequired<TargetPassConfig>();
AU.addRequired<SlotIndexes>();
AU.addPreserved<SlotIndexes>();
AU.addRequired<LiveIntervals>();
AU.addPreserved<LiveIntervals>();
MachineFunctionPass::getAnalysisUsage(AU);
237}

239char PostMachineScheduler::ID = 0;

241char &llvm::PostMachineSchedulerID = PostMachineScheduler::ID;

243INITIALIZE_PASS_BEGIN(PostMachineScheduler, "postmisched",static void *initializePostMachineSchedulerPassOnce(PassRegistry
 &Registry) {
                    "PostRA Machine Instruction Scheduler", false, false)static void *initializePostMachineSchedulerPassOnce(PassRegistry
 &Registry) {
245INITIALIZE_PASS_DEPENDENCY(MachineDominatorTree)initializeMachineDominatorTreePass(Registry);
246INITIALIZE_PASS_DEPENDENCY(MachineLoopInfo)initializeMachineLoopInfoPass(Registry);
247INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass)initializeAAResultsWrapperPassPass(Registry);
248INITIALIZE_PASS_END(PostMachineScheduler, "postmisched",PassInfo *PI = new PassInfo( "PostRA Machine Instruction Scheduler"
, "postmisched", &PostMachineScheduler::ID, PassInfo::NormalCtor_t
(callDefaultCtor<PostMachineScheduler>), false, false);
 Registry.registerPass(*PI, true); return PI; } static llvm::
once_flag InitializePostMachineSchedulerPassFlag; void llvm::
initializePostMachineSchedulerPass(PassRegistry &Registry
) { llvm::call_once(InitializePostMachineSchedulerPassFlag, initializePostMachineSchedulerPassOnce
, std::ref(Registry)); }
                  "PostRA Machine Instruction Scheduler", false, false)PassInfo *PI = new PassInfo( "PostRA Machine Instruction Scheduler"
, "postmisched", &PostMachineScheduler::ID, PassInfo::NormalCtor_t
(callDefaultCtor<PostMachineScheduler>), false, false);
 Registry.registerPass(*PI, true); return PI; } static llvm::
once_flag InitializePostMachineSchedulerPassFlag; void llvm::
initializePostMachineSchedulerPass(PassRegistry &Registry
) { llvm::call_once(InitializePostMachineSchedulerPassFlag, initializePostMachineSchedulerPassOnce
, std::ref(Registry)); }

251PostMachineScheduler::PostMachineScheduler() : MachineSchedulerBase(ID) {
initializePostMachineSchedulerPass(*PassRegistry::getPassRegistry());
253}

255void PostMachineScheduler::getAnalysisUsage(AnalysisUsage &AU) const {
AU.setPreservesCFG();
AU.addRequired<MachineDominatorTree>();
AU.addRequired<MachineLoopInfo>();
AU.addRequired<AAResultsWrapperPass>();
AU.addRequired<TargetPassConfig>();
MachineFunctionPass::getAnalysisUsage(AU);
262}

264MachinePassRegistry<MachineSchedRegistry::ScheduleDAGCtor>
  MachineSchedRegistry::Registry;

267/// A dummy default scheduler factory indicates whether the scheduler
268/// is overridden on the command line.
269static ScheduleDAGInstrs *useDefaultMachineSched(MachineSchedContext *C) {
return nullptr;
271}

273/// MachineSchedOpt allows command line selection of the scheduler.
274static cl::opt<MachineSchedRegistry::ScheduleDAGCtor, false,
             RegisterPassParser<MachineSchedRegistry>>
276MachineSchedOpt("misched",
              cl::init(&useDefaultMachineSched), cl::Hidden,
              cl::desc("Machine instruction scheduler to use"));

280static MachineSchedRegistry
281DefaultSchedRegistry("default", "Use the target's default scheduler choice.",
                   useDefaultMachineSched);

284static cl::opt<bool> EnableMachineSched(
  "enable-misched",
  cl::desc("Enable the machine instruction scheduling pass."), cl::init(true),
  cl::Hidden);

289static cl::opt<bool> EnablePostRAMachineSched(
  "enable-post-misched",
  cl::desc("Enable the post-ra machine instruction scheduling pass."),
  cl::init(true), cl::Hidden);

294/// Decrement this iterator until reaching the top or a non-debug instr.
295static MachineBasicBlock::const_iterator
296priorNonDebug(MachineBasicBlock::const_iterator I,
            MachineBasicBlock::const_iterator Beg) {
assert(I != Beg && "reached the top of the region, cannot decrement")(static_cast<void> (0));
while (--I != Beg) {
  if (!I->isDebugOrPseudoInstr())
    break;
}
return I;
304}

306/// Non-const version.
307static MachineBasicBlock::iterator
308priorNonDebug(MachineBasicBlock::iterator I,
            MachineBasicBlock::const_iterator Beg) {
return priorNonDebug(MachineBasicBlock::const_iterator(I), Beg)
    .getNonConstIterator();
312}

314/// If this iterator is a debug value, increment until reaching the End or a
315/// non-debug instruction.
316static MachineBasicBlock::const_iterator
317nextIfDebug(MachineBasicBlock::const_iterator I,
          MachineBasicBlock::const_iterator End) {
for(; I != End; ++I) {
  if (!I->isDebugOrPseudoInstr())
    break;
}
return I;
324}

326/// Non-const version.
327static MachineBasicBlock::iterator
328nextIfDebug(MachineBasicBlock::iterator I,
          MachineBasicBlock::const_iterator End) {
return nextIfDebug(MachineBasicBlock::const_iterator(I), End)
    .getNonConstIterator();
332}

334/// Instantiate a ScheduleDAGInstrs that will be owned by the caller.
335ScheduleDAGInstrs *MachineScheduler::createMachineScheduler() {
// Select the scheduler, or set the default.
MachineSchedRegistry::ScheduleDAGCtor Ctor = MachineSchedOpt;
if (Ctor != useDefaultMachineSched)
  return Ctor(this);

// Get the default scheduler set by the target for this function.
ScheduleDAGInstrs *Scheduler = PassConfig->createMachineScheduler(this);
if (Scheduler)
  return Scheduler;

// Default to GenericScheduler.
return createGenericSchedLive(this);
348}

350/// Instantiate a ScheduleDAGInstrs for PostRA scheduling that will be owned by
351/// the caller. We don't have a command line option to override the postRA
352/// scheduler. The Target must configure it.
353ScheduleDAGInstrs *PostMachineScheduler::createPostMachineScheduler() {
// Get the postRA scheduler set by the target for this function.
ScheduleDAGInstrs *Scheduler = PassConfig->createPostMachineScheduler(this);
if (Scheduler)
  return Scheduler;

// Default to GenericScheduler.
return createGenericSchedPostRA(this);
361}

363/// Top-level MachineScheduler pass driver.
364///
365/// Visit blocks in function order. Divide each block into scheduling regions
366/// and visit them bottom-up. Visiting regions bottom-up is not required, but is
367/// consistent with the DAG builder, which traverses the interior of the
368/// scheduling regions bottom-up.
369///
370/// This design avoids exposing scheduling boundaries to the DAG builder,
371/// simplifying the DAG builder's support for "special" target instructions.
372/// At the same time the design allows target schedulers to operate across
373/// scheduling boundaries, for example to bundle the boundary instructions
374/// without reordering them. This creates complexity, because the target
375/// scheduler must update the RegionBegin and RegionEnd positions cached by
376/// ScheduleDAGInstrs whenever adding or removing instructions. A much simpler
377/// design would be to split blocks at scheduling boundaries, but LLVM has a
378/// general bias against block splitting purely for implementation simplicity.
379bool MachineScheduler::runOnMachineFunction(MachineFunction &mf) {
if (skipFunction(mf.getFunction()))
  return false;

if (EnableMachineSched.getNumOccurrences()) {
  if (!EnableMachineSched)
    return false;
} else if (!mf.getSubtarget().enableMachineScheduler())
  return false;

LLVM_DEBUG(dbgs() << "Before MISched:\n"; mf.print(dbgs()))do { } while (false);

// Initialize the context of the pass.
MF = &mf;
MLI = &getAnalysis<MachineLoopInfo>();
MDT = &getAnalysis<MachineDominatorTree>();
PassConfig = &getAnalysis<TargetPassConfig>();
AA = &getAnalysis<AAResultsWrapperPass>().getAAResults();

LIS = &getAnalysis<LiveIntervals>();

if (VerifyScheduling) {
  LLVM_DEBUG(LIS->dump())do { } while (false);
  MF->verify(this, "Before machine scheduling.");
}
RegClassInfo->runOnMachineFunction(*MF);

// Instantiate the selected scheduler for this target, function, and
// optimization level.
std::unique_ptr<ScheduleDAGInstrs> Scheduler(createMachineScheduler());
scheduleRegions(*Scheduler, false);

LLVM_DEBUG(LIS->dump())do { } while (false);
if (VerifyScheduling)
  MF->verify(this, "After machine scheduling.");
return true;
415}

417bool PostMachineScheduler::runOnMachineFunction(MachineFunction &mf) {
if (skipFunction(mf.getFunction()))
  return false;

if (EnablePostRAMachineSched.getNumOccurrences()) {
  if (!EnablePostRAMachineSched)
    return false;
} else if (!mf.getSubtarget().enablePostRAMachineScheduler()) {
  LLVM_DEBUG(dbgs() << "Subtarget disables post-MI-sched.\n")do { } while (false);
  return false;
}
LLVM_DEBUG(dbgs() << "Before post-MI-sched:\n"; mf.print(dbgs()))do { } while (false);

// Initialize the context of the pass.
MF = &mf;
MLI = &getAnalysis<MachineLoopInfo>();
PassConfig = &getAnalysis<TargetPassConfig>();
AA = &getAnalysis<AAResultsWrapperPass>().getAAResults();

if (VerifyScheduling)
  MF->verify(this, "Before post machine scheduling.");

// Instantiate the selected scheduler for this target, function, and
// optimization level.
std::unique_ptr<ScheduleDAGInstrs> Scheduler(createPostMachineScheduler());
scheduleRegions(*Scheduler, true);

if (VerifyScheduling)
  MF->verify(this, "After post machine scheduling.");
return true;
447}

449/// Return true of the given instruction should not be included in a scheduling
450/// region.
451///
452/// MachineScheduler does not currently support scheduling across calls. To
453/// handle calls, the DAG builder needs to be modified to create register
454/// anti/output dependencies on the registers clobbered by the call's regmask
455/// operand. In PreRA scheduling, the stack pointer adjustment already prevents
456/// scheduling across calls. In PostRA scheduling, we need the isCall to enforce
457/// the boundary, but there would be no benefit to postRA scheduling across
458/// calls this late anyway.
459static bool isSchedBoundary(MachineBasicBlock::iterator MI,
                          MachineBasicBlock *MBB,
                          MachineFunction *MF,
                          const TargetInstrInfo *TII) {
return MI->isCall() || TII->isSchedulingBoundary(*MI, MBB, *MF);
464}

466/// A region of an MBB for scheduling.
467namespace {
468struct SchedRegion {
/// RegionBegin is the first instruction in the scheduling region, and
/// RegionEnd is either MBB->end() or the scheduling boundary after the
/// last instruction in the scheduling region. These iterators cannot refer
/// to instructions outside of the identified scheduling region because
/// those may be reordered before scheduling this region.
MachineBasicBlock::iterator RegionBegin;
MachineBasicBlock::iterator RegionEnd;
unsigned NumRegionInstrs;

SchedRegion(MachineBasicBlock::iterator B, MachineBasicBlock::iterator E,
            unsigned N) :
  RegionBegin(B), RegionEnd(E), NumRegionInstrs(N) {}
481};
482} // end anonymous namespace

484using MBBRegionsVector = SmallVector<SchedRegion, 16>;

486static void
487getSchedRegions(MachineBasicBlock *MBB,
              MBBRegionsVector &Regions,
              bool RegionsTopDown) {
MachineFunction *MF = MBB->getParent();
const TargetInstrInfo *TII = MF->getSubtarget().getInstrInfo();

MachineBasicBlock::iterator I = nullptr;
for(MachineBasicBlock::iterator RegionEnd = MBB->end();
    RegionEnd != MBB->begin(); RegionEnd = I) {

  // Avoid decrementing RegionEnd for blocks with no terminator.
  if (RegionEnd != MBB->end() ||
      isSchedBoundary(&*std::prev(RegionEnd), &*MBB, MF, TII)) {
    --RegionEnd;
  }

  // The next region starts above the previous region. Look backward in the
  // instruction stream until we find the nearest boundary.
  unsigned NumRegionInstrs = 0;
  I = RegionEnd;
  for (;I != MBB->begin(); --I) {
    MachineInstr &MI = *std::prev(I);
    if (isSchedBoundary(&MI, &*MBB, MF, TII))
      break;
    if (!MI.isDebugOrPseudoInstr()) {
      // MBB::size() uses instr_iterator to count. Here we need a bundle to
      // count as a single instruction.
      ++NumRegionInstrs;
    }
  }

  // It's possible we found a scheduling region that only has debug
  // instructions. Don't bother scheduling these.
  if (NumRegionInstrs != 0)
    Regions.push_back(SchedRegion(I, RegionEnd, NumRegionInstrs));
}

if (RegionsTopDown)
  std::reverse(Regions.begin(), Regions.end());
526}

528/// Main driver for both MachineScheduler and PostMachineScheduler.
529void MachineSchedulerBase::scheduleRegions(ScheduleDAGInstrs &Scheduler,
                                         bool FixKillFlags) {
// Visit all machine basic blocks.
//
// TODO: Visit blocks in global postorder or postorder within the bottom-up
// loop tree. Then we can optionally compute global RegPressure.
for (MachineFunction::iterator MBB = MF->begin(), MBBEnd = MF->end();
     MBB != MBBEnd; ++MBB) {

  Scheduler.startBlock(&*MBB);

540#ifndef NDEBUG1
  if (SchedOnlyFunc.getNumOccurrences() && SchedOnlyFunc != MF->getName())
    continue;
  if (SchedOnlyBlock.getNumOccurrences()
      && (int)SchedOnlyBlock != MBB->getNumber())
    continue;
546#endif

  // Break the block into scheduling regions [I, RegionEnd). RegionEnd
  // points to the scheduling boundary at the bottom of the region. The DAG
  // does not include RegionEnd, but the region does (i.e. the next
  // RegionEnd is above the previous RegionBegin). If the current block has
  // no terminator then RegionEnd == MBB->end() for the bottom region.
  //
  // All the regions of MBB are first found and stored in MBBRegions, which
  // will be processed (MBB) top-down if initialized with true.
  //
  // The Scheduler may insert instructions during either schedule() or
  // exitRegion(), even for empty regions. So the local iterators 'I' and
  // 'RegionEnd' are invalid across these calls. Instructions must not be
  // added to other regions than the current one without updating MBBRegions.

  MBBRegionsVector MBBRegions;
  getSchedRegions(&*MBB, MBBRegions, Scheduler.doMBBSchedRegionsTopDown());
  for (MBBRegionsVector::iterator R = MBBRegions.begin();
       R != MBBRegions.end(); ++R) {
    MachineBasicBlock::iterator I = R->RegionBegin;
    MachineBasicBlock::iterator RegionEnd = R->RegionEnd;
    unsigned NumRegionInstrs = R->NumRegionInstrs;

    // Notify the scheduler of the region, even if we may skip scheduling
    // it. Perhaps it still needs to be bundled.
    Scheduler.enterRegion(&*MBB, I, RegionEnd, NumRegionInstrs);

    // Skip empty scheduling regions (0 or 1 schedulable instructions).
    if (I == RegionEnd || I == std::prev(RegionEnd)) {
      // Close the current region. Bundle the terminator if needed.
      // This invalidates 'RegionEnd' and 'I'.
      Scheduler.exitRegion();
      continue;
    }
    LLVM_DEBUG(dbgs() << "********** MI Scheduling **********\n")do { } while (false);
    LLVM_DEBUG(dbgs() << MF->getName() << ":" << printMBBReference(*MBB)do { } while (false)
                      << " " << MBB->getName() << "\n  From: " << *Ido { } while (false)
                      << "    To: ";do { } while (false)
               if (RegionEnd != MBB->end()) dbgs() << *RegionEnd;do { } while (false)
               else dbgs() << "End\n";do { } while (false)
               dbgs() << " RegionInstrs: " << NumRegionInstrs << '\n')do { } while (false);
    if (DumpCriticalPathLength) {
      errs() << MF->getName();
      errs() << ":%bb. " << MBB->getNumber();
      errs() << " " << MBB->getName() << " \n";
    }

    // Schedule a region: possibly reorder instructions.
    // This invalidates the original region iterators.
    Scheduler.schedule();

    // Close the current region.
    Scheduler.exitRegion();
  }
  Scheduler.finishBlock();
  // FIXME: Ideally, no further passes should rely on kill flags. However,
  // thumb2 size reduction is currently an exception, so the PostMIScheduler
  // needs to do this.
  if (FixKillFlags)
    Scheduler.fixupKills(*MBB);
}
Scheduler.finalizeSchedule();
609}

611void MachineSchedulerBase::print(raw_ostream &O, const Module* m) const {
// unimplemented
613}

615#if !defined(NDEBUG1) || defined(LLVM_ENABLE_DUMP)
616LLVM_DUMP_METHOD__attribute__((noinline)) __attribute__((__used__)) void ReadyQueue::dump() const {
dbgs() << "Queue " << Name << ": ";
for (const SUnit *SU : Queue)
  dbgs() << SU->NodeNum << " ";
dbgs() << "\n";
621}
622#endif

624//===----------------------------------------------------------------------===//
625// ScheduleDAGMI - Basic machine instruction scheduling. This is
626// independent of PreRA/PostRA scheduling and involves no extra book-keeping for
627// virtual registers.
628// ===----------------------------------------------------------------------===/

630// Provide a vtable anchor.
631ScheduleDAGMI::~ScheduleDAGMI() = default;

633/// ReleaseSucc - Decrement the NumPredsLeft count of a successor. When
634/// NumPredsLeft reaches zero, release the successor node.
635///
636/// FIXME: Adjust SuccSU height based on MinLatency.
637void ScheduleDAGMI::releaseSucc(SUnit *SU, SDep *SuccEdge) {
SUnit *SuccSU = SuccEdge->getSUnit();

if (SuccEdge->isWeak()) {
  --SuccSU->WeakPredsLeft;
  if (SuccEdge->isCluster())
    NextClusterSucc = SuccSU;
  return;
}
646#ifndef NDEBUG1
if (SuccSU->NumPredsLeft == 0) {
  dbgs() << "*** Scheduling failed! ***\n";
  dumpNode(*SuccSU);
  dbgs() << " has been released too many times!\n";
  llvm_unreachable(nullptr)__builtin_unreachable();
}
653#endif
// SU->TopReadyCycle was set to CurrCycle when it was scheduled. However,
// CurrCycle may have advanced since then.
if (SuccSU->TopReadyCycle < SU->TopReadyCycle + SuccEdge->getLatency())
  SuccSU->TopReadyCycle = SU->TopReadyCycle + SuccEdge->getLatency();

--SuccSU->NumPredsLeft;
if (SuccSU->NumPredsLeft == 0 && SuccSU != &ExitSU)
  SchedImpl->releaseTopNode(SuccSU);
662}

664/// releaseSuccessors - Call releaseSucc on each of SU's successors.
665void ScheduleDAGMI::releaseSuccessors(SUnit *SU) {
for (SDep &Succ : SU->Succs)
  releaseSucc(SU, &Succ);
668}

670/// ReleasePred - Decrement the NumSuccsLeft count of a predecessor. When
671/// NumSuccsLeft reaches zero, release the predecessor node.
672///
673/// FIXME: Adjust PredSU height based on MinLatency.
674void ScheduleDAGMI::releasePred(SUnit *SU, SDep *PredEdge) {
SUnit *PredSU = PredEdge->getSUnit();

if (PredEdge->isWeak()) {
  --PredSU->WeakSuccsLeft;
  if (PredEdge->isCluster())
    NextClusterPred = PredSU;
  return;
}
683#ifndef NDEBUG1
if (PredSU->NumSuccsLeft == 0) {
  dbgs() << "*** Scheduling failed! ***\n";
  dumpNode(*PredSU);
  dbgs() << " has been released too many times!\n";
  llvm_unreachable(nullptr)__builtin_unreachable();
}
690#endif
// SU->BotReadyCycle was set to CurrCycle when it was scheduled. However,
// CurrCycle may have advanced since then.
if (PredSU->BotReadyCycle < SU->BotReadyCycle + PredEdge->getLatency())
  PredSU->BotReadyCycle = SU->BotReadyCycle + PredEdge->getLatency();

--PredSU->NumSuccsLeft;
if (PredSU->NumSuccsLeft == 0 && PredSU != &EntrySU)
  SchedImpl->releaseBottomNode(PredSU);
699}

701/// releasePredecessors - Call releasePred on each of SU's predecessors.
702void ScheduleDAGMI::releasePredecessors(SUnit *SU) {
for (SDep &Pred : SU->Preds)
  releasePred(SU, &Pred);
705}

707void ScheduleDAGMI::startBlock(MachineBasicBlock *bb) {
ScheduleDAGInstrs::startBlock(bb);
SchedImpl->enterMBB(bb);
710}

712void ScheduleDAGMI::finishBlock() {
SchedImpl->leaveMBB();
ScheduleDAGInstrs::finishBlock();
715}

717/// enterRegion - Called back from MachineScheduler::runOnMachineFunction after
718/// crossing a scheduling boundary. [begin, end) includes all instructions in
719/// the region, including the boundary itself and single-instruction regions
720/// that don't get scheduled.
721void ScheduleDAGMI::enterRegion(MachineBasicBlock *bb,
                                   MachineBasicBlock::iterator begin,
                                   MachineBasicBlock::iterator end,
                                   unsigned regioninstrs)
725{
ScheduleDAGInstrs::enterRegion(bb, begin, end, regioninstrs);

SchedImpl->initPolicy(begin, end, regioninstrs);
729}

731/// This is normally called from the main scheduler loop but may also be invoked
732/// by the scheduling strategy to perform additional code motion.
733void ScheduleDAGMI::moveInstruction(
MachineInstr *MI, MachineBasicBlock::iterator InsertPos) {
// Advance RegionBegin if the first instruction moves down.
if (&*RegionBegin == MI)
  ++RegionBegin;

// Update the instruction stream.
BB->splice(InsertPos, BB, MI);

// Update LiveIntervals
if (LIS)
  LIS->handleMove(*MI, /*UpdateFlags=*/true);

// Recede RegionBegin if an instruction moves above the first.
if (RegionBegin == InsertPos)
  RegionBegin = MI;
749}

751bool ScheduleDAGMI::checkSchedLimit() {
752#ifndef NDEBUG1
if (NumInstrsScheduled == MISchedCutoff && MISchedCutoff != ~0U) {
  CurrentTop = CurrentBottom;
  return false;
}
++NumInstrsScheduled;
758#endif
return true;
760}

762/// Per-region scheduling driver, called back from
763/// MachineScheduler::runOnMachineFunction. This is a simplified driver that
764/// does not consider liveness or register pressure. It is useful for PostRA
765/// scheduling and potentially other custom schedulers.
766void ScheduleDAGMI::schedule() {
LLVM_DEBUG(dbgs() << "ScheduleDAGMI::schedule starting\n")do { } while (false);
LLVM_DEBUG(SchedImpl->dumpPolicy())do { } while (false);

// Build the DAG.
buildSchedGraph(AA);

postprocessDAG();

SmallVector<SUnit*, 8> TopRoots, BotRoots;
findRootsAndBiasEdges(TopRoots, BotRoots);

LLVM_DEBUG(dump())do { } while (false);
if (PrintDAGs) dump();
if (ViewMISchedDAGs) viewGraph();

// Initialize the strategy before modifying the DAG.
// This may initialize a DFSResult to be used for queue priority.
SchedImpl->initialize(this);

// Initialize ready queues now that the DAG and priority data are finalized.
initQueues(TopRoots, BotRoots);

bool IsTopNode = false;
while (true) {
  LLVM_DEBUG(dbgs() << "** ScheduleDAGMI::schedule picking next node\n")do { } while (false);
  SUnit *SU = SchedImpl->pickNode(IsTopNode);
  if (!SU) break;

  assert(!SU->isScheduled && "Node already scheduled")(static_cast<void> (0));
  if (!checkSchedLimit())
    break;

  MachineInstr *MI = SU->getInstr();
  if (IsTopNode) {
    assert(SU->isTopReady() && "node still has unscheduled dependencies")(static_cast<void> (0));
    if (&*CurrentTop == MI)
      CurrentTop = nextIfDebug(++CurrentTop, CurrentBottom);
    else
      moveInstruction(MI, CurrentTop);
  } else {
    assert(SU->isBottomReady() && "node still has unscheduled dependencies")(static_cast<void> (0));
    MachineBasicBlock::iterator priorII =
      priorNonDebug(CurrentBottom, CurrentTop);
    if (&*priorII == MI)
      CurrentBottom = priorII;
    else {
      if (&*CurrentTop == MI)
        CurrentTop = nextIfDebug(++CurrentTop, priorII);
      moveInstruction(MI, CurrentBottom);
      CurrentBottom = MI;
    }
  }
  // Notify the scheduling strategy before updating the DAG.
  // This sets the scheduled node's ReadyCycle to CurrCycle. When updateQueues
  // runs, it can then use the accurate ReadyCycle time to determine whether
  // newly released nodes can move to the readyQ.
  SchedImpl->schedNode(SU, IsTopNode);

  updateQueues(SU, IsTopNode);
}
assert(CurrentTop == CurrentBottom && "Nonempty unscheduled zone.")(static_cast<void> (0));

placeDebugValues();

LLVM_DEBUG({do { } while (false)
  dbgs() << "*** Final schedule for "do { } while (false)
         << printMBBReference(*begin()->getParent()) << " ***\n";do { } while (false)
  dumpSchedule();do { } while (false)
  dbgs() << '\n';do { } while (false)
})do { } while (false);
837}

839/// Apply each ScheduleDAGMutation step in order.
840void ScheduleDAGMI::postprocessDAG() {
for (auto &m : Mutations)
  m->apply(this);
843}

845void ScheduleDAGMI::
846findRootsAndBiasEdges(SmallVectorImpl<SUnit*> &TopRoots,
                    SmallVectorImpl<SUnit*> &BotRoots) {
for (SUnit &SU : SUnits) {
  assert(!SU.isBoundaryNode() && "Boundary node should not be in SUnits")(static_cast<void> (0));

  // Order predecessors so DFSResult follows the critical path.
  SU.biasCriticalPath();

  // A SUnit is ready to top schedule if it has no predecessors.
  if (!SU.NumPredsLeft)
    TopRoots.push_back(&SU);
  // A SUnit is ready to bottom schedule if it has no successors.
  if (!SU.NumSuccsLeft)
    BotRoots.push_back(&SU);
}
ExitSU.biasCriticalPath();
862}

864/// Identify DAG roots and setup scheduler queues.
865void ScheduleDAGMI::initQueues(ArrayRef<SUnit*> TopRoots,
                             ArrayRef<SUnit*> BotRoots) {
NextClusterSucc = nullptr;
NextClusterPred = nullptr;

// Release all DAG roots for scheduling, not including EntrySU/ExitSU.
//
// Nodes with unreleased weak edges can still be roots.
// Release top roots in forward order.
for (SUnit *SU : TopRoots)
  SchedImpl->releaseTopNode(SU);

// Release bottom roots in reverse order so the higher priority nodes appear
// first. This is more natural and slightly more efficient.
for (SmallVectorImpl<SUnit*>::const_reverse_iterator
       I = BotRoots.rbegin(), E = BotRoots.rend(); I != E; ++I) {
  SchedImpl->releaseBottomNode(*I);
}

releaseSuccessors(&EntrySU);
releasePredecessors(&ExitSU);

SchedImpl->registerRoots();

// Advance past initial DebugValues.
CurrentTop = nextIfDebug(RegionBegin, RegionEnd);
CurrentBottom = RegionEnd;
892}

894/// Update scheduler queues after scheduling an instruction.
895void ScheduleDAGMI::updateQueues(SUnit *SU, bool IsTopNode) {
// Release dependent instructions for scheduling.
if (IsTopNode)
  releaseSuccessors(SU);
else
  releasePredecessors(SU);

SU->isScheduled = true;
903}

905/// Reinsert any remaining debug_values, just like the PostRA scheduler.
906void ScheduleDAGMI::placeDebugValues() {
// If first instruction was a DBG_VALUE then put it back.
if (FirstDbgValue) {
  BB->splice(RegionBegin, BB, FirstDbgValue);
  RegionBegin = FirstDbgValue;
}

for (std::vector<std::pair<MachineInstr *, MachineInstr *>>::iterator
       DI = DbgValues.end(), DE = DbgValues.begin(); DI != DE; --DI) {
  std::pair<MachineInstr *, MachineInstr *> P = *std::prev(DI);
  MachineInstr *DbgValue = P.first;
  MachineBasicBlock::iterator OrigPrevMI = P.second;
  if (&*RegionBegin == DbgValue)
    ++RegionBegin;
  BB->splice(++OrigPrevMI, BB, DbgValue);
  if (OrigPrevMI == std::prev(RegionEnd))
    RegionEnd = DbgValue;
}
DbgValues.clear();
FirstDbgValue = nullptr;
926}

928#if !defined(NDEBUG1) || defined(LLVM_ENABLE_DUMP)
929LLVM_DUMP_METHOD__attribute__((noinline)) __attribute__((__used__)) void ScheduleDAGMI::dumpSchedule() const {
for (MachineInstr &MI : *this) {
  if (SUnit *SU = getSUnit(&MI))
    dumpNode(*SU);
  else
    dbgs() << "Missing SUnit\n";
}
936}
937#endif

939//===----------------------------------------------------------------------===//
940// ScheduleDAGMILive - Base class for MachineInstr scheduling with LiveIntervals
941// preservation.
942//===----------------------------------------------------------------------===//

944ScheduleDAGMILive::~ScheduleDAGMILive() {
delete DFSResult;
946}

948void ScheduleDAGMILive::collectVRegUses(SUnit &SU) {
const MachineInstr &MI = *SU.getInstr();
for (const MachineOperand &MO : MI.operands()) {
  if (!MO.isReg())
    continue;
  if (!MO.readsReg())
    continue;
  if (TrackLaneMasks && !MO.isUse())
    continue;

  Register Reg = MO.getReg();
  if (!Register::isVirtualRegister(Reg))
    continue;

  // Ignore re-defs.
  if (TrackLaneMasks) {
    bool FoundDef = false;
    for (const MachineOperand &MO2 : MI.operands()) {
      if (MO2.isReg() && MO2.isDef() && MO2.getReg() == Reg && !MO2.isDead()) {
        FoundDef = true;
        break;
      }
    }
    if (FoundDef)
      continue;
  }

  // Record this local VReg use.
  VReg2SUnitMultiMap::iterator UI = VRegUses.find(Reg);
  for (; UI != VRegUses.end(); ++UI) {
    if (UI->SU == &SU)
      break;
  }
  if (UI == VRegUses.end())
    VRegUses.insert(VReg2SUnit(Reg, LaneBitmask::getNone(), &SU));
}
984}

986/// enterRegion - Called back from MachineScheduler::runOnMachineFunction after
987/// crossing a scheduling boundary. [begin, end) includes all instructions in
988/// the region, including the boundary itself and single-instruction regions
989/// that don't get scheduled.
990void ScheduleDAGMILive::enterRegion(MachineBasicBlock *bb,
                              MachineBasicBlock::iterator begin,
                              MachineBasicBlock::iterator end,
                              unsigned regioninstrs)
994{
// ScheduleDAGMI initializes SchedImpl's per-region policy.
ScheduleDAGMI::enterRegion(bb, begin, end, regioninstrs);

// For convenience remember the end of the liveness region.
LiveRegionEnd = (RegionEnd == bb->end()) ? RegionEnd : std::next(RegionEnd);

SUPressureDiffs.clear();

ShouldTrackPressure = SchedImpl->shouldTrackPressure();
ShouldTrackLaneMasks = SchedImpl->shouldTrackLaneMasks();

assert((!ShouldTrackLaneMasks || ShouldTrackPressure) &&(static_cast<void> (0))
       "ShouldTrackLaneMasks requires ShouldTrackPressure")(static_cast<void> (0));
1008}

1010// Setup the register pressure trackers for the top scheduled and bottom
1011// scheduled regions.
1012void ScheduleDAGMILive::initRegPressure() {
VRegUses.clear();
VRegUses.setUniverse(MRI.getNumVirtRegs());
for (SUnit &SU : SUnits)
  collectVRegUses(SU);

TopRPTracker.init(&MF, RegClassInfo, LIS, BB, RegionBegin,
                  ShouldTrackLaneMasks, false);
BotRPTracker.init(&MF, RegClassInfo, LIS, BB, LiveRegionEnd,
                  ShouldTrackLaneMasks, false);

// Close the RPTracker to finalize live ins.
RPTracker.closeRegion();

LLVM_DEBUG(RPTracker.dump())do { } while (false);

// Initialize the live ins and live outs.
TopRPTracker.addLiveRegs(RPTracker.getPressure().LiveInRegs);
BotRPTracker.addLiveRegs(RPTracker.getPressure().LiveOutRegs);

// Close one end of the tracker so we can call
// getMaxUpward/DownwardPressureDelta before advancing across any
// instructions. This converts currently live regs into live ins/outs.
TopRPTracker.closeTop();
BotRPTracker.closeBottom();

BotRPTracker.initLiveThru(RPTracker);
if (!BotRPTracker.getLiveThru().empty()) {
  TopRPTracker.initLiveThru(BotRPTracker.getLiveThru());
  LLVM_DEBUG(dbgs() << "Live Thru: ";do { } while (false)
             dumpRegSetPressure(BotRPTracker.getLiveThru(), TRI))do { } while (false);
};

// For each live out vreg reduce the pressure change associated with other
// uses of the same vreg below the live-out reaching def.
updatePressureDiffs(RPTracker.getPressure().LiveOutRegs);

// Account for liveness generated by the region boundary.
if (LiveRegionEnd != RegionEnd) {
  SmallVector<RegisterMaskPair, 8> LiveUses;
  BotRPTracker.recede(&LiveUses);
  updatePressureDiffs(LiveUses);
}

LLVM_DEBUG(dbgs() << "Top Pressure:\n";do { } while (false)
           dumpRegSetPressure(TopRPTracker.getRegSetPressureAtPos(), TRI);do { } while (false)
           dbgs() << "Bottom Pressure:\n";do { } while (false)
           dumpRegSetPressure(BotRPTracker.getRegSetPressureAtPos(), TRI);)do { } while (false);

assert((BotRPTracker.getPos() == RegionEnd ||(static_cast<void> (0))
        (RegionEnd->isDebugInstr() &&(static_cast<void> (0))
         BotRPTracker.getPos() == priorNonDebug(RegionEnd, RegionBegin))) &&(static_cast<void> (0))
       "Can't find the region bottom")(static_cast<void> (0));

// Cache the list of excess pressure sets in this region. This will also track
// the max pressure in the scheduled code for these sets.
RegionCriticalPSets.clear();
const std::vector<unsigned> &RegionPressure =
  RPTracker.getPressure().MaxSetPressure;
for (unsigned i = 0, e = RegionPressure.size(); i < e; ++i) {
  unsigned Limit = RegClassInfo->getRegPressureSetLimit(i);
  if (RegionPressure[i] > Limit) {
    LLVM_DEBUG(dbgs() << TRI->getRegPressureSetName(i) << " Limit " << Limitdo { } while (false)
                      << " Actual " << RegionPressure[i] << "\n")do { } while (false);
    RegionCriticalPSets.push_back(PressureChange(i));
  }
}
LLVM_DEBUG(dbgs() << "Excess PSets: ";do { } while (false)
           for (const PressureChange &RCPSdo { } while (false)
                : RegionCriticalPSets) dbgs()do { } while (false)
           << TRI->getRegPressureSetName(RCPS.getPSet()) << " ";do { } while (false)
           dbgs() << "\n")do { } while (false);
1084}

1086void ScheduleDAGMILive::
1087updateScheduledPressure(const SUnit *SU,
                      const std::vector<unsigned> &NewMaxPressure) {
const PressureDiff &PDiff = getPressureDiff(SU);
unsigned CritIdx = 0, CritEnd = RegionCriticalPSets.size();
for (const PressureChange &PC : PDiff) {
  if (!PC.isValid())
    break;
  unsigned ID = PC.getPSet();
  while (CritIdx != CritEnd && RegionCriticalPSets[CritIdx].getPSet() < ID)
    ++CritIdx;
  if (CritIdx != CritEnd && RegionCriticalPSets[CritIdx].getPSet() == ID) {
    if ((int)NewMaxPressure[ID] > RegionCriticalPSets[CritIdx].getUnitInc()
        && NewMaxPressure[ID] <= (unsigned)std::numeric_limits<int16_t>::max())
      RegionCriticalPSets[CritIdx].setUnitInc(NewMaxPressure[ID]);
  }
  unsigned Limit = RegClassInfo->getRegPressureSetLimit(ID);
  if (NewMaxPressure[ID] >= Limit - 2) {
    LLVM_DEBUG(dbgs() << "  " << TRI->getRegPressureSetName(ID) << ": "do { } while (false)
                      << NewMaxPressure[ID]do { } while (false)
                      << ((NewMaxPressure[ID] > Limit) ? " > " : " <= ")do { } while (false)
                      << Limit << "(+ " << BotRPTracker.getLiveThru()[ID]do { } while (false)
                      << " livethru)\n")do { } while (false);
  }
}
1111}

1113/// Update the PressureDiff array for liveness after scheduling this
1114/// instruction.
1115void ScheduleDAGMILive::updatePressureDiffs(
  ArrayRef<RegisterMaskPair> LiveUses) {
for (const RegisterMaskPair &P : LiveUses) {
  Register Reg = P.RegUnit;
  /// FIXME: Currently assuming single-use physregs.
  if (!Register::isVirtualRegister(Reg))
    continue;

  if (ShouldTrackLaneMasks) {
    // If the register has just become live then other uses won't change
    // this fact anymore => decrement pressure.
    // If the register has just become dead then other uses make it come
    // back to life => increment pressure.
    bool Decrement = P.LaneMask.any();

    for (const VReg2SUnit &V2SU
         : make_range(VRegUses.find(Reg), VRegUses.end())) {
      SUnit &SU = *V2SU.SU;
      if (SU.isScheduled || &SU == &ExitSU)
        continue;

      PressureDiff &PDiff = getPressureDiff(&SU);
      PDiff.addPressureChange(Reg, Decrement, &MRI);
      LLVM_DEBUG(dbgs() << "  UpdateRegP: SU(" << SU.NodeNum << ") "do { } while (false)
                        << printReg(Reg, TRI) << ':'do { } while (false)
                        << PrintLaneMask(P.LaneMask) << ' ' << *SU.getInstr();do { } while (false)
                 dbgs() << "              to "; PDiff.dump(*TRI);)do { } while (false);
    }
  } else {
    assert(P.LaneMask.any())(static_cast<void> (0));
    LLVM_DEBUG(dbgs() << "  LiveReg: " << printVRegOrUnit(Reg, TRI) << "\n")do { } while (false);
    // This may be called before CurrentBottom has been initialized. However,
    // BotRPTracker must have a valid position. We want the value live into the
    // instruction or live out of the block, so ask for the previous
    // instruction's live-out.
    const LiveInterval &LI = LIS->getInterval(Reg);
    VNInfo *VNI;
    MachineBasicBlock::const_iterator I =
      nextIfDebug(BotRPTracker.getPos(), BB->end());
    if (I == BB->end())
      VNI = LI.getVNInfoBefore(LIS->getMBBEndIdx(BB));
    else {
      LiveQueryResult LRQ = LI.Query(LIS->getInstructionIndex(*I));
      VNI = LRQ.valueIn();
    }
    // RegisterPressureTracker guarantees that readsReg is true for LiveUses.
    assert(VNI && "No live value at use.")(static_cast<void> (0));
    for (const VReg2SUnit &V2SU
         : make_range(VRegUses.find(Reg), VRegUses.end())) {
      SUnit *SU = V2SU.SU;
      // If this use comes before the reaching def, it cannot be a last use,
      // so decrease its pressure change.
      if (!SU->isScheduled && SU != &ExitSU) {
        LiveQueryResult LRQ =
            LI.Query(LIS->getInstructionIndex(*SU->getInstr()));
        if (LRQ.valueIn() == VNI) {
          PressureDiff &PDiff = getPressureDiff(SU);
          PDiff.addPressureChange(Reg, true, &MRI);
          LLVM_DEBUG(dbgs() << "  UpdateRegP: SU(" << SU->NodeNum << ") "do { } while (false)
                            << *SU->getInstr();do { } while (false)
                     dbgs() << "              to "; PDiff.dump(*TRI);)do { } while (false);
        }
      }
    }
  }
}
1181}

1183void ScheduleDAGMILive::dump() const {
1184#if !defined(NDEBUG1) || defined(LLVM_ENABLE_DUMP)
if (EntrySU.getInstr() != nullptr)
  dumpNodeAll(EntrySU);
for (const SUnit &SU : SUnits) {
  dumpNodeAll(SU);
  if (ShouldTrackPressure) {
    dbgs() << "  Pressure Diff      : ";
    getPressureDiff(&SU).dump(*TRI);
  }
  dbgs() << "  Single Issue       : ";
  if (SchedModel.mustBeginGroup(SU.getInstr()) &&
      SchedModel.mustEndGroup(SU.getInstr()))
    dbgs() << "true;";
  else
    dbgs() << "false;";
  dbgs() << '\n';
}
if (ExitSU.getInstr() != nullptr)
  dumpNodeAll(ExitSU);
1203#endif
1204}

1206/// schedule - Called back from MachineScheduler::runOnMachineFunction
1207/// after setting up the current scheduling region. [RegionBegin, RegionEnd)
1208/// only includes instructions that have DAG nodes, not scheduling boundaries.
1209///
1210/// This is a skeletal driver, with all the functionality pushed into helpers,
1211/// so that it can be easily extended by experimental schedulers. Generally,
1212/// implementing MachineSchedStrategy should be sufficient to implement a new
1213/// scheduling algorithm. However, if a scheduler further subclasses
1214/// ScheduleDAGMILive then it will want to override this virtual method in order
1215/// to update any specialized state.
1216void ScheduleDAGMILive::schedule() {
LLVM_DEBUG(dbgs() << "ScheduleDAGMILive::schedule starting\n")do { } while (false);
LLVM_DEBUG(SchedImpl->dumpPolicy())do { } while (false);
buildDAGWithRegPressure();

postprocessDAG();

SmallVector<SUnit*, 8> TopRoots, BotRoots;
findRootsAndBiasEdges(TopRoots, BotRoots);

// Initialize the strategy before modifying the DAG.
// This may initialize a DFSResult to be used for queue priority.
SchedImpl->initialize(this);

LLVM_DEBUG(dump())do { } while (false);
if (PrintDAGs) dump();
if (ViewMISchedDAGs) viewGraph();

// Initialize ready queues now that the DAG and priority data are finalized.
initQueues(TopRoots, BotRoots);

bool IsTopNode = false;
while (true) {
  LLVM_DEBUG(dbgs() << "** ScheduleDAGMILive::schedule picking next node\n")do { } while (false);
  SUnit *SU = SchedImpl->pickNode(IsTopNode);
  if (!SU) break;

  assert(!SU->isScheduled && "Node already scheduled")(static_cast<void> (0));
  if (!checkSchedLimit())
    break;

  scheduleMI(SU, IsTopNode);

  if (DFSResult) {
    unsigned SubtreeID = DFSResult->getSubtreeID(SU);
    if (!ScheduledTrees.test(SubtreeID)) {
      ScheduledTrees.set(SubtreeID);
      DFSResult->scheduleTree(SubtreeID);
      SchedImpl->scheduleTree(SubtreeID);
    }
  }

  // Notify the scheduling strategy after updating the DAG.
  SchedImpl->schedNode(SU, IsTopNode);

  updateQueues(SU, IsTopNode);
}
assert(CurrentTop == CurrentBottom && "Nonempty unscheduled zone.")(static_cast<void> (0));

placeDebugValues();

LLVM_DEBUG({do { } while (false)
  dbgs() << "*** Final schedule for "do { } while (false)
         << printMBBReference(*begin()->getParent()) << " ***\n";do { } while (false)
  dumpSchedule();do { } while (false)
  dbgs() << '\n';do { } while (false)
})do { } while (false);
1273}

1275/// Build the DAG and setup three register pressure trackers.
1276void ScheduleDAGMILive::buildDAGWithRegPressure() {
if (!ShouldTrackPressure) {
  RPTracker.reset();
  RegionCriticalPSets.clear();
  buildSchedGraph(AA);
  return;
}

// Initialize the register pressure tracker used by buildSchedGraph.
RPTracker.init(&MF, RegClassInfo, LIS, BB, LiveRegionEnd,
               ShouldTrackLaneMasks, /*TrackUntiedDefs=*/true);

// Account for liveness generate by the region boundary.
if (LiveRegionEnd != RegionEnd)
  RPTracker.recede();

// Build the DAG, and compute current register pressure.
buildSchedGraph(AA, &RPTracker, &SUPressureDiffs, LIS, ShouldTrackLaneMasks);

// Initialize top/bottom trackers after computing region pressure.
initRegPressure();
1297}

1299void ScheduleDAGMILive::computeDFSResult() {
if (!DFSResult)
  DFSResult = new SchedDFSResult(/*BottomU*/true, MinSubtreeSize);
DFSResult->clear();
ScheduledTrees.clear();
DFSResult->resize(SUnits.size());
DFSResult->compute(SUnits);
ScheduledTrees.resize(DFSResult->getNumSubtrees());
1307}

1309/// Compute the max cyclic critical path through the DAG. The scheduling DAG
1310/// only provides the critical path for single block loops. To handle loops that
1311/// span blocks, we could use the vreg path latencies provided by
1312/// MachineTraceMetrics instead. However, MachineTraceMetrics is not currently
1313/// available for use in the scheduler.
1314///
1315/// The cyclic path estimation identifies a def-use pair that crosses the back
1316/// edge and considers the depth and height of the nodes. For example, consider
1317/// the following instruction sequence where each instruction has unit latency
1318/// and defines an eponymous virtual register:
1319///
1320/// a->b(a,c)->c(b)->d(c)->exit
1321///
1322/// The cyclic critical path is a two cycles: b->c->b
1323/// The acyclic critical path is four cycles: a->b->c->d->exit
1324/// LiveOutHeight = height(c) = len(c->d->exit) = 2
1325/// LiveOutDepth = depth(c) + 1 = len(a->b->c) + 1 = 3
1326/// LiveInHeight = height(b) + 1 = len(b->c->d->exit) + 1 = 4
1327/// LiveInDepth = depth(b) = len(a->b) = 1
1328///
1329/// LiveOutDepth - LiveInDepth = 3 - 1 = 2
1330/// LiveInHeight - LiveOutHeight = 4 - 2 = 2
1331/// CyclicCriticalPath = min(2, 2) = 2
1332///
1333/// This could be relevant to PostRA scheduling, but is currently implemented
1334/// assuming LiveIntervals.
1335unsigned ScheduleDAGMILive::computeCyclicCriticalPath() {
// This only applies to single block loop.
if (!BB->isSuccessor(BB))
  return 0;

unsigned MaxCyclicLatency = 0;
// Visit each live out vreg def to find def/use pairs that cross iterations.
for (const RegisterMaskPair &P : RPTracker.getPressure().LiveOutRegs) {
  Register Reg = P.RegUnit;
  if (!Register::isVirtualRegister(Reg))
    continue;
  const LiveInterval &LI = LIS->getInterval(Reg);
  const VNInfo *DefVNI = LI.getVNInfoBefore(LIS->getMBBEndIdx(BB));
  if (!DefVNI)
    continue;

  MachineInstr *DefMI = LIS->getInstructionFromIndex(DefVNI->def);
  const SUnit *DefSU = getSUnit(DefMI);
  if (!DefSU)
    continue;

  unsigned LiveOutHeight = DefSU->getHeight();
  unsigned LiveOutDepth = DefSU->getDepth() + DefSU->Latency;
  // Visit all local users of the vreg def.
  for (const VReg2SUnit &V2SU
       : make_range(VRegUses.find(Reg), VRegUses.end())) {
    SUnit *SU = V2SU.SU;
    if (SU == &ExitSU)
      continue;

    // Only consider uses of the phi.
    LiveQueryResult LRQ = LI.Query(LIS->getInstructionIndex(*SU->getInstr()));
    if (!LRQ.valueIn()->isPHIDef())
      continue;

    // Assume that a path spanning two iterations is a cycle, which could
    // overestimate in strange cases. This allows cyclic latency to be
    // estimated as the minimum slack of the vreg's depth or height.
    unsigned CyclicLatency = 0;
    if (LiveOutDepth > SU->getDepth())
      CyclicLatency = LiveOutDepth - SU->getDepth();

    unsigned LiveInHeight = SU->getHeight() + DefSU->Latency;
    if (LiveInHeight > LiveOutHeight) {
      if (LiveInHeight - LiveOutHeight < CyclicLatency)
        CyclicLatency = LiveInHeight - LiveOutHeight;
    } else
      CyclicLatency = 0;

    LLVM_DEBUG(dbgs() << "Cyclic Path: SU(" << DefSU->NodeNum << ") -> SU("do { } while (false)
                      << SU->NodeNum << ") = " << CyclicLatency << "c\n")do { } while (false);
    if (CyclicLatency > MaxCyclicLatency)
      MaxCyclicLatency = CyclicLatency;
  }
}
LLVM_DEBUG(dbgs() << "Cyclic Critical Path: " << MaxCyclicLatency << "c\n")do { } while (false);
return MaxCyclicLatency;
1392}

1394/// Release ExitSU predecessors and setup scheduler queues. Re-position
1395/// the Top RP tracker in case the region beginning has changed.
1396void ScheduleDAGMILive::initQueues(ArrayRef<SUnit*> TopRoots,
                                 ArrayRef<SUnit*> BotRoots) {
ScheduleDAGMI::initQueues(TopRoots, BotRoots);
if (ShouldTrackPressure) {
  assert(TopRPTracker.getPos() == RegionBegin && "bad initial Top tracker")(static_cast<void> (0));
  TopRPTracker.setPos(CurrentTop);
}
1403}

1405/// Move an instruction and update register pressure.
1406void ScheduleDAGMILive::scheduleMI(SUnit *SU, bool IsTopNode) {
// Move the instruction to its new location in the instruction stream.
MachineInstr *MI = SU->getInstr();

if (IsTopNode) {
  assert(SU->isTopReady() && "node still has unscheduled dependencies")(static_cast<void> (0));
  if (&*CurrentTop == MI)
    CurrentTop = nextIfDebug(++CurrentTop, CurrentBottom);
  else {
    moveInstruction(MI, CurrentTop);
    TopRPTracker.setPos(MI);
  }

  if (ShouldTrackPressure) {
    // Update top scheduled pressure.
    RegisterOperands RegOpers;
    RegOpers.collect(*MI, *TRI, MRI, ShouldTrackLaneMasks, false);
    if (ShouldTrackLaneMasks) {
      // Adjust liveness and add missing dead+read-undef flags.
      SlotIndex SlotIdx = LIS->getInstructionIndex(*MI).getRegSlot();
      RegOpers.adjustLaneLiveness(*LIS, MRI, SlotIdx, MI);
    } else {
      // Adjust for missing dead-def flags.
      RegOpers.detectDeadDefs(*MI, *LIS);
    }

    TopRPTracker.advance(RegOpers);
    assert(TopRPTracker.getPos() == CurrentTop && "out of sync")(static_cast<void> (0));
    LLVM_DEBUG(dbgs() << "Top Pressure:\n"; dumpRegSetPressure(do { } while (false)
                   TopRPTracker.getRegSetPressureAtPos(), TRI);)do { } while (false);

    updateScheduledPressure(SU, TopRPTracker.getPressure().MaxSetPressure);
  }
} else {
  assert(SU->isBottomReady() && "node still has unscheduled dependencies")(static_cast<void> (0));
  MachineBasicBlock::iterator priorII =
    priorNonDebug(CurrentBottom, CurrentTop);
  if (&*priorII == MI)
    CurrentBottom = priorII;
  else {
    if (&*CurrentTop == MI) {
      CurrentTop = nextIfDebug(++CurrentTop, priorII);
      TopRPTracker.setPos(CurrentTop);
    }
    moveInstruction(MI, CurrentBottom);
    CurrentBottom = MI;
    BotRPTracker.setPos(CurrentBottom);
  }
  if (ShouldTrackPressure) {
    RegisterOperands RegOpers;
    RegOpers.collect(*MI, *TRI, MRI, ShouldTrackLaneMasks, false);
    if (ShouldTrackLaneMasks) {
      // Adjust liveness and add missing dead+read-undef flags.
      SlotIndex SlotIdx = LIS->getInstructionIndex(*MI).getRegSlot();
      RegOpers.adjustLaneLiveness(*LIS, MRI, SlotIdx, MI);
    } else {
      // Adjust for missing dead-def flags.
      RegOpers.detectDeadDefs(*MI, *LIS);
    }

    if (BotRPTracker.getPos() != CurrentBottom)
      BotRPTracker.recedeSkipDebugValues();
    SmallVector<RegisterMaskPair, 8> LiveUses;
    BotRPTracker.recede(RegOpers, &LiveUses);
    assert(BotRPTracker.getPos() == CurrentBottom && "out of sync")(static_cast<void> (0));
    LLVM_DEBUG(dbgs() << "Bottom Pressure:\n"; dumpRegSetPressure(do { } while (false)
                   BotRPTracker.getRegSetPressureAtPos(), TRI);)do { } while (false);

    updateScheduledPressure(SU, BotRPTracker.getPressure().MaxSetPressure);
    updatePressureDiffs(LiveUses);
  }
}
1478}

1480//===----------------------------------------------------------------------===//
1481// BaseMemOpClusterMutation - DAG post-processing to cluster loads or stores.
1482//===----------------------------------------------------------------------===//

1484namespace {

1486/// Post-process the DAG to create cluster edges between neighboring
1487/// loads or between neighboring stores.
1488class BaseMemOpClusterMutation : public ScheduleDAGMutation {
struct MemOpInfo {
  SUnit *SU;
  SmallVector<const MachineOperand *, 4> BaseOps;
  int64_t Offset;
  unsigned Width;

  MemOpInfo(SUnit *SU, ArrayRef<const MachineOperand *> BaseOps,
            int64_t Offset, unsigned Width)
      : SU(SU), BaseOps(BaseOps.begin(), BaseOps.end()), Offset(Offset),
        Width(Width) {}

  static bool Compare(const MachineOperand *const &A,
                      const MachineOperand *const &B) {
    if (A->getType() != B->getType())
      return A->getType() < B->getType();
    if (A->isReg())
      return A->getReg() < B->getReg();
    if (A->isFI()) {
      const MachineFunction &MF = *A->getParent()->getParent()->getParent();
      const TargetFrameLowering &TFI = *MF.getSubtarget().getFrameLowering();
      bool StackGrowsDown = TFI.getStackGrowthDirection() ==
                            TargetFrameLowering::StackGrowsDown;
      return StackGrowsDown ? A->getIndex() > B->getIndex()
                            : A->getIndex() < B->getIndex();
    }

    llvm_unreachable("MemOpClusterMutation only supports register or frame "__builtin_unreachable()
                     "index bases.")__builtin_unreachable();
  }

  bool operator<(const MemOpInfo &RHS) const {
    // FIXME: Don't compare everything twice. Maybe use C++20 three way
    // comparison instead when it's available.
    if (std::lexicographical_compare(BaseOps.begin(), BaseOps.end(),
                                     RHS.BaseOps.begin(), RHS.BaseOps.end(),
                                     Compare))
      return true;
    if (std::lexicographical_compare(RHS.BaseOps.begin(), RHS.BaseOps.end(),
                                     BaseOps.begin(), BaseOps.end(), Compare))
      return false;
    if (Offset != RHS.Offset)
      return Offset < RHS.Offset;
    return SU->NodeNum < RHS.SU->NodeNum;
  }
};

const TargetInstrInfo *TII;
const TargetRegisterInfo *TRI;
bool IsLoad;

1539public:
BaseMemOpClusterMutation(const TargetInstrInfo *tii,
                         const TargetRegisterInfo *tri, bool IsLoad)
    : TII(tii), TRI(tri), IsLoad(IsLoad) {}

void apply(ScheduleDAGInstrs *DAGInstrs) override;

1546protected:
void clusterNeighboringMemOps(ArrayRef<MemOpInfo> MemOps, bool FastCluster,
                              ScheduleDAGInstrs *DAG);
void collectMemOpRecords(std::vector<SUnit> &SUnits,
                         SmallVectorImpl<MemOpInfo> &MemOpRecords);
bool groupMemOps(ArrayRef<MemOpInfo> MemOps, ScheduleDAGInstrs *DAG,
                 DenseMap<unsigned, SmallVector<MemOpInfo, 32>> &Groups);
1553};

1555class StoreClusterMutation : public BaseMemOpClusterMutation {
1556public:
StoreClusterMutation(const TargetInstrInfo *tii,
                     const TargetRegisterInfo *tri)
    : BaseMemOpClusterMutation(tii, tri, false) {}
1560};

1562class LoadClusterMutation : public BaseMemOpClusterMutation {
1563public:
LoadClusterMutation(const TargetInstrInfo *tii, const TargetRegisterInfo *tri)
    : BaseMemOpClusterMutation(tii, tri, true) {}
1566};

1568} // end anonymous namespace

1570namespace llvm {

1572std::unique_ptr<ScheduleDAGMutation>
1573createLoadClusterDAGMutation(const TargetInstrInfo *TII,
                           const TargetRegisterInfo *TRI) {
return EnableMemOpCluster ? std::make_unique<LoadClusterMutation>(TII, TRI)
                          : nullptr;
1577}

1579std::unique_ptr<ScheduleDAGMutation>
1580createStoreClusterDAGMutation(const TargetInstrInfo *TII,
                            const TargetRegisterInfo *TRI) {
return EnableMemOpCluster ? std::make_unique<StoreClusterMutation>(TII, TRI)
                          : nullptr;
1584}

1586} // end namespace llvm

1588// Sorting all the loads/stores first, then for each load/store, checking the
1589// following load/store one by one, until reach the first non-dependent one and
1590// call target hook to see if they can cluster.
1591// If FastCluster is enabled, we assume that, all the loads/stores have been
1592// preprocessed and now, they didn't have dependencies on each other.
1593void BaseMemOpClusterMutation::clusterNeighboringMemOps(
  ArrayRef<MemOpInfo> MemOpRecords, bool FastCluster,
  ScheduleDAGInstrs *DAG) {
// Keep track of the current cluster length and bytes for each SUnit.
DenseMap<unsigned, std::pair<unsigned, unsigned>> SUnit2ClusterInfo;

// At this point, `MemOpRecords` array must hold atleast two mem ops. Try to
// cluster mem ops collected within `MemOpRecords` array.
for (unsigned Idx = 0, End = MemOpRecords.size(); Idx < (End - 1); ++Idx) {
  // Decision to cluster mem ops is taken based on target dependent logic
  auto MemOpa = MemOpRecords[Idx];

  // Seek for the next load/store to do the cluster.
  unsigned NextIdx = Idx + 1;
  for (; NextIdx < End; ++NextIdx)
    // Skip if MemOpb has been clustered already or has dependency with
    // MemOpa.
    if (!SUnit2ClusterInfo.count(MemOpRecords[NextIdx].SU->NodeNum) &&
        (FastCluster ||
         (!DAG->IsReachable(MemOpRecords[NextIdx].SU, MemOpa.SU) &&
          !DAG->IsReachable(MemOpa.SU, MemOpRecords[NextIdx].SU))))
      break;
  if (NextIdx == End)
    continue;

  auto MemOpb = MemOpRecords[NextIdx];
  unsigned ClusterLength = 2;
  unsigned CurrentClusterBytes = MemOpa.Width + MemOpb.Width;
  if (SUnit2ClusterInfo.count(MemOpa.SU->NodeNum)) {
    ClusterLength = SUnit2ClusterInfo[MemOpa.SU->NodeNum].first + 1;
    CurrentClusterBytes =
        SUnit2ClusterInfo[MemOpa.SU->NodeNum].second + MemOpb.Width;
  }

  if (!TII->shouldClusterMemOps(MemOpa.BaseOps, MemOpb.BaseOps, ClusterLength,
                                CurrentClusterBytes))
    continue;

  SUnit *SUa = MemOpa.SU;
  SUnit *SUb = MemOpb.SU;
  if (SUa->NodeNum > SUb->NodeNum)
    std::swap(SUa, SUb);

  // FIXME: Is this check really required?
  if (!DAG->addEdge(SUb, SDep(SUa, SDep::Cluster)))
    continue;

  LLVM_DEBUG(dbgs() << "Cluster ld/st SU(" << SUa->NodeNum << ") - SU("do { } while (false)
                    << SUb->NodeNum << ")\n")do { } while (false);
  ++NumClustered;

  if (IsLoad) {
    // Copy successor edges from SUa to SUb. Interleaving computation
    // dependent on SUa can prevent load combining due to register reuse.
    // Predecessor edges do not need to be copied from SUb to SUa since
    // nearby loads should have effectively the same inputs.
    for (const SDep &Succ : SUa->Succs) {
      if (Succ.getSUnit() == SUb)
        continue;
      LLVM_DEBUG(dbgs() << "  Copy Succ SU(" << Succ.getSUnit()->NodeNumdo { } while (false)
                        << ")\n")do { } while (false);
      DAG->addEdge(Succ.getSUnit(), SDep(SUb, SDep::Artificial));
    }
  } else {
    // Copy predecessor edges from SUb to SUa to avoid the SUnits that
    // SUb dependent on scheduled in-between SUb and SUa. Successor edges
    // do not need to be copied from SUa to SUb since no one will depend
    // on stores.
    // Notice that, we don't need to care about the memory dependency as
    // we won't try to cluster them if they have any memory dependency.
    for (const SDep &Pred : SUb->Preds) {
      if (Pred.getSUnit() == SUa)
        continue;
      LLVM_DEBUG(dbgs() << "  Copy Pred SU(" << Pred.getSUnit()->NodeNumdo { } while (false)
                        << ")\n")do { } while (false);
      DAG->addEdge(SUa, SDep(Pred.getSUnit(), SDep::Artificial));
    }
  }

  SUnit2ClusterInfo[MemOpb.SU->NodeNum] = {ClusterLength,
                                           CurrentClusterBytes};

  LLVM_DEBUG(dbgs() << "  Curr cluster length: " << ClusterLengthdo { } while (false)
                    << ", Curr cluster bytes: " << CurrentClusterBytesdo { } while (false)
                    << "\n")do { } while (false);
}
1679}

1681void BaseMemOpClusterMutation::collectMemOpRecords(
  std::vector<SUnit> &SUnits, SmallVectorImpl<MemOpInfo> &MemOpRecords) {
for (auto &SU : SUnits) {
  if ((IsLoad && !SU.getInstr()->mayLoad()) ||
      (!IsLoad && !SU.getInstr()->mayStore()))
    continue;

  const MachineInstr &MI = *SU.getInstr();
  SmallVector<const MachineOperand *, 4> BaseOps;
  int64_t Offset;
  bool OffsetIsScalable;
  unsigned Width;
  if (TII->getMemOperandsWithOffsetWidth(MI, BaseOps, Offset,
                                         OffsetIsScalable, Width, TRI)) {
    MemOpRecords.push_back(MemOpInfo(&SU, BaseOps, Offset, Width));

    LLVM_DEBUG(dbgs() << "Num BaseOps: " << BaseOps.size() << ", Offset: "do { } while (false)
                      << Offset << ", OffsetIsScalable: " << OffsetIsScalabledo { } while (false)
                      << ", Width: " << Width << "\n")do { } while (false);
  }
1701#ifndef NDEBUG1
  for (auto *Op : BaseOps)
    assert(Op)(static_cast<void> (0));
1704#endif
}
1706}

1708bool BaseMemOpClusterMutation::groupMemOps(
  ArrayRef<MemOpInfo> MemOps, ScheduleDAGInstrs *DAG,
  DenseMap<unsigned, SmallVector<MemOpInfo, 32>> &Groups) {
bool FastCluster =
    ForceFastCluster ||
    MemOps.size() * DAG->SUnits.size() / 1000 > FastClusterThreshold;

for (const auto &MemOp : MemOps) {
  unsigned ChainPredID = DAG->SUnits.size();
  if (FastCluster) {
    for (const SDep &Pred : MemOp.SU->Preds) {
      // We only want to cluster the mem ops that have the same ctrl(non-data)
      // pred so that they didn't have ctrl dependency for each other. But for
      // store instrs, we can still cluster them if the pred is load instr.
      if ((Pred.isCtrl() &&
           (IsLoad ||
            (Pred.getSUnit() && Pred.getSUnit()->getInstr()->mayStore()))) &&
          !Pred.isArtificial()) {
        ChainPredID = Pred.getSUnit()->NodeNum;
        break;
      }
    }
  } else
    ChainPredID = 0;

  Groups[ChainPredID].push_back(MemOp);
}
return FastCluster;
1736}

1738/// Callback from DAG postProcessing to create cluster edges for loads/stores.
1739void BaseMemOpClusterMutation::apply(ScheduleDAGInstrs *DAG) {
// Collect all the clusterable loads/stores
SmallVector<MemOpInfo, 32> MemOpRecords;
collectMemOpRecords(DAG->SUnits, MemOpRecords);

if (MemOpRecords.size() < 2)
  return;

// Put the loads/stores without dependency into the same group with some
// heuristic if the DAG is too complex to avoid compiling time blow up.
// Notice that, some fusion pair could be lost with this.
DenseMap<unsigned, SmallVector<MemOpInfo, 32>> Groups;
bool FastCluster = groupMemOps(MemOpRecords, DAG, Groups);

for (auto &Group : Groups) {
  // Sorting the loads/stores, so that, we can stop the cluster as early as
  // possible.
  llvm::sort(Group.second);

  // Trying to cluster all the neighboring loads/stores.
  clusterNeighboringMemOps(Group.second, FastCluster, DAG);
}
1761}

1763//===----------------------------------------------------------------------===//
1764// CopyConstrain - DAG post-processing to encourage copy elimination.
1765//===----------------------------------------------------------------------===//

1767namespace {

1769/// Post-process the DAG to create weak edges from all uses of a copy to
1770/// the one use that defines the copy's source vreg, most likely an induction
1771/// variable increment.
1772class CopyConstrain : public ScheduleDAGMutation {
// Transient state.
SlotIndex RegionBeginIdx;

// RegionEndIdx is the slot index of the last non-debug instruction in the
// scheduling region. So we may have RegionBeginIdx == RegionEndIdx.
SlotIndex RegionEndIdx;

1780public:
CopyConstrain(const TargetInstrInfo *, const TargetRegisterInfo *) {}

void apply(ScheduleDAGInstrs *DAGInstrs) override;

1785protected:
void constrainLocalCopy(SUnit *CopySU, ScheduleDAGMILive *DAG);
1787};

1789} // end anonymous namespace

1791namespace llvm {

1793std::unique_ptr<ScheduleDAGMutation>
1794createCopyConstrainDAGMutation(const TargetInstrInfo *TII,
                             const TargetRegisterInfo *TRI) {
return std::make_unique<CopyConstrain>(TII, TRI);
1797}

1799} // end namespace llvm

1801/// constrainLocalCopy handles two possibilities:
1802/// 1) Local src:
1803/// I0:     = dst
1804/// I1: src = ...
1805/// I2:     = dst
1806/// I3: dst = src (copy)
1807/// (create pred->succ edges I0->I1, I2->I1)
1808///
1809/// 2) Local copy:
1810/// I0: dst = src (copy)
1811/// I1:     = dst
1812/// I2: src = ...
1813/// I3:     = dst
1814/// (create pred->succ edges I1->I2, I3->I2)
1815///
1816/// Although the MachineScheduler is currently constrained to single blocks,
1817/// this algorithm should handle extended blocks. An EBB is a set of
1818/// contiguously numbered blocks such that the previous block in the EBB is
1819/// always the single predecessor.
1820void CopyConstrain::constrainLocalCopy(SUnit *CopySU, ScheduleDAGMILive *DAG) {
LiveIntervals *LIS = DAG->getLIS();
MachineInstr *Copy = CopySU->getInstr();

// Check for pure vreg copies.
const MachineOperand &SrcOp = Copy->getOperand(1);
Register SrcReg = SrcOp.getReg();
if (!Register::isVirtualRegister(SrcReg) || !SrcOp.readsReg())
  return;

const MachineOperand &DstOp = Copy->getOperand(0);
Register DstReg = DstOp.getReg();
if (!Register::isVirtualRegister(DstReg) || DstOp.isDead())
  return;

// Check if either the dest or source is local. If it's live across a back
// edge, it's not local. Note that if both vregs are live across the back
// edge, we cannot successfully contrain the copy without cyclic scheduling.
// If both the copy's source and dest are local live intervals, then we
// should treat the dest as the global for the purpose of adding
// constraints. This adds edges from source's other uses to the copy.
unsigned LocalReg = SrcReg;
unsigned GlobalReg = DstReg;
LiveInterval *LocalLI = &LIS->getInterval(LocalReg);
if (!LocalLI->isLocal(RegionBeginIdx, RegionEndIdx)) {
  LocalReg = DstReg;
  GlobalReg = SrcReg;
  LocalLI = &LIS->getInterval(LocalReg);
  if (!LocalLI->isLocal(RegionBeginIdx, RegionEndIdx))
    return;
}
LiveInterval *GlobalLI = &LIS->getInterval(GlobalReg);

// Find the global segment after the start of the local LI.
LiveInterval::iterator GlobalSegment = GlobalLI->find(LocalLI->beginIndex());
// If GlobalLI does not overlap LocalLI->start, then a copy directly feeds a
// local live range. We could create edges from other global uses to the local
// start, but the coalescer should have already eliminated these cases, so
// don't bother dealing with it.
if (GlobalSegment == GlobalLI->end())
  return;

// If GlobalSegment is killed at the LocalLI->start, the call to find()
// returned the next global segment. But if GlobalSegment overlaps with
// LocalLI->start, then advance to the next segment. If a hole in GlobalLI
// exists in LocalLI's vicinity, GlobalSegment will be the end of the hole.
if (GlobalSegment->contains(LocalLI->beginIndex()))
  ++GlobalSegment;

if (GlobalSegment == GlobalLI->end())
  return;

// Check if GlobalLI contains a hole in the vicinity of LocalLI.
if (GlobalSegment != GlobalLI->begin()) {
  // Two address defs have no hole.
  if (SlotIndex::isSameInstr(std::prev(GlobalSegment)->end,
                             GlobalSegment->start)) {
    return;
  }
  // If the prior global segment may be defined by the same two-address
  // instruction that also defines LocalLI, then can't make a hole here.
  if (SlotIndex::isSameInstr(std::prev(GlobalSegment)->start,
                             LocalLI->beginIndex())) {
    return;
  }
  // If GlobalLI has a prior segment, it must be live into the EBB. Otherwise
  // it would be a disconnected component in the live range.
  assert(std::prev(GlobalSegment)->start < LocalLI->beginIndex() &&(static_cast<void> (0))
         "Disconnected LRG within the scheduling region.")(static_cast<void> (0));
}
MachineInstr *GlobalDef = LIS->getInstructionFromIndex(GlobalSegment->start);
if (!GlobalDef)
  return;

SUnit *GlobalSU = DAG->getSUnit(GlobalDef);
if (!GlobalSU)
  return;

// GlobalDef is the bottom of the GlobalLI hole. Open the hole by
// constraining the uses of the last local def to precede GlobalDef.
SmallVector<SUnit*,8> LocalUses;
const VNInfo *LastLocalVN = LocalLI->getVNInfoBefore(LocalLI->endIndex());
MachineInstr *LastLocalDef = LIS->getInstructionFromIndex(LastLocalVN->def);
SUnit *LastLocalSU = DAG->getSUnit(LastLocalDef);
for (const SDep &Succ : LastLocalSU->Succs) {
  if (Succ.getKind() != SDep::Data || Succ.getReg() != LocalReg)
    continue;
  if (Succ.getSUnit() == GlobalSU)
    continue;
  if (!DAG->canAddEdge(GlobalSU, Succ.getSUnit()))
    return;
  LocalUses.push_back(Succ.getSUnit());
}
// Open the top of the GlobalLI hole by constraining any earlier global uses
// to precede the start of LocalLI.
SmallVector<SUnit*,8> GlobalUses;
MachineInstr *FirstLocalDef =
  LIS->getInstructionFromIndex(LocalLI->beginIndex());
SUnit *FirstLocalSU = DAG->getSUnit(FirstLocalDef);
for (const SDep &Pred : GlobalSU->Preds) {
  if (Pred.getKind() != SDep::Anti || Pred.getReg() != GlobalReg)
    continue;
  if (Pred.getSUnit() == FirstLocalSU)
    continue;
  if (!DAG->canAddEdge(FirstLocalSU, Pred.getSUnit()))
    return;
  GlobalUses.push_back(Pred.getSUnit());
}
LLVM_DEBUG(dbgs() << "Constraining copy SU(" << CopySU->NodeNum << ")\n")do { } while (false);
// Add the weak edges.
for (SUnit *LU : LocalUses) {
  LLVM_DEBUG(dbgs() << "  Local use SU(" << LU->NodeNum << ") -> SU("do { } while (false)
                    << GlobalSU->NodeNum << ")\n")do { } while (false);
  DAG->addEdge(GlobalSU, SDep(LU, SDep::Weak));
}
for (SUnit *GU : GlobalUses) {
  LLVM_DEBUG(dbgs() << "  Global use SU(" << GU->NodeNum << ") -> SU("do { } while (false)
                    << FirstLocalSU->NodeNum << ")\n")do { } while (false);
  DAG->addEdge(FirstLocalSU, SDep(GU, SDep::Weak));
}
1940}

1942/// Callback from DAG postProcessing to create weak edges to encourage
1943/// copy elimination.
1944void CopyConstrain::apply(ScheduleDAGInstrs *DAGInstrs) {
ScheduleDAGMI *DAG = static_cast<ScheduleDAGMI*>(DAGInstrs);
assert(DAG->hasVRegLiveness() && "Expect VRegs with LiveIntervals")(static_cast<void> (0));

MachineBasicBlock::iterator FirstPos = nextIfDebug(DAG->begin(), DAG->end());
if (FirstPos == DAG->end())
  return;
RegionBeginIdx = DAG->getLIS()->getInstructionIndex(*FirstPos);
RegionEndIdx = DAG->getLIS()->getInstructionIndex(
    *priorNonDebug(DAG->end(), DAG->begin()));

for (SUnit &SU : DAG->SUnits) {
  if (!SU.getInstr()->isCopy())
    continue;

  constrainLocalCopy(&SU, static_cast<ScheduleDAGMILive*>(DAG));
}
1961}

1963//===----------------------------------------------------------------------===//
1964// MachineSchedStrategy helpers used by GenericScheduler, GenericPostScheduler
1965// and possibly other custom schedulers.
1966//===----------------------------------------------------------------------===//

1968static const unsigned InvalidCycle = ~0U;

1970SchedBoundary::~SchedBoundary() { delete HazardRec; }

1972/// Given a Count of resource usage and a Latency value, return true if a
1973/// SchedBoundary becomes resource limited.
1974/// If we are checking after scheduling a node, we should return true when
1975/// we just reach the resource limit.
1976static bool checkResourceLimit(unsigned LFactor, unsigned Count,
                             unsigned Latency, bool AfterSchedNode) {
int ResCntFactor = (int)(Count - (Latency * LFactor));
if (AfterSchedNode)
  return ResCntFactor >= (int)LFactor;
else
  return ResCntFactor > (int)LFactor;
1983}

1985void SchedBoundary::reset() {
// A new HazardRec is created for each DAG and owned by SchedBoundary.
// Destroying and reconstructing it is very expensive though. So keep
// invalid, placeholder HazardRecs.
if (HazardRec && HazardRec->isEnabled()) {
  delete HazardRec;
  HazardRec = nullptr;
}
Available.clear();
Pending.clear();
CheckPending = false;
CurrCycle = 0;
CurrMOps = 0;
MinReadyCycle = std::numeric_limits<unsigned>::max();
ExpectedLatency = 0;
DependentLatency = 0;
RetiredMOps = 0;
MaxExecutedResCount = 0;
ZoneCritResIdx = 0;
IsResourceLimited = false;
ReservedCycles.clear();
ReservedCyclesIndex.clear();
ResourceGroupSubUnitMasks.clear();
2008#ifndef NDEBUG1
// Track the maximum number of stall cycles that could arise either from the
// latency of a DAG edge or the number of cycles that a processor resource is
// reserved (SchedBoundary::ReservedCycles).
MaxObservedStall = 0;
2013#endif
// Reserve a zero-count for invalid CritResIdx.
ExecutedResCounts.resize(1);
assert(!ExecutedResCounts[0] && "nonzero count for bad resource")(static_cast<void> (0));
2017}

2019void SchedRemainder::
2020init(ScheduleDAGMI *DAG, const TargetSchedModel *SchedModel) {
reset();
if (!SchedModel->hasInstrSchedModel())
  return;
RemainingCounts.resize(SchedModel->getNumProcResourceKinds());
for (SUnit &SU : DAG->SUnits) {
  const MCSchedClassDesc *SC = DAG->getSchedClass(&SU);
  RemIssueCount += SchedModel->getNumMicroOps(SU.getInstr(), SC)
    * SchedModel->getMicroOpFactor();
  for (TargetSchedModel::ProcResIter
         PI = SchedModel->getWriteProcResBegin(SC),
         PE = SchedModel->getWriteProcResEnd(SC); PI != PE; ++PI) {
    unsigned PIdx = PI->ProcResourceIdx;
    unsigned Factor = SchedModel->getResourceFactor(PIdx);
    RemainingCounts[PIdx] += (Factor * PI->Cycles);
  }
}
2037}

2039void SchedBoundary::
2040init(ScheduleDAGMI *dag, const TargetSchedModel *smodel, SchedRemainder *rem) {
reset();
DAG = dag;
SchedModel = smodel;
Rem = rem;
if (SchedModel->hasInstrSchedModel()) {
  unsigned ResourceCount = SchedModel->getNumProcResourceKinds();
  ReservedCyclesIndex.resize(ResourceCount);
  ExecutedResCounts.resize(ResourceCount);
  ResourceGroupSubUnitMasks.resize(ResourceCount, APInt(ResourceCount, 0));
  unsigned NumUnits = 0;

  for (unsigned i = 0; i < ResourceCount; ++i) {
    ReservedCyclesIndex[i] = NumUnits;
    NumUnits += SchedModel->getProcResource(i)->NumUnits;
    if (isUnbufferedGroup(i)) {
      auto SubUnits = SchedModel->getProcResource(i)->SubUnitsIdxBegin;
      for (unsigned U = 0, UE = SchedModel->getProcResource(i)->NumUnits;
           U != UE; ++U)
        ResourceGroupSubUnitMasks[i].setBit(SubUnits[U]);
    }
  }

  ReservedCycles.resize(NumUnits, InvalidCycle);
}
2065}

2067/// Compute the stall cycles based on this SUnit's ready time. Heuristics treat
2068/// these "soft stalls" differently than the hard stall cycles based on CPU
2069/// resources and computed by checkHazard(). A fully in-order model
2070/// (MicroOpBufferSize==0) will not make use of this since instructions are not
2071/// available for scheduling until they are ready. However, a weaker in-order
2072/// model may use this for heuristics. For example, if a processor has in-order
2073/// behavior when reading certain resources, this may come into play.
2074unsigned SchedBoundary::getLatencyStallCycles(SUnit *SU) {
if (!SU->isUnbuffered)
  return 0;

unsigned ReadyCycle = (isTop() ? SU->TopReadyCycle : SU->BotReadyCycle);
if (ReadyCycle > CurrCycle)
  return ReadyCycle - CurrCycle;
return 0;
2082}

2084/// Compute the next cycle at which the given processor resource unit
2085/// can be scheduled.
2086unsigned SchedBoundary::getNextResourceCycleByInstance(unsigned InstanceIdx,
                                                     unsigned Cycles) {
unsigned NextUnreserved = ReservedCycles[InstanceIdx];
// If this resource has never been used, always return cycle zero.
if (NextUnreserved == InvalidCycle)
  return 0;
// For bottom-up scheduling add the cycles needed for the current operation.
if (!isTop())
  NextUnreserved += Cycles;
return NextUnreserved;
2096}

2098/// Compute the next cycle at which the given processor resource can be
2099/// scheduled.  Returns the next cycle and the index of the processor resource
2100/// instance in the reserved cycles vector.
2101std::pair<unsigned, unsigned>
2102SchedBoundary::getNextResourceCycle(const MCSchedClassDesc *SC, unsigned PIdx,
                                  unsigned Cycles) {

unsigned MinNextUnreserved = InvalidCycle;
unsigned InstanceIdx = 0;
unsigned StartIndex = ReservedCyclesIndex[PIdx];
unsigned NumberOfInstances = SchedModel->getProcResource(PIdx)->NumUnits;
assert(NumberOfInstances > 0 &&(static_cast<void> (0))
       "Cannot have zero instances of a ProcResource")(static_cast<void> (0));

if (isUnbufferedGroup(PIdx)) {
  // If any subunits are used by the instruction, report that the resource
  // group is available at 0, effectively removing the group record from
  // hazarding and basing the hazarding decisions on the subunit records.
  // Otherwise, choose the first available instance from among the subunits.
  // Specifications which assign cycles to both the subunits and the group or
  // which use an unbuffered group with buffered subunits will appear to
  // schedule strangely. In the first case, the additional cycles for the
  // group will be ignored.  In the second, the group will be ignored
  // entirely.
  for (const MCWriteProcResEntry &PE :
       make_range(SchedModel->getWriteProcResBegin(SC),
                  SchedModel->getWriteProcResEnd(SC)))
    if (ResourceGroupSubUnitMasks[PIdx][PE.ProcResourceIdx])
      return std::make_pair(0u, StartIndex);

  auto SubUnits = SchedModel->getProcResource(PIdx)->SubUnitsIdxBegin;
  for (unsigned I = 0, End = NumberOfInstances; I < End; ++I) {
    unsigned NextUnreserved, NextInstanceIdx;
    std::tie(NextUnreserved, NextInstanceIdx) =
        getNextResourceCycle(SC, SubUnits[I], Cycles);
    if (MinNextUnreserved > NextUnreserved) {
      InstanceIdx = NextInstanceIdx;
      MinNextUnreserved = NextUnreserved;
    }
  }
  return std::make_pair(MinNextUnreserved, InstanceIdx);
}

for (unsigned I = StartIndex, End = StartIndex + NumberOfInstances; I < End;
     ++I) {
  unsigned NextUnreserved = getNextResourceCycleByInstance(I, Cycles);
  if (MinNextUnreserved > NextUnreserved) {
    InstanceIdx = I;
    MinNextUnreserved = NextUnreserved;
  }
}
return std::make_pair(MinNextUnreserved, InstanceIdx);
2150}

2152/// Does this SU have a hazard within the current instruction group.
2153///
2154/// The scheduler supports two modes of hazard recognition. The first is the
2155/// ScheduleHazardRecognizer API. It is a fully general hazard recognizer that
2156/// supports highly complicated in-order reservation tables
2157/// (ScoreboardHazardRecognizer) and arbitrary target-specific logic.
2158///
2159/// The second is a streamlined mechanism that checks for hazards based on
2160/// simple counters that the scheduler itself maintains. It explicitly checks
2161/// for instruction dispatch limitations, including the number of micro-ops that
2162/// can dispatch per cycle.
2163///
2164/// TODO: Also check whether the SU must start a new group.
2165bool SchedBoundary::checkHazard(SUnit *SU) {
if (HazardRec->isEnabled()
    && HazardRec->getHazardType(SU) != ScheduleHazardRecognizer::NoHazard) {
  return true;
}

unsigned uops = SchedModel->getNumMicroOps(SU->getInstr());
if ((CurrMOps > 0) && (CurrMOps + uops > SchedModel->getIssueWidth())) {
  LLVM_DEBUG(dbgs() << "  SU(" << SU->NodeNum << ") uops="do { } while (false)
                    << SchedModel->getNumMicroOps(SU->getInstr()) << '\n')do { } while (false);
  return true;
}

if (CurrMOps > 0 &&
    ((isTop() && SchedModel->mustBeginGroup(SU->getInstr())) ||
     (!isTop() && SchedModel->mustEndGroup(SU->getInstr())))) {
  LLVM_DEBUG(dbgs() << "  hazard: SU(" << SU->NodeNum << ") must "do { } while (false)
                    << (isTop() ? "begin" : "end") << " group\n")do { } while (false);
  return true;
}

if (SchedModel->hasInstrSchedModel() && SU->hasReservedResource) {
  const MCSchedClassDesc *SC = DAG->getSchedClass(SU);
  for (const MCWriteProcResEntry &PE :
        make_range(SchedModel->getWriteProcResBegin(SC),
                   SchedModel->getWriteProcResEnd(SC))) {
    unsigned ResIdx = PE.ProcResourceIdx;
    unsigned Cycles = PE.Cycles;
    unsigned NRCycle, InstanceIdx;
    std::tie(NRCycle, InstanceIdx) = getNextResourceCycle(SC, ResIdx, Cycles);
    if (NRCycle > CurrCycle) {
2196#ifndef NDEBUG1
      MaxObservedStall = std::max(Cycles, MaxObservedStall);
2198#endif
      LLVM_DEBUG(dbgs() << "  SU(" << SU->NodeNum << ") "do { } while (false)
                        << SchedModel->getResourceName(ResIdx)do { } while (false)
                        << '[' << InstanceIdx - ReservedCyclesIndex[ResIdx]  << ']'do { } while (false)
                        << "=" << NRCycle << "c\n")do { } while (false);
      return true;
    }
  }
}
return false;
2208}

2210// Find the unscheduled node in ReadySUs with the highest latency.
2211unsigned SchedBoundary::
2212findMaxLatency(ArrayRef<SUnit*> ReadySUs) {
SUnit *LateSU = nullptr;
unsigned RemLatency = 0;
for (SUnit *SU : ReadySUs) {
  unsigned L = getUnscheduledLatency(SU);
  if (L > RemLatency) {
    RemLatency = L;
    LateSU = SU;
  }
}
if (LateSU) {
  LLVM_DEBUG(dbgs() << Available.getName() << " RemLatency SU("do { } while (false)
                    << LateSU->NodeNum << ") " << RemLatency << "c\n")do { } while (false);
}
return RemLatency;
2227}

2229// Count resources in this zone and the remaining unscheduled
2230// instruction. Return the max count, scaled. Set OtherCritIdx to the critical
2231// resource index, or zero if the zone is issue limited.
2232unsigned SchedBoundary::
2233getOtherResourceCount(unsigned &OtherCritIdx) {
OtherCritIdx = 0;
if (!SchedModel->hasInstrSchedModel())
  return 0;

unsigned OtherCritCount = Rem->RemIssueCount
  + (RetiredMOps * SchedModel->getMicroOpFactor());
LLVM_DEBUG(dbgs() << "  " << Available.getName() << " + Remain MOps: "do { } while (false)
                  << OtherCritCount / SchedModel->getMicroOpFactor() << '\n')do { } while (false);
for (unsigned PIdx = 1, PEnd = SchedModel->getNumProcResourceKinds();
     PIdx != PEnd; ++PIdx) {
  unsigned OtherCount = getResourceCount(PIdx) + Rem->RemainingCounts[PIdx];
  if (OtherCount > OtherCritCount) {
    OtherCritCount = OtherCount;
    OtherCritIdx = PIdx;
  }
}
if (OtherCritIdx) {
  LLVM_DEBUG(do { } while (false)
      dbgs() << "  " << Available.getName() << " + Remain CritRes: "do { } while (false)
             << OtherCritCount / SchedModel->getResourceFactor(OtherCritIdx)do { } while (false)
             << " " << SchedModel->getResourceName(OtherCritIdx) << "\n")do { } while (false);
}
return OtherCritCount;
2257}

2259void SchedBoundary::releaseNode(SUnit *SU, unsigned ReadyCycle, bool InPQueue,
                              unsigned Idx) {
assert(SU->getInstr() && "Scheduled SUnit must have instr")(static_cast<void> (0));

2263#ifndef NDEBUG1
// ReadyCycle was been bumped up to the CurrCycle when this node was
// scheduled, but CurrCycle may have been eagerly advanced immediately after
// scheduling, so may now be greater than ReadyCycle.
if (ReadyCycle > CurrCycle)
  MaxObservedStall = std::max(ReadyCycle - CurrCycle, MaxObservedStall);
2269#endif

if (ReadyCycle < MinReadyCycle)
  MinReadyCycle = ReadyCycle;

// Check for interlocks first. For the purpose of other heuristics, an
// instruction that cannot issue appears as if it's not in the ReadyQueue.
bool IsBuffered = SchedModel->getMicroOpBufferSize() != 0;
bool HazardDetected = (!IsBuffered && ReadyCycle > CurrCycle) ||
                      checkHazard(SU) || (Available.size() >= ReadyListLimit);

if (!HazardDetected) {
  Available.push(SU);

  if (InPQueue)
    Pending.remove(Pending.begin() + Idx);
  return;
}

if (!InPQueue)
  Pending.push(SU);
2290}

2292/// Move the boundary of scheduled code by one cycle.
2293void SchedBoundary::bumpCycle(unsigned NextCycle) {
if (SchedModel->getMicroOpBufferSize() == 0) {
  assert(MinReadyCycle < std::numeric_limits<unsigned>::max() &&(static_cast<void> (0))
         "MinReadyCycle uninitialized")(static_cast<void> (0));
  if (MinReadyCycle > NextCycle)
    NextCycle = MinReadyCycle;
}
// Update the current micro-ops, which will issue in the next cycle.
unsigned DecMOps = SchedModel->getIssueWidth() * (NextCycle - CurrCycle);
CurrMOps = (CurrMOps <= DecMOps) ? 0 : CurrMOps - DecMOps;

// Decrement DependentLatency based on the next cycle.
if ((NextCycle - CurrCycle) > DependentLatency)
  DependentLatency = 0;
else
  DependentLatency -= (NextCycle - CurrCycle);

if (!HazardRec->isEnabled()) {
  // Bypass HazardRec virtual calls.
  CurrCycle = NextCycle;
} else {
  // Bypass getHazardType calls in case of long latency.
  for (; CurrCycle != NextCycle; ++CurrCycle) {
    if (isTop())
      HazardRec->AdvanceCycle();
    else
      HazardRec->RecedeCycle();
  }
}
CheckPending = true;
IsResourceLimited =
    checkResourceLimit(SchedModel->getLatencyFactor(), getCriticalCount(),
                       getScheduledLatency(), true);

LLVM_DEBUG(dbgs() << "Cycle: " << CurrCycle << ' ' << Available.getName()do { } while (false)
                  << '\n')do { } while (false);
2329}

2331void SchedBoundary::incExecutedResources(unsigned PIdx, unsigned Count) {
ExecutedResCounts[PIdx] += Count;
if (ExecutedResCounts[PIdx] > MaxExecutedResCount)
  MaxExecutedResCount = ExecutedResCounts[PIdx];
2335}

2337/// Add the given processor resource to this scheduled zone.
2338///
2339/// \param Cycles indicates the number of consecutive (non-pipelined) cycles
2340/// during which this resource is consumed.
2341///
2342/// \return the next cycle at which the instruction may execute without
2343/// oversubscribing resources.
2344unsigned SchedBoundary::countResource(const MCSchedClassDesc *SC, unsigned PIdx,
                                    unsigned Cycles, unsigned NextCycle) {
unsigned Factor = SchedModel->getResourceFactor(PIdx);
unsigned Count = Factor * Cycles;
LLVM_DEBUG(dbgs() << "  " << SchedModel->getResourceName(PIdx) << " +"do { } while (false)
                  << Cycles << "x" << Factor << "u\n")do { } while (false);

// Update Executed resources counts.
incExecutedResources(PIdx, Count);
assert(Rem->RemainingCounts[PIdx] >= Count && "resource double counted")(static_cast<void> (0));
Rem->RemainingCounts[PIdx] -= Count;

// Check if this resource exceeds the current critical resource. If so, it
// becomes the critical resource.
if (ZoneCritResIdx != PIdx && (getResourceCount(PIdx) > getCriticalCount())) {
  ZoneCritResIdx = PIdx;
  LLVM_DEBUG(dbgs() << "  *** Critical resource "do { } while (false)
                    << SchedModel->getResourceName(PIdx) << ": "do { } while (false)
                    << getResourceCount(PIdx) / SchedModel->getLatencyFactor()do { } while (false)
                    << "c\n")do { } while (false);
}
// For reserved resources, record the highest cycle using the resource.
unsigned NextAvailable, InstanceIdx;
std::tie(NextAvailable, InstanceIdx) = getNextResourceCycle(SC, PIdx, Cycles);
if (NextAvailable > CurrCycle) {
  LLVM_DEBUG(dbgs() << "  Resource conflict: "do { } while (false)
                    << SchedModel->getResourceName(PIdx)do { } while (false)
                    << '[' << InstanceIdx - ReservedCyclesIndex[PIdx]  << ']'do { } while (false)
                    << " reserved until @" << NextAvailable << "\n")do { } while (false);
}
return NextAvailable;
2375}

2377/// Move the boundary of scheduled code by one SUnit.
2378void SchedBoundary::bumpNode(SUnit *SU) {
// Update the reservation table.
if (HazardRec->isEnabled()) {
  if (!isTop() && SU->isCall) {
    // Calls are scheduled with their preceding instructions. For bottom-up
    // scheduling, clear the pipeline state before emitting.
    HazardRec->Reset();
  }
  HazardRec->EmitInstruction(SU);
  // Scheduling an instruction may have made pending instructions available.
  CheckPending = true;
}
// checkHazard should prevent scheduling multiple instructions per cycle that
// exceed the issue width.
const MCSchedClassDesc *SC = DAG->getSchedClass(SU);
unsigned IncMOps = SchedModel->getNumMicroOps(SU->getInstr());
assert((static_cast<void> (0))
    (CurrMOps == 0 || (CurrMOps + IncMOps) <= SchedModel->getIssueWidth()) &&(static_cast<void> (0))
    "Cannot schedule this instruction's MicroOps in the current cycle.")(static_cast<void> (0));

unsigned ReadyCycle = (isTop() ? SU->TopReadyCycle : SU->BotReadyCycle);
LLVM_DEBUG(dbgs() << "  Ready @" << ReadyCycle << "c\n")do { } while (false);

unsigned NextCycle = CurrCycle;
switch (SchedModel->getMicroOpBufferSize()) {
case 0:
  assert(ReadyCycle <= CurrCycle && "Broken PendingQueue")(static_cast<void> (0));
  break;
case 1:
  if (ReadyCycle > NextCycle) {
    NextCycle = ReadyCycle;
    LLVM_DEBUG(dbgs() << "  *** Stall until: " << ReadyCycle << "\n")do { } while (false);
  }
  break;
default:
  // We don't currently model the OOO reorder buffer, so consider all
  // scheduled MOps to be "retired". We do loosely model in-order resource
  // latency. If this instruction uses an in-order resource, account for any
  // likely stall cycles.
  if (SU->isUnbuffered && ReadyCycle > NextCycle)
    NextCycle = ReadyCycle;
  break;
}
RetiredMOps += IncMOps;

// Update resource counts and critical resource.
if (SchedModel->hasInstrSchedModel()) {
  unsigned DecRemIssue = IncMOps * SchedModel->getMicroOpFactor();
  assert(Rem->RemIssueCount >= DecRemIssue && "MOps double counted")(static_cast<void> (0));
  Rem->RemIssueCount -= DecRemIssue;
  if (ZoneCritResIdx) {
    // Scale scheduled micro-ops for comparing with the critical resource.
    unsigned ScaledMOps =
      RetiredMOps * SchedModel->getMicroOpFactor();

    // If scaled micro-ops are now more than the previous critical resource by
    // a full cycle, then micro-ops issue becomes critical.
    if ((int)(ScaledMOps - getResourceCount(ZoneCritResIdx))
        >= (int)SchedModel->getLatencyFactor()) {
      ZoneCritResIdx = 0;
      LLVM_DEBUG(dbgs() << "  *** Critical resource NumMicroOps: "do { } while (false)
                        << ScaledMOps / SchedModel->getLatencyFactor()do { } while (false)
                        << "c\n")do { } while (false);
    }
  }
  for (TargetSchedModel::ProcResIter
         PI = SchedModel->getWriteProcResBegin(SC),
         PE = SchedModel->getWriteProcResEnd(SC); PI != PE; ++PI) {
    unsigned RCycle =
      countResource(SC, PI->ProcResourceIdx, PI->Cycles, NextCycle);
    if (RCycle > NextCycle)
      NextCycle = RCycle;
  }
  if (SU->hasReservedResource) {
    // For reserved resources, record the highest cycle using the resource.
    // For top-down scheduling, this is the cycle in which we schedule this
    // instruction plus the number of cycles the operations reserves the
    // resource. For bottom-up is it simply the instruction's cycle.
    for (TargetSchedModel::ProcResIter
           PI = SchedModel->getWriteProcResBegin(SC),
           PE = SchedModel->getWriteProcResEnd(SC); PI != PE; ++PI) {
      unsigned PIdx = PI->ProcResourceIdx;
      if (SchedModel->getProcResource(PIdx)->BufferSize == 0) {
        unsigned ReservedUntil, InstanceIdx;
        std::tie(ReservedUntil, InstanceIdx) =
            getNextResourceCycle(SC, PIdx, 0);
        if (isTop()) {
          ReservedCycles[InstanceIdx] =
              std::max(ReservedUntil, NextCycle + PI->Cycles);
        } else
          ReservedCycles[InstanceIdx] = NextCycle;
      }
    }
  }
}
// Update ExpectedLatency and DependentLatency.
unsigned &TopLatency = isTop() ? ExpectedLatency : DependentLatency;
unsigned &BotLatency = isTop() ? DependentLatency : ExpectedLatency;
if (SU->getDepth() > TopLatency) {
  TopLatency = SU->getDepth();
  LLVM_DEBUG(dbgs() << "  " << Available.getName() << " TopLatency SU("do { } while (false)
                    << SU->NodeNum << ") " << TopLatency << "c\n")do { } while (false);
}
if (SU->getHeight() > BotLatency) {
  BotLatency = SU->getHeight();
  LLVM_DEBUG(dbgs() << "  " << Available.getName() << " BotLatency SU("do { } while (false)
                    << SU->NodeNum << ") " << BotLatency << "c\n")do { } while (false);
}
// If we stall for any reason, bump the cycle.
if (NextCycle > CurrCycle)
  bumpCycle(NextCycle);
else
  // After updating ZoneCritResIdx and ExpectedLatency, check if we're
  // resource limited. If a stall occurred, bumpCycle does this.
  IsResourceLimited =
      checkResourceLimit(SchedModel->getLatencyFactor(), getCriticalCount(),
                         getScheduledLatency(), true);

// Update CurrMOps after calling bumpCycle to handle stalls, since bumpCycle
// resets CurrMOps. Loop to handle instructions with more MOps than issue in
// one cycle.  Since we commonly reach the max MOps here, opportunistically
// bump the cycle to avoid uselessly checking everything in the readyQ.
CurrMOps += IncMOps;

// Bump the cycle count for issue group constraints.
// This must be done after NextCycle has been adjust for all other stalls.
// Calling bumpCycle(X) will reduce CurrMOps by one issue group and set
// currCycle to X.
if ((isTop() &&  SchedModel->mustEndGroup(SU->getInstr())) ||
    (!isTop() && SchedModel->mustBeginGroup(SU->getInstr()))) {
  LLVM_DEBUG(dbgs() << "  Bump cycle to " << (isTop() ? "end" : "begin")do { } while (false)
                    << " group\n")do { } while (false);
  bumpCycle(++NextCycle);
}

while (CurrMOps >= SchedModel->getIssueWidth()) {
  LLVM_DEBUG(dbgs() << "  *** Max MOps " << CurrMOps << " at cycle "do { } while (false)
                    << CurrCycle << '\n')do { } while (false);
  bumpCycle(++NextCycle);
}
LLVM_DEBUG(dumpScheduledState())do { } while (false);
2519}

2521/// Release pending ready nodes in to the available queue. This makes them
2522/// visible to heuristics.
2523void SchedBoundary::releasePending() {
// If the available queue is empty, it is safe to reset MinReadyCycle.
if (Available.empty())
  MinReadyCycle = std::numeric_limits<unsigned>::max();

// Check to see if any of the pending instructions are ready to issue.  If
// so, add them to the available queue.
for (unsigned I = 0, E = Pending.size(); I < E; ++I) {
  SUnit *SU = *(Pending.begin() + I);
  unsigned ReadyCycle = isTop() ? SU->TopReadyCycle : SU->BotReadyCycle;

  if (ReadyCycle < MinReadyCycle)
    MinReadyCycle = ReadyCycle;

  if (Available.size() >= ReadyListLimit)
    break;

  releaseNode(SU, ReadyCycle, true, I);
  if (E != Pending.size()) {
    --I;
    --E;
  }
}
CheckPending = false;
2547}

2549/// Remove SU from the ready set for this boundary.
2550void SchedBoundary::removeReady(SUnit *SU) {
if (Available.isInQueue(SU))
  Available.remove(Available.find(SU));
else {
  assert(Pending.isInQueue(SU) && "bad ready count")(static_cast<void> (0));
  Pending.remove(Pending.find(SU));
}
2557}

2559/// If this queue only has one ready candidate, return it. As a side effect,
2560/// defer any nodes that now hit a hazard, and advance the cycle until at least
2561/// one node is ready. If multiple instructions are ready, return NULL.
2562SUnit *SchedBoundary::pickOnlyChoice() {
if (CheckPending)
10
←
Assuming field 'CheckPending' is false→
11
←
Taking false branch→
  releasePending();

// Defer any ready instrs that now have a hazard.
for (ReadyQueue::iterator I = Available.begin(); I != Available.end();) {
12
←
Loop condition is false. Execution continues on line 2575→
  if (checkHazard(*I)) {
    Pending.push(*I);
    I = Available.remove(I);
    continue;
  }
  ++I;
}
for (unsigned i = 0; Available.empty(); ++i) {
13
←
Loop condition is false. Execution continues on line 2584→
2576//  FIXME: Re-enable assert once PR20057 is resolved.
2577//    assert(i <= (HazardRec->getMaxLookAhead() + MaxObservedStall) &&
2578//           "permanent hazard");
  (void)i;
  bumpCycle(CurrCycle + 1);
  releasePending();
}

LLVM_DEBUG(Pending.dump())do { } while (false);
14
←
Loop condition is false.  Exiting loop→
LLVM_DEBUG(Available.dump())do { } while (false);
15
←
Loop condition is false.  Exiting loop→

if (Available.size() == 1)
16
←
Assuming the condition is false→
17
←
Taking false branch→
  return *Available.begin();
return nullptr;
18
←
Returning null pointer, which participates in a condition later→
2590}

2592#if !defined(NDEBUG1) || defined(LLVM_ENABLE_DUMP)
2593// This is useful information to dump after bumpNode.
2594// Note that the Queue contents are more useful before pickNodeFromQueue.
2595LLVM_DUMP_METHOD__attribute__((noinline)) __attribute__((__used__)) void SchedBoundary::dumpScheduledState() const {
unsigned ResFactor;
unsigned ResCount;
if (ZoneCritResIdx) {
  ResFactor = SchedModel->getResourceFactor(ZoneCritResIdx);
  ResCount = getResourceCount(ZoneCritResIdx);
} else {
  ResFactor = SchedModel->getMicroOpFactor();
  ResCount = RetiredMOps * ResFactor;
}
unsigned LFactor = SchedModel->getLatencyFactor();
dbgs() << Available.getName() << " @" << CurrCycle << "c\n"
       << "  Retired: " << RetiredMOps;
dbgs() << "\n  Executed: " << getExecutedCount() / LFactor << "c";
dbgs() << "\n  Critical: " << ResCount / LFactor << "c, "
       << ResCount / ResFactor << " "
       << SchedModel->getResourceName(ZoneCritResIdx)
       << "\n  ExpectedLatency: " << ExpectedLatency << "c\n"
       << (IsResourceLimited ? "  - Resource" : "  - Latency")
       << " limited.\n";
2615}
2616#endif

2618//===----------------------------------------------------------------------===//
2619// GenericScheduler - Generic implementation of MachineSchedStrategy.
2620//===----------------------------------------------------------------------===//

2622void GenericSchedulerBase::SchedCandidate::
2623initResourceDelta(const ScheduleDAGMI *DAG,
                const TargetSchedModel *SchedModel) {
if (!Policy.ReduceResIdx && !Policy.DemandResIdx)
  return;

const MCSchedClassDesc *SC = DAG->getSchedClass(SU);
for (TargetSchedModel::ProcResIter
       PI = SchedModel->getWriteProcResBegin(SC),
       PE = SchedModel->getWriteProcResEnd(SC); PI != PE; ++PI) {
  if (PI->ProcResourceIdx == Policy.ReduceResIdx)
    ResDelta.CritResources += PI->Cycles;
  if (PI->ProcResourceIdx == Policy.DemandResIdx)
    ResDelta.DemandedResources += PI->Cycles;
}
2637}

2639/// Compute remaining latency. We need this both to determine whether the
2640/// overall schedule has become latency-limited and whether the instructions
2641/// outside this zone are resource or latency limited.
2642///
2643/// The "dependent" latency is updated incrementally during scheduling as the
2644/// max height/depth of scheduled nodes minus the cycles since it was
2645/// scheduled:
2646///   DLat = max (N.depth - (CurrCycle - N.ReadyCycle) for N in Zone
2647///
2648/// The "independent" latency is the max ready queue depth:
2649///   ILat = max N.depth for N in Available|Pending
2650///
2651/// RemainingLatency is the greater of independent and dependent latency.
2652///
2653/// These computations are expensive, especially in DAGs with many edges, so
2654/// only do them if necessary.
2655static unsigned computeRemLatency(SchedBoundary &CurrZone) {
unsigned RemLatency = CurrZone.getDependentLatency();
RemLatency = std::max(RemLatency,
                      CurrZone.findMaxLatency(CurrZone.Available.elements()));
RemLatency = std::max(RemLatency,
                      CurrZone.findMaxLatency(CurrZone.Pending.elements()));
return RemLatency;
2662}

2664/// Returns true if the current cycle plus remaning latency is greater than
2665/// the critical path in the scheduling region.
2666bool GenericSchedulerBase::shouldReduceLatency(const CandPolicy &Policy,
                                             SchedBoundary &CurrZone,
                                             bool ComputeRemLatency,
                                             unsigned &RemLatency) const {
// The current cycle is already greater than the critical path, so we are
// already latency limited and don't need to compute the remaining latency.
if (CurrZone.getCurrCycle() > Rem.CriticalPath)
  return true;

// If we haven't scheduled anything yet, then we aren't latency limited.
if (CurrZone.getCurrCycle() == 0)
  return false;

if (ComputeRemLatency)
  RemLatency = computeRemLatency(CurrZone);

return RemLatency + CurrZone.getCurrCycle() > Rem.CriticalPath;
2683}

2685/// Set the CandPolicy given a scheduling zone given the current resources and
2686/// latencies inside and outside the zone.
2687void GenericSchedulerBase::setPolicy(CandPolicy &Policy, bool IsPostRA,
                                   SchedBoundary &CurrZone,
                                   SchedBoundary *OtherZone) {
// Apply preemptive heuristics based on the total latency and resources
// inside and outside this zone. Potential stalls should be considered before
// following this policy.

// Compute the critical resource outside the zone.
unsigned OtherCritIdx = 0;
unsigned OtherCount =
  OtherZone ? OtherZone->getOtherResourceCount(OtherCritIdx) : 0;

bool OtherResLimited = false;
unsigned RemLatency = 0;
bool RemLatencyComputed = false;
if (SchedModel->hasInstrSchedModel() && OtherCount != 0) {
  RemLatency = computeRemLatency(CurrZone);
  RemLatencyComputed = true;
  OtherResLimited = checkResourceLimit(SchedModel->getLatencyFactor(),
                                       OtherCount, RemLatency, false);
}

// Schedule aggressively for latency in PostRA mode. We don't check for
// acyclic latency during PostRA, and highly out-of-order processors will
// skip PostRA scheduling.
if (!OtherResLimited &&
    (IsPostRA || shouldReduceLatency(Policy, CurrZone, !RemLatencyComputed,
                                     RemLatency))) {
  Policy.ReduceLatency |= true;
  LLVM_DEBUG(dbgs() << "  " << CurrZone.Available.getName()do { } while (false)
                    << " RemainingLatency " << RemLatency << " + "do { } while (false)
                    << CurrZone.getCurrCycle() << "c > CritPath "do { } while (false)
                    << Rem.CriticalPath << "\n")do { } while (false);
}
// If the same resource is limiting inside and outside the zone, do nothing.
if (CurrZone.getZoneCritResIdx() == OtherCritIdx)
  return;

LLVM_DEBUG(if (CurrZone.isResourceLimited()) {do { } while (false)
  dbgs() << "  " << CurrZone.Available.getName() << " ResourceLimited: "do { } while (false)
         << SchedModel->getResourceName(CurrZone.getZoneCritResIdx()) << "\n";do { } while (false)
} if (OtherResLimited) dbgs()do { } while (false)
               << "  RemainingLimit: "do { } while (false)
               << SchedModel->getResourceName(OtherCritIdx) << "\n";do { } while (false)
           if (!CurrZone.isResourceLimited() && !OtherResLimited) dbgs()do { } while (false)
           << "  Latency limited both directions.\n")do { } while (false);

if (CurrZone.isResourceLimited() && !Policy.ReduceResIdx)
  Policy.ReduceResIdx = CurrZone.getZoneCritResIdx();

if (OtherResLimited)
  Policy.DemandResIdx = OtherCritIdx;
2739}

2741#ifndef NDEBUG1
2742const char *GenericSchedulerBase::getReasonStr(
GenericSchedulerBase::CandReason Reason) {
switch (Reason) {
case NoCand:         return "NOCAND    ";
case Only1:          return "ONLY1     ";
case PhysReg:        return "PHYS-REG  ";
case RegExcess:      return "REG-EXCESS";
case RegCritical:    return "REG-CRIT  ";
case Stall:          return "STALL     ";
case Cluster:        return "CLUSTER   ";
case Weak:           return "WEAK      ";
case RegMax:         return "REG-MAX   ";
case ResourceReduce: return "RES-REDUCE";
case ResourceDemand: return "RES-DEMAND";
case TopDepthReduce: return "TOP-DEPTH ";
case TopPathReduce:  return "TOP-PATH  ";
case BotHeightReduce:return "BOT-HEIGHT";
case BotPathReduce:  return "BOT-PATH  ";
case NextDefUse:     return "DEF-USE   ";
case NodeOrder:      return "ORDER     ";
};
llvm_unreachable("Unknown reason!")__builtin_unreachable();
2764}

2766void GenericSchedulerBase::traceCandidate(const SchedCandidate &Cand) {
PressureChange P;
unsigned ResIdx = 0;
unsigned Latency = 0;
switch (Cand.Reason) {
default:
  break;
case RegExcess:
  P = Cand.RPDelta.Excess;
  break;
case RegCritical:
  P = Cand.RPDelta.CriticalMax;
  break;
case RegMax:
  P = Cand.RPDelta.CurrentMax;
  break;
case ResourceReduce:
  ResIdx = Cand.Policy.ReduceResIdx;
  break;
case ResourceDemand:
  ResIdx = Cand.Policy.DemandResIdx;
  break;
case TopDepthReduce:
  Latency = Cand.SU->getDepth();
  break;
case TopPathReduce:
  Latency = Cand.SU->getHeight();
  break;
case BotHeightReduce:
  Latency = Cand.SU->getHeight();
  break;
case BotPathReduce:
  Latency = Cand.SU->getDepth();
  break;
}
dbgs() << "  Cand SU(" << Cand.SU->NodeNum << ") " << getReasonStr(Cand.Reason);
if (P.isValid())
  dbgs() << " " << TRI->getRegPressureSetName(P.getPSet())
         << ":" << P.getUnitInc() << " ";
else
  dbgs() << "      ";
if (ResIdx)
  dbgs() << " " << SchedModel->getProcResource(ResIdx)->Name << " ";
else
  dbgs() << "         ";
if (Latency)
  dbgs() << " " << Latency << " cycles ";
else
  dbgs() << "          ";
dbgs() << '\n';
2816}
2817#endif

2819namespace llvm {
2820/// Return true if this heuristic determines order.
2821/// TODO: Consider refactor return type of these functions as integer or enum,
2822/// as we may need to differentiate whether TryCand is better than Cand.
2823bool tryLess(int TryVal, int CandVal,
           GenericSchedulerBase::SchedCandidate &TryCand,
           GenericSchedulerBase::SchedCandidate &Cand,
           GenericSchedulerBase::CandReason Reason) {
if (TryVal < CandVal) {
  TryCand.Reason = Reason;
  return true;
}
if (TryVal > CandVal) {
  if (Cand.Reason > Reason)
    Cand.Reason = Reason;
  return true;
}
return false;
2837}

2839bool tryGreater(int TryVal, int CandVal,
              GenericSchedulerBase::SchedCandidate &TryCand,
              GenericSchedulerBase::SchedCandidate &Cand,
              GenericSchedulerBase::CandReason Reason) {
if (TryVal > CandVal) {
  TryCand.Reason = Reason;
  return true;
}
if (TryVal < CandVal) {
  if (Cand.Reason > Reason)
    Cand.Reason = Reason;
  return true;
}
return false;
2853}

2855bool tryLatency(GenericSchedulerBase::SchedCandidate &TryCand,
              GenericSchedulerBase::SchedCandidate &Cand,
              SchedBoundary &Zone) {
if (Zone.isTop()) {
  // Prefer the candidate with the lesser depth, but only if one of them has
  // depth greater than the total latency scheduled so far, otherwise either
  // of them could be scheduled now with no stall.
  if (std::max(TryCand.SU->getDepth(), Cand.SU->getDepth()) >
      Zone.getScheduledLatency()) {
    if (tryLess(TryCand.SU->getDepth(), Cand.SU->getDepth(),
                TryCand, Cand, GenericSchedulerBase::TopDepthReduce))
      return true;
  }
  if (tryGreater(TryCand.SU->getHeight(), Cand.SU->getHeight(),
                 TryCand, Cand, GenericSchedulerBase::TopPathReduce))
    return true;
} else {
  // Prefer the candidate with the lesser height, but only if one of them has
  // height greater than the total latency scheduled so far, otherwise either
  // of them could be scheduled now with no stall.
  if (std::max(TryCand.SU->getHeight(), Cand.SU->getHeight()) >
      Zone.getScheduledLatency()) {
    if (tryLess(TryCand.SU->getHeight(), Cand.SU->getHeight(),
                TryCand, Cand, GenericSchedulerBase::BotHeightReduce))
      return true;
  }
  if (tryGreater(TryCand.SU->getDepth(), Cand.SU->getDepth(),
                 TryCand, Cand, GenericSchedulerBase::BotPathReduce))
    return true;
}
return false;
2886}
2887} // end namespace llvm

2889static void tracePick(GenericSchedulerBase::CandReason Reason, bool IsTop) {
LLVM_DEBUG(dbgs() << "Pick " << (IsTop ? "Top " : "Bot ")do { } while (false)
                  << GenericSchedulerBase::getReasonStr(Reason) << '\n')do { } while (false);
2892}

2894static void tracePick(const GenericSchedulerBase::SchedCandidate &Cand) {
tracePick(Cand.Reason, Cand.AtTop);
2896}

2898void GenericScheduler::initialize(ScheduleDAGMI *dag) {
assert(dag->hasVRegLiveness() &&(static_cast<void> (0))
       "(PreRA)GenericScheduler needs vreg liveness")(static_cast<void> (0));
DAG = static_cast<ScheduleDAGMILive*>(dag);
SchedModel = DAG->getSchedModel();
TRI = DAG->TRI;

if (RegionPolicy.ComputeDFSResult)
  DAG->computeDFSResult();

Rem.init(DAG, SchedModel);
Top.init(DAG, SchedModel, &Rem);
Bot.init(DAG, SchedModel, &Rem);

// Initialize resource counts.

// Initialize the HazardRecognizers. If itineraries don't exist, are empty, or
// are disabled, then these HazardRecs will be disabled.
const InstrItineraryData *Itin = SchedModel->getInstrItineraries();
if (!Top.HazardRec) {
  Top.HazardRec =
      DAG->MF.getSubtarget().getInstrInfo()->CreateTargetMIHazardRecognizer(
          Itin, DAG);
}
if (!Bot.HazardRec) {
  Bot.HazardRec =
      DAG->MF.getSubtarget().getInstrInfo()->CreateTargetMIHazardRecognizer(
          Itin, DAG);
}
TopCand.SU = nullptr;
BotCand.SU = nullptr;
2929}

2931/// Initialize the per-region scheduling policy.
2932void GenericScheduler::initPolicy(MachineBasicBlock::iterator Begin,
                                MachineBasicBlock::iterator End,
                                unsigned NumRegionInstrs) {
const MachineFunction &MF = *Begin->getMF();
const TargetLowering *TLI = MF.getSubtarget().getTargetLowering();

// Avoid setting up the register pressure tracker for small regions to save
// compile time. As a rough heuristic, only track pressure when the number of
// schedulable instructions exceeds half the integer register file.
RegionPolicy.ShouldTrackPressure = true;
for (unsigned VT = MVT::i32; VT > (unsigned)MVT::i1; --VT) {
  MVT::SimpleValueType LegalIntVT = (MVT::SimpleValueType)VT;
  if (TLI->isTypeLegal(LegalIntVT)) {
    unsigned NIntRegs = Context->RegClassInfo->getNumAllocatableRegs(
      TLI->getRegClassFor(LegalIntVT));
    RegionPolicy.ShouldTrackPressure = NumRegionInstrs > (NIntRegs / 2);
  }
}

// For generic targets, we default to bottom-up, because it's simpler and more
// compile-time optimizations have been implemented in that direction.
RegionPolicy.OnlyBottomUp = true;

// Allow the subtarget to override default policy.
MF.getSubtarget().overrideSchedPolicy(RegionPolicy, NumRegionInstrs);

// After subtarget overrides, apply command line options.
if (!EnableRegPressure) {
  RegionPolicy.ShouldTrackPressure = false;
  RegionPolicy.ShouldTrackLaneMasks = false;
}

// Check -misched-topdown/bottomup can force or unforce scheduling direction.
// e.g. -misched-bottomup=false allows scheduling in both directions.
assert((!ForceTopDown || !ForceBottomUp) &&(static_cast<void> (0))
       "-misched-topdown incompatible with -misched-bottomup")(static_cast<void> (0));
if (ForceBottomUp.getNumOccurrences() > 0) {
  RegionPolicy.OnlyBottomUp = ForceBottomUp;
  if (RegionPolicy.OnlyBottomUp)
    RegionPolicy.OnlyTopDown = false;
}
if (ForceTopDown.getNumOccurrences() > 0) {
  RegionPolicy.OnlyTopDown = ForceTopDown;
  if (RegionPolicy.OnlyTopDown)
    RegionPolicy.OnlyBottomUp = false;
}
2978}

2980void GenericScheduler::dumpPolicy() const {
// Cannot completely remove virtual function even in release mode.
2982#if !defined(NDEBUG1) || defined(LLVM_ENABLE_DUMP)
dbgs() << "GenericScheduler RegionPolicy: "
       << " ShouldTrackPressure=" << RegionPolicy.ShouldTrackPressure
       << " OnlyTopDown=" << RegionPolicy.OnlyTopDown
       << " OnlyBottomUp=" << RegionPolicy.OnlyBottomUp
       << "\n";
2988#endif
2989}

2991/// Set IsAcyclicLatencyLimited if the acyclic path is longer than the cyclic
2992/// critical path by more cycles than it takes to drain the instruction buffer.
2993/// We estimate an upper bounds on in-flight instructions as:
2994///
2995/// CyclesPerIteration = max( CyclicPath, Loop-Resource-Height )
2996/// InFlightIterations = AcyclicPath / CyclesPerIteration
2997/// InFlightResources = InFlightIterations * LoopResources
2998///
2999/// TODO: Check execution resources in addition to IssueCount.
3000void GenericScheduler::checkAcyclicLatency() {
if (Rem.CyclicCritPath == 0 || Rem.CyclicCritPath >= Rem.CriticalPath)
  return;

// Scaled number of cycles per loop iteration.
unsigned IterCount =
  std::max(Rem.CyclicCritPath * SchedModel->getLatencyFactor(),
           Rem.RemIssueCount);
// Scaled acyclic critical path.
unsigned AcyclicCount = Rem.CriticalPath * SchedModel->getLatencyFactor();
// InFlightCount = (AcyclicPath / IterCycles) * InstrPerLoop
unsigned InFlightCount =
  (AcyclicCount * Rem.RemIssueCount + IterCount-1) / IterCount;
unsigned BufferLimit =
  SchedModel->getMicroOpBufferSize() * SchedModel->getMicroOpFactor();

Rem.IsAcyclicLatencyLimited = InFlightCount > BufferLimit;

LLVM_DEBUG(do { } while (false)
    dbgs() << "IssueCycles="do { } while (false)
           << Rem.RemIssueCount / SchedModel->getLatencyFactor() << "c "do { } while (false)
           << "IterCycles=" << IterCount / SchedModel->getLatencyFactor()do { } while (false)
           << "c NumIters=" << (AcyclicCount + IterCount - 1) / IterCountdo { } while (false)
           << " InFlight=" << InFlightCount / SchedModel->getMicroOpFactor()do { } while (false)
           << "m BufferLim=" << SchedModel->getMicroOpBufferSize() << "m\n";do { } while (false)
    if (Rem.IsAcyclicLatencyLimited) dbgs() << "  ACYCLIC LATENCY LIMIT\n")do { } while (false);
3026}

3028void GenericScheduler::registerRoots() {
Rem.CriticalPath = DAG->ExitSU.getDepth();

// Some roots may not feed into ExitSU. Check all of them in case.
for (const SUnit *SU : Bot.Available) {
  if (SU->getDepth() > Rem.CriticalPath)
    Rem.CriticalPath = SU->getDepth();
}
LLVM_DEBUG(dbgs() << "Critical Path(GS-RR ): " << Rem.CriticalPath << '\n')do { } while (false);
if (DumpCriticalPathLength) {
  errs() << "Critical Path(GS-RR ): " << Rem.CriticalPath << " \n";
}

if (EnableCyclicPath && SchedModel->getMicroOpBufferSize() > 0) {
  Rem.CyclicCritPath = DAG->computeCyclicCriticalPath();
  checkAcyclicLatency();
}
3045}

3047namespace llvm {
3048bool tryPressure(const PressureChange &TryP,
               const PressureChange &CandP,
               GenericSchedulerBase::SchedCandidate &TryCand,
               GenericSchedulerBase::SchedCandidate &Cand,
               GenericSchedulerBase::CandReason Reason,
               const TargetRegisterInfo *TRI,
               const MachineFunction &MF) {
// If one candidate decreases and the other increases, go with it.
// Invalid candidates have UnitInc==0.
if (tryGreater(TryP.getUnitInc() < 0, CandP.getUnitInc() < 0, TryCand, Cand,
               Reason)) {
  return true;
}
// Do not compare the magnitude of pressure changes between top and bottom
// boundary.
if (Cand.AtTop != TryCand.AtTop)
  return false;

// If both candidates affect the same set in the same boundary, go with the
// smallest increase.
unsigned TryPSet = TryP.getPSetOrMax();
unsigned CandPSet = CandP.getPSetOrMax();
if (TryPSet == CandPSet) {
  return tryLess(TryP.getUnitInc(), CandP.getUnitInc(), TryCand, Cand,
                 Reason);
}

int TryRank = TryP.isValid() ? TRI->getRegPressureSetScore(MF, TryPSet) :
                               std::numeric_limits<int>::max();

int CandRank = CandP.isValid() ? TRI->getRegPressureSetScore(MF, CandPSet) :
                                 std::numeric_limits<int>::max();

// If the candidates are decreasing pressure, reverse priority.
if (TryP.getUnitInc() < 0)
  std::swap(TryRank, CandRank);
return tryGreater(TryRank, CandRank, TryCand, Cand, Reason);
3085}

3087unsigned getWeakLeft(const SUnit *SU, bool isTop) {
return (isTop) ? SU->WeakPredsLeft : SU->WeakSuccsLeft;
3089}

3091/// Minimize physical register live ranges. Regalloc wants them adjacent to
3092/// their physreg def/use.
3093///
3094/// FIXME: This is an unnecessary check on the critical path. Most are root/leaf
3095/// copies which can be prescheduled. The rest (e.g. x86 MUL) could be bundled
3096/// with the operation that produces or consumes the physreg. We'll do this when
3097/// regalloc has support for parallel copies.
3098int biasPhysReg(const SUnit *SU, bool isTop) {
const MachineInstr *MI = SU->getInstr();

if (MI->isCopy()) {
  unsigned ScheduledOper = isTop ? 1 : 0;
  unsigned UnscheduledOper = isTop ? 0 : 1;
  // If we have already scheduled the physreg produce/consumer, immediately
  // schedule the copy.
  if (Register::isPhysicalRegister(MI->getOperand(ScheduledOper).getReg()))
    return 1;
  // If the physreg is at the boundary, defer it. Otherwise schedule it
  // immediately to free the dependent. We can hoist the copy later.
  bool AtBoundary = isTop ? !SU->NumSuccsLeft : !SU->NumPredsLeft;
  if (Register::isPhysicalRegister(MI->getOperand(UnscheduledOper).getReg()))
    return AtBoundary ? -1 : 1;
}

if (MI->isMoveImmediate()) {
  // If we have a move immediate and all successors have been assigned, bias
  // towards scheduling this later. Make sure all register defs are to
  // physical registers.
  bool DoBias = true;
  for (const MachineOperand &Op : MI->defs()) {
    if (Op.isReg() && !Register::isPhysicalRegister(Op.getReg())) {
      DoBias = false;
      break;
    }
  }

  if (DoBias)
    return isTop ? -1 : 1;
}

return 0;
3132}
3133} // end namespace llvm

3135void GenericScheduler::initCandidate(SchedCandidate &Cand, SUnit *SU,
                                   bool AtTop,
                                   const RegPressureTracker &RPTracker,
                                   RegPressureTracker &TempTracker) {
Cand.SU = SU;
Cand.AtTop = AtTop;
if (DAG->isTrackingPressure()) {
  if (AtTop) {
    TempTracker.getMaxDownwardPressureDelta(
      Cand.SU->getInstr(),
      Cand.RPDelta,
      DAG->getRegionCriticalPSets(),
      DAG->getRegPressure().MaxSetPressure);
  } else {
    if (VerifyScheduling) {
      TempTracker.getMaxUpwardPressureDelta(
        Cand.SU->getInstr(),
        &DAG->getPressureDiff(Cand.SU),
        Cand.RPDelta,
        DAG->getRegionCriticalPSets(),
        DAG->getRegPressure().MaxSetPressure);
    } else {
      RPTracker.getUpwardPressureDelta(
        Cand.SU->getInstr(),
        DAG->getPressureDiff(Cand.SU),
        Cand.RPDelta,
        DAG->getRegionCriticalPSets(),
        DAG->getRegPressure().MaxSetPressure);
    }
  }
}
LLVM_DEBUG(if (Cand.RPDelta.Excess.isValid()) dbgs()do { } while (false)
           << "  Try  SU(" << Cand.SU->NodeNum << ") "do { } while (false)
           << TRI->getRegPressureSetName(Cand.RPDelta.Excess.getPSet()) << ":"do { } while (false)
           << Cand.RPDelta.Excess.getUnitInc() << "\n")do { } while (false);
3170}

3172/// Apply a set of heuristics to a new candidate. Heuristics are currently
3173/// hierarchical. This may be more efficient than a graduated cost model because
3174/// we don't need to evaluate all aspects of the model for each node in the
3175/// queue. But it's really done to make the heuristics easier to debug and
3176/// statistically analyze.
3177///
3178/// \param Cand provides the policy and current best candidate.
3179/// \param TryCand refers to the next SUnit candidate, otherwise uninitialized.
3180/// \param Zone describes the scheduled zone that we are extending, or nullptr
3181///             if Cand is from a different zone than TryCand.
3182/// \return \c true if TryCand is better than Cand (Reason is NOT NoCand)
3183bool GenericScheduler::tryCandidate(SchedCandidate &Cand,
                                  SchedCandidate &TryCand,
                                  SchedBoundary *Zone) const {
// Initialize the candidate if needed.
if (!Cand.isValid()) {
  TryCand.Reason = NodeOrder;
  return true;
}

// Bias PhysReg Defs and copies to their uses and defined respectively.
if (tryGreater(biasPhysReg(TryCand.SU, TryCand.AtTop),
               biasPhysReg(Cand.SU, Cand.AtTop), TryCand, Cand, PhysReg))
  return TryCand.Reason != NoCand;

// Avoid exceeding the target's limit.
if (DAG->isTrackingPressure() && tryPressure(TryCand.RPDelta.Excess,
                                             Cand.RPDelta.Excess,
                                             TryCand, Cand, RegExcess, TRI,
                                             DAG->MF))
  return TryCand.Reason != NoCand;

// Avoid increasing the max critical pressure in the scheduled region.
if (DAG->isTrackingPressure() && tryPressure(TryCand.RPDelta.CriticalMax,
                                             Cand.RPDelta.CriticalMax,
                                             TryCand, Cand, RegCritical, TRI,
                                             DAG->MF))
  return TryCand.Reason != NoCand;

// We only compare a subset of features when comparing nodes between
// Top and Bottom boundary. Some properties are simply incomparable, in many
// other instances we should only override the other boundary if something
// is a clear good pick on one boundary. Skip heuristics that are more
// "tie-breaking" in nature.
bool SameBoundary = Zone != nullptr;
if (SameBoundary) {
  // For loops that are acyclic path limited, aggressively schedule for
  // latency. Within an single cycle, whenever CurrMOps > 0, allow normal
  // heuristics to take precedence.
  if (Rem.IsAcyclicLatencyLimited && !Zone->getCurrMOps() &&
      tryLatency(TryCand, Cand, *Zone))
    return TryCand.Reason != NoCand;

  // Prioritize instructions that read unbuffered resources by stall cycles.
  if (tryLess(Zone->getLatencyStallCycles(TryCand.SU),
              Zone->getLatencyStallCycles(Cand.SU), TryCand, Cand, Stall))
    return TryCand.Reason != NoCand;
}

// Keep clustered nodes together to encourage downstream peephole
// optimizations which may reduce resource requirements.
//
// This is a best effort to set things up for a post-RA pass. Optimizations
// like generating loads of multiple registers should ideally be done within
// the scheduler pass by combining the loads during DAG postprocessing.
const SUnit *CandNextClusterSU =
  Cand.AtTop ? DAG->getNextClusterSucc() : DAG->getNextClusterPred();
const SUnit *TryCandNextClusterSU =
  TryCand.AtTop ? DAG->getNextClusterSucc() : DAG->getNextClusterPred();
if (tryGreater(TryCand.SU == TryCandNextClusterSU,
               Cand.SU == CandNextClusterSU,
               TryCand, Cand, Cluster))
  return TryCand.Reason != NoCand;

if (SameBoundary) {
  // Weak edges are for clustering and other constraints.
  if (tryLess(getWeakLeft(TryCand.SU, TryCand.AtTop),
              getWeakLeft(Cand.SU, Cand.AtTop),
              TryCand, Cand, Weak))
    return TryCand.Reason != NoCand;
}

// Avoid increasing the max pressure of the entire region.
if (DAG->isTrackingPressure() && tryPressure(TryCand.RPDelta.CurrentMax,
                                             Cand.RPDelta.CurrentMax,
                                             TryCand, Cand, RegMax, TRI,
                                             DAG->MF))
  return TryCand.Reason != NoCand;

if (SameBoundary) {
  // Avoid critical resource consumption and balance the schedule.
  TryCand.initResourceDelta(DAG, SchedModel);
  if (tryLess(TryCand.ResDelta.CritResources, Cand.ResDelta.CritResources,
              TryCand, Cand, ResourceReduce))
    return TryCand.Reason != NoCand;
  if (tryGreater(TryCand.ResDelta.DemandedResources,
                 Cand.ResDelta.DemandedResources,
                 TryCand, Cand, ResourceDemand))
    return TryCand.Reason != NoCand;

  // Avoid serializing long latency dependence chains.
  // For acyclic path limited loops, latency was already checked above.
  if (!RegionPolicy.DisableLatencyHeuristic && TryCand.Policy.ReduceLatency &&
      !Rem.IsAcyclicLatencyLimited && tryLatency(TryCand, Cand, *Zone))
    return TryCand.Reason != NoCand;

  // Fall through to original instruction order.
  if ((Zone->isTop() && TryCand.SU->NodeNum < Cand.SU->NodeNum)
      || (!Zone->isTop() && TryCand.SU->NodeNum > Cand.SU->NodeNum)) {
    TryCand.Reason = NodeOrder;
    return true;
  }
}

return false;
3287}

3289/// Pick the best candidate from the queue.
3290///
3291/// TODO: getMaxPressureDelta results can be mostly cached for each SUnit during
3292/// DAG building. To adjust for the current scheduling location we need to
3293/// maintain the number of vreg uses remaining to be top-scheduled.
3294void GenericScheduler::pickNodeFromQueue(SchedBoundary &Zone,
                                       const CandPolicy &ZonePolicy,
                                       const RegPressureTracker &RPTracker,
                                       SchedCandidate &Cand) {
// getMaxPressureDelta temporarily modifies the tracker.
RegPressureTracker &TempTracker = const_cast<RegPressureTracker&>(RPTracker);

ReadyQueue &Q = Zone.Available;
for (SUnit *SU : Q) {

  SchedCandidate TryCand(ZonePolicy);
  initCandidate(TryCand, SU, Zone.isTop(), RPTracker, TempTracker);
  // Pass SchedBoundary only when comparing nodes from the same boundary.
  SchedBoundary *ZoneArg = Cand.AtTop == TryCand.AtTop ? &Zone : nullptr;
  if (tryCandidate(Cand, TryCand, ZoneArg)) {
    // Initialize resource delta if needed in case future heuristics query it.
    if (TryCand.ResDelta == SchedResourceDelta())
      TryCand.initResourceDelta(DAG, SchedModel);
    Cand.setBest(TryCand);
    LLVM_DEBUG(traceCandidate(Cand))do { } while (false);
  }
}
3316}

3318/// Pick the best candidate node from either the top or bottom queue.
3319SUnit *GenericScheduler::pickNodeBidirectional(bool &IsTopNode) {
// Schedule as far as possible in the direction of no choice. This is most
// efficient, but also provides the best heuristics for CriticalPSets.
if (SUnit *SU = Bot.pickOnlyChoice()) {
  IsTopNode = false;
  tracePick(Only1, false);
  return SU;
}
if (SUnit *SU = Top.pickOnlyChoice()) {
  IsTopNode = true;
  tracePick(Only1, true);
  return SU;
}
// Set the bottom-up policy based on the state of the current bottom zone and
// the instructions outside the zone, including the top zone.
CandPolicy BotPolicy;
setPolicy(BotPolicy, /*IsPostRA=*/false, Bot, &Top);
// Set the top-down policy based on the state of the current top zone and
// the instructions outside the zone, including the bottom zone.
CandPolicy TopPolicy;
setPolicy(TopPolicy, /*IsPostRA=*/false, Top, &Bot);

// See if BotCand is still valid (because we previously scheduled from Top).
LLVM_DEBUG(dbgs() << "Picking from Bot:\n")do { } while (false);
if (!BotCand.isValid() || BotCand.SU->isScheduled ||
    BotCand.Policy != BotPolicy) {
  BotCand.reset(CandPolicy());
  pickNodeFromQueue(Bot, BotPolicy, DAG->getBotRPTracker(), BotCand);
  assert(BotCand.Reason != NoCand && "failed to find the first candidate")(static_cast<void> (0));
} else {
  LLVM_DEBUG(traceCandidate(BotCand))do { } while (false);
3350#ifndef NDEBUG1
  if (VerifyScheduling) {
    SchedCandidate TCand;
    TCand.reset(CandPolicy());
    pickNodeFromQueue(Bot, BotPolicy, DAG->getBotRPTracker(), TCand);
    assert(TCand.SU == BotCand.SU &&(static_cast<void> (0))
           "Last pick result should correspond to re-picking right now")(static_cast<void> (0));
  }
3358#endif
}

// Check if the top Q has a better candidate.
LLVM_DEBUG(dbgs() << "Picking from Top:\n")do { } while (false);
if (!TopCand.isValid() || TopCand.SU->isScheduled ||
    TopCand.Policy != TopPolicy) {
  TopCand.reset(CandPolicy());
  pickNodeFromQueue(Top, TopPolicy, DAG->getTopRPTracker(), TopCand);
  assert(TopCand.Reason != NoCand && "failed to find the first candidate")(static_cast<void> (0));
} else {
  LLVM_DEBUG(traceCandidate(TopCand))do { } while (false);
3370#ifndef NDEBUG1
  if (VerifyScheduling) {
    SchedCandidate TCand;
    TCand.reset(CandPolicy());
    pickNodeFromQueue(Top, TopPolicy, DAG->getTopRPTracker(), TCand);
    assert(TCand.SU == TopCand.SU &&(static_cast<void> (0))
         "Last pick result should correspond to re-picking right now")(static_cast<void> (0));
  }
3378#endif
}

// Pick best from BotCand and TopCand.
assert(BotCand.isValid())(static_cast<void> (0));
assert(TopCand.isValid())(static_cast<void> (0));
SchedCandidate Cand = BotCand;
TopCand.Reason = NoCand;
if (tryCandidate(Cand, TopCand, nullptr)) {
  Cand.setBest(TopCand);
  LLVM_DEBUG(traceCandidate(Cand))do { } while (false);
}

IsTopNode = Cand.AtTop;
tracePick(Cand);
return Cand.SU;
3394}

3396/// Pick the best node to balance the schedule. Implements MachineSchedStrategy.
3397SUnit *GenericScheduler::pickNode(bool &IsTopNode) {
if (DAG->top() == DAG->bottom()) {
  assert(Top.Available.empty() && Top.Pending.empty() &&(static_cast<void> (0))
         Bot.Available.empty() && Bot.Pending.empty() && "ReadyQ garbage")(static_cast<void> (0));
  return nullptr;
}
SUnit *SU;
do {
  if (RegionPolicy.OnlyTopDown) {
    SU = Top.pickOnlyChoice();
    if (!SU) {
      CandPolicy NoPolicy;
      TopCand.reset(NoPolicy);
      pickNodeFromQueue(Top, NoPolicy, DAG->getTopRPTracker(), TopCand);
      assert(TopCand.Reason != NoCand && "failed to find a candidate")(static_cast<void> (0));
      tracePick(TopCand);
      SU = TopCand.SU;
    }
    IsTopNode = true;
  } else if (RegionPolicy.OnlyBottomUp) {
    SU = Bot.pickOnlyChoice();
    if (!SU) {
      CandPolicy NoPolicy;
      BotCand.reset(NoPolicy);
      pickNodeFromQueue(Bot, NoPolicy, DAG->getBotRPTracker(), BotCand);
      assert(BotCand.Reason != NoCand && "failed to find a candidate")(static_cast<void> (0));
      tracePick(BotCand);
      SU = BotCand.SU;
    }
    IsTopNode = false;
  } else {
    SU = pickNodeBidirectional(IsTopNode);
  }
} while (SU->isScheduled);

if (SU->isTopReady())
  Top.removeReady(SU);
if (SU->isBottomReady())
  Bot.removeReady(SU);

LLVM_DEBUG(dbgs() << "Scheduling SU(" << SU->NodeNum << ") "do { } while (false)
                  << *SU->getInstr())do { } while (false);
return SU;
3440}

3442void GenericScheduler::reschedulePhysReg(SUnit *SU, bool isTop) {
MachineBasicBlock::iterator InsertPos = SU->getInstr();
if (!isTop)
  ++InsertPos;
SmallVectorImpl<SDep> &Deps = isTop ? SU->Preds : SU->Succs;

// Find already scheduled copies with a single physreg dependence and move
// them just above the scheduled instruction.
for (SDep &Dep : Deps) {
  if (Dep.getKind() != SDep::Data ||
      !Register::isPhysicalRegister(Dep.getReg()))
    continue;
  SUnit *DepSU = Dep.getSUnit();
  if (isTop ? DepSU->Succs.size() > 1 : DepSU->Preds.size() > 1)
    continue;
  MachineInstr *Copy = DepSU->getInstr();
  if (!Copy->isCopy() && !Copy->isMoveImmediate())
    continue;
  LLVM_DEBUG(dbgs() << "  Rescheduling physreg copy ";do { } while (false)
             DAG->dumpNode(*Dep.getSUnit()))do { } while (false);
  DAG->moveInstruction(Copy, InsertPos);
}
3464}

3466/// Update the scheduler's state after scheduling a node. This is the same node
3467/// that was just returned by pickNode(). However, ScheduleDAGMILive needs to
3468/// update it's state based on the current cycle before MachineSchedStrategy
3469/// does.
3470///
3471/// FIXME: Eventually, we may bundle physreg copies rather than rescheduling
3472/// them here. See comments in biasPhysReg.
3473void GenericScheduler::schedNode(SUnit *SU, bool IsTopNode) {
if (IsTopNode) {
  SU->TopReadyCycle = std::max(SU->TopReadyCycle, Top.getCurrCycle());
  Top.bumpNode(SU);
  if (SU->hasPhysRegUses)
    reschedulePhysReg(SU, true);
} else {
  SU->BotReadyCycle = std::max(SU->BotReadyCycle, Bot.getCurrCycle());
  Bot.bumpNode(SU);
  if (SU->hasPhysRegDefs)
    reschedulePhysReg(SU, false);
}
3485}

3487/// Create the standard converging machine scheduler. This will be used as the
3488/// default scheduler if the target does not set a default.
3489ScheduleDAGMILive *llvm::createGenericSchedLive(MachineSchedContext *C) {
ScheduleDAGMILive *DAG =
    new ScheduleDAGMILive(C, std::make_unique<GenericScheduler>(C));
// Register DAG post-processors.
//
// FIXME: extend the mutation API to allow earlier mutations to instantiate
// data and pass it to later mutations. Have a single mutation that gathers
// the interesting nodes in one pass.
DAG->addMutation(createCopyConstrainDAGMutation(DAG->TII, DAG->TRI));
return DAG;
3499}

3501static ScheduleDAGInstrs *createConvergingSched(MachineSchedContext *C) {
return createGenericSchedLive(C);
3503}

3505static MachineSchedRegistry
3506GenericSchedRegistry("converge", "Standard converging scheduler.",
                   createConvergingSched);

3509//===----------------------------------------------------------------------===//
3510// PostGenericScheduler - Generic PostRA implementation of MachineSchedStrategy.
3511//===----------------------------------------------------------------------===//

3513void PostGenericScheduler::initialize(ScheduleDAGMI *Dag) {
DAG = Dag;
SchedModel = DAG->getSchedModel();
TRI = DAG->TRI;

Rem.init(DAG, SchedModel);
Top.init(DAG, SchedModel, &Rem);
BotRoots.clear();

// Initialize the HazardRecognizers. If itineraries don't exist, are empty,
// or are disabled, then these HazardRecs will be disabled.
const InstrItineraryData *Itin = SchedModel->getInstrItineraries();
if (!Top.HazardRec) {
  Top.HazardRec =
      DAG->MF.getSubtarget().getInstrInfo()->CreateTargetMIHazardRecognizer(
          Itin, DAG);
}
3530}

3532void PostGenericScheduler::registerRoots() {
Rem.CriticalPath = DAG->ExitSU.getDepth();

// Some roots may not feed into ExitSU. Check all of them in case.
for (const SUnit *SU : BotRoots) {
  if (SU->getDepth() > Rem.CriticalPath)
    Rem.CriticalPath = SU->getDepth();
}
LLVM_DEBUG(dbgs() << "Critical Path: (PGS-RR) " << Rem.CriticalPath << '\n')do { } while (false);
if (DumpCriticalPathLength) {
  errs() << "Critical Path(PGS-RR ): " << Rem.CriticalPath << " \n";
}
3544}

3546/// Apply a set of heuristics to a new candidate for PostRA scheduling.
3547///
3548/// \param Cand provides the policy and current best candidate.
3549/// \param TryCand refers to the next SUnit candidate, otherwise uninitialized.
3550/// \return \c true if TryCand is better than Cand (Reason is NOT NoCand)
3551bool PostGenericScheduler::tryCandidate(SchedCandidate &Cand,
                                      SchedCandidate &TryCand) {
// Initialize the candidate if needed.
if (!Cand.isValid()) {
  TryCand.Reason = NodeOrder;
  return true;
}

// Prioritize instructions that read unbuffered resources by stall cycles.
if (tryLess(Top.getLatencyStallCycles(TryCand.SU),
            Top.getLatencyStallCycles(Cand.SU), TryCand, Cand, Stall))
  return TryCand.Reason != NoCand;

// Keep clustered nodes together.
if (tryGreater(TryCand.SU == DAG->getNextClusterSucc(),
               Cand.SU == DAG->getNextClusterSucc(),
               TryCand, Cand, Cluster))
  return TryCand.Reason != NoCand;

// Avoid critical resource consumption and balance the schedule.
if (tryLess(TryCand.ResDelta.CritResources, Cand.ResDelta.CritResources,
            TryCand, Cand, ResourceReduce))
  return TryCand.Reason != NoCand;
if (tryGreater(TryCand.ResDelta.DemandedResources,
               Cand.ResDelta.DemandedResources,
               TryCand, Cand, ResourceDemand))
  return TryCand.Reason != NoCand;

// Avoid serializing long latency dependence chains.
if (Cand.Policy.ReduceLatency && tryLatency(TryCand, Cand, Top)) {
  return TryCand.Reason != NoCand;
}

// Fall through to original instruction order.
if (TryCand.SU->NodeNum < Cand.SU->NodeNum) {
  TryCand.Reason = NodeOrder;
  return true;
}

return false;
3591}

3593void PostGenericScheduler::pickNodeFromQueue(SchedCandidate &Cand) {
ReadyQueue &Q = Top.Available;
for (SUnit *SU : Q) {
  SchedCandidate TryCand(Cand.Policy);
  TryCand.SU = SU;
  TryCand.AtTop = true;
  TryCand.initResourceDelta(DAG, SchedModel);
  if (tryCandidate(Cand, TryCand)) {
    Cand.setBest(TryCand);
    LLVM_DEBUG(traceCandidate(Cand))do { } while (false);
  }
}
3605}
27
←
Returning without writing to 'Cand.SU'→

3607/// Pick the next node to schedule.
3608SUnit *PostGenericScheduler::pickNode(bool &IsTopNode) {
if (DAG->top() == DAG->bottom()) {
1
Calling 'operator=='→
7
←
Returning from 'operator=='→
8
←
Taking false branch→
  assert(Top.Available.empty() && Top.Pending.empty() && "ReadyQ garbage")(static_cast<void> (0));
  return nullptr;
}
SUnit *SU;
do {
  SU = Top.pickOnlyChoice();
9
←
Calling 'SchedBoundary::pickOnlyChoice'→
19
←
Returning from 'SchedBoundary::pickOnlyChoice'→
  if (SU19.1
'SU' is null
1
'SU' is null
1
'SU' is null
1
'SU' is null
) {
20
←
Taking false branch→
    tracePick(Only1, true);
  } else {
    CandPolicy NoPolicy;
    SchedCandidate TopCand(NoPolicy);
21
←
Calling constructor for 'SchedCandidate'→
25
←
Returning from constructor for 'SchedCandidate'→
    // Set the top-down policy based on the state of the current top zone and
    // the instructions outside the zone, including the bottom zone.
    setPolicy(TopCand.Policy, /*IsPostRA=*/true, Top, nullptr);
    pickNodeFromQueue(TopCand);
26
←
Calling 'PostGenericScheduler::pickNodeFromQueue'→
28
←
Returning from 'PostGenericScheduler::pickNodeFromQueue'→
    assert(TopCand.Reason != NoCand && "failed to find a candidate")(static_cast<void> (0));
    tracePick(TopCand);
    SU = TopCand.SU;
29
←
Null pointer value stored to 'SU'→
  }
} while (SU->isScheduled);
30
←
Access to field 'isScheduled' results in a dereference of a null pointer (loaded from variable 'SU')

IsTopNode = true;
Top.removeReady(SU);

LLVM_DEBUG(dbgs() << "Scheduling SU(" << SU->NodeNum << ") "do { } while (false)
                  << *SU->getInstr())do { } while (false);
return SU;
3637}

3639/// Called after ScheduleDAGMI has scheduled an instruction and updated
3640/// scheduled/remaining flags in the DAG nodes.
3641void PostGenericScheduler::schedNode(SUnit *SU, bool IsTopNode) {
SU->TopReadyCycle = std::max(SU->TopReadyCycle, Top.getCurrCycle());
Top.bumpNode(SU);
3644}

3646ScheduleDAGMI *llvm::createGenericSchedPostRA(MachineSchedContext *C) {
return new ScheduleDAGMI(C, std::make_unique<PostGenericScheduler>(C),
                         /*RemoveKillFlags=*/true);
3649}

3651//===----------------------------------------------------------------------===//
3652// ILP Scheduler. Currently for experimental analysis of heuristics.
3653//===----------------------------------------------------------------------===//

3655namespace {

3657/// Order nodes by the ILP metric.
3658struct ILPOrder {
const SchedDFSResult *DFSResult = nullptr;
const BitVector *ScheduledTrees = nullptr;
bool MaximizeILP;

ILPOrder(bool MaxILP) : MaximizeILP(MaxILP) {}

/// Apply a less-than relation on node priority.
///
/// (Return true if A comes after B in the Q.)
bool operator()(const SUnit *A, const SUnit *B) const {
  unsigned SchedTreeA = DFSResult->getSubtreeID(A);
  unsigned SchedTreeB = DFSResult->getSubtreeID(B);
  if (SchedTreeA != SchedTreeB) {
    // Unscheduled trees have lower priority.
    if (ScheduledTrees->test(SchedTreeA) != ScheduledTrees->test(SchedTreeB))
      return ScheduledTrees->test(SchedTreeB);

    // Trees with shallower connections have have lower priority.
    if (DFSResult->getSubtreeLevel(SchedTreeA)
        != DFSResult->getSubtreeLevel(SchedTreeB)) {
      return DFSResult->getSubtreeLevel(SchedTreeA)
        < DFSResult->getSubtreeLevel(SchedTreeB);
    }
  }
  if (MaximizeILP)
    return DFSResult->getILP(A) < DFSResult->getILP(B);
  else
    return DFSResult->getILP(A) > DFSResult->getILP(B);
}
3688};

3690/// Schedule based on the ILP metric.
3691class ILPScheduler : public MachineSchedStrategy {
ScheduleDAGMILive *DAG = nullptr;
ILPOrder Cmp;

std::vector<SUnit*> ReadyQ;

3697public:
ILPScheduler(bool MaximizeILP) : Cmp(MaximizeILP) {}

void initialize(ScheduleDAGMI *dag) override {
  assert(dag->hasVRegLiveness() && "ILPScheduler needs vreg liveness")(static_cast<void> (0));
  DAG = static_cast<ScheduleDAGMILive*>(dag);
  DAG->computeDFSResult();
  Cmp.DFSResult = DAG->getDFSResult();
  Cmp.ScheduledTrees = &DAG->getScheduledTrees();
  ReadyQ.clear();
}

void registerRoots() override {
  // Restore the heap in ReadyQ with the updated DFS results.
  std::make_heap(ReadyQ.begin(), ReadyQ.end(), Cmp);
}

/// Implement MachineSchedStrategy interface.
/// -----------------------------------------

/// Callback to select the highest priority node from the ready Q.
SUnit *pickNode(bool &IsTopNode) override {
  if (ReadyQ.empty()) return nullptr;
  std::pop_heap(ReadyQ.begin(), ReadyQ.end(), Cmp);
  SUnit *SU = ReadyQ.back();
  ReadyQ.pop_back();
  IsTopNode = false;
  LLVM_DEBUG(dbgs() << "Pick node "do { } while (false)
                    << "SU(" << SU->NodeNum << ") "do { } while (false)
                    << " ILP: " << DAG->getDFSResult()->getILP(SU)do { } while (false)
                    << " Tree: " << DAG->getDFSResult()->getSubtreeID(SU)do { } while (false)
                    << " @"do { } while (false)
                    << DAG->getDFSResult()->getSubtreeLevel(do { } while (false)
                           DAG->getDFSResult()->getSubtreeID(SU))do { } while (false)
                    << '\n'do { } while (false)
                    << "Scheduling " << *SU->getInstr())do { } while (false);
  return SU;
}

/// Scheduler callback to notify that a new subtree is scheduled.
void scheduleTree(unsigned SubtreeID) override {
  std::make_heap(ReadyQ.begin(), ReadyQ.end(), Cmp);
}

/// Callback after a node is scheduled. Mark a newly scheduled tree, notify
/// DFSResults, and resort the priority Q.
void schedNode(SUnit *SU, bool IsTopNode) override {
  assert(!IsTopNode && "SchedDFSResult needs bottom-up")(static_cast<void> (0));
}

void releaseTopNode(SUnit *) override { /*only called for top roots*/ }

void releaseBottomNode(SUnit *SU) override {
  ReadyQ.push_back(SU);
  std::push_heap(ReadyQ.begin(), ReadyQ.end(), Cmp);
}
3753};

3755} // end anonymous namespace

3757static ScheduleDAGInstrs *createILPMaxScheduler(MachineSchedContext *C) {
return new ScheduleDAGMILive(C, std::make_unique<ILPScheduler>(true));
3759}
3760static ScheduleDAGInstrs *createILPMinScheduler(MachineSchedContext *C) {
return new ScheduleDAGMILive(C, std::make_unique<ILPScheduler>(false));
3762}

3764static MachineSchedRegistry ILPMaxRegistry(
"ilpmax", "Schedule bottom-up for max ILP", createILPMaxScheduler);
3766static MachineSchedRegistry ILPMinRegistry(
"ilpmin", "Schedule bottom-up for min ILP", createILPMinScheduler);

3769//===----------------------------------------------------------------------===//
3770// Machine Instruction Shuffler for Correctness Testing
3771//===----------------------------------------------------------------------===//

3773#ifndef NDEBUG1
3774namespace {

3776/// Apply a less-than relation on the node order, which corresponds to the
3777/// instruction order prior to scheduling. IsReverse implements greater-than.
3778template<bool IsReverse>
3779struct SUnitOrder {
bool operator()(SUnit *A, SUnit *B) const {
  if (IsReverse)
    return A->NodeNum > B->NodeNum;
  else
    return A->NodeNum < B->NodeNum;
}
3786};

3788/// Reorder instructions as much as possible.
3789class InstructionShuffler : public MachineSchedStrategy {
bool IsAlternating;
bool IsTopDown;

// Using a less-than relation (SUnitOrder<false>) for the TopQ priority
// gives nodes with a higher number higher priority causing the latest
// instructions to be scheduled first.
PriorityQueue<SUnit*, std::vector<SUnit*>, SUnitOrder<false>>
  TopQ;

// When scheduling bottom-up, use greater-than as the queue priority.
PriorityQueue<SUnit*, std::vector<SUnit*>, SUnitOrder<true>>
  BottomQ;

3803public:
InstructionShuffler(bool alternate, bool topdown)
  : IsAlternating(alternate), IsTopDown(topdown) {}

void initialize(ScheduleDAGMI*) override {
  TopQ.clear();
  BottomQ.clear();
}

/// Implement MachineSchedStrategy interface.
/// -----------------------------------------

SUnit *pickNode(bool &IsTopNode) override {
  SUnit *SU;
  if (IsTopDown) {
    do {
      if (TopQ.empty()) return nullptr;
      SU = TopQ.top();
      TopQ.pop();
    } while (SU->isScheduled);
    IsTopNode = true;
  } else {
    do {
      if (BottomQ.empty()) return nullptr;
      SU = BottomQ.top();
      BottomQ.pop();
    } while (SU->isScheduled);
    IsTopNode = false;
  }
  if (IsAlternating)
    IsTopDown = !IsTopDown;
  return SU;
}

void schedNode(SUnit *SU, bool IsTopNode) override {}

void releaseTopNode(SUnit *SU) override {
  TopQ.push(SU);
}
void releaseBottomNode(SUnit *SU) override {
  BottomQ.push(SU);
}
3845};

3847} // end anonymous namespace

3849static ScheduleDAGInstrs *createInstructionShuffler(MachineSchedContext *C) {
bool Alternate = !ForceTopDown && !ForceBottomUp;
bool TopDown = !ForceBottomUp;
assert((TopDown || !ForceTopDown) &&(static_cast<void> (0))
       "-misched-topdown incompatible with -misched-bottomup")(static_cast<void> (0));
return new ScheduleDAGMILive(
    C, std::make_unique<InstructionShuffler>(Alternate, TopDown));
3856}

3858static MachineSchedRegistry ShufflerRegistry(
"shuffle", "Shuffle machine instructions alternating directions",
createInstructionShuffler);
3861#endif // !NDEBUG

3863//===----------------------------------------------------------------------===//
3864// GraphWriter support for ScheduleDAGMILive.
3865//===----------------------------------------------------------------------===//

3867#ifndef NDEBUG1
3868namespace llvm {

3870template<> struct GraphTraits<
ScheduleDAGMI*> : public GraphTraits<ScheduleDAG*> {};

3873template<>
3874struct DOTGraphTraits<ScheduleDAGMI*> : public DefaultDOTGraphTraits {
DOTGraphTraits(bool isSimple = false) : DefaultDOTGraphTraits(isSimple) {}

static std::string getGraphName(const ScheduleDAG *G) {
  return std::string(G->MF.getName());
}

static bool renderGraphFromBottomUp() {
  return true;
}

static bool isNodeHidden(const SUnit *Node, const ScheduleDAG *G) {
  if (ViewMISchedCutoff == 0)
    return false;
  return (Node->Preds.size() > ViewMISchedCutoff
       || Node->Succs.size() > ViewMISchedCutoff);
}

/// If you want to override the dot attributes printed for a particular
/// edge, override this method.
static std::string getEdgeAttributes(const SUnit *Node,
                                     SUnitIterator EI,
                                     const ScheduleDAG *Graph) {
  if (EI.isArtificialDep())
    return "color=cyan,style=dashed";
  if (EI.isCtrlDep())
    return "color=blue,style=dashed";
  return "";
}

static std::string getNodeLabel(const SUnit *SU, const ScheduleDAG *G) {
  std::string Str;
  raw_string_ostream SS(Str);
  const ScheduleDAGMI *DAG = static_cast<const ScheduleDAGMI*>(G);
  const SchedDFSResult *DFS = DAG->hasVRegLiveness() ?
    static_cast<const ScheduleDAGMILive*>(G)->getDFSResult() : nullptr;
  SS << "SU:" << SU->NodeNum;
  if (DFS)
    SS << " I:" << DFS->getNumInstrs(SU);
  return SS.str();
}

static std::string getNodeDescription(const SUnit *SU, const ScheduleDAG *G) {
  return G->getGraphNodeLabel(SU);
}

static std::string getNodeAttributes(const SUnit *N, const ScheduleDAG *G) {
  std::string Str("shape=Mrecord");
  const ScheduleDAGMI *DAG = static_cast<const ScheduleDAGMI*>(G);
  const SchedDFSResult *DFS = DAG->hasVRegLiveness() ?
    static_cast<const ScheduleDAGMILive*>(G)->getDFSResult() : nullptr;
  if (DFS) {
    Str += ",style=filled,fillcolor=\"#";
    Str += DOT::getColorString(DFS->getSubtreeID(N));
    Str += '"';
  }
  return Str;
}
3932};

3934} // end namespace llvm
3935#endif // NDEBUG

3937/// viewGraph - Pop up a ghostview window with the reachable parts of the DAG
3938/// rendered using 'dot'.
3939void ScheduleDAGMI::viewGraph(const Twine &Name, const Twine &Title) {
3940#ifndef NDEBUG1
ViewGraph(this, Name, false, Title);
3942#else
errs() << "ScheduleDAGMI::viewGraph is only available in debug builds on "
       << "systems with Graphviz or gv!\n";
3945#endif  // NDEBUG
3946}

3948/// Out-of-line implementation with no arguments is handy for gdb.
3949void ScheduleDAGMI::viewGraph() {
viewGraph(getDAGName(), "Scheduling-Units Graph for " + getDAGName());
3951}

←

/build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/llvm/include/llvm/CodeGen/MachineInstrBundleIterator.h

→

1//===- llvm/CodeGen/MachineInstrBundleIterator.h ----------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Defines an iterator class that bundles MachineInstr.
10//
11//===----------------------------------------------------------------------===//

13#ifndef LLVM_CODEGEN_MACHINEINSTRBUNDLEITERATOR_H
14#define LLVM_CODEGEN_MACHINEINSTRBUNDLEITERATOR_H

16#include "llvm/ADT/ilist.h"
17#include "llvm/ADT/simple_ilist.h"
18#include <cassert>
19#include <iterator>
20#include <type_traits>

22namespace llvm {

24template <class T, bool IsReverse> struct MachineInstrBundleIteratorTraits;
25template <class T> struct MachineInstrBundleIteratorTraits<T, false> {
using list_type = simple_ilist<T, ilist_sentinel_tracking<true>>;
using instr_iterator = typename list_type::iterator;
using nonconst_instr_iterator = typename list_type::iterator;
using const_instr_iterator = typename list_type::const_iterator;
30};
31template <class T> struct MachineInstrBundleIteratorTraits<T, true> {
using list_type = simple_ilist<T, ilist_sentinel_tracking<true>>;
using instr_iterator = typename list_type::reverse_iterator;
using nonconst_instr_iterator = typename list_type::reverse_iterator;
using const_instr_iterator = typename list_type::const_reverse_iterator;
36};
37template <class T> struct MachineInstrBundleIteratorTraits<const T, false> {
using list_type = simple_ilist<T, ilist_sentinel_tracking<true>>;
using instr_iterator = typename list_type::const_iterator;
using nonconst_instr_iterator = typename list_type::iterator;
using const_instr_iterator = typename list_type::const_iterator;
42};
43template <class T> struct MachineInstrBundleIteratorTraits<const T, true> {
using list_type = simple_ilist<T, ilist_sentinel_tracking<true>>;
using instr_iterator = typename list_type::const_reverse_iterator;
using nonconst_instr_iterator = typename list_type::reverse_iterator;
using const_instr_iterator = typename list_type::const_reverse_iterator;
48};

50template <bool IsReverse> struct MachineInstrBundleIteratorHelper;
51template <> struct MachineInstrBundleIteratorHelper<false> {
/// Get the beginning of the current bundle.
template <class Iterator> static Iterator getBundleBegin(Iterator I) {
  if (!I.isEnd())
    while (I->isBundledWithPred())
      --I;
  return I;
}

/// Get the final node of the current bundle.
template <class Iterator> static Iterator getBundleFinal(Iterator I) {
  if (!I.isEnd())
    while (I->isBundledWithSucc())
      ++I;
  return I;
}

/// Increment forward ilist iterator.
template <class Iterator> static void increment(Iterator &I) {
  I = std::next(getBundleFinal(I));
}

/// Decrement forward ilist iterator.
template <class Iterator> static void decrement(Iterator &I) {
  I = getBundleBegin(std::prev(I));
}
77};

79template <> struct MachineInstrBundleIteratorHelper<true> {
/// Get the beginning of the current bundle.
template <class Iterator> static Iterator getBundleBegin(Iterator I) {
  return MachineInstrBundleIteratorHelper<false>::getBundleBegin(
             I.getReverse())
      .getReverse();
}

/// Get the final node of the current bundle.
template <class Iterator> static Iterator getBundleFinal(Iterator I) {
  return MachineInstrBundleIteratorHelper<false>::getBundleFinal(
             I.getReverse())
      .getReverse();
}

/// Increment reverse ilist iterator.
template <class Iterator> static void increment(Iterator &I) {
  I = getBundleBegin(std::next(I));
}

/// Decrement reverse ilist iterator.
template <class Iterator> static void decrement(Iterator &I) {
  I = std::prev(getBundleFinal(I));
}
103};

105/// MachineBasicBlock iterator that automatically skips over MIs that are
106/// inside bundles (i.e. walk top level MIs only).
107template <typename Ty, bool IsReverse = false>
108class MachineInstrBundleIterator : MachineInstrBundleIteratorHelper<IsReverse> {
using Traits = MachineInstrBundleIteratorTraits<Ty, IsReverse>;
using instr_iterator = typename Traits::instr_iterator;

instr_iterator MII;

114public:
using value_type = typename instr_iterator::value_type;
using difference_type = typename instr_iterator::difference_type;
using pointer = typename instr_iterator::pointer;
using reference = typename instr_iterator::reference;
using const_pointer = typename instr_iterator::const_pointer;
using const_reference = typename instr_iterator::const_reference;
using iterator_category = std::bidirectional_iterator_tag;

123private:
using nonconst_instr_iterator = typename Traits::nonconst_instr_iterator;
using const_instr_iterator = typename Traits::const_instr_iterator;
using nonconst_iterator =
    MachineInstrBundleIterator<typename nonconst_instr_iterator::value_type,
                               IsReverse>;
using reverse_iterator = MachineInstrBundleIterator<Ty, !IsReverse>;

131public:
MachineInstrBundleIterator(instr_iterator MI) : MII(MI) {
  assert((!MI.getNodePtr() || MI.isEnd() || !MI->isBundledWithPred()) &&(static_cast<void> (0))
         "It's not legal to initialize MachineInstrBundleIterator with a "(static_cast<void> (0))
         "bundled MI")(static_cast<void> (0));
}

MachineInstrBundleIterator(reference MI) : MII(MI) {
  assert(!MI.isBundledWithPred() && "It's not legal to initialize "(static_cast<void> (0))
                                    "MachineInstrBundleIterator with a "(static_cast<void> (0))
                                    "bundled MI")(static_cast<void> (0));
}

MachineInstrBundleIterator(pointer MI) : MII(MI) {
  // FIXME: This conversion should be explicit.
  assert((!MI || !MI->isBundledWithPred()) && "It's not legal to initialize "(static_cast<void> (0))
                                              "MachineInstrBundleIterator "(static_cast<void> (0))
                                              "with a bundled MI")(static_cast<void> (0));
}

// Template allows conversion from const to nonconst.
template <class OtherTy>
MachineInstrBundleIterator(
    const MachineInstrBundleIterator<OtherTy, IsReverse> &I,
    std::enable_if_t<std::is_convertible<OtherTy *, Ty *>::value, void *> =
        nullptr)
    : MII(I.getInstrIterator()) {}

MachineInstrBundleIterator() : MII(nullptr) {}

/// Explicit conversion between forward/reverse iterators.
///
/// Translate between forward and reverse iterators without changing range
/// boundaries.  The resulting iterator will dereference (and have a handle)
/// to the previous node, which is somewhat unexpected; but converting the
/// two endpoints in a range will give the same range in reverse.
///
/// This matches std::reverse_iterator conversions.
explicit MachineInstrBundleIterator(
    const MachineInstrBundleIterator<Ty, !IsReverse> &I)
    : MachineInstrBundleIterator(++I.getReverse()) {}

/// Get the bundle iterator for the given instruction's bundle.
static MachineInstrBundleIterator getAtBundleBegin(instr_iterator MI) {
  return MachineInstrBundleIteratorHelper<IsReverse>::getBundleBegin(MI);
}

reference operator*() const { return *MII; }
pointer operator->() const { return &operator*(); }

/// Check for null.
bool isValid() const { return MII.getNodePtr(); }

friend bool operator==(const MachineInstrBundleIterator &L,
                       const MachineInstrBundleIterator &R) {
  return L.MII == R.MII;
2
←
Calling 'operator=='→
5
←
Returning from 'operator=='→
6
←
Returning zero, which participates in a condition later→
}
friend bool operator==(const MachineInstrBundleIterator &L,
                       const const_instr_iterator &R) {
  return L.MII == R; // Avoid assertion about validity of R.
}
friend bool operator==(const const_instr_iterator &L,
                       const MachineInstrBundleIterator &R) {
  return L == R.MII; // Avoid assertion about validity of L.
}
friend bool operator==(const MachineInstrBundleIterator &L,
                       const nonconst_instr_iterator &R) {
  return L.MII == R; // Avoid assertion about validity of R.
}
friend bool operator==(const nonconst_instr_iterator &L,
                       const MachineInstrBundleIterator &R) {
  return L == R.MII; // Avoid assertion about validity of L.
}
friend bool operator==(const MachineInstrBundleIterator &L, const_pointer R) {
  return L == const_instr_iterator(R); // Avoid assertion about validity of R.
}
friend bool operator==(const_pointer L, const MachineInstrBundleIterator &R) {
  return const_instr_iterator(L) == R; // Avoid assertion about validity of L.
}
friend bool operator==(const MachineInstrBundleIterator &L,
                       const_reference R) {
  return L == &R; // Avoid assertion about validity of R.
}
friend bool operator==(const_reference L,
                       const MachineInstrBundleIterator &R) {
  return &L == R; // Avoid assertion about validity of L.
}

friend bool operator!=(const MachineInstrBundleIterator &L,
                       const MachineInstrBundleIterator &R) {
  return !(L == R);
}
friend bool operator!=(const MachineInstrBundleIterator &L,
                       const const_instr_iterator &R) {
  return !(L == R);
}
friend bool operator!=(const const_instr_iterator &L,
                       const MachineInstrBundleIterator &R) {
  return !(L == R);
}
friend bool operator!=(const MachineInstrBundleIterator &L,
                       const nonconst_instr_iterator &R) {
  return !(L == R);
}
friend bool operator!=(const nonconst_instr_iterator &L,
                       const MachineInstrBundleIterator &R) {
  return !(L == R);
}
friend bool operator!=(const MachineInstrBundleIterator &L, const_pointer R) {
  return !(L == R);
}
friend bool operator!=(const_pointer L, const MachineInstrBundleIterator &R) {
  return !(L == R);
}
friend bool operator!=(const MachineInstrBundleIterator &L,
                       const_reference R) {
  return !(L == R);
}
friend bool operator!=(const_reference L,
                       const MachineInstrBundleIterator &R) {
  return !(L == R);
}

// Increment and decrement operators...
MachineInstrBundleIterator &operator--() {
  this->decrement(MII);
  return *this;
}
MachineInstrBundleIterator &operator++() {
  this->increment(MII);
  return *this;
}
MachineInstrBundleIterator operator--(int) {
  MachineInstrBundleIterator Temp = *this;
  --*this;
  return Temp;
}
MachineInstrBundleIterator operator++(int) {
  MachineInstrBundleIterator Temp = *this;
  ++*this;
  return Temp;
}

instr_iterator getInstrIterator() const { return MII; }

nonconst_iterator getNonConstIterator() const { return MII.getNonConst(); }

/// Get a reverse iterator to the same node.
///
/// Gives a reverse iterator that will dereference (and have a handle) to the
/// same node.  Converting the endpoint iterators in a range will give a
/// different range; for range operations, use the explicit conversions.
reverse_iterator getReverse() const { return MII.getReverse(); }
284};

286} // end namespace llvm

288#endif // LLVM_CODEGEN_MACHINEINSTRBUNDLEITERATOR_H

←

/build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/llvm/include/llvm/ADT/ilist_iterator.h

→

1//===- llvm/ADT/ilist_iterator.h - Intrusive List Iterator ------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//

9#ifndef LLVM_ADT_ILIST_ITERATOR_H
10#define LLVM_ADT_ILIST_ITERATOR_H

12#include "llvm/ADT/ilist_node.h"
13#include <cassert>
14#include <cstddef>
15#include <iterator>
16#include <type_traits>

18namespace llvm {

20namespace ilist_detail {

22/// Find const-correct node types.
23template <class OptionsT, bool IsConst> struct IteratorTraits;
24template <class OptionsT> struct IteratorTraits<OptionsT, false> {
using value_type = typename OptionsT::value_type;
using pointer = typename OptionsT::pointer;
using reference = typename OptionsT::reference;
using node_pointer = ilist_node_impl<OptionsT> *;
using node_reference = ilist_node_impl<OptionsT> &;
30};
31template <class OptionsT> struct IteratorTraits<OptionsT, true> {
using value_type = const typename OptionsT::value_type;
using pointer = typename OptionsT::const_pointer;
using reference = typename OptionsT::const_reference;
using node_pointer = const ilist_node_impl<OptionsT> *;
using node_reference = const ilist_node_impl<OptionsT> &;
37};

39template <bool IsReverse> struct IteratorHelper;
40template <> struct IteratorHelper<false> : ilist_detail::NodeAccess {
using Access = ilist_detail::NodeAccess;

template <class T> static void increment(T *&I) { I = Access::getNext(*I); }
template <class T> static void decrement(T *&I) { I = Access::getPrev(*I); }
45};
46template <> struct IteratorHelper<true> : ilist_detail::NodeAccess {
using Access = ilist_detail::NodeAccess;

template <class T> static void increment(T *&I) { I = Access::getPrev(*I); }
template <class T> static void decrement(T *&I) { I = Access::getNext(*I); }
51};

53} // end namespace ilist_detail

55/// Iterator for intrusive lists  based on ilist_node.
56template <class OptionsT, bool IsReverse, bool IsConst>
57class ilist_iterator : ilist_detail::SpecificNodeAccess<OptionsT> {
friend ilist_iterator<OptionsT, IsReverse, !IsConst>;
friend ilist_iterator<OptionsT, !IsReverse, IsConst>;
friend ilist_iterator<OptionsT, !IsReverse, !IsConst>;

using Traits = ilist_detail::IteratorTraits<OptionsT, IsConst>;
using Access = ilist_detail::SpecificNodeAccess<OptionsT>;

65public:
using value_type = typename Traits::value_type;
using pointer = typename Traits::pointer;
using reference = typename Traits::reference;
using difference_type = ptrdiff_t;
using iterator_category = std::bidirectional_iterator_tag;
using const_pointer = typename OptionsT::const_pointer;
using const_reference = typename OptionsT::const_reference;

74private:
using node_pointer = typename Traits::node_pointer;
using node_reference = typename Traits::node_reference;

node_pointer NodePtr = nullptr;

80public:
/// Create from an ilist_node.
explicit ilist_iterator(node_reference N) : NodePtr(&N) {}

explicit ilist_iterator(pointer NP) : NodePtr(Access::getNodePtr(NP)) {}
explicit ilist_iterator(reference NR) : NodePtr(Access::getNodePtr(&NR)) {}
ilist_iterator() = default;

// This is templated so that we can allow constructing a const iterator from
// a nonconst iterator...
template <bool RHSIsConst>
ilist_iterator(const ilist_iterator<OptionsT, IsReverse, RHSIsConst> &RHS,
               std::enable_if_t<IsConst || !RHSIsConst, void *> = nullptr)
    : NodePtr(RHS.NodePtr) {}

// This is templated so that we can allow assigning to a const iterator from
// a nonconst iterator...
template <bool RHSIsConst>
std::enable_if_t<IsConst || !RHSIsConst, ilist_iterator &>
operator=(const ilist_iterator<OptionsT, IsReverse, RHSIsConst> &RHS) {
  NodePtr = RHS.NodePtr;
  return *this;
}

/// Explicit conversion between forward/reverse iterators.
///
/// Translate between forward and reverse iterators without changing range
/// boundaries.  The resulting iterator will dereference (and have a handle)
/// to the previous node, which is somewhat unexpected; but converting the
/// two endpoints in a range will give the same range in reverse.
///
/// This matches std::reverse_iterator conversions.
explicit ilist_iterator(
    const ilist_iterator<OptionsT, !IsReverse, IsConst> &RHS)
    : ilist_iterator(++RHS.getReverse()) {}

/// Get a reverse iterator to the same node.
///
/// Gives a reverse iterator that will dereference (and have a handle) to the
/// same node.  Converting the endpoint iterators in a range will give a
/// different range; for range operations, use the explicit conversions.
ilist_iterator<OptionsT, !IsReverse, IsConst> getReverse() const {
  if (NodePtr)
    return ilist_iterator<OptionsT, !IsReverse, IsConst>(*NodePtr);
  return ilist_iterator<OptionsT, !IsReverse, IsConst>();
}

/// Const-cast.
ilist_iterator<OptionsT, IsReverse, false> getNonConst() const {
  if (NodePtr)
    return ilist_iterator<OptionsT, IsReverse, false>(
        const_cast<typename ilist_iterator<OptionsT, IsReverse,
                                           false>::node_reference>(*NodePtr));
  return ilist_iterator<OptionsT, IsReverse, false>();
}

// Accessors...
reference operator*() const {
  assert(!NodePtr->isKnownSentinel())(static_cast<void> (0));
  return *Access::getValuePtr(NodePtr);
}
pointer operator->() const { return &operator*(); }

// Comparison operators
friend bool operator==(const ilist_iterator &LHS, const ilist_iterator &RHS) {
  return LHS.NodePtr == RHS.NodePtr;
3
←
Assuming 'LHS.NodePtr' is not equal to 'RHS.NodePtr'→
4
←
Returning zero, which participates in a condition later→
}
friend bool operator!=(const ilist_iterator &LHS, const ilist_iterator &RHS) {
  return LHS.NodePtr != RHS.NodePtr;
}

// Increment and decrement operators...
ilist_iterator &operator--() {
  NodePtr = IsReverse ? NodePtr->getNext() : NodePtr->getPrev();
  return *this;
}
ilist_iterator &operator++() {
  NodePtr = IsReverse ? NodePtr->getPrev() : NodePtr->getNext();
  return *this;
}
ilist_iterator operator--(int) {
  ilist_iterator tmp = *this;
  --*this;
  return tmp;
}
ilist_iterator operator++(int) {
  ilist_iterator tmp = *this;
  ++*this;
  return tmp;
}

/// Get the underlying ilist_node.
node_pointer getNodePtr() const { return static_cast<node_pointer>(NodePtr); }

/// Check for end.  Only valid if ilist_sentinel_tracking<true>.
bool isEnd() const { return NodePtr ? NodePtr->isSentinel() : false; }
176};

178template <typename From> struct simplify_type;

180/// Allow ilist_iterators to convert into pointers to a node automatically when
181/// used by the dyn_cast, cast, isa mechanisms...
182///
183/// FIXME: remove this, since there is no implicit conversion to NodeTy.
184template <class OptionsT, bool IsConst>
185struct simplify_type<ilist_iterator<OptionsT, false, IsConst>> {
using iterator = ilist_iterator<OptionsT, false, IsConst>;
using SimpleType = typename iterator::pointer;

static SimpleType getSimplifiedValue(const iterator &Node) { return &*Node; }
190};
191template <class OptionsT, bool IsConst>
192struct simplify_type<const ilist_iterator<OptionsT, false, IsConst>>
  : simplify_type<ilist_iterator<OptionsT, false, IsConst>> {};

195} // end namespace llvm

197#endif // LLVM_ADT_ILIST_ITERATOR_H

←

/build/llvm-toolchain-snapshot-14~++20210903100615+fd66b44ec19e/llvm/include/llvm/CodeGen/MachineScheduler.h

1//===- MachineScheduler.h - MachineInstr Scheduling Pass --------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file provides an interface for customizing the standard MachineScheduler
10// pass. Note that the entire pass may be replaced as follows:
11//
12// <Target>TargetMachine::createPassConfig(PassManagerBase &PM) {
13//   PM.substitutePass(&MachineSchedulerID, &CustomSchedulerPassID);
14//   ...}
15//
16// The MachineScheduler pass is only responsible for choosing the regions to be
17// scheduled. Targets can override the DAG builder and scheduler without
18// replacing the pass as follows:
19//
20// ScheduleDAGInstrs *<Target>PassConfig::
21// createMachineScheduler(MachineSchedContext *C) {
22//   return new CustomMachineScheduler(C);
23// }
24//
25// The default scheduler, ScheduleDAGMILive, builds the DAG and drives list
26// scheduling while updating the instruction stream, register pressure, and live
27// intervals. Most targets don't need to override the DAG builder and list
28// scheduler, but subtargets that require custom scheduling heuristics may
29// plugin an alternate MachineSchedStrategy. The strategy is responsible for
30// selecting the highest priority node from the list:
31//
32// ScheduleDAGInstrs *<Target>PassConfig::
33// createMachineScheduler(MachineSchedContext *C) {
34//   return new ScheduleDAGMILive(C, CustomStrategy(C));
35// }
36//
37// The DAG builder can also be customized in a sense by adding DAG mutations
38// that will run after DAG building and before list scheduling. DAG mutations
39// can adjust dependencies based on target-specific knowledge or add weak edges
40// to aid heuristics:
41//
42// ScheduleDAGInstrs *<Target>PassConfig::
43// createMachineScheduler(MachineSchedContext *C) {
44//   ScheduleDAGMI *DAG = createGenericSchedLive(C);
45//   DAG->addMutation(new CustomDAGMutation(...));
46//   return DAG;
47// }
48//
49// A target that supports alternative schedulers can use the
50// MachineSchedRegistry to allow command line selection. This can be done by
51// implementing the following boilerplate:
52//
53// static ScheduleDAGInstrs *createCustomMachineSched(MachineSchedContext *C) {
54//  return new CustomMachineScheduler(C);
55// }
56// static MachineSchedRegistry
57// SchedCustomRegistry("custom", "Run my target's custom scheduler",
58//                     createCustomMachineSched);
59//
60//
61// Finally, subtargets that don't need to implement custom heuristics but would
62// like to configure the GenericScheduler's policy for a given scheduler region,
63// including scheduling direction and register pressure tracking policy, can do
64// this:
65//
66// void <SubTarget>Subtarget::
67// overrideSchedPolicy(MachineSchedPolicy &Policy,
68//                     unsigned NumRegionInstrs) const {
69//   Policy.<Flag> = true;
70// }
71//
72//===----------------------------------------------------------------------===//

74#ifndef LLVM_CODEGEN_MACHINESCHEDULER_H
75#define LLVM_CODEGEN_MACHINESCHEDULER_H

77#include "llvm/ADT/APInt.h"
78#include "llvm/ADT/ArrayRef.h"
79#include "llvm/ADT/BitVector.h"
80#include "llvm/ADT/STLExtras.h"
81#include "llvm/ADT/SmallVector.h"
82#include "llvm/ADT/StringRef.h"
83#include "llvm/ADT/Twine.h"
84#include "llvm/CodeGen/MachineBasicBlock.h"
85#include "llvm/CodeGen/MachinePassRegistry.h"
86#include "llvm/CodeGen/RegisterPressure.h"
87#include "llvm/CodeGen/ScheduleDAG.h"
88#include "llvm/CodeGen/ScheduleDAGInstrs.h"
89#include "llvm/CodeGen/ScheduleDAGMutation.h"
90#include "llvm/CodeGen/TargetSchedule.h"
91#include "llvm/Support/CommandLine.h"
92#include "llvm/Support/ErrorHandling.h"
93#include <algorithm>
94#include <cassert>
95#include <memory>
96#include <string>
97#include <vector>

99namespace llvm {

101extern cl::opt<bool> ForceTopDown;
102extern cl::opt<bool> ForceBottomUp;
103extern cl::opt<bool> VerifyScheduling;

105class AAResults;
106class LiveIntervals;
107class MachineDominatorTree;
108class MachineFunction;
109class MachineInstr;
110class MachineLoopInfo;
111class RegisterClassInfo;
112class SchedDFSResult;
113class ScheduleHazardRecognizer;
114class TargetInstrInfo;
115class TargetPassConfig;
116class TargetRegisterInfo;

118/// MachineSchedContext provides enough context from the MachineScheduler pass
119/// for the target to instantiate a scheduler.
120struct MachineSchedContext {
MachineFunction *MF = nullptr;
const MachineLoopInfo *MLI = nullptr;
const MachineDominatorTree *MDT = nullptr;
const TargetPassConfig *PassConfig = nullptr;
AAResults *AA = nullptr;
LiveIntervals *LIS = nullptr;

RegisterClassInfo *RegClassInfo;

MachineSchedContext();
virtual ~MachineSchedContext();
132};

134/// MachineSchedRegistry provides a selection of available machine instruction
135/// schedulers.
136class MachineSchedRegistry
  : public MachinePassRegistryNode<
        ScheduleDAGInstrs *(*)(MachineSchedContext *)> {
139public:
using ScheduleDAGCtor = ScheduleDAGInstrs *(*)(MachineSchedContext *);

// RegisterPassParser requires a (misnamed) FunctionPassCtor type.
using FunctionPassCtor = ScheduleDAGCtor;

static MachinePassRegistry<ScheduleDAGCtor> Registry;

MachineSchedRegistry(const char *N, const char *D, ScheduleDAGCtor C)
    : MachinePassRegistryNode(N, D, C) {
  Registry.Add(this);
}

~MachineSchedRegistry() { Registry.Remove(this); }

// Accessors.
//
MachineSchedRegistry *getNext() const {
  return (MachineSchedRegistry *)MachinePassRegistryNode::getNext();
}

static MachineSchedRegistry *getList() {
  return (MachineSchedRegistry *)Registry.getList();
}

static void setListener(MachinePassRegistryListener<FunctionPassCtor> *L) {
  Registry.setListener(L);
}
167};

169class ScheduleDAGMI;

171/// Define a generic scheduling policy for targets that don't provide their own
172/// MachineSchedStrategy. This can be overriden for each scheduling region
173/// before building the DAG.
174struct MachineSchedPolicy {
// Allow the scheduler to disable register pressure tracking.
bool ShouldTrackPressure = false;
/// Track LaneMasks to allow reordering of independent subregister writes
/// of the same vreg. \sa MachineSchedStrategy::shouldTrackLaneMasks()
bool ShouldTrackLaneMasks = false;

// Allow the scheduler to force top-down or bottom-up scheduling. If neither
// is true, the scheduler runs in both directions and converges.
bool OnlyTopDown = false;
bool OnlyBottomUp = false;

// Disable heuristic that tries to fetch nodes from long dependency chains
// first.
bool DisableLatencyHeuristic = false;

// Compute DFSResult for use in scheduling heuristics.
bool ComputeDFSResult = false;

MachineSchedPolicy() = default;
194};

196/// MachineSchedStrategy - Interface to the scheduling algorithm used by
197/// ScheduleDAGMI.
198///
199/// Initialization sequence:
200///   initPolicy -> shouldTrackPressure -> initialize(DAG) -> registerRoots
201class MachineSchedStrategy {
virtual void anchor();

204public:
virtual ~MachineSchedStrategy() = default;

/// Optionally override the per-region scheduling policy.
virtual void initPolicy(MachineBasicBlock::iterator Begin,
                        MachineBasicBlock::iterator End,
                        unsigned NumRegionInstrs) {}

virtual void dumpPolicy() const {}

/// Check if pressure tracking is needed before building the DAG and
/// initializing this strategy. Called after initPolicy.
virtual bool shouldTrackPressure() const { return true; }

/// Returns true if lanemasks should be tracked. LaneMask tracking is
/// necessary to reorder independent subregister defs for the same vreg.
/// This has to be enabled in combination with shouldTrackPressure().
virtual bool shouldTrackLaneMasks() const { return false; }

// If this method returns true, handling of the scheduling regions
// themselves (in case of a scheduling boundary in MBB) will be done
// beginning with the topmost region of MBB.
virtual bool doMBBSchedRegionsTopDown() const { return false; }

/// Initialize the strategy after building the DAG for a new region.
virtual void initialize(ScheduleDAGMI *DAG) = 0;

/// Tell the strategy that MBB is about to be processed.
virtual void enterMBB(MachineBasicBlock *MBB) {};

/// Tell the strategy that current MBB is done.
virtual void leaveMBB() {};

/// Notify this strategy that all roots have been released (including those
/// that depend on EntrySU or ExitSU).
virtual void registerRoots() {}

/// Pick the next node to schedule, or return NULL. Set IsTopNode to true to
/// schedule the node at the top of the unscheduled region. Otherwise it will
/// be scheduled at the bottom.
virtual SUnit *pickNode(bool &IsTopNode) = 0;

/// Scheduler callback to notify that a new subtree is scheduled.
virtual void scheduleTree(unsigned SubtreeID) {}

/// Notify MachineSchedStrategy that ScheduleDAGMI has scheduled an
/// instruction and updated scheduled/remaining flags in the DAG nodes.
virtual void schedNode(SUnit *SU, bool IsTopNode) = 0;

/// When all predecessor dependencies have been resolved, free this node for
/// top-down scheduling.
virtual void releaseTopNode(SUnit *SU) = 0;

/// When all successor dependencies have been resolved, free this node for
/// bottom-up scheduling.
virtual void releaseBottomNode(SUnit *SU) = 0;
260};

262/// ScheduleDAGMI is an implementation of ScheduleDAGInstrs that simply
263/// schedules machine instructions according to the given MachineSchedStrategy
264/// without much extra book-keeping. This is the common functionality between
265/// PreRA and PostRA MachineScheduler.
266class ScheduleDAGMI : public ScheduleDAGInstrs {
267protected:
AAResults *AA;
LiveIntervals *LIS;
std::unique_ptr<MachineSchedStrategy> SchedImpl;

/// Ordered list of DAG postprocessing steps.
std::vector<std::unique_ptr<ScheduleDAGMutation>> Mutations;

/// The top of the unscheduled zone.
MachineBasicBlock::iterator CurrentTop;

/// The bottom of the unscheduled zone.
MachineBasicBlock::iterator CurrentBottom;

/// Record the next node in a scheduled cluster.
const SUnit *NextClusterPred = nullptr;
const SUnit *NextClusterSucc = nullptr;

285#ifndef NDEBUG1
/// The number of instructions scheduled so far. Used to cut off the
/// scheduler at the point determined by misched-cutoff.
unsigned NumInstrsScheduled = 0;
289#endif

291public:
ScheduleDAGMI(MachineSchedContext *C, std::unique_ptr<MachineSchedStrategy> S,
              bool RemoveKillFlags)
    : ScheduleDAGInstrs(*C->MF, C->MLI, RemoveKillFlags), AA(C->AA),
      LIS(C->LIS), SchedImpl(std::move(S)) {}

// Provide a vtable anchor
~ScheduleDAGMI() override;

/// If this method returns true, handling of the scheduling regions
/// themselves (in case of a scheduling boundary in MBB) will be done
/// beginning with the topmost region of MBB.
bool doMBBSchedRegionsTopDown() const override {
  return SchedImpl->doMBBSchedRegionsTopDown();
}

// Returns LiveIntervals instance for use in DAG mutators and such.
LiveIntervals *getLIS() const { return LIS; }

/// Return true if this DAG supports VReg liveness and RegPressure.
virtual bool hasVRegLiveness() const { return false; }

/// Add a postprocessing step to the DAG builder.
/// Mutations are applied in the order that they are added after normal DAG
/// building and before MachineSchedStrategy initialization.
///
/// ScheduleDAGMI takes ownership of the Mutation object.
void addMutation(std::unique_ptr<ScheduleDAGMutation> Mutation) {
  if (Mutation)
    Mutations.push_back(std::move(Mutation));
}

MachineBasicBlock::iterator top() const { return CurrentTop; }
MachineBasicBlock::iterator bottom() const { return CurrentBottom; }

/// Implement the ScheduleDAGInstrs interface for handling the next scheduling
/// region. This covers all instructions in a block, while schedule() may only
/// cover a subset.
void enterRegion(MachineBasicBlock *bb,
                 MachineBasicBlock::iterator begin,
                 MachineBasicBlock::iterator end,
                 unsigned regioninstrs) override;

/// Implement ScheduleDAGInstrs interface for scheduling a sequence of
/// reorderable instructions.
void schedule() override;

void startBlock(MachineBasicBlock *bb) override;
void finishBlock() override;

/// Change the position of an instruction within the basic block and update
/// live ranges and region boundary iterators.
void moveInstruction(MachineInstr *MI, MachineBasicBlock::iterator InsertPos);

const SUnit *getNextClusterPred() const { return NextClusterPred; }

const SUnit *getNextClusterSucc() const { return NextClusterSucc; }

void viewGraph(const Twine &Name, const Twine &Title) override;
void viewGraph() override;

352protected:
// Top-Level entry points for the schedule() driver...

/// Apply each ScheduleDAGMutation step in order. This allows different
/// instances of ScheduleDAGMI to perform custom DAG postprocessing.
void postprocessDAG();

/// Release ExitSU predecessors and setup scheduler queues.
void initQueues(ArrayRef<SUnit*> TopRoots, ArrayRef<SUnit*> BotRoots);

/// Update scheduler DAG and queues after scheduling an instruction.
void updateQueues(SUnit *SU, bool IsTopNode);

/// Reinsert debug_values recorded in ScheduleDAGInstrs::DbgValues.
void placeDebugValues();

/// dump the scheduled Sequence.
void dumpSchedule() const;

// Lesser helpers...
bool checkSchedLimit();

void findRootsAndBiasEdges(SmallVectorImpl<SUnit*> &TopRoots,
                           SmallVectorImpl<SUnit*> &BotRoots);

void releaseSucc(SUnit *SU, SDep *SuccEdge);
void releaseSuccessors(SUnit *SU);
void releasePred(SUnit *SU, SDep *PredEdge);
void releasePredecessors(SUnit *SU);
381};

383/// ScheduleDAGMILive is an implementation of ScheduleDAGInstrs that schedules
384/// machine instructions while updating LiveIntervals and tracking regpressure.
385class ScheduleDAGMILive : public ScheduleDAGMI {
386protected:
RegisterClassInfo *RegClassInfo;

/// Information about DAG subtrees. If DFSResult is NULL, then SchedulerTrees
/// will be empty.
SchedDFSResult *DFSResult = nullptr;
BitVector ScheduledTrees;

MachineBasicBlock::iterator LiveRegionEnd;

/// Maps vregs to the SUnits of their uses in the current scheduling region.
VReg2SUnitMultiMap VRegUses;

// Map each SU to its summary of pressure changes. This array is updated for
// liveness during bottom-up scheduling. Top-down scheduling may proceed but
// has no affect on the pressure diffs.
PressureDiffs SUPressureDiffs;

/// Register pressure in this region computed by initRegPressure.
bool ShouldTrackPressure = false;
bool ShouldTrackLaneMasks = false;
IntervalPressure RegPressure;
RegPressureTracker RPTracker;

/// List of pressure sets that exceed the target's pressure limit before
/// scheduling, listed in increasing set ID order. Each pressure set is paired
/// with its max pressure in the currently scheduled regions.
std::vector<PressureChange> RegionCriticalPSets;

/// The top of the unscheduled zone.
IntervalPressure TopPressure;
RegPressureTracker TopRPTracker;

/// The bottom of the unscheduled zone.
IntervalPressure BotPressure;
RegPressureTracker BotRPTracker;

/// True if disconnected subregister components are already renamed.
/// The renaming is only done on demand if lane masks are tracked.
bool DisconnectedComponentsRenamed = false;

427public:
ScheduleDAGMILive(MachineSchedContext *C,
                  std::unique_ptr<MachineSchedStrategy> S)
    : ScheduleDAGMI(C, std::move(S), /*RemoveKillFlags=*/false),
      RegClassInfo(C->RegClassInfo), RPTracker(RegPressure),
      TopRPTracker(TopPressure), BotRPTracker(BotPressure) {}

~ScheduleDAGMILive() override;

/// Return true if this DAG supports VReg liveness and RegPressure.
bool hasVRegLiveness() const override { return true; }

/// Return true if register pressure tracking is enabled.
bool isTrackingPressure() const { return ShouldTrackPressure; }

/// Get current register pressure for the top scheduled instructions.
const IntervalPressure &getTopPressure() const { return TopPressure; }
const RegPressureTracker &getTopRPTracker() const { return TopRPTracker; }

/// Get current register pressure for the bottom scheduled instructions.
const IntervalPressure &getBotPressure() const { return BotPressure; }
const RegPressureTracker &getBotRPTracker() const { return BotRPTracker; }

/// Get register pressure for the entire scheduling region before scheduling.
const IntervalPressure &getRegPressure() const { return RegPressure; }

const std::vector<PressureChange> &getRegionCriticalPSets() const {
  return RegionCriticalPSets;
}

PressureDiff &getPressureDiff(const SUnit *SU) {
  return SUPressureDiffs[SU->NodeNum];
}
const PressureDiff &getPressureDiff(const SUnit *SU) const {
  return SUPressureDiffs[SU->NodeNum];
}

/// Compute a DFSResult after DAG building is complete, and before any
/// queue comparisons.
void computeDFSResult();

/// Return a non-null DFS result if the scheduling strategy initialized it.
const SchedDFSResult *getDFSResult() const { return DFSResult; }

BitVector &getScheduledTrees() { return ScheduledTrees; }

/// Implement the ScheduleDAGInstrs interface for handling the next scheduling
/// region. This covers all instructions in a block, while schedule() may only
/// cover a subset.
void enterRegion(MachineBasicBlock *bb,
                 MachineBasicBlock::iterator begin,
                 MachineBasicBlock::iterator end,
                 unsigned regioninstrs) override;

/// Implement ScheduleDAGInstrs interface for scheduling a sequence of
/// reorderable instructions.
void schedule() override;

/// Compute the cyclic critical path through the DAG.
unsigned computeCyclicCriticalPath();

void dump() const override;

490protected:
// Top-Level entry points for the schedule() driver...

/// Call ScheduleDAGInstrs::buildSchedGraph with register pressure tracking
/// enabled. This sets up three trackers. RPTracker will cover the entire DAG
/// region, TopTracker and BottomTracker will be initialized to the top and
/// bottom of the DAG region without covereing any unscheduled instruction.
void buildDAGWithRegPressure();

/// Release ExitSU predecessors and setup scheduler queues. Re-position
/// the Top RP tracker in case the region beginning has changed.
void initQueues(ArrayRef<SUnit*> TopRoots, ArrayRef<SUnit*> BotRoots);

/// Move an instruction and update register pressure.
void scheduleMI(SUnit *SU, bool IsTopNode);

// Lesser helpers...

void initRegPressure();

void updatePressureDiffs(ArrayRef<RegisterMaskPair> LiveUses);

void updateScheduledPressure(const SUnit *SU,
                             const std::vector<unsigned> &NewMaxPressure);

void collectVRegUses(SUnit &SU);
516};

518//===----------------------------------------------------------------------===//
519///
520/// Helpers for implementing custom MachineSchedStrategy classes. These take
521/// care of the book-keeping associated with list scheduling heuristics.
522///
523//===----------------------------------------------------------------------===//

525/// ReadyQueue encapsulates vector of "ready" SUnits with basic convenience
526/// methods for pushing and removing nodes. ReadyQueue's are uniquely identified
527/// by an ID. SUnit::NodeQueueId is a mask of the ReadyQueues the SUnit is in.
528///
529/// This is a convenience class that may be used by implementations of
530/// MachineSchedStrategy.
531class ReadyQueue {
unsigned ID;
std::string Name;
std::vector<SUnit*> Queue;

536public:
ReadyQueue(unsigned id, const Twine &name): ID(id), Name(name.str()) {}

unsigned getID() const { return ID; }

StringRef getName() const { return Name; }

// SU is in this queue if it's NodeQueueID is a superset of this ID.
bool isInQueue(SUnit *SU) const { return (SU->NodeQueueId & ID); }

bool empty() const { return Queue.empty(); }

void clear() { Queue.clear(); }

unsigned size() const { return Queue.size(); }

using iterator = std::vector<SUnit*>::iterator;

iterator begin() { return Queue.begin(); }

iterator end() { return Queue.end(); }

ArrayRef<SUnit*> elements() { return Queue; }

iterator find(SUnit *SU) { return llvm::find(Queue, SU); }

void push(SUnit *SU) {
  Queue.push_back(SU);
  SU->NodeQueueId |= ID;
}

iterator remove(iterator I) {
  (*I)->NodeQueueId &= ~ID;
  *I = Queue.back();
  unsigned idx = I - Queue.begin();
  Queue.pop_back();
  return Queue.begin() + idx;
}

void dump() const;
576};

578/// Summarize the unscheduled region.
579struct SchedRemainder {
// Critical path through the DAG in expected latency.
unsigned CriticalPath;
unsigned CyclicCritPath;

// Scaled count of micro-ops left to schedule.
unsigned RemIssueCount;

bool IsAcyclicLatencyLimited;

// Unscheduled resources
SmallVector<unsigned, 16> RemainingCounts;

SchedRemainder() { reset(); }

void reset() {
  CriticalPath = 0;
  CyclicCritPath = 0;
  RemIssueCount = 0;
  IsAcyclicLatencyLimited = false;
  RemainingCounts.clear();
}

void init(ScheduleDAGMI *DAG, const TargetSchedModel *SchedModel);
603};

605/// Each Scheduling boundary is associated with ready queues. It tracks the
606/// current cycle in the direction of movement, and maintains the state
607/// of "hazards" and other interlocks at the current cycle.
608class SchedBoundary {
609public:
/// SUnit::NodeQueueId: 0 (none), 1 (top), 2 (bot), 3 (both)
enum {
  TopQID = 1,
  BotQID = 2,
  LogMaxQID = 2
};

ScheduleDAGMI *DAG = nullptr;
const TargetSchedModel *SchedModel = nullptr;
SchedRemainder *Rem = nullptr;

ReadyQueue Available;
ReadyQueue Pending;

ScheduleHazardRecognizer *HazardRec = nullptr;

626private:
/// True if the pending Q should be checked/updated before scheduling another
/// instruction.
bool CheckPending;

/// Number of cycles it takes to issue the instructions scheduled in this
/// zone. It is defined as: scheduled-micro-ops / issue-width + stalls.
/// See getStalls().
unsigned CurrCycle;

/// Micro-ops issued in the current cycle
unsigned CurrMOps;

/// MinReadyCycle - Cycle of the soonest available instruction.
unsigned MinReadyCycle;

// The expected latency of the critical path in this scheduled zone.
unsigned ExpectedLatency;

// The latency of dependence chains leading into this zone.
// For each node scheduled bottom-up: DLat = max DLat, N.Depth.
// For each cycle scheduled: DLat -= 1.
unsigned DependentLatency;

/// Count the scheduled (issued) micro-ops that can be retired by
/// time=CurrCycle assuming the first scheduled instr is retired at time=0.
unsigned RetiredMOps;

// Count scheduled resources that have been executed. Resources are
// considered executed if they become ready in the time that it takes to
// saturate any resource including the one in question. Counts are scaled
// for direct comparison with other resources. Counts can be compared with
// MOps * getMicroOpFactor and Latency * getLatencyFactor.
SmallVector<unsigned, 16> ExecutedResCounts;

/// Cache the max count for a single resource.
unsigned MaxExecutedResCount;

// Cache the critical resources ID in this scheduled zone.
unsigned ZoneCritResIdx;

// Is the scheduled region resource limited vs. latency limited.
bool IsResourceLimited;

// Record the highest cycle at which each resource has been reserved by a
// scheduled instruction.
SmallVector<unsigned, 16> ReservedCycles;

// For each PIdx, stores first index into ReservedCycles that corresponds to
// it.
SmallVector<unsigned, 16> ReservedCyclesIndex;

// For each PIdx, stores the resource group IDs of its subunits
SmallVector<APInt, 16> ResourceGroupSubUnitMasks;

681#ifndef NDEBUG1
// Remember the greatest possible stall as an upper bound on the number of
// times we should retry the pending queue because of a hazard.
unsigned MaxObservedStall;
685#endif

687public:
/// Pending queues extend the ready queues with the same ID and the
/// PendingFlag set.
SchedBoundary(unsigned ID, const Twine &Name):
  Available(ID, Name+".A"), Pending(ID << LogMaxQID, Name+".P") {
  reset();
}

~SchedBoundary();

void reset();

void init(ScheduleDAGMI *dag, const TargetSchedModel *smodel,
          SchedRemainder *rem);

bool isTop() const {
  return Available.getID() == TopQID;
}

/// Number of cycles to issue the instructions scheduled in this zone.
unsigned getCurrCycle() const { return CurrCycle; }

/// Micro-ops issued in the current cycle
unsigned getCurrMOps() const { return CurrMOps; }

// The latency of dependence chains leading into this zone.
unsigned getDependentLatency() const { return DependentLatency; }

/// Get the number of latency cycles "covered" by the scheduled
/// instructions. This is the larger of the critical path within the zone
/// and the number of cycles required to issue the instructions.
unsigned getScheduledLatency() const {
  return std::max(ExpectedLatency, CurrCycle);
}

unsigned getUnscheduledLatency(SUnit *SU) const {
  return isTop() ? SU->getHeight() : SU->getDepth();
}

unsigned getResourceCount(unsigned ResIdx) const {
  return ExecutedResCounts[ResIdx];
}

/// Get the scaled count of scheduled micro-ops and resources, including
/// executed resources.
unsigned getCriticalCount() const {
  if (!ZoneCritResIdx)
    return RetiredMOps * SchedModel->getMicroOpFactor();
  return getResourceCount(ZoneCritResIdx);
}

/// Get a scaled count for the minimum execution time of the scheduled
/// micro-ops that are ready to execute by getExecutedCount. Notice the
/// feedback loop.
unsigned getExecutedCount() const {
  return std::max(CurrCycle * SchedModel->getLatencyFactor(),
                  MaxExecutedResCount);
}

unsigned getZoneCritResIdx() const { return ZoneCritResIdx; }

// Is the scheduled region resource limited vs. latency limited.
bool isResourceLimited() const { return IsResourceLimited; }

/// Get the difference between the given SUnit's ready time and the current
/// cycle.
unsigned getLatencyStallCycles(SUnit *SU);

unsigned getNextResourceCycleByInstance(unsigned InstanceIndex,
                                        unsigned Cycles);

std::pair<unsigned, unsigned> getNextResourceCycle(const MCSchedClassDesc *SC,
                                                   unsigned PIdx,
                                                   unsigned Cycles);

bool isUnbufferedGroup(unsigned PIdx) const {
  return SchedModel->getProcResource(PIdx)->SubUnitsIdxBegin &&
         !SchedModel->getProcResource(PIdx)->BufferSize;
}

bool checkHazard(SUnit *SU);

unsigned findMaxLatency(ArrayRef<SUnit*> ReadySUs);

unsigned getOtherResourceCount(unsigned &OtherCritIdx);

/// Release SU to make it ready. If it's not in hazard, remove it from
/// pending queue (if already in) and push into available queue.
/// Otherwise, push the SU into pending queue.
///
/// @param SU The unit to be released.
/// @param ReadyCycle Until which cycle the unit is ready.
/// @param InPQueue Whether SU is already in pending queue.
/// @param Idx Position offset in pending queue (if in it).
void releaseNode(SUnit *SU, unsigned ReadyCycle, bool InPQueue,
                 unsigned Idx = 0);

void bumpCycle(unsigned NextCycle);

void incExecutedResources(unsigned PIdx, unsigned Count);

unsigned countResource(const MCSchedClassDesc *SC, unsigned PIdx,
                       unsigned Cycles, unsigned ReadyCycle);

void bumpNode(SUnit *SU);

void releasePending();

void removeReady(SUnit *SU);

/// Call this before applying any other heuristics to the Available queue.
/// Updates the Available/Pending Q's if necessary and returns the single
/// available instruction, or NULL if there are multiple candidates.
SUnit *pickOnlyChoice();

void dumpScheduledState() const;
803};

805/// Base class for GenericScheduler. This class maintains information about
806/// scheduling candidates based on TargetSchedModel making it easy to implement
807/// heuristics for either preRA or postRA scheduling.
808class GenericSchedulerBase : public MachineSchedStrategy {
809public:
/// Represent the type of SchedCandidate found within a single queue.
/// pickNodeBidirectional depends on these listed by decreasing priority.
enum CandReason : uint8_t {
  NoCand, Only1, PhysReg, RegExcess, RegCritical, Stall, Cluster, Weak,
  RegMax, ResourceReduce, ResourceDemand, BotHeightReduce, BotPathReduce,
  TopDepthReduce, TopPathReduce, NextDefUse, NodeOrder};

817#ifndef NDEBUG1
static const char *getReasonStr(GenericSchedulerBase::CandReason Reason);
819#endif

/// Policy for scheduling the next instruction in the candidate's zone.
struct CandPolicy {
  bool ReduceLatency = false;
  unsigned ReduceResIdx = 0;
  unsigned DemandResIdx = 0;

  CandPolicy() = default;

  bool operator==(const CandPolicy &RHS) const {
    return ReduceLatency == RHS.ReduceLatency &&
           ReduceResIdx == RHS.ReduceResIdx &&
           DemandResIdx == RHS.DemandResIdx;
  }
  bool operator!=(const CandPolicy &RHS) const {
    return !(*this == RHS);
  }
};

/// Status of an instruction's critical resource consumption.
struct SchedResourceDelta {
  // Count critical resources in the scheduled region required by SU.
  unsigned CritResources = 0;

  // Count critical resources from another region consumed by SU.
  unsigned DemandedResources = 0;

  SchedResourceDelta() = default;

  bool operator==(const SchedResourceDelta &RHS) const {
    return CritResources == RHS.CritResources
      && DemandedResources == RHS.DemandedResources;
  }
  bool operator!=(const SchedResourceDelta &RHS) const {
    return !operator==(RHS);
  }
};

/// Store the state used by GenericScheduler heuristics, required for the
/// lifetime of one invocation of pickNode().
struct SchedCandidate {
  CandPolicy Policy;

  // The best SUnit candidate.
  SUnit *SU;

  // The reason for this candidate.
  CandReason Reason;

  // Whether this candidate should be scheduled at top/bottom.
  bool AtTop;

  // Register pressure values for the best candidate.
  RegPressureDelta RPDelta;

  // Critical resource consumption of the best candidate.
  SchedResourceDelta ResDelta;

  SchedCandidate() { reset(CandPolicy()); }
  SchedCandidate(const CandPolicy &Policy) { reset(Policy); }
22
←
Calling 'SchedCandidate::reset'→
24
←
Returning from 'SchedCandidate::reset'→

  void reset(const CandPolicy &NewPolicy) {
    Policy = NewPolicy;
    SU = nullptr;
23
←
Null pointer value stored to 'TopCand.SU'→
    Reason = NoCand;
    AtTop = false;
    RPDelta = RegPressureDelta();
    ResDelta = SchedResourceDelta();
  }

  bool isValid() const { return SU; }

  // Copy the status of another candidate without changing policy.
  void setBest(SchedCandidate &Best) {
    assert(Best.Reason != NoCand && "uninitialized Sched candidate")(static_cast<void> (0));
    SU = Best.SU;
    Reason = Best.Reason;
    AtTop = Best.AtTop;
    RPDelta = Best.RPDelta;
    ResDelta = Best.ResDelta;
  }

  void initResourceDelta(const ScheduleDAGMI *DAG,
                         const TargetSchedModel *SchedModel);
};

906protected:
const MachineSchedContext *Context;
const TargetSchedModel *SchedModel = nullptr;
const TargetRegisterInfo *TRI = nullptr;

SchedRemainder Rem;

GenericSchedulerBase(const MachineSchedContext *C) : Context(C) {}

void setPolicy(CandPolicy &Policy, bool IsPostRA, SchedBoundary &CurrZone,
               SchedBoundary *OtherZone);

918#ifndef NDEBUG1
void traceCandidate(const SchedCandidate &Cand);
920#endif

922private:
bool shouldReduceLatency(const CandPolicy &Policy, SchedBoundary &CurrZone,
                         bool ComputeRemLatency, unsigned &RemLatency) const;
925};

927// Utility functions used by heuristics in tryCandidate().
928bool tryLess(int TryVal, int CandVal,
           GenericSchedulerBase::SchedCandidate &TryCand,
           GenericSchedulerBase::SchedCandidate &Cand,
           GenericSchedulerBase::CandReason Reason);
932bool tryGreater(int TryVal, int CandVal,
              GenericSchedulerBase::SchedCandidate &TryCand,
              GenericSchedulerBase::SchedCandidate &Cand,
              GenericSchedulerBase::CandReason Reason);
936bool tryLatency(GenericSchedulerBase::SchedCandidate &TryCand,
              GenericSchedulerBase::SchedCandidate &Cand,
              SchedBoundary &Zone);
939bool tryPressure(const PressureChange &TryP,
               const PressureChange &CandP,
               GenericSchedulerBase::SchedCandidate &TryCand,
               GenericSchedulerBase::SchedCandidate &Cand,
               GenericSchedulerBase::CandReason Reason,
               const TargetRegisterInfo *TRI,
               const MachineFunction &MF);
946unsigned getWeakLeft(const SUnit *SU, bool isTop);
947int biasPhysReg(const SUnit *SU, bool isTop);

949/// GenericScheduler shrinks the unscheduled zone using heuristics to balance
950/// the schedule.
951class GenericScheduler : public GenericSchedulerBase {
952public:
GenericScheduler(const MachineSchedContext *C):
  GenericSchedulerBase(C), Top(SchedBoundary::TopQID, "TopQ"),
  Bot(SchedBoundary::BotQID, "BotQ") {}

void initPolicy(MachineBasicBlock::iterator Begin,
                MachineBasicBlock::iterator End,
                unsigned NumRegionInstrs) override;

void dumpPolicy() const override;

bool shouldTrackPressure() const override {
  return RegionPolicy.ShouldTrackPressure;
}

bool shouldTrackLaneMasks() const override {
  return RegionPolicy.ShouldTrackLaneMasks;
}

void initialize(ScheduleDAGMI *dag) override;

SUnit *pickNode(bool &IsTopNode) override;

void schedNode(SUnit *SU, bool IsTopNode) override;

void releaseTopNode(SUnit *SU) override {
  if (SU->isScheduled)
    return;

  Top.releaseNode(SU, SU->TopReadyCycle, false);
  TopCand.SU = nullptr;
}

void releaseBottomNode(SUnit *SU) override {
  if (SU->isScheduled)
    return;

  Bot.releaseNode(SU, SU->BotReadyCycle, false);
  BotCand.SU = nullptr;
}

void registerRoots() override;

995protected:
ScheduleDAGMILive *DAG = nullptr;

MachineSchedPolicy RegionPolicy;

// State of the top and bottom scheduled instruction boundaries.
SchedBoundary Top;
SchedBoundary Bot;

/// Candidate last picked from Top boundary.
SchedCandidate TopCand;
/// Candidate last picked from Bot boundary.
SchedCandidate BotCand;

void checkAcyclicLatency();

void initCandidate(SchedCandidate &Cand, SUnit *SU, bool AtTop,
                   const RegPressureTracker &RPTracker,
                   RegPressureTracker &TempTracker);

virtual bool tryCandidate(SchedCandidate &Cand, SchedCandidate &TryCand,
                          SchedBoundary *Zone) const;

SUnit *pickNodeBidirectional(bool &IsTopNode);

void pickNodeFromQueue(SchedBoundary &Zone,
                       const CandPolicy &ZonePolicy,
                       const RegPressureTracker &RPTracker,
                       SchedCandidate &Candidate);

void reschedulePhysReg(SUnit *SU, bool isTop);
1026};

1028/// PostGenericScheduler - Interface to the scheduling algorithm used by
1029/// ScheduleDAGMI.
1030///
1031/// Callbacks from ScheduleDAGMI:
1032///   initPolicy -> initialize(DAG) -> registerRoots -> pickNode ...
1033class PostGenericScheduler : public GenericSchedulerBase {
1034protected:
ScheduleDAGMI *DAG = nullptr;
SchedBoundary Top;
SmallVector<SUnit*, 8> BotRoots;

1039public:
PostGenericScheduler(const MachineSchedContext *C):
  GenericSchedulerBase(C), Top(SchedBoundary::TopQID, "TopQ") {}

~PostGenericScheduler() override = default;

void initPolicy(MachineBasicBlock::iterator Begin,
                MachineBasicBlock::iterator End,
                unsigned NumRegionInstrs) override {
  /* no configurable policy */
}

/// PostRA scheduling does not track pressure.
bool shouldTrackPressure() const override { return false; }

void initialize(ScheduleDAGMI *Dag) override;

void registerRoots() override;

SUnit *pickNode(bool &IsTopNode) override;

void scheduleTree(unsigned SubtreeID) override {
  llvm_unreachable("PostRA scheduler does not support subtree analysis.")__builtin_unreachable();
}

void schedNode(SUnit *SU, bool IsTopNode) override;

void releaseTopNode(SUnit *SU) override {
  if (SU->isScheduled)
    return;
  Top.releaseNode(SU, SU->TopReadyCycle, false);
}

// Only called for roots.
void releaseBottomNode(SUnit *SU) override {
  BotRoots.push_back(SU);
}

1077protected:
virtual bool tryCandidate(SchedCandidate &Cand, SchedCandidate &TryCand);

void pickNodeFromQueue(SchedCandidate &Cand);
1081};

1083/// Create the standard converging machine scheduler. This will be used as the
1084/// default scheduler if the target does not set a default.
1085/// Adds default DAG mutations.
1086ScheduleDAGMILive *createGenericSchedLive(MachineSchedContext *C);

1088/// Create a generic scheduler with no vreg liveness or DAG mutation passes.
1089ScheduleDAGMI *createGenericSchedPostRA(MachineSchedContext *C);

1091std::unique_ptr<ScheduleDAGMutation>
1092createLoadClusterDAGMutation(const TargetInstrInfo *TII,
                           const TargetRegisterInfo *TRI);

1095std::unique_ptr<ScheduleDAGMutation>
1096createStoreClusterDAGMutation(const TargetInstrInfo *TII,
                            const TargetRegisterInfo *TRI);

1099std::unique_ptr<ScheduleDAGMutation>
1100createCopyConstrainDAGMutation(const TargetInstrInfo *TII,
                             const TargetRegisterInfo *TRI);

1103} // end namespace llvm

1105#endif // LLVM_CODEGEN_MACHINESCHEDULER_H