doxygen/LatencyPriorityQueue_8cpp_source.html

//===---- LatencyPriorityQueue.cpp - A latency-oriented priority queue ----===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the LatencyPriorityQueue class, which is a

// SchedulingPriorityQueue that schedules using latency information to

// reduce the length of the critical path through the basic block.

//

//===----------------------------------------------------------------------===//


#include "llvm/CodeGen/LatencyPriorityQueue.h"

#include "llvm/Config/llvm-config.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/raw_ostream.h"

using namespace llvm;


#define DEBUG_TYPE "scheduler"


bool latency_sort::operator()(const SUnit *LHS, const SUnit *RHS) const {

  // The isScheduleHigh flag allows nodes with wraparound dependencies that

  // cannot easily be modeled as edges with latencies to be scheduled as

  // soon as possible in a top-down schedule.

  if (LHS->isScheduleHigh && !RHS->isScheduleHigh)

    return false;

  if (!LHS->isScheduleHigh && RHS->isScheduleHigh)

    return true;


  unsigned LHSNum = LHS->NodeNum;

  unsigned RHSNum = RHS->NodeNum;


  // The most important heuristic is scheduling the critical path.

  unsigned LHSLatency = PQ->getLatency(LHSNum);

  unsigned RHSLatency = PQ->getLatency(RHSNum);

  if (LHSLatency < RHSLatency) return true;

  if (LHSLatency > RHSLatency) return false;


  // After that, if two nodes have identical latencies, look to see if one will

  // unblock more other nodes than the other.

  unsigned LHSBlocked = PQ->getNumSolelyBlockNodes(LHSNum);

  unsigned RHSBlocked = PQ->getNumSolelyBlockNodes(RHSNum);

  if (LHSBlocked < RHSBlocked) return true;

  if (LHSBlocked > RHSBlocked) return false;


  // Finally, just to provide a stable ordering, use the node number as a

  // deciding factor.

  return RHSNum < LHSNum;

}


/// getSingleUnscheduledPred - If there is exactly one unscheduled predecessor

/// of SU, return it, otherwise return null.

SUnit *LatencyPriorityQueue::getSingleUnscheduledPred(SUnit *SU) {

  SUnit *OnlyAvailablePred = nullptr;

  for (const SDep &P : SU->Preds) {

    SUnit &Pred = *P.getSUnit();

    if (!Pred.isScheduled) {

      // We found an available, but not scheduled, predecessor.  If it's the

      // only one we have found, keep track of it... otherwise give up.

      if (OnlyAvailablePred && OnlyAvailablePred != &Pred)

        return nullptr;

      OnlyAvailablePred = &Pred;

    }

  }


  return OnlyAvailablePred;

}


void LatencyPriorityQueue::push(SUnit *SU) {

  // Look at all of the successors of this node.  Count the number of nodes that

  // this node is the sole unscheduled node for.

  unsigned NumNodesBlocking = 0;

  for (const SDep &Succ : SU->Succs)

    if (getSingleUnscheduledPred(Succ.getSUnit()) == SU)

      ++NumNodesBlocking;

  NumNodesSolelyBlocking[SU->NodeNum] = NumNodesBlocking;


  Queue.push_back(SU);

}


// scheduledNode - As nodes are scheduled, we look to see if there are any

// successor nodes that have a single unscheduled predecessor.  If so, that

// single predecessor has a higher priority, since scheduling it will make

// the node available.

void LatencyPriorityQueue::scheduledNode(SUnit *SU) {

  for (const SDep &Succ : SU->Succs)

    AdjustPriorityOfUnscheduledPreds(Succ.getSUnit());

}


/// AdjustPriorityOfUnscheduledPreds - One of the predecessors of SU was just

/// scheduled.  If SU is not itself available, then there is at least one

/// predecessor node that has not been scheduled yet.  If SU has exactly ONE

/// unscheduled predecessor, we want to increase its priority: it getting

/// scheduled will make this node available, so it is better than some other

/// node of the same priority that will not make a node available.

void LatencyPriorityQueue::AdjustPriorityOfUnscheduledPreds(SUnit *SU) {

  if (SU->isAvailable) return;  // All preds scheduled.


  SUnit *OnlyAvailablePred = getSingleUnscheduledPred(SU);

  if (!OnlyAvailablePred || !OnlyAvailablePred->isAvailable) return;


  // Okay, we found a single predecessor that is available, but not scheduled.

  // Since it is available, it must be in the priority queue.  First remove it.

  remove(OnlyAvailablePred);


  // Reinsert the node into the priority queue, which recomputes its

  // NumNodesSolelyBlocking value.

  push(OnlyAvailablePred);

}


SUnit *LatencyPriorityQueue::pop() {

  if (empty()) return nullptr;

  std::vector<SUnit *>::iterator Best = Queue.begin();

  for (std::vector<SUnit *>::iterator I = std::next(Queue.begin()),

       E = Queue.end(); I != E; ++I)

    if (Picker(*Best, *I))

      Best = I;

  SUnit *V = *Best;

  if (Best != std::prev(Queue.end()))

    std::swap(*Best, Queue.back());

  Queue.pop_back();

  return V;

}


void LatencyPriorityQueue::remove(SUnit *SU) {

  assert(!Queue.empty() && "Queue is empty!");

  std::vector<SUnit *>::iterator I = find(Queue, SU);

  assert(I != Queue.end() && "Queue doesn't contain the SU being removed!");

  if (I != std::prev(Queue.end()))

    std::swap(*I, Queue.back());

  Queue.pop_back();

}


#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)

LLVM_DUMP_METHOD void LatencyPriorityQueue::dump(ScheduleDAG *DAG) const {

  dbgs() << "Latency Priority Queue\n";

  dbgs() << "  Number of Queue Entries: " << Queue.size() << "\n";

  for (const SUnit *SU : Queue) {

    dbgs() << "    ";

    DAG->dumpNode(*SU);

  }

}

#endif

LLVM_DUMP_METHOD
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
Definition: Compiler.h:622

Debug.h

LatencyPriorityQueue.h

I
#define I(x, y, z)
Definition: MD5.cpp:58

P
#define P(N)

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

llvm::LatencyPriorityQueue::getNumSolelyBlockNodes
unsigned getNumSolelyBlockNodes(unsigned NodeNum) const
Definition: LatencyPriorityQueue.h:73

llvm::LatencyPriorityQueue::push
void push(SUnit *U) override
Definition: LatencyPriorityQueue.cpp:72

llvm::LatencyPriorityQueue::pop
SUnit * pop() override
Definition: LatencyPriorityQueue.cpp:115

llvm::LatencyPriorityQueue::dump
LLVM_DUMP_METHOD void dump(ScheduleDAG *DAG) const override
Definition: LatencyPriorityQueue.cpp:139

llvm::LatencyPriorityQueue::remove
void remove(SUnit *SU) override
Definition: LatencyPriorityQueue.cpp:129

llvm::LatencyPriorityQueue::scheduledNode
void scheduledNode(SUnit *SU) override
As each node is scheduled, this method is invoked.
Definition: LatencyPriorityQueue.cpp:89

llvm::LatencyPriorityQueue::getLatency
unsigned getLatency(unsigned NodeNum) const
Definition: LatencyPriorityQueue.h:68

llvm::LatencyPriorityQueue::empty
bool empty() const override
Definition: LatencyPriorityQueue.h:78

llvm::SDep
Scheduling dependency.
Definition: ScheduleDAG.h:49

llvm::SDep::getSUnit
SUnit * getSUnit() const
Definition: ScheduleDAG.h:498

llvm::SUnit
Scheduling unit. This is a node in the scheduling DAG.
Definition: ScheduleDAG.h:242

llvm::SUnit::NodeNum
unsigned NodeNum
Entry # of node in the node vector.
Definition: ScheduleDAG.h:270

llvm::SUnit::isScheduled
bool isScheduled
True once scheduled.
Definition: ScheduleDAG.h:296

llvm::SUnit::isAvailable
bool isAvailable
True once available.
Definition: ScheduleDAG.h:295

llvm::SUnit::Succs
SmallVector< SDep, 4 > Succs
All sunit successors.
Definition: ScheduleDAG.h:263

llvm::SUnit::Preds
SmallVector< SDep, 4 > Preds
All sunit predecessors.
Definition: ScheduleDAG.h:262

llvm::ScheduleDAG
Definition: ScheduleDAG.h:572

llvm::ScheduleDAG::dumpNode
virtual void dumpNode(const SUnit &SU) const =0

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::find
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1759

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition: BitVector.h:860

raw_ostream.h

llvm::latency_sort::PQ
LatencyPriorityQueue * PQ
Definition: LatencyPriorityQueue.h:26

llvm::latency_sort::operator()
bool operator()(const SUnit *LHS, const SUnit *RHS) const
Definition: LatencyPriorityQueue.cpp:23