LLVM 20.0.0git
LatencyPriorityQueue.cpp
Go to the documentation of this file.
1//===---- LatencyPriorityQueue.cpp - A latency-oriented priority queue ----===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the LatencyPriorityQueue class, which is a
10// SchedulingPriorityQueue that schedules using latency information to
11// reduce the length of the critical path through the basic block.
12//
13//===----------------------------------------------------------------------===//
14
16#include "llvm/Config/llvm-config.h"
17#include "llvm/Support/Debug.h"
19using namespace llvm;
20
21#define DEBUG_TYPE "scheduler"
22
23bool latency_sort::operator()(const SUnit *LHS, const SUnit *RHS) const {
24 // The isScheduleHigh flag allows nodes with wraparound dependencies that
25 // cannot easily be modeled as edges with latencies to be scheduled as
26 // soon as possible in a top-down schedule.
27 if (LHS->isScheduleHigh && !RHS->isScheduleHigh)
28 return false;
29 if (!LHS->isScheduleHigh && RHS->isScheduleHigh)
30 return true;
31
32 unsigned LHSNum = LHS->NodeNum;
33 unsigned RHSNum = RHS->NodeNum;
34
35 // The most important heuristic is scheduling the critical path.
36 unsigned LHSLatency = PQ->getLatency(LHSNum);
37 unsigned RHSLatency = PQ->getLatency(RHSNum);
38 if (LHSLatency < RHSLatency) return true;
39 if (LHSLatency > RHSLatency) return false;
40
41 // After that, if two nodes have identical latencies, look to see if one will
42 // unblock more other nodes than the other.
43 unsigned LHSBlocked = PQ->getNumSolelyBlockNodes(LHSNum);
44 unsigned RHSBlocked = PQ->getNumSolelyBlockNodes(RHSNum);
45 if (LHSBlocked < RHSBlocked) return true;
46 if (LHSBlocked > RHSBlocked) return false;
47
48 // Finally, just to provide a stable ordering, use the node number as a
49 // deciding factor.
50 return RHSNum < LHSNum;
51}
52
53
54/// getSingleUnscheduledPred - If there is exactly one unscheduled predecessor
55/// of SU, return it, otherwise return null.
56SUnit *LatencyPriorityQueue::getSingleUnscheduledPred(SUnit *SU) {
57 SUnit *OnlyAvailablePred = nullptr;
58 for (const SDep &P : SU->Preds) {
59 SUnit &Pred = *P.getSUnit();
60 if (!Pred.isScheduled) {
61 // We found an available, but not scheduled, predecessor. If it's the
62 // only one we have found, keep track of it... otherwise give up.
63 if (OnlyAvailablePred && OnlyAvailablePred != &Pred)
64 return nullptr;
65 OnlyAvailablePred = &Pred;
66 }
67 }
68
69 return OnlyAvailablePred;
70}
71
73 // Look at all of the successors of this node. Count the number of nodes that
74 // this node is the sole unscheduled node for.
75 unsigned NumNodesBlocking = 0;
76 for (const SDep &Succ : SU->Succs)
77 if (getSingleUnscheduledPred(Succ.getSUnit()) == SU)
78 ++NumNodesBlocking;
79 NumNodesSolelyBlocking[SU->NodeNum] = NumNodesBlocking;
80
81 Queue.push_back(SU);
82}
83
84
85// scheduledNode - As nodes are scheduled, we look to see if there are any
86// successor nodes that have a single unscheduled predecessor. If so, that
87// single predecessor has a higher priority, since scheduling it will make
88// the node available.
90 for (const SDep &Succ : SU->Succs)
91 AdjustPriorityOfUnscheduledPreds(Succ.getSUnit());
92}
93
94/// AdjustPriorityOfUnscheduledPreds - One of the predecessors of SU was just
95/// scheduled. If SU is not itself available, then there is at least one
96/// predecessor node that has not been scheduled yet. If SU has exactly ONE
97/// unscheduled predecessor, we want to increase its priority: it getting
98/// scheduled will make this node available, so it is better than some other
99/// node of the same priority that will not make a node available.
100void LatencyPriorityQueue::AdjustPriorityOfUnscheduledPreds(SUnit *SU) {
101 if (SU->isAvailable) return; // All preds scheduled.
102
103 SUnit *OnlyAvailablePred = getSingleUnscheduledPred(SU);
104 if (!OnlyAvailablePred || !OnlyAvailablePred->isAvailable) return;
105
106 // Okay, we found a single predecessor that is available, but not scheduled.
107 // Since it is available, it must be in the priority queue. First remove it.
108 remove(OnlyAvailablePred);
109
110 // Reinsert the node into the priority queue, which recomputes its
111 // NumNodesSolelyBlocking value.
112 push(OnlyAvailablePred);
113}
114
116 if (empty()) return nullptr;
117 std::vector<SUnit *>::iterator Best = Queue.begin();
118 for (std::vector<SUnit *>::iterator I = std::next(Queue.begin()),
119 E = Queue.end(); I != E; ++I)
120 if (Picker(*Best, *I))
121 Best = I;
122 SUnit *V = *Best;
123 if (Best != std::prev(Queue.end()))
124 std::swap(*Best, Queue.back());
125 Queue.pop_back();
126 return V;
127}
128
130 assert(!Queue.empty() && "Queue is empty!");
131 std::vector<SUnit *>::iterator I = find(Queue, SU);
132 assert(I != Queue.end() && "Queue doesn't contain the SU being removed!");
133 if (I != std::prev(Queue.end()))
134 std::swap(*I, Queue.back());
135 Queue.pop_back();
136}
137
138#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
140 dbgs() << "Latency Priority Queue\n";
141 dbgs() << " Number of Queue Entries: " << Queue.size() << "\n";
142 for (const SUnit *SU : Queue) {
143 dbgs() << " ";
144 DAG->dumpNode(*SU);
145 }
146}
147#endif
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
Definition: Compiler.h:533
#define I(x, y, z)
Definition: MD5.cpp:58
#define P(N)
const MachineOperand & RHS
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
Value * LHS
unsigned getNumSolelyBlockNodes(unsigned NodeNum) const
void push(SUnit *U) override
LLVM_DUMP_METHOD void dump(ScheduleDAG *DAG) const override
void remove(SUnit *SU) override
void scheduledNode(SUnit *SU) override
As each node is scheduled, this method is invoked.
unsigned getLatency(unsigned NodeNum) const
bool empty() const override
Scheduling dependency.
Definition: ScheduleDAG.h:49
SUnit * getSUnit() const
Definition: ScheduleDAG.h:498
Scheduling unit. This is a node in the scheduling DAG.
Definition: ScheduleDAG.h:242
unsigned NodeNum
Entry # of node in the node vector.
Definition: ScheduleDAG.h:270
bool isScheduled
True once scheduled.
Definition: ScheduleDAG.h:296
bool isAvailable
True once available.
Definition: ScheduleDAG.h:295
SmallVector< SDep, 4 > Succs
All sunit successors.
Definition: ScheduleDAG.h:263
SmallVector< SDep, 4 > Preds
All sunit predecessors.
Definition: ScheduleDAG.h:262
virtual void dumpNode(const SUnit &SU) const =0
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1742
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition: BitVector.h:860
LatencyPriorityQueue * PQ
bool operator()(const SUnit *LHS, const SUnit *RHS) const