24#include <unordered_set>
26#define DEBUG_TYPE "spirv-convergence-region-analysis"
33 "SPIRV convergence regions analysis",
true,
true)
38 "convergence-region",
"SPIRV convergence regions analysis",
43template <
typename BasicBlockType,
typename IntrinsicInstType>
44std::optional<IntrinsicInstType *>
46 static_assert(std::is_const_v<IntrinsicInstType> ==
47 std::is_const_v<BasicBlockType>,
48 "Constness must match between input and output.");
49 static_assert(std::is_same_v<BasicBlock, std::remove_const_t<BasicBlockType>>,
50 "Input must be a basic block.");
52 std::is_same_v<IntrinsicInst, std::remove_const_t<IntrinsicInstType>>,
53 "Output type must be an intrinsic instruction.");
84 while (Candidate != NextCandidate && NextCandidate !=
nullptr) {
85 Candidate = NextCandidate;
86 NextCandidate =
nullptr;
92 for (
auto *Child : Candidate->
Children) {
93 if (Child->Blocks.count(Entry) != 0) {
94 NextCandidate = Child;
103std::optional<IntrinsicInst *>
105 return getConvergenceTokenInternal<BasicBlock, IntrinsicInst>(BB);
108std::optional<const IntrinsicInst *>
110 return getConvergenceTokenInternal<const BasicBlock, const IntrinsicInst>(BB);
115 : DT(DT), LI(LI),
Parent(nullptr) {
116 Entry = &
F.getEntryBlock();
131 for ([[maybe_unused]]
auto *BB : this->
Exits)
140 Child->releaseMemory();
147 const std::string Indent(IndentSize,
'\t');
148 dbgs() << Indent <<
this <<
": {\n";
149 dbgs() << Indent <<
" Parent: " <<
Parent <<
"\n";
157 if (
Entry->getName() !=
"")
158 dbgs() << Indent <<
" Entry: " <<
Entry->getName() <<
"\n";
160 dbgs() << Indent <<
" Entry: " <<
Entry <<
"\n";
162 dbgs() << Indent <<
" Exits: { ";
163 for (
const auto &Exit :
Exits) {
164 if (Exit->getName() !=
"")
165 dbgs() << Exit->getName() <<
", ";
167 dbgs() << Exit <<
", ";
171 dbgs() << Indent <<
" Blocks: { ";
173 if (
Block->getName() !=
"")
180 dbgs() << Indent <<
" Children: {\n";
182 Child->dump(IndentSize + 2);
183 dbgs() << Indent <<
" }\n";
185 dbgs() << Indent <<
"}\n";
189class ConvergenceRegionAnalyzer {
192 : DT(DT), LI(LI),
F(
F) {}
203 if (!LI.isLoopHeader(To))
206 auto *L = LI.getLoopFor(To);
207 if (L->contains(From) && L->isLoopLatch(From))
213 std::unordered_set<BasicBlock *>
215 std::function<
bool(
const BasicBlock *)> isMatch)
const {
216 std::unordered_set<BasicBlock *> Output;
222 for (
unsigned i = 0; i < Terminator->getNumSuccessors(); ++i) {
223 auto *To = Terminator->getSuccessor(i);
225 if (isBackEdge(From, To))
228 auto ChildSet = findPathsToMatch(LI, To, isMatch);
229 if (ChildSet.size() == 0)
232 Output.insert(ChildSet.begin(), ChildSet.end());
236 for (
auto *BB : L->getBlocks()) {
245 SmallPtrSet<BasicBlock *, 2>
246 findExitNodes(
const SmallPtrSetImpl<BasicBlock *> &RegionBlocks) {
247 SmallPtrSet<BasicBlock *, 2> Exits;
249 for (
auto *
B : RegionBlocks) {
251 for (
unsigned i = 0; i <
Terminator->getNumSuccessors(); ++i) {
253 if (RegionBlocks.count(Child) == 0)
262 ConvergenceRegionInfo analyze() {
263 ConvergenceRegion *TopLevelRegion =
new ConvergenceRegion(DT, LI,
F);
264 std::queue<Loop *> ToProcess;
268 while (ToProcess.size() != 0) {
269 auto *
L = ToProcess.front();
275 L->getExitingBlocks(LoopExits);
276 if (CT.has_value()) {
277 for (
auto *Exit : LoopExits) {
278 auto N = findPathsToMatch(LI, Exit, [&CT](
const BasicBlock *
block) {
280 if (Token == std::nullopt)
282 return Token.value() == CT.value();
284 RegionBlocks.insert_range(
N);
288 auto RegionExits = findExitNodes(RegionBlocks);
289 ConvergenceRegion *
Region =
new ConvergenceRegion(
290 DT, LI, CT,
L->getHeader(), std::move(RegionBlocks),
291 std::move(RegionExits));
293 assert(
Region->Parent !=
nullptr &&
"This is impossible.");
294 Region->Parent->Children.push_back(Region);
297 return ConvergenceRegionInfo(TopLevelRegion);
310 ConvergenceRegionAnalyzer Analyzer(
F, DT, LI);
311 return Analyzer.analyze();
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
static ConvergenceRegion * findParentRegion(ConvergenceRegion *Start, BasicBlock *Entry)
unify loop Fixup each natural loop to have a single exit block
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
LLVM Basic Block Representation.
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
Analysis pass which computes a DominatorTree.
Legacy analysis pass which computes a DominatorTree.
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Analysis pass that exposes the LoopInfo for a function.
bool isLoopHeader(const BlockT *BB) const
SmallVector< LoopT *, 4 > getLoopsInPreorder() const
Return all of the loops in the function in preorder across the loop nests, with siblings in forward p...
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
The legacy pass manager's analysis pass to compute loop information.
AnalysisType & getAnalysis() const
getAnalysis<AnalysisType>() - This function is used by subclasses to get to the analysis information ...
bool runOnFunction(Function &F) override
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.
SPIRVConvergenceRegionAnalysisWrapperPass()
Result run(Function &F, FunctionAnalysisManager &AM)
SPIRV::ConvergenceRegionInfo Result
SmallVector< ConvergenceRegion * > Children
ConvergenceRegion(DominatorTree &DT, LoopInfo &LI, Function &F)
void dump(const unsigned IndentSize=0) const
SmallPtrSet< BasicBlock *, 2 > Exits
std::optional< IntrinsicInst * > ConvergenceToken
ConvergenceRegion * Parent
SmallPtrSet< BasicBlock *, 8 > Blocks
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
ConvergenceRegionInfo getConvergenceRegions(Function &F, DominatorTree &DT, LoopInfo &LI)
std::optional< IntrinsicInst * > getConvergenceToken(BasicBlock *BB)
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
constexpr from_range_t from_range
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
Implement std::hash so that hash_code can be used in STL containers.
std::optional< IntrinsicInstType * > getConvergenceTokenInternal(BasicBlockType *BB)
A special type used by analysis passes to provide an address that identifies that particular analysis...