109 using ElemToSuperNodeMap =
118 auto H = getHash(Deps);
119 if (
auto *ExistingSN = findCanonicalSuperNode(
H, Deps)) {
120 for (
auto &[Container, Elems] : Defs) {
121 auto &DstCElems = ExistingSN->Defs[Container];
122 [[maybe_unused]]
size_t ExpectedSize =
123 DstCElems.size() + Elems.size();
124 DstCElems.insert(Elems.begin(), Elems.end());
125 assert(DstCElems.size() == ExpectedSize);
131 std::make_unique<SuperNode>(std::move(Defs), std::move(Deps));
132 CanonicalSNs[
H].push_back(NewSN.get());
136 void coalesce(std::vector<std::unique_ptr<SuperNode>> &SNs,
137 ElemToSuperNodeMap &ElemToSN) {
138 for (
size_t I = 0;
I != SNs.size();) {
140 auto H = getHash(SN->Deps);
141 if (
auto *CanonicalSN = findCanonicalSuperNode(
H, SN->Deps)) {
142 for (
auto &[Container, Elems] : SN->Defs) {
143 CanonicalSN->Defs[Container].insert(Elems.begin(), Elems.end());
144 auto &ContainerElemToSN = ElemToSN[Container];
145 for (
auto &Elem : Elems)
146 ContainerElemToSN[Elem] = CanonicalSN;
151 CanonicalSNs[
H].push_back(SN.get());
157 template <
typename Pred>
void remove(Pred &&Remove) {
158 for (
auto &[Hash, SNs] : CanonicalSNs) {
160 for (
size_t I = 0;
I != SNs.size(); ++
I) {
161 if (Remove(SNs[
I])) {
170 CanonicalSNs.erase(Hash);
179 SortedContainers.reserve(
M.size());
180 for (
auto &[Container, Elems] : M)
181 SortedContainers.push_back(Container);
184 for (
auto &Container : SortedContainers) {
185 auto &ContainerElems =
M.at(Container);
187 ContainerElems.end());
196 SuperNode *findCanonicalSuperNode(hash_code
H,
198 for (
auto *SN : CanonicalSNs[
H])
204 DenseMap<hash_code, SmallVector<SuperNode *>> CanonicalSNs;
218 for (
auto &[Container, Elems] : Defs) {
219 assert(!Elems.empty() &&
"Defs for container must not be empty");
220 auto I = Deps.
find(Container);
223 auto &DepsForContainer =
I->second;
224 for (
auto &Elem : Elems)
225 DepsForContainer.erase(Elem);
226 if (DepsForContainer.empty())
230 Deps.
erase(Container);
231 if (
auto SN = C.addOrCreateSuperNode(std::move(Defs), std::move(Deps)))
232 SNs.push_back(std::move(SN));
235 return std::move(SNs);
240 std::vector<std::unique_ptr<SuperNode>> SNs;
243 class SimplifyResult {
248 const std::vector<std::unique_ptr<SuperNode>> &
superNodes()
const {
254 ElemToSuperNodeMap ElemToSN)
256 std::vector<std::unique_ptr<SuperNode>> SNs;
257 ElemToSuperNodeMap ElemToSN;
261 static SimplifyResult
simplify(std::vector<std::unique_ptr<SuperNode>> SNs) {
263 ElemToSuperNodeMap ElemToSN;
264 for (
auto &SN : SNs) {
265 for (
auto &[Container, Elements] : SN->Defs) {
266 auto &ContainerElemToSN = ElemToSN[Container];
267 for (
auto &
E : Elements)
268 ContainerElemToSN[
E] = SN.get();
272 SuperNodeDepsMap SuperNodeDeps;
273 hoistDeps(SuperNodeDeps, SNs, ElemToSN);
274 propagateSuperNodeDeps(SuperNodeDeps);
275 sinkDeps(SNs, SuperNodeDeps);
280 return {std::move(SNs), std::move(ElemToSN)};
284 std::vector<std::unique_ptr<SuperNode>>
Ready;
285 std::vector<std::unique_ptr<SuperNode>>
Failed;
295 template <
typename GetExternalStateFn>
296 EmitResult
emit(SimplifyResult SR, GetExternalStateFn &&GetExternalState) {
297 auto NewSNs = std::move(SR.SNs);
298 auto ElemToNewSN = std::move(SR.ElemToSN);
301 auto FailedSNs = processExternalDeps(NewSNs, GetExternalState);
304 std::vector<std::unique_ptr<SuperNode>> ModifiedPendingSNs;
305 for (
size_t I = 0;
I != PendingSNs.size();) {
306 auto &SN = PendingSNs[
I];
308 for (
auto &[Container, Elems] : SN->Deps) {
309 auto I = ElemToNewSN.find(Container);
310 if (
I == ElemToNewSN.end())
312 for (
auto Elem : Elems) {
313 if (
I->second.contains(Elem)) {
322 ModifiedPendingSNs.push_back(std::move(SN));
324 PendingSNs.pop_back();
330 SuperNodeDepsMap SuperNodeDeps;
331 hoistDeps(SuperNodeDeps, ModifiedPendingSNs, ElemToNewSN);
333 CoalesceToPendingSNs.remove(
334 [&](SuperNode *SN) {
return SuperNodeDeps.count(SN); });
336 hoistDeps(SuperNodeDeps, NewSNs, ElemToPendingSN);
337 propagateSuperNodeDeps(SuperNodeDeps);
338 sinkDeps(NewSNs, SuperNodeDeps);
339 sinkDeps(ModifiedPendingSNs, SuperNodeDeps);
343 std::vector<std::unique_ptr<SuperNode>> ReadyNodes, FailedNodes;
344 processReadyOrFailed(ModifiedPendingSNs, ReadyNodes, FailedNodes,
345 SuperNodeDeps, ElemToPendingSN, FailedSNs);
346 processReadyOrFailed(NewSNs, ReadyNodes, FailedNodes, SuperNodeDeps,
347 ElemToNewSN, FailedSNs);
349 CoalesceToPendingSNs.coalesce(ModifiedPendingSNs, ElemToPendingSN);
350 CoalesceToPendingSNs.coalesce(NewSNs, ElemToPendingSN);
353 for (
auto &SN : ModifiedPendingSNs)
354 PendingSNs.push_back(std::move(SN));
357 for (
auto &SN : NewSNs) {
358 for (
auto &[Container, Elems] : SN->Defs) {
359 auto &Row = ElemToPendingSN[Container];
360 for (
auto &Elem : Elems)
361 Row[Elem] = SN.get();
363 PendingSNs.push_back(std::move(SN));
366 return {std::move(ReadyNodes), std::move(FailedNodes)};
373 std::vector<std::unique_ptr<SuperNode>>
375 std::vector<std::unique_ptr<SuperNode>> FailedSNs;
377 for (
size_t I = 0;
I != PendingSNs.size();) {
378 auto &PendingSN = PendingSNs[
I];
379 bool FailPendingSN =
false;
380 for (
auto &[Container, Elems] : PendingSN->Deps) {
383 auto I =
Failed.find(Container);
386 for (
auto &Elem : Elems) {
387 if (
I->second.count(Elem)) {
388 FailPendingSN =
true;
394 FailedSNs.push_back(std::move(PendingSN));
395 PendingSN = std::move(PendingSNs.back());
396 PendingSNs.pop_back();
401 for (
auto &SN : FailedSNs) {
402 CoalesceToPendingSNs.remove(
403 [&](SuperNode *SNC) {
return SNC == SN.get(); });
404 for (
auto &[Container, Elems] : SN->Defs) {
405 assert(ElemToPendingSN.count(Container));
406 auto &CElems = ElemToPendingSN[Container];
407 for (
auto &Elem : Elems)
410 ElemToPendingSN.erase(Container);
425 for (
auto &PendingSN : PendingSNs) {
426 if (PendingSN->Deps.empty())
427 ErrLog() <<
"Pending SN " << PendingSN.get() <<
" has empty dep set.\n";
429 bool BadElem =
false;
430 for (
auto &[Container, Elems] : PendingSN->Deps) {
431 auto I = ElemToPendingSN.find(Container);
432 if (
I == ElemToPendingSN.end())
435 ErrLog() <<
"Pending SN " << PendingSN.get()
436 <<
" has dependence map entry for " << Container
437 <<
" with empty element set.\n";
438 for (
auto &Elem : Elems) {
439 if (
I->second.count(Elem)) {
440 ErrLog() <<
"Pending SN " << PendingSN.get()
441 <<
" has dependence on emitted element ( " << Container
442 <<
", " << Elem <<
")\n";
452 for (
auto &[Container, Elems] : PendingSN->Defs) {
454 ErrLog() <<
"Pending SN " << PendingSN.get()
455 <<
" has def map entry for " << Container
456 <<
" with empty element set.\n";
457 DefCount += Elems.size();
458 auto I = ElemToPendingSN.find(Container);
459 if (
I == ElemToPendingSN.end())
460 ErrLog() <<
"Pending SN " << PendingSN.get() <<
" has "
461 << Elems.size() <<
" defs in container " << Container
462 <<
" not covered by ElemsToPendingSN.\n";
464 for (
auto &Elem : Elems) {
465 auto J =
I->second.find(Elem);
466 if (J ==
I->second.end())
467 ErrLog() <<
"Pending SN " << PendingSN.get() <<
" has element ("
468 << Container <<
", " << Elem
469 <<
") not covered by ElemsToPendingSN.\n";
470 else if (J->second != PendingSN.get())
471 ErrLog() <<
"ElemToPendingSN value invalid for (" << Container
472 <<
", " << Elem <<
")\n";
478 size_t DefCount2 = 0;
479 for (
auto &[Container, Elems] : ElemToPendingSN)
480 DefCount2 += Elems.size();
482 assert(DefCount2 >= DefCount);
483 if (DefCount2 != DefCount)
484 ErrLog() <<
"ElemToPendingSN contains extra elements.\n";
495 static void hoistDeps(SuperNodeDepsMap &SuperNodeDeps,
496 std::vector<std::unique_ptr<SuperNode>> &SNs,
497 ElemToSuperNodeMap &ElemToSN) {
498 for (
auto &SN : SNs) {
499 auto &SNDeps = SuperNodeDeps[SN.get()];
500 for (
auto &[DefContainer, DefElems] : ElemToSN) {
501 auto I = SN->Deps.find(DefContainer);
502 if (
I == SN->Deps.end())
504 for (
auto &[DefElem, DefSN] : DefElems)
505 if (
I->second.erase(DefElem))
506 SNDeps.insert(DefSN);
507 if (
I->second.empty())
514 static void propagateSuperNodeDeps(SuperNodeDepsMap &SuperNodeDeps) {
515 for (
auto &[SN, Deps] : SuperNodeDeps) {
516 DenseSet<SuperNode *> Reachable({SN});
519 while (!Worklist.empty()) {
520 auto *DepSN = Worklist.pop_back_val();
521 if (!Reachable.insert(DepSN).second)
523 auto I = SuperNodeDeps.find(DepSN);
524 if (
I == SuperNodeDeps.end())
526 for (
auto *DepSNDep :
I->second)
527 Worklist.push_back(DepSNDep);
530 Deps = std::move(Reachable);
535 static void sinkDeps(std::vector<std::unique_ptr<SuperNode>> &SNs,
536 SuperNodeDepsMap &SuperNodeDeps) {
537 for (
auto &SN : SNs) {
538 auto I = SuperNodeDeps.find(SN.get());
539 if (
I == SuperNodeDeps.end())
542 for (
auto *DepSN :
I->second)
543 for (
auto &[Container, Elems] : DepSN->Deps)
544 SN->Deps[Container].insert(Elems.begin(), Elems.end());
548 template <
typename GetExternalStateFn>
549 static std::vector<SuperNode *>
550 processExternalDeps(std::vector<std::unique_ptr<SuperNode>> &SNs,
551 GetExternalStateFn &GetExternalState) {
552 std::vector<SuperNode *> FailedSNs;
553 for (
auto &SN : SNs) {
554 bool SNHasError =
false;
556 for (
auto &[Container, Elems] : SN->Deps) {
558 for (
auto &Elem : Elems) {
559 switch (GetExternalState(Container, Elem)) {
563 ElemToRemove.push_back(Elem);
566 ElemToRemove.push_back(Elem);
571 for (
auto &Elem : ElemToRemove)
574 ContainersToRemove.push_back(Container);
576 for (
auto &Container : ContainersToRemove)
577 SN->Deps.erase(Container);
579 FailedSNs.push_back(SN.get());
585 void processReadyOrFailed(std::vector<std::unique_ptr<SuperNode>> &SNs,
586 std::vector<std::unique_ptr<SuperNode>> &
Ready,
587 std::vector<std::unique_ptr<SuperNode>> &
Failed,
588 SuperNodeDepsMap &SuperNodeDeps,
589 ElemToSuperNodeMap &ElemToSNs,
590 std::vector<SuperNode *> FailedSNs) {
591 for (
size_t I = 0;
I != SNs.size();) {
594 bool SNFailed =
false;
595 assert(SuperNodeDeps.count(SN.get()));
596 auto &SNSuperNodeDeps = SuperNodeDeps[SN.get()];
597 for (
auto *FailedSN : FailedSNs) {
598 if (FailedSN == SN.get() || SNSuperNodeDeps.count(FailedSN)) {
604 bool SNReady = SN->Deps.empty();
606 if (SNReady || SNFailed) {
616 std::vector<std::unique_ptr<SuperNode>> PendingSNs;
617 ElemToSuperNodeMap ElemToPendingSN;
618 Coalescer CoalesceToPendingSNs;