doxygen/UnifyLoopExits_8cpp_source.html

//===- UnifyLoopExits.cpp - Redirect exiting edges to one block -*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// For each natural loop with multiple exit blocks, this pass creates a new

// block N such that all exiting blocks now branch to N, and then control flow

// is redistributed to all the original exit blocks.

//

// Limitation: This assumes that all terminators in the CFG are direct branches

//             (the "br" instruction). The presence of any other control flow

//             such as indirectbr, switch or callbr will cause an assert.

//

//===----------------------------------------------------------------------===//


#include "llvm/Transforms/Utils/UnifyLoopExits.h"

#include "llvm/ADT/MapVector.h"

#include "llvm/Analysis/DomTreeUpdater.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/Dominators.h"

#include "llvm/InitializePasses.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Transforms/Utils.h"

#include "llvm/Transforms/Utils/BasicBlockUtils.h"

#include "llvm/Transforms/Utils/ControlFlowUtils.h"


#define DEBUG_TYPE "unify-loop-exits"


using namespace llvm;


static cl::opt<unsigned> MaxBooleansInControlFlowHub(

    "max-booleans-in-control-flow-hub", cl::init(32), cl::Hidden,

    cl::desc("Set the maximum number of outgoing blocks for using a boolean "

             "value to record the exiting block in the ControlFlowHub."));


namespace {

struct UnifyLoopExitsLegacyPass : public FunctionPass {

  static char ID;

  UnifyLoopExitsLegacyPass() : FunctionPass(ID) {

    initializeUnifyLoopExitsLegacyPassPass(*PassRegistry::getPassRegistry());

  }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.addRequired<LoopInfoWrapperPass>();

    AU.addRequired<DominatorTreeWrapperPass>();

    AU.addPreserved<LoopInfoWrapperPass>();

    AU.addPreserved<DominatorTreeWrapperPass>();

  }


  bool runOnFunction(Function &F) override;

};

} // namespace


char UnifyLoopExitsLegacyPass::ID = 0;


FunctionPass *llvm::createUnifyLoopExitsPass() {

  return new UnifyLoopExitsLegacyPass();

}


INITIALIZE_PASS_BEGIN(UnifyLoopExitsLegacyPass, "unify-loop-exits",

                      "Fixup each natural loop to have a single exit block",

                      false /* Only looks at CFG */, false /* Analysis Pass */)

INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)

INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)

INITIALIZE_PASS_END(UnifyLoopExitsLegacyPass, "unify-loop-exits",

                    "Fixup each natural loop to have a single exit block",

                    false /* Only looks at CFG */, false /* Analysis Pass */)


// The current transform introduces new control flow paths which may break the

// SSA requirement that every def must dominate all its uses. For example,

// consider a value D defined inside the loop that is used by some instruction

// U outside the loop. It follows that D dominates U, since the original

// program has valid SSA form. After merging the exits, all paths from D to U

// now flow through the unified exit block. In addition, there may be other

// paths that do not pass through D, but now reach the unified exit

// block. Thus, D no longer dominates U.

//

// Restore the dominance by creating a phi for each such D at the new unified

// loop exit. But when doing this, ignore any uses U that are in the new unified

// loop exit, since those were introduced specially when the block was created.

//

// The use of SSAUpdater seems like overkill for this operation. The location

// for creating the new PHI is well-known, and also the set of incoming blocks

// to the new PHI.

static void restoreSSA(const DominatorTree &DT, const Loop *L,

                       SmallVectorImpl<BasicBlock *> &Incoming,

                       BasicBlock *LoopExitBlock) {

  using InstVector = SmallVector<Instruction *, 8>;

  using IIMap = MapVector<Instruction *, InstVector>;

  IIMap ExternalUsers;

  for (auto *BB : L->blocks()) {

    for (auto &I : *BB) {

      for (auto &U : I.uses()) {

        auto UserInst = cast<Instruction>(U.getUser());

        auto UserBlock = UserInst->getParent();

        if (UserBlock == LoopExitBlock)

          continue;

        if (L->contains(UserBlock))

          continue;

        LLVM_DEBUG(dbgs() << "added ext use for " << I.getName() << "("

                          << BB->getName() << ")"

                          << ": " << UserInst->getName() << "("

                          << UserBlock->getName() << ")"

                          << "\n");

        ExternalUsers[&I].push_back(UserInst);

      }

    }

  }


  for (const auto &II : ExternalUsers) {

    // For each Def used outside the loop, create NewPhi in

    // LoopExitBlock. NewPhi receives Def only along exiting blocks that

    // dominate it, while the remaining values are undefined since those paths

    // didn't exist in the original CFG.

    auto Def = II.first;

    LLVM_DEBUG(dbgs() << "externally used: " << Def->getName() << "\n");

    auto NewPhi =

        PHINode::Create(Def->getType(), Incoming.size(),

                        Def->getName() + ".moved", LoopExitBlock->begin());

    for (auto *In : Incoming) {

      LLVM_DEBUG(dbgs() << "predecessor " << In->getName() << ": ");

      if (Def->getParent() == In || DT.dominates(Def, In)) {

        LLVM_DEBUG(dbgs() << "dominated\n");

        NewPhi->addIncoming(Def, In);

      } else {

        LLVM_DEBUG(dbgs() << "not dominated\n");

        NewPhi->addIncoming(PoisonValue::get(Def->getType()), In);

      }

    }


    LLVM_DEBUG(dbgs() << "external users:");

    for (auto *U : II.second) {

      LLVM_DEBUG(dbgs() << " " << U->getName());

      U->replaceUsesOfWith(Def, NewPhi);

    }

    LLVM_DEBUG(dbgs() << "\n");

  }

}


static bool unifyLoopExits(DominatorTree &DT, LoopInfo &LI, Loop *L) {

  // To unify the loop exits, we need a list of the exiting blocks as

  // well as exit blocks. The functions for locating these lists both

  // traverse the entire loop body. It is more efficient to first

  // locate the exiting blocks and then examine their successors to

  // locate the exit blocks.

  SmallVector<BasicBlock *, 8> ExitingBlocks;

  L->getExitingBlocks(ExitingBlocks);


  // Redirect exiting edges through a control flow hub.

  ControlFlowHub CHub;

  for (auto *BB : ExitingBlocks) {

    auto *Branch = cast<BranchInst>(BB->getTerminator());

    BasicBlock *Succ0 = Branch->getSuccessor(0);

    Succ0 = L->contains(Succ0) ? nullptr : Succ0;


    BasicBlock *Succ1 =

        Branch->isUnconditional() ? nullptr : Branch->getSuccessor(1);

    Succ1 = L->contains(Succ1) ? nullptr : Succ1;

    CHub.addBranch(BB, Succ0, Succ1);


    LLVM_DEBUG(dbgs() << "Added exiting branch: " << BB->getName() << " -> {"

                      << (Succ0 ? Succ0->getName() : "<none>") << ", "

                      << (Succ1 ? Succ1->getName() : "<none>") << "}\n");

  }


  SmallVector<BasicBlock *, 8> GuardBlocks;

  DomTreeUpdater DTU(DT, DomTreeUpdater::UpdateStrategy::Eager);

  BasicBlock *LoopExitBlock = CHub.finalize(

      &DTU, GuardBlocks, "loop.exit", MaxBooleansInControlFlowHub.getValue());


  restoreSSA(DT, L, ExitingBlocks, LoopExitBlock);


#if defined(EXPENSIVE_CHECKS)

  assert(DT.verify(DominatorTree::VerificationLevel::Full));

#else

  assert(DT.verify(DominatorTree::VerificationLevel::Fast));

#endif // EXPENSIVE_CHECKS

  L->verifyLoop();


  // The guard blocks were created outside the loop, so they need to become

  // members of the parent loop.

  if (auto ParentLoop = L->getParentLoop()) {

    for (auto *G : GuardBlocks) {

      ParentLoop->addBasicBlockToLoop(G, LI);

    }

    ParentLoop->verifyLoop();

  }


#if defined(EXPENSIVE_CHECKS)

  LI.verify(DT);

#endif // EXPENSIVE_CHECKS


  return true;

}


static bool runImpl(LoopInfo &LI, DominatorTree &DT) {


  bool Changed = false;

  auto Loops = LI.getLoopsInPreorder();

  for (auto *L : Loops) {

    LLVM_DEBUG(dbgs() << "Processing loop:\n"; L->print(dbgs()));

    Changed |= unifyLoopExits(DT, LI, L);

  }

  return Changed;

}


bool UnifyLoopExitsLegacyPass::runOnFunction(Function &F) {

  LLVM_DEBUG(dbgs() << "===== Unifying loop exits in function " << F.getName()

                    << "\n");

  auto &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();

  auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();


  assert(hasOnlySimpleTerminator(F) && "Unsupported block terminator.");


  return runImpl(LI, DT);

}


namespace llvm {


PreservedAnalyses UnifyLoopExitsPass::run(Function &F,

                                          FunctionAnalysisManager &AM) {

  LLVM_DEBUG(dbgs() << "===== Unifying loop exits in function " << F.getName()

                    << "\n");

  auto &LI = AM.getResult<LoopAnalysis>(F);

  auto &DT = AM.getResult<DominatorTreeAnalysis>(F);


  if (!runImpl(LI, DT))

    return PreservedAnalyses::all();

  PreservedAnalyses PA;

  PA.preserve<LoopAnalysis>();

  PA.preserve<DominatorTreeAnalysis>();

  return PA;

}

} // namespace llvm

const
aarch64 promote const
Definition: AArch64PromoteConstant.cpp:230

BasicBlockUtils.h

CommandLine.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

ControlFlowUtils.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition: Debug.h:106

DomTreeUpdater.h

Dominators.h

runImpl
static bool runImpl(Function &F, const TargetLowering &TLI)
Definition: ExpandLargeDivRem.cpp:79

Loops
Hexagon Hardware Loops
Definition: HexagonHardwareLoops.cpp:373

InitializePasses.h

LoopInfo.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

G
#define G(x, y, z)
Definition: MD5.cpp:56

MapVector.h
This file implements a map that provides insertion order iteration.

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:51

Fixup
PowerPC TLS Dynamic Call Fixup
Definition: PPCTLSDynamicCall.cpp:339

INITIALIZE_PASS_DEPENDENCY
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition: PassSupport.h:55

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:57

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:52

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

Utils.h

exits
unify loop exits
Definition: UnifyLoopExits.cpp:69

block
unify loop Fixup each natural loop to have a single exit block
Definition: UnifyLoopExits.cpp:70

unifyLoopExits
static bool unifyLoopExits(DominatorTree &DT, LoopInfo &LI, Loop *L)
Definition: UnifyLoopExits.cpp:144

restoreSSA
unify loop Fixup each natural loop to have a single exit static false void restoreSSA(const DominatorTree &DT, const Loop *L, SmallVectorImpl< BasicBlock * > &Incoming, BasicBlock *LoopExitBlock)
Definition: UnifyLoopExits.cpp:89

MaxBooleansInControlFlowHub
static cl::opt< unsigned > MaxBooleansInControlFlowHub("max-booleans-in-control-flow-hub", cl::init(32), cl::Hidden, cl::desc("Set the maximum number of outgoing blocks for using a boolean " "value to record the exiting block in the ControlFlowHub."))

runImpl
static bool runImpl(LoopInfo &LI, DominatorTree &DT)
Definition: UnifyLoopExits.cpp:200

UnifyLoopExits.h

llvm::AnalysisManager
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:253

llvm::AnalysisManager::getResult
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Definition: PassManager.h:410

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition: PassAnalysisSupport.h:47

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition: PassAnalysisSupport.h:75

llvm::AnalysisUsage::addPreserved
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
Definition: PassAnalysisSupport.h:98

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:61

llvm::DomTreeUpdater
Definition: DomTreeUpdater.h:30

llvm::DominatorTreeAnalysis
Analysis pass which computes a DominatorTree.
Definition: Dominators.h:279

llvm::DominatorTreeBase::verify
bool verify(VerificationLevel VL=VerificationLevel::Full) const
verify - checks if the tree is correct.
Definition: GenericDomTree.h:905

llvm::DominatorTreeWrapperPass
Legacy analysis pass which computes a DominatorTree.
Definition: Dominators.h:317

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition: Dominators.h:162

llvm::DominatorTree::dominates
bool dominates(const BasicBlock *BB, const Use &U) const
Return true if the (end of the) basic block BB dominates the use U.
Definition: Dominators.cpp:122

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition: Pass.h:310

llvm::FunctionPass::runOnFunction
virtual bool runOnFunction(Function &F)=0
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.

llvm::Function
Definition: Function.h:63

llvm::LoopAnalysis
Analysis pass that exposes the LoopInfo for a function.
Definition: LoopInfo.h:566

llvm::LoopInfoBase::verify
void verify(const DominatorTreeBase< BlockT, false > &DomTree) const
Definition: GenericLoopInfoImpl.h:718

llvm::LoopInfoBase::getLoopsInPreorder
SmallVector< LoopT *, 4 > getLoopsInPreorder() const
Return all of the loops in the function in preorder across the loop nests, with siblings in forward p...
Definition: GenericLoopInfoImpl.h:606

llvm::LoopInfoWrapperPass
The legacy pass manager's analysis pass to compute loop information.
Definition: LoopInfo.h:593

llvm::LoopInfo
Definition: LoopInfo.h:407

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:39

llvm::MapVector
This class implements a map that also provides access to all stored values in a deterministic order.
Definition: MapVector.h:36

llvm::PHINode::Create
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
Definition: Instructions.h:2635

llvm::PassRegistry::getPassRegistry
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Definition: PassRegistry.cpp:24

llvm::Pass::getAnalysisUsage
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
Definition: Pass.cpp:98

llvm::PoisonValue::get
static PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition: Constants.cpp:1878

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:111

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:117

llvm::PreservedAnalyses::preserve
void preserve()
Mark an analysis as preserved.
Definition: Analysis.h:131

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:573

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::UnifyLoopExitsPass::run
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
Definition: UnifyLoopExits.cpp:224

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

llvm::cl::opt
Definition: CommandLine.h:1423

unsigned

false
Definition: StackSlotColoring.cpp:193

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:137

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::hasOnlySimpleTerminator
bool hasOnlySimpleTerminator(const Function &F)
Definition: BasicBlockUtils.cpp:1909

llvm::initializeUnifyLoopExitsLegacyPassPass
void initializeUnifyLoopExitsLegacyPassPass(PassRegistry &)

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

llvm::createUnifyLoopExitsPass
FunctionPass * createUnifyLoopExitsPass()
Definition: UnifyLoopExits.cpp:60

llvm::ControlFlowHub
Given a set of branch descriptors [BB, Succ0, Succ1], create a "hub" such that the control flow from ...
Definition: ControlFlowUtils.h:97

llvm::ControlFlowHub::finalize
BasicBlock * finalize(DomTreeUpdater *DTU, SmallVectorImpl< BasicBlock * > &GuardBlocks, const StringRef Prefix, std::optional< unsigned > MaxControlFlowBooleans=std::nullopt)
Definition: ControlFlowUtils.cpp:273

llvm::ControlFlowHub::addBranch
void addBranch(BasicBlock *BB, BasicBlock *Succ0, BasicBlock *Succ1)
Definition: ControlFlowUtils.h:107

llvm::Incoming
Incoming for lane maks phi as machine instruction, incoming register Reg and incoming block Block are...
Definition: SILowerI1Copies.h:25

llvm::cl::desc
Definition: CommandLine.h:409