doxygen/html/ScheduleDAGInstrs_8cpp_source.html

//===---- ScheduleDAGInstrs.cpp - MachineInstr Rescheduling ---------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file This implements the ScheduleDAGInstrs class, which implements

/// re-scheduling of MachineInstrs.

//

//===----------------------------------------------------------------------===//


#include "llvm/CodeGen/ScheduleDAGInstrs.h"


#include "llvm/ADT/IntEqClasses.h"

#include "llvm/ADT/MapVector.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/SparseSet.h"

#include "llvm/ADT/iterator_range.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/CodeGen/LiveIntervals.h"

#include "llvm/CodeGen/LivePhysRegs.h"

#include "llvm/CodeGen/MachineBasicBlock.h"

#include "llvm/CodeGen/MachineFrameInfo.h"

#include "llvm/CodeGen/MachineFunction.h"

#include "llvm/CodeGen/MachineInstr.h"

#include "llvm/CodeGen/MachineInstrBundle.h"

#include "llvm/CodeGen/MachineMemOperand.h"

#include "llvm/CodeGen/MachineOperand.h"

#include "llvm/CodeGen/MachineRegisterInfo.h"

#include "llvm/CodeGen/PseudoSourceValue.h"

#include "llvm/CodeGen/RegisterPressure.h"

#include "llvm/CodeGen/ScheduleDAG.h"

#include "llvm/CodeGen/ScheduleDFS.h"

#include "llvm/CodeGen/SlotIndexes.h"

#include "llvm/CodeGen/TargetInstrInfo.h"

#include "llvm/CodeGen/TargetRegisterInfo.h"

#include "llvm/CodeGen/TargetSubtargetInfo.h"

#include "llvm/Config/llvm-config.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/Type.h"

#include "llvm/IR/Value.h"

#include "llvm/MC/LaneBitmask.h"

#include "llvm/MC/MCRegisterInfo.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/Format.h"

#include "llvm/Support/raw_ostream.h"

#include <algorithm>

#include <cassert>

#include <iterator>

#include <utility>

#include <vector>


using namespace llvm;


#define DEBUG_TYPE "machine-scheduler"


static cl::opt<bool>

    EnableAASchedMI("enable-aa-sched-mi", cl::Hidden,

                    cl::desc("Enable use of AA during MI DAG construction"));


static cl::opt<bool> UseTBAA("use-tbaa-in-sched-mi", cl::Hidden,

    cl::init(true), cl::desc("Enable use of TBAA during MI DAG construction"));


static cl::opt<bool>

    EnableSchedModel("schedmodel", cl::Hidden, cl::init(true),

                     cl::desc("Use TargetSchedModel for latency lookup"));


static cl::opt<bool>

    EnableSchedItins("scheditins", cl::Hidden, cl::init(true),

                     cl::desc("Use InstrItineraryData for latency lookup"));


// Note: the two options below might be used in tuning compile time vs

// output quality. Setting HugeRegion so large that it will never be

// reached means best-effort, but may be slow.


// When Stores and Loads maps (or NonAliasStores and NonAliasLoads)

// together hold this many SUs, a reduction of maps will be done.

static cl::opt<unsigned> HugeRegion("dag-maps-huge-region", cl::Hidden,

    cl::init(1000), cl::desc("The limit to use while constructing the DAG "

                             "prior to scheduling, at which point a trade-off "

                             "is made to avoid excessive compile time."));


static cl::opt<unsigned> ReductionSize(

    "dag-maps-reduction-size", cl::Hidden,

    cl::desc("A huge scheduling region will have maps reduced by this many "

             "nodes at a time. Defaults to HugeRegion / 2."));


#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)

static cl::opt<bool> SchedPrintCycles(

    "sched-print-cycles", cl::Hidden, cl::init(false),

    cl::desc("Report top/bottom cycles when dumping SUnit instances"));

#endif


static unsigned getReductionSize() {

  // Always reduce a huge region with half of the elements, except

  // when user sets this number explicitly.

  if (ReductionSize.getNumOccurrences() == 0)

    return HugeRegion / 2;

  return ReductionSize;

}


static void dumpSUList(const ScheduleDAGInstrs::SUList &L) {

#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)

  dbgs() << "{ ";

  for (const SUnit *SU : L) {

    dbgs() << "SU(" << SU->NodeNum << ")";

    if (SU != L.back())

      dbgs() << ", ";

  }

  dbgs() << "}\n";

#endif

}


ScheduleDAGInstrs::ScheduleDAGInstrs(MachineFunction &mf,

                                     const MachineLoopInfo *mli,

                                     bool RemoveKillFlags)

    : ScheduleDAG(mf), MLI(mli), MFI(mf.getFrameInfo()),

      RemoveKillFlags(RemoveKillFlags),

      UnknownValue(UndefValue::get(

                             Type::getVoidTy(mf.getFunction().getContext()))), Topo(SUnits, &ExitSU) {

  DbgValues.clear();


  const TargetSubtargetInfo &ST = mf.getSubtarget();

  SchedModel.init(&ST, EnableSchedModel, EnableSchedItins);

}


/// If this machine instr has memory reference information and it can be

/// tracked to a normal reference to a known object, return the Value

/// for that object. This function returns false the memory location is

/// unknown or may alias anything.


static bool getUnderlyingObjectsForInstr(const MachineInstr *MI,

                                         const MachineFrameInfo &MFI,

                                         UnderlyingObjectsVector &Objects,

                                         const DataLayout &DL) {

  auto AllMMOsOkay = [&]() {

    for (const MachineMemOperand *MMO : MI->memoperands()) {

      // TODO: Figure out whether isAtomic is really necessary (see D57601).

      if (MMO->isVolatile() || MMO->isAtomic())

        return false;


      if (const PseudoSourceValue *PSV = MMO->getPseudoValue()) {

        // Function that contain tail calls don't have unique PseudoSourceValue

        // objects. Two PseudoSourceValues might refer to the same or

        // overlapping locations. The client code calling this function assumes

        // this is not the case. So return a conservative answer of no known

        // object.

        if (MFI.hasTailCall())

          return false;


        // For now, ignore PseudoSourceValues which may alias LLVM IR values

        // because the code that uses this function has no way to cope with

        // such aliases.

        if (PSV->isAliased(&MFI))

          return false;


        bool MayAlias = PSV->mayAlias(&MFI);

        Objects.emplace_back(PSV, MayAlias);

      } else if (const Value *V = MMO->getValue()) {

        SmallVector<Value *, 4> Objs;

        if (!getUnderlyingObjectsForCodeGen(V, Objs))

          return false;


        for (Value *V : Objs) {

          assert(isIdentifiedObject(V));

          Objects.emplace_back(V, true);

        }

      } else

        return false;

    }

    return true;

  };


  if (!AllMMOsOkay()) {

    Objects.clear();

    return false;

  }


  return true;

}


void ScheduleDAGInstrs::startBlock(MachineBasicBlock *bb) {

  BB = bb;

}


void ScheduleDAGInstrs::finishBlock() {

  // Subclasses should no longer refer to the old block.

  BB = nullptr;

}


void ScheduleDAGInstrs::enterRegion(MachineBasicBlock *bb,

                                    MachineBasicBlock::iterator begin,

                                    MachineBasicBlock::iterator end,

                                    unsigned regioninstrs) {

  assert(bb == BB && "startBlock should set BB");

  RegionBegin = begin;

  RegionEnd = end;

  NumRegionInstrs = regioninstrs;

}


void ScheduleDAGInstrs::exitRegion() {

  // Nothing to do.

}


void ScheduleDAGInstrs::addSchedBarrierDeps() {

  MachineInstr *ExitMI =

      RegionEnd != BB->end()

          ? &*skipDebugInstructionsBackward(RegionEnd, RegionBegin)

          : nullptr;

  ExitSU.setInstr(ExitMI);

  // Add dependencies on the defs and uses of the instruction.

  if (ExitMI) {

    const MCInstrDesc &MIDesc = ExitMI->getDesc();

    for (const MachineOperand &MO : ExitMI->all_uses()) {

      unsigned OpIdx = MO.getOperandNo();

      Register Reg = MO.getReg();

      if (Reg.isPhysical()) {

        // addPhysRegDataDeps uses the provided operand index to retrieve

        // the operand use cycle from the scheduling model. If the operand

        // is "fake" (e.g., an operand of a call instruction used to pass

        // an argument to the called function.), the scheduling model may not

        // have an entry for it. If this is the case, pass -1 as operand index,

        // which will cause addPhysRegDataDeps to add an artificial dependency.

        // FIXME: Using hasImplicitUseOfPhysReg here is inaccurate as it misses

        //  aliases. When fixing, make sure to update addPhysRegDataDeps, too.

        bool IsRealUse = OpIdx < MIDesc.getNumOperands() ||

                         MIDesc.hasImplicitUseOfPhysReg(Reg);

        for (MCRegUnit Unit : TRI->regunits(Reg))

          Uses.insert(PhysRegSUOper(&ExitSU, IsRealUse ? OpIdx : -1, Unit));

      } else if (Reg.isVirtual() && MO.readsReg()) {

        addVRegUseDeps(&ExitSU, OpIdx);

      }

    }

  }

  if (!ExitMI || (!ExitMI->isCall() && !ExitMI->isBarrier())) {

    // For others, e.g. fallthrough, conditional branch, assume the exit

    // uses all the registers that are livein to the successor blocks.

    for (const MachineBasicBlock *Succ : BB->successors()) {

      for (const auto &LI : Succ->liveins()) {

        for (MCRegUnitMaskIterator U(LI.PhysReg, TRI); U.isValid(); ++U) {

          auto [Unit, Mask] = *U;

          if ((Mask & LI.LaneMask).any() && !Uses.contains(Unit))

            Uses.insert(PhysRegSUOper(&ExitSU, -1, Unit));

        }

      }

    }

  }

}


/// MO is an operand of SU's instruction that defines a physical register. Adds

/// data dependencies from SU to any uses of the physical register.


void ScheduleDAGInstrs::addPhysRegDataDeps(SUnit *SU, unsigned OperIdx) {

  const MachineOperand &MO = SU->getInstr()->getOperand(OperIdx);

  assert(MO.isDef() && "expect physreg def");

  Register Reg = MO.getReg();


  // Ask the target if address-backscheduling is desirable, and if so how much.

  const TargetSubtargetInfo &ST = MF.getSubtarget();


  // Only use any non-zero latency for real defs/uses, in contrast to

  // "fake" operands added by regalloc.

  const MCInstrDesc &DefMIDesc = SU->getInstr()->getDesc();

  bool ImplicitPseudoDef = (OperIdx >= DefMIDesc.getNumOperands() &&

                            !DefMIDesc.hasImplicitDefOfPhysReg(Reg));

  for (MCRegUnit Unit : TRI->regunits(Reg)) {

    for (RegUnit2SUnitsMap::iterator I = Uses.find(Unit); I != Uses.end();

         ++I) {

      SUnit *UseSU = I->SU;

      if (UseSU == SU)

        continue;


      // Adjust the dependence latency using operand def/use information,

      // then allow the target to perform its own adjustments.

      MachineInstr *UseInstr = nullptr;

      int UseOpIdx = I->OpIdx;

      bool ImplicitPseudoUse = false;

      SDep Dep;

      if (UseOpIdx < 0) {

        Dep = SDep(SU, SDep::Artificial);

      } else {

        // Set the hasPhysRegDefs only for physreg defs that have a use within

        // the scheduling region.

        SU->hasPhysRegDefs = true;


        UseInstr = UseSU->getInstr();

        Register UseReg = UseInstr->getOperand(UseOpIdx).getReg();

        const MCInstrDesc &UseMIDesc = UseInstr->getDesc();

        ImplicitPseudoUse = UseOpIdx >= ((int)UseMIDesc.getNumOperands()) &&

                            !UseMIDesc.hasImplicitUseOfPhysReg(UseReg);


        Dep = SDep(SU, SDep::Data, UseReg);

      }

      if (!ImplicitPseudoDef && !ImplicitPseudoUse) {

        Dep.setLatency(SchedModel.computeOperandLatency(SU->getInstr(), OperIdx,

                                                        UseInstr, UseOpIdx));

      } else {

        Dep.setLatency(0);

      }

      ST.adjustSchedDependency(SU, OperIdx, UseSU, UseOpIdx, Dep, &SchedModel);

      UseSU->addPred(Dep);

    }

  }

}


/// Adds register dependencies (data, anti, and output) from this SUnit

/// to following instructions in the same scheduling region that depend the

/// physical register referenced at OperIdx.


void ScheduleDAGInstrs::addPhysRegDeps(SUnit *SU, unsigned OperIdx) {

  MachineInstr *MI = SU->getInstr();

  MachineOperand &MO = MI->getOperand(OperIdx);

  Register Reg = MO.getReg();

  // We do not need to track any dependencies for constant registers.

  if (MRI.isConstantPhysReg(Reg))

    return;


  const TargetSubtargetInfo &ST = MF.getSubtarget();


  // Optionally add output and anti dependencies. For anti

  // dependencies we use a latency of 0 because for a multi-issue

  // target we want to allow the defining instruction to issue

  // in the same cycle as the using instruction.

  // TODO: Using a latency of 1 here for output dependencies assumes

  //       there's no cost for reusing registers.

  SDep::Kind Kind = MO.isUse() ? SDep::Anti : SDep::Output;

  for (MCRegUnit Unit : TRI->regunits(Reg)) {

    for (RegUnit2SUnitsMap::iterator I = Defs.find(Unit); I != Defs.end();

         ++I) {

      SUnit *DefSU = I->SU;

      if (DefSU == &ExitSU)

        continue;

      MachineInstr *DefInstr = DefSU->getInstr();

      MachineOperand &DefMO = DefInstr->getOperand(I->OpIdx);

      if (DefSU != SU &&

          (Kind != SDep::Output || !MO.isDead() || !DefMO.isDead())) {

        SDep Dep(SU, Kind, DefMO.getReg());

        if (Kind != SDep::Anti) {

          Dep.setLatency(

              SchedModel.computeOutputLatency(MI, OperIdx, DefInstr));

        }

        ST.adjustSchedDependency(SU, OperIdx, DefSU, I->OpIdx, Dep,

                                 &SchedModel);

        DefSU->addPred(Dep);

      }

    }

  }


  if (MO.isUse()) {

    SU->hasPhysRegUses = true;

    // Either insert a new Reg2SUnits entry with an empty SUnits list, or

    // retrieve the existing SUnits list for this register's uses.

    // Push this SUnit on the use list.

    for (MCRegUnit Unit : TRI->regunits(Reg))

      Uses.insert(PhysRegSUOper(SU, OperIdx, Unit));

    if (RemoveKillFlags)

      MO.setIsKill(false);

  } else {

    addPhysRegDataDeps(SU, OperIdx);


    // Clear previous uses and defs of this register and its subregisters.

    for (MCRegUnit Unit : TRI->regunits(Reg)) {

      Uses.eraseAll(Unit);

      if (!MO.isDead())

        Defs.eraseAll(Unit);

    }


    if (MO.isDead() && SU->isCall) {

      // Calls will not be reordered because of chain dependencies (see

      // below). Since call operands are dead, calls may continue to be added

      // to the DefList making dependence checking quadratic in the size of

      // the block. Instead, we leave only one call at the back of the

      // DefList.

      for (MCRegUnit Unit : TRI->regunits(Reg)) {

        RegUnit2SUnitsMap::RangePair P = Defs.equal_range(Unit);

        RegUnit2SUnitsMap::iterator B = P.first;

        RegUnit2SUnitsMap::iterator I = P.second;

        for (bool isBegin = I == B; !isBegin; /* empty */) {

          isBegin = (--I) == B;

          if (!I->SU->isCall)

            break;

          I = Defs.erase(I);

        }

      }

    }


    // Defs are pushed in the order they are visited and never reordered.

    for (MCRegUnit Unit : TRI->regunits(Reg))

      Defs.insert(PhysRegSUOper(SU, OperIdx, Unit));

  }

}


LaneBitmask ScheduleDAGInstrs::getLaneMaskForMO(const MachineOperand &MO) const

{

  Register Reg = MO.getReg();

  // No point in tracking lanemasks if we don't have interesting subregisters.

  const TargetRegisterClass &RC = *MRI.getRegClass(Reg);

  if (!RC.HasDisjunctSubRegs)

    return LaneBitmask::getAll();


  unsigned SubReg = MO.getSubReg();

  if (SubReg == 0)

    return RC.getLaneMask();

  return TRI->getSubRegIndexLaneMask(SubReg);

}


bool ScheduleDAGInstrs::deadDefHasNoUse(const MachineOperand &MO) {

  auto RegUse = CurrentVRegUses.find(MO.getReg());

  if (RegUse == CurrentVRegUses.end())

    return true;

  return (RegUse->LaneMask & getLaneMaskForMO(MO)).none();

}


/// Adds register output and data dependencies from this SUnit to instructions

/// that occur later in the same scheduling region if they read from or write to

/// the virtual register defined at OperIdx.

///

/// TODO: Hoist loop induction variable increments. This has to be

/// reevaluated. Generally, IV scheduling should be done before coalescing.


void ScheduleDAGInstrs::addVRegDefDeps(SUnit *SU, unsigned OperIdx) {

  MachineInstr *MI = SU->getInstr();

  MachineOperand &MO = MI->getOperand(OperIdx);

  Register Reg = MO.getReg();


  LaneBitmask DefLaneMask;

  LaneBitmask KillLaneMask;

  if (TrackLaneMasks) {

    bool IsKill = MO.getSubReg() == 0 || MO.isUndef();

    DefLaneMask = getLaneMaskForMO(MO);

    // If we have a <read-undef> flag, none of the lane values comes from an

    // earlier instruction.

    KillLaneMask = IsKill ? LaneBitmask::getAll() : DefLaneMask;


    if (MO.getSubReg() != 0 && MO.isUndef()) {

      // There may be other subregister defs on the same instruction of the same

      // register in later operands. The lanes of other defs will now be live

      // after this instruction, so these should not be treated as killed by the

      // instruction even though they appear to be killed in this one operand.

      for (const MachineOperand &OtherMO :

           llvm::drop_begin(MI->operands(), OperIdx + 1))

        if (OtherMO.isReg() && OtherMO.isDef() && OtherMO.getReg() == Reg)

          KillLaneMask &= ~getLaneMaskForMO(OtherMO);

    }


    // Clear undef flag, we'll re-add it later once we know which subregister

    // Def is first.

    MO.setIsUndef(false);

  } else {

    DefLaneMask = LaneBitmask::getAll();

    KillLaneMask = LaneBitmask::getAll();

  }


  if (MO.isDead()) {

    assert(deadDefHasNoUse(MO) && "Dead defs should have no uses");

  } else {

    // Add data dependence to all uses we found so far.

    const TargetSubtargetInfo &ST = MF.getSubtarget();

    for (VReg2SUnitOperIdxMultiMap::iterator I = CurrentVRegUses.find(Reg),

         E = CurrentVRegUses.end(); I != E; /*empty*/) {

      LaneBitmask LaneMask = I->LaneMask;

      // Ignore uses of other lanes.

      if ((LaneMask & KillLaneMask).none()) {

        ++I;

        continue;

      }


      if ((LaneMask & DefLaneMask).any()) {

        SUnit *UseSU = I->SU;

        MachineInstr *Use = UseSU->getInstr();

        SDep Dep(SU, SDep::Data, Reg);

        Dep.setLatency(SchedModel.computeOperandLatency(MI, OperIdx, Use,

                                                        I->OperandIndex));

        ST.adjustSchedDependency(SU, OperIdx, UseSU, I->OperandIndex, Dep,

                                 &SchedModel);

        UseSU->addPred(Dep);

      }


      LaneMask &= ~KillLaneMask;

      // If we found a Def for all lanes of this use, remove it from the list.

      if (LaneMask.any()) {

        I->LaneMask = LaneMask;

        ++I;

      } else

        I = CurrentVRegUses.erase(I);

    }

  }


  // Shortcut: Singly defined vregs do not have output/anti dependencies.

  if (MRI.hasOneDef(Reg))

    return;


  // Add output dependence to the next nearest defs of this vreg.

  //

  // Unless this definition is dead, the output dependence should be

  // transitively redundant with antidependencies from this definition's

  // uses. We're conservative for now until we have a way to guarantee the uses

  // are not eliminated sometime during scheduling. The output dependence edge

  // is also useful if output latency exceeds def-use latency.

  LaneBitmask LaneMask = DefLaneMask;

  for (VReg2SUnit &V2SU : make_range(CurrentVRegDefs.find(Reg),

                                     CurrentVRegDefs.end())) {

    // Ignore defs for other lanes.

    if ((V2SU.LaneMask & LaneMask).none())

      continue;

    // Add an output dependence.

    SUnit *DefSU = V2SU.SU;

    // Ignore additional defs of the same lanes in one instruction. This can

    // happen because lanemasks are shared for targets with too many

    // subregisters. We also use some representration tricks/hacks where we

    // add super-register defs/uses, to imply that although we only access parts

    // of the reg we care about the full one.

    if (DefSU == SU)

      continue;

    SDep Dep(SU, SDep::Output, Reg);

    Dep.setLatency(

      SchedModel.computeOutputLatency(MI, OperIdx, DefSU->getInstr()));

    DefSU->addPred(Dep);


    // Update current definition. This can get tricky if the def was about a

    // bigger lanemask before. We then have to shrink it and create a new

    // VReg2SUnit for the non-overlapping part.

    LaneBitmask OverlapMask = V2SU.LaneMask & LaneMask;

    LaneBitmask NonOverlapMask = V2SU.LaneMask & ~LaneMask;

    V2SU.SU = SU;

    V2SU.LaneMask = OverlapMask;

    if (NonOverlapMask.any())

      CurrentVRegDefs.insert(VReg2SUnit(Reg, NonOverlapMask, DefSU));

  }

  // If there was no CurrentVRegDefs entry for some lanes yet, create one.

  if (LaneMask.any())

    CurrentVRegDefs.insert(VReg2SUnit(Reg, LaneMask, SU));

}


/// Adds a register data dependency if the instruction that defines the

/// virtual register used at OperIdx is mapped to an SUnit. Add a register

/// antidependency from this SUnit to instructions that occur later in the same

/// scheduling region if they write the virtual register.

///

/// TODO: Handle ExitSU "uses" properly.


void ScheduleDAGInstrs::addVRegUseDeps(SUnit *SU, unsigned OperIdx) {

  const MachineInstr *MI = SU->getInstr();

  assert(!MI->isDebugOrPseudoInstr());


  const MachineOperand &MO = MI->getOperand(OperIdx);

  Register Reg = MO.getReg();


  // Remember the use. Data dependencies will be added when we find the def.

  LaneBitmask LaneMask = TrackLaneMasks ? getLaneMaskForMO(MO)

                                        : LaneBitmask::getAll();

  CurrentVRegUses.insert(VReg2SUnitOperIdx(Reg, LaneMask, OperIdx, SU));


  // Add antidependences to the following defs of the vreg.

  for (VReg2SUnit &V2SU : make_range(CurrentVRegDefs.find(Reg),

                                     CurrentVRegDefs.end())) {

    // Ignore defs for unrelated lanes.

    LaneBitmask PrevDefLaneMask = V2SU.LaneMask;

    if ((PrevDefLaneMask & LaneMask).none())

      continue;

    if (V2SU.SU == SU)

      continue;


    V2SU.SU->addPred(SDep(SU, SDep::Anti, Reg));

  }

}


void ScheduleDAGInstrs::addChainDependency (SUnit *SUa, SUnit *SUb,

                                            unsigned Latency) {

  if (SUa->getInstr()->mayAlias(getAAForDep(), *SUb->getInstr(), UseTBAA)) {

    SDep Dep(SUa, SDep::MayAliasMem);

    Dep.setLatency(Latency);

    SUb->addPred(Dep);

  }

}


/// Creates an SUnit for each real instruction, numbered in top-down

/// topological order. The instruction order A < B, implies that no edge exists

/// from B to A.

///

/// Map each real instruction to its SUnit.

///

/// After initSUnits, the SUnits vector cannot be resized and the scheduler may

/// hang onto SUnit pointers. We may relax this in the future by using SUnit IDs

/// instead of pointers.

///

/// MachineScheduler relies on initSUnits numbering the nodes by their order in

/// the original instruction list.


void ScheduleDAGInstrs::initSUnits() {

  // We'll be allocating one SUnit for each real instruction in the region,

  // which is contained within a basic block.

  SUnits.reserve(NumRegionInstrs);


  for (MachineInstr &MI : make_range(RegionBegin, RegionEnd)) {

    if (MI.isDebugOrPseudoInstr())

      continue;


    SUnit *SU = newSUnit(&MI);

    MISUnitMap[&MI] = SU;


    SU->isCall = MI.isCall();

    SU->isCommutable = MI.isCommutable();


    // Assign the Latency field of SU using target-provided information.

    SU->Latency = SchedModel.computeInstrLatency(SU->getInstr());


    // If this SUnit uses a reserved or unbuffered resource, mark it as such.

    //

    // Reserved resources block an instruction from issuing and stall the

    // entire pipeline. These are identified by BufferSize=0.

    //

    // Unbuffered resources prevent execution of subsequent instructions that

    // require the same resources. This is used for in-order execution pipelines

    // within an out-of-order core. These are identified by BufferSize=1.

    if (SchedModel.hasInstrSchedModel()) {

      const MCSchedClassDesc *SC = getSchedClass(SU);

      for (const MCWriteProcResEntry &PRE :

           make_range(SchedModel.getWriteProcResBegin(SC),

                      SchedModel.getWriteProcResEnd(SC))) {

        switch (SchedModel.getProcResource(PRE.ProcResourceIdx)->BufferSize) {

        case 0:

          SU->hasReservedResource = true;

          break;

        case 1:

          SU->isUnbuffered = true;

          break;

        default:

          break;

        }

      }

    }

  }

}


class ScheduleDAGInstrs::Value2SUsMap

    : public SmallMapVector<ValueType, SUList, 4> {

  /// Current total number of SUs in map.

  unsigned NumNodes = 0;


  /// 1 for loads, 0 for stores. (see comment in SUList)

  unsigned TrueMemOrderLatency;


public:

  Value2SUsMap(unsigned lat = 0) : TrueMemOrderLatency(lat) {}


  /// To keep NumNodes up to date, insert() is used instead of

  /// this operator w/ push_back().


  ValueType &operator[](const SUList &Key) {

    llvm_unreachable("Don't use. Use insert() instead."); };


  /// Adds SU to the SUList of V. If Map grows huge, reduce its size by calling

  /// reduce().


  void inline insert(SUnit *SU, ValueType V) {

    MapVector::operator[](V).push_back(SU);

    NumNodes++;

  }


  /// Clears the list of SUs mapped to V.


  void inline clearList(ValueType V) {

    iterator Itr = find(V);

    if (Itr != end()) {

      assert(NumNodes >= Itr->second.size());

      NumNodes -= Itr->second.size();


      Itr->second.clear();

    }

  }


  /// Clears map from all contents.


  void clear() {

    SmallMapVector<ValueType, SUList, 4>::clear();

    NumNodes = 0;

  }


  unsigned inline size() const { return NumNodes; }


  /// Counts the number of SUs in this map after a reduction.


  void reComputeSize() {

    NumNodes = 0;

    for (auto &I : *this)

      NumNodes += I.second.size();

  }


  unsigned inline getTrueMemOrderLatency() const {

    return TrueMemOrderLatency;

  }


  void dump();

};


void ScheduleDAGInstrs::addChainDependencies(SUnit *SU,

                                             Value2SUsMap &Val2SUsMap) {

  for (auto &I : Val2SUsMap)

    addChainDependencies(SU, I.second,

                         Val2SUsMap.getTrueMemOrderLatency());

}


void ScheduleDAGInstrs::addChainDependencies(SUnit *SU,

                                             Value2SUsMap &Val2SUsMap,

                                             ValueType V) {

  Value2SUsMap::iterator Itr = Val2SUsMap.find(V);

  if (Itr != Val2SUsMap.end())

    addChainDependencies(SU, Itr->second,

                         Val2SUsMap.getTrueMemOrderLatency());

}


void ScheduleDAGInstrs::addBarrierChain(Value2SUsMap &map) {

  assert(BarrierChain != nullptr);


  for (auto &[V, SUs] : map) {

    (void)V;

    for (auto *SU : SUs)

      SU->addPredBarrier(BarrierChain);

  }

  map.clear();

}


void ScheduleDAGInstrs::insertBarrierChain(Value2SUsMap &map) {

  assert(BarrierChain != nullptr);


  // Go through all lists of SUs.

  for (Value2SUsMap::iterator I = map.begin(), EE = map.end(); I != EE;) {

    Value2SUsMap::iterator CurrItr = I++;

    SUList &sus = CurrItr->second;

    SUList::iterator SUItr = sus.begin(), SUEE = sus.end();

    for (; SUItr != SUEE; ++SUItr) {

      // Stop on BarrierChain or any instruction above it.

      if ((*SUItr)->NodeNum <= BarrierChain->NodeNum)

        break;


      (*SUItr)->addPredBarrier(BarrierChain);

    }


    // Remove also the BarrierChain from list if present.

    if (SUItr != SUEE && *SUItr == BarrierChain)

      SUItr++;


    // Remove all SUs that are now successors of BarrierChain.

    if (SUItr != sus.begin())

      sus.erase(sus.begin(), SUItr);

  }


  // Remove all entries with empty su lists.

  map.remove_if([&](std::pair<ValueType, SUList> &mapEntry) {

      return (mapEntry.second.empty()); });


  // Recompute the size of the map (NumNodes).

  map.reComputeSize();

}


void ScheduleDAGInstrs::buildSchedGraph(AAResults *AA,

                                        RegPressureTracker *RPTracker,

                                        PressureDiffs *PDiffs,

                                        LiveIntervals *LIS,

                                        bool TrackLaneMasks) {

  const TargetSubtargetInfo &ST = MF.getSubtarget();

  bool UseAA = EnableAASchedMI.getNumOccurrences() > 0 ? EnableAASchedMI

                                                       : ST.useAA();

  if (UseAA && AA)

    AAForDep.emplace(*AA);


  BarrierChain = nullptr;


  this->TrackLaneMasks = TrackLaneMasks;

  MISUnitMap.clear();

  ScheduleDAG::clearDAG();


  // Create an SUnit for each real instruction.

  initSUnits();


  if (PDiffs)

    PDiffs->init(SUnits.size());


  // We build scheduling units by walking a block's instruction list

  // from bottom to top.


  // Each MIs' memory operand(s) is analyzed to a list of underlying

  // objects. The SU is then inserted in the SUList(s) mapped from the

  // Value(s). Each Value thus gets mapped to lists of SUs depending

  // on it, stores and loads kept separately. Two SUs are trivially

  // non-aliasing if they both depend on only identified Values and do

  // not share any common Value.

  Value2SUsMap Stores, Loads(1 /*TrueMemOrderLatency*/);


  // Certain memory accesses are known to not alias any SU in Stores

  // or Loads, and have therefore their own 'NonAlias'

  // domain. E.g. spill / reload instructions never alias LLVM I/R

  // Values. It would be nice to assume that this type of memory

  // accesses always have a proper memory operand modelling, and are

  // therefore never unanalyzable, but this is conservatively not

  // done.

  Value2SUsMap NonAliasStores, NonAliasLoads(1 /*TrueMemOrderLatency*/);


  // Track all instructions that may raise floating-point exceptions.

  // These do not depend on one other (or normal loads or stores), but

  // must not be rescheduled across global barriers.  Note that we don't

  // really need a "map" here since we don't track those MIs by value;

  // using the same Value2SUsMap data type here is simply a matter of

  // convenience.

  Value2SUsMap FPExceptions;


  // Remove any stale debug info; sometimes BuildSchedGraph is called again

  // without emitting the info from the previous call.

  DbgValues.clear();

  FirstDbgValue = nullptr;


  assert(Defs.empty() && Uses.empty() &&

         "Only BuildGraph should update Defs/Uses");

  Defs.setUniverse(TRI->getNumRegs());

  Uses.setUniverse(TRI->getNumRegs());


  assert(CurrentVRegDefs.empty() && "nobody else should use CurrentVRegDefs");

  assert(CurrentVRegUses.empty() && "nobody else should use CurrentVRegUses");

  unsigned NumVirtRegs = MRI.getNumVirtRegs();

  CurrentVRegDefs.setUniverse(NumVirtRegs);

  CurrentVRegUses.setUniverse(NumVirtRegs);


  // Model data dependencies between instructions being scheduled and the

  // ExitSU.

  addSchedBarrierDeps();


  // Walk the list of instructions, from bottom moving up.

  MachineInstr *DbgMI = nullptr;

  for (MachineBasicBlock::iterator MII = RegionEnd, MIE = RegionBegin;

       MII != MIE; --MII) {

    MachineInstr &MI = *std::prev(MII);

    if (DbgMI) {

      DbgValues.emplace_back(DbgMI, &MI);

      DbgMI = nullptr;

    }


    if (MI.isDebugValue() || MI.isDebugPHI()) {

      DbgMI = &MI;

      continue;

    }


    if (MI.isDebugLabel() || MI.isDebugRef() || MI.isPseudoProbe())

      continue;


    SUnit *SU = MISUnitMap[&MI];

    assert(SU && "No SUnit mapped to this MI");


    if (RPTracker) {

      RegisterOperands RegOpers;

      RegOpers.collect(MI, *TRI, MRI, TrackLaneMasks, false);

      if (TrackLaneMasks) {

        SlotIndex SlotIdx = LIS->getInstructionIndex(MI);

        RegOpers.adjustLaneLiveness(*LIS, MRI, SlotIdx);

      }

      if (PDiffs != nullptr)

        PDiffs->addInstruction(SU->NodeNum, RegOpers, MRI);


      if (RPTracker->getPos() == RegionEnd || &*RPTracker->getPos() != &MI)

        RPTracker->recedeSkipDebugValues();

      assert(&*RPTracker->getPos() == &MI && "RPTracker in sync");

      RPTracker->recede(RegOpers);

    }


    assert(

        (CanHandleTerminators || (!MI.isTerminator() && !MI.isPosition())) &&

        "Cannot schedule terminators or labels!");


    // Add register-based dependencies (data, anti, and output).

    // For some instructions (calls, returns, inline-asm, etc.) there can

    // be explicit uses and implicit defs, in which case the use will appear

    // on the operand list before the def. Do two passes over the operand

    // list to make sure that defs are processed before any uses.

    bool HasVRegDef = false;

    for (unsigned j = 0, n = MI.getNumOperands(); j != n; ++j) {

      const MachineOperand &MO = MI.getOperand(j);

      if (!MO.isReg() || !MO.isDef())

        continue;

      Register Reg = MO.getReg();

      if (Reg.isPhysical()) {

        addPhysRegDeps(SU, j);

      } else if (Reg.isVirtual()) {

        HasVRegDef = true;

        addVRegDefDeps(SU, j);

      }

    }

    // Now process all uses.

    for (unsigned j = 0, n = MI.getNumOperands(); j != n; ++j) {

      const MachineOperand &MO = MI.getOperand(j);

      // Only look at use operands.

      // We do not need to check for MO.readsReg() here because subsequent

      // subregister defs will get output dependence edges and need no

      // additional use dependencies.

      if (!MO.isReg() || !MO.isUse())

        continue;

      Register Reg = MO.getReg();

      if (Reg.isPhysical()) {

        addPhysRegDeps(SU, j);

      } else if (Reg.isVirtual() && MO.readsReg()) {

        addVRegUseDeps(SU, j);

      }

    }


    // If we haven't seen any uses in this scheduling region, create a

    // dependence edge to ExitSU to model the live-out latency. This is required

    // for vreg defs with no in-region use, and prefetches with no vreg def.

    //

    // FIXME: NumDataSuccs would be more precise than NumSuccs here. This

    // check currently relies on being called before adding chain deps.

    if (SU->NumSuccs == 0 && SU->Latency > 1 && (HasVRegDef || MI.mayLoad())) {

      SDep Dep(SU, SDep::Artificial);

      Dep.setLatency(SU->Latency - 1);

      ExitSU.addPred(Dep);

    }


    // Add memory dependencies (Note: isStoreToStackSlot and

    // isLoadFromStackSLot are not usable after stack slots are lowered to

    // actual addresses).


    const TargetInstrInfo *TII = ST.getInstrInfo();

    // This is a barrier event that acts as a pivotal node in the DAG.

    if (TII->isGlobalMemoryObject(&MI)) {


      // Become the barrier chain.

      if (BarrierChain)

        BarrierChain->addPredBarrier(SU);

      BarrierChain = SU;


      LLVM_DEBUG(dbgs() << "Global memory object and new barrier chain: SU("

                        << BarrierChain->NodeNum << ").\n");


      // Add dependencies against everything below it and clear maps.

      addBarrierChain(Stores);

      addBarrierChain(Loads);

      addBarrierChain(NonAliasStores);

      addBarrierChain(NonAliasLoads);

      addBarrierChain(FPExceptions);


      continue;

    }


    // Instructions that may raise FP exceptions may not be moved

    // across any global barriers.

    if (MI.mayRaiseFPException()) {

      if (BarrierChain)

        BarrierChain->addPredBarrier(SU);


      FPExceptions.insert(SU, UnknownValue);


      if (FPExceptions.size() >= HugeRegion) {

        LLVM_DEBUG(dbgs() << "Reducing FPExceptions map.\n");

        Value2SUsMap empty;

        reduceHugeMemNodeMaps(FPExceptions, empty, getReductionSize());

      }

    }


    // If it's not a store or a variant load, we're done.

    if (!MI.mayStore() &&

        !(MI.mayLoad() && !MI.isDereferenceableInvariantLoad()))

      continue;


    // Always add dependecy edge to BarrierChain if present.

    if (BarrierChain)

      BarrierChain->addPredBarrier(SU);


    // Find the underlying objects for MI. The Objs vector is either

    // empty, or filled with the Values of memory locations which this

    // SU depends on.

    UnderlyingObjectsVector Objs;

    bool ObjsFound = getUnderlyingObjectsForInstr(&MI, MFI, Objs,

                                                  MF.getDataLayout());


    if (MI.mayStore()) {

      if (!ObjsFound) {

        // An unknown store depends on all stores and loads.

        addChainDependencies(SU, Stores);

        addChainDependencies(SU, NonAliasStores);

        addChainDependencies(SU, Loads);

        addChainDependencies(SU, NonAliasLoads);


        // Map this store to 'UnknownValue'.

        Stores.insert(SU, UnknownValue);

      } else {

        // Add precise dependencies against all previously seen memory

        // accesses mapped to the same Value(s).

        for (const UnderlyingObject &UnderlObj : Objs) {

          ValueType V = UnderlObj.getValue();

          bool ThisMayAlias = UnderlObj.mayAlias();


          // Add dependencies to previous stores and loads mapped to V.

          addChainDependencies(SU, (ThisMayAlias ? Stores : NonAliasStores), V);

          addChainDependencies(SU, (ThisMayAlias ? Loads : NonAliasLoads), V);

        }

        // Update the store map after all chains have been added to avoid adding

        // self-loop edge if multiple underlying objects are present.

        for (const UnderlyingObject &UnderlObj : Objs) {

          ValueType V = UnderlObj.getValue();

          bool ThisMayAlias = UnderlObj.mayAlias();


          // Map this store to V.

          (ThisMayAlias ? Stores : NonAliasStores).insert(SU, V);

        }

        // The store may have dependencies to unanalyzable loads and

        // stores.

        addChainDependencies(SU, Loads, UnknownValue);

        addChainDependencies(SU, Stores, UnknownValue);

      }

    } else { // SU is a load.

      if (!ObjsFound) {

        // An unknown load depends on all stores.

        addChainDependencies(SU, Stores);

        addChainDependencies(SU, NonAliasStores);


        Loads.insert(SU, UnknownValue);

      } else {

        for (const UnderlyingObject &UnderlObj : Objs) {

          ValueType V = UnderlObj.getValue();

          bool ThisMayAlias = UnderlObj.mayAlias();


          // Add precise dependencies against all previously seen stores

          // mapping to the same Value(s).

          addChainDependencies(SU, (ThisMayAlias ? Stores : NonAliasStores), V);


          // Map this load to V.

          (ThisMayAlias ? Loads : NonAliasLoads).insert(SU, V);

        }

        // The load may have dependencies to unanalyzable stores.

        addChainDependencies(SU, Stores, UnknownValue);

      }

    }


    // Reduce maps if they grow huge.

    if (Stores.size() + Loads.size() >= HugeRegion) {

      LLVM_DEBUG(dbgs() << "Reducing Stores and Loads maps.\n");

      reduceHugeMemNodeMaps(Stores, Loads, getReductionSize());

    }

    if (NonAliasStores.size() + NonAliasLoads.size() >= HugeRegion) {

      LLVM_DEBUG(dbgs() << "Reducing NonAliasStores and NonAliasLoads maps.\n");

      reduceHugeMemNodeMaps(NonAliasStores, NonAliasLoads, getReductionSize());

    }

  }


  if (DbgMI)

    FirstDbgValue = DbgMI;


  Defs.clear();

  Uses.clear();

  CurrentVRegDefs.clear();

  CurrentVRegUses.clear();


  Topo.MarkDirty();

}


raw_ostream &llvm::operator<<(raw_ostream &OS, const PseudoSourceValue* PSV) {

  PSV->printCustom(OS);

  return OS;

}


void ScheduleDAGInstrs::Value2SUsMap::dump() {

  for (const auto &[ValType, SUs] : *this) {

    if (isa<const Value *>(ValType)) {

      const Value *V = cast<const Value *>(ValType);

      if (isa<UndefValue>(V))

        dbgs() << "Unknown";

      else

        V->printAsOperand(dbgs());

    } else if (isa<const PseudoSourceValue *>(ValType))

      dbgs() << cast<const PseudoSourceValue *>(ValType);

    else

      llvm_unreachable("Unknown Value type.");


    dbgs() << " : ";

    dumpSUList(SUs);

  }

}


void ScheduleDAGInstrs::reduceHugeMemNodeMaps(Value2SUsMap &stores,

                                              Value2SUsMap &loads, unsigned N) {

  LLVM_DEBUG(dbgs() << "Before reduction:\nStoring SUnits:\n"; stores.dump();

             dbgs() << "Loading SUnits:\n"; loads.dump());


  // Insert all SU's NodeNums into a vector and sort it.

  std::vector<unsigned> NodeNums;

  NodeNums.reserve(stores.size() + loads.size());

  for (const auto &[V, SUs] : stores) {

    (void)V;

    for (const auto *SU : SUs)

      NodeNums.push_back(SU->NodeNum);

  }

  for (const auto &[V, SUs] : loads) {

    (void)V;

    for (const auto *SU : SUs)

      NodeNums.push_back(SU->NodeNum);

  }

  llvm::sort(NodeNums);


  // The N last elements in NodeNums will be removed, and the SU with

  // the lowest NodeNum of them will become the new BarrierChain to

  // let the not yet seen SUs have a dependency to the removed SUs.

  assert(N <= NodeNums.size());

  SUnit *newBarrierChain = &SUnits[*(NodeNums.end() - N)];

  if (BarrierChain) {

    // The aliasing and non-aliasing maps reduce independently of each

    // other, but share a common BarrierChain. Check if the

    // newBarrierChain is above the former one. If it is not, it may

    // introduce a loop to use newBarrierChain, so keep the old one.

    if (newBarrierChain->NodeNum < BarrierChain->NodeNum) {

      BarrierChain->addPredBarrier(newBarrierChain);

      BarrierChain = newBarrierChain;

      LLVM_DEBUG(dbgs() << "Inserting new barrier chain: SU("

                        << BarrierChain->NodeNum << ").\n");

    }

    else

      LLVM_DEBUG(dbgs() << "Keeping old barrier chain: SU("

                        << BarrierChain->NodeNum << ").\n");

  }

  else

    BarrierChain = newBarrierChain;


  insertBarrierChain(stores);

  insertBarrierChain(loads);


  LLVM_DEBUG(dbgs() << "After reduction:\nStoring SUnits:\n"; stores.dump();

             dbgs() << "Loading SUnits:\n"; loads.dump());

}


static void toggleKills(const MachineRegisterInfo &MRI, LiveRegUnits &LiveRegs,

                        MachineInstr &MI, bool addToLiveRegs) {

  for (MachineOperand &MO : MI.operands()) {

    if (!MO.isReg() || !MO.readsReg())

      continue;

    Register Reg = MO.getReg();

    if (!Reg)

      continue;


    // Things that are available after the instruction are killed by it.

    bool IsKill = LiveRegs.available(Reg);


    // Exception: Do not kill reserved registers

    MO.setIsKill(IsKill && !MRI.isReserved(Reg));

    if (addToLiveRegs)

      LiveRegs.addReg(Reg);

  }

}


void ScheduleDAGInstrs::fixupKills(MachineBasicBlock &MBB) {

  LLVM_DEBUG(dbgs() << "Fixup kills for " << printMBBReference(MBB) << '\n');


  LiveRegs.init(*TRI);

  LiveRegs.addLiveOuts(MBB);


  // Examine block from end to start...

  for (MachineInstr &MI : llvm::reverse(MBB)) {

    if (MI.isDebugOrPseudoInstr())

      continue;


    // Update liveness.  Registers that are defed but not used in this

    // instruction are now dead. Mark register and all subregs as they

    // are completely defined.

    for (ConstMIBundleOperands O(MI); O.isValid(); ++O) {

      const MachineOperand &MO = *O;

      if (MO.isReg()) {

        if (!MO.isDef())

          continue;

        Register Reg = MO.getReg();

        if (!Reg)

          continue;

        LiveRegs.removeReg(Reg);

      } else if (MO.isRegMask()) {

        LiveRegs.removeRegsNotPreserved(MO.getRegMask());

      }

    }


    // If there is a bundle header fix it up first.

    if (!MI.isBundled()) {

      toggleKills(MRI, LiveRegs, MI, true);

    } else {

      MachineBasicBlock::instr_iterator Bundle = MI.getIterator();

      if (MI.isBundle())

        toggleKills(MRI, LiveRegs, MI, false);


      // Some targets make the (questionable) assumtion that the instructions

      // inside the bundle are ordered and consequently only the last use of

      // a register inside the bundle can kill it.

      MachineBasicBlock::instr_iterator I = std::next(Bundle);

      while (I->isBundledWithSucc())

        ++I;

      do {

        if (!I->isDebugOrPseudoInstr())

          toggleKills(MRI, LiveRegs, *I, true);

        --I;

      } while (I != Bundle);

    }

  }

}


void ScheduleDAGInstrs::dumpNode(const SUnit &SU) const {

#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)

  dumpNodeName(SU);

  if (SchedPrintCycles)

    dbgs() << " [TopReadyCycle = " << SU.TopReadyCycle

           << ", BottomReadyCycle = " << SU.BotReadyCycle << "]";

  dbgs() << ": ";

  SU.getInstr()->dump();

#endif

}


void ScheduleDAGInstrs::dump() const {

#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)

  if (EntrySU.getInstr() != nullptr)

    dumpNodeAll(EntrySU);

  for (const SUnit &SU : SUnits)

    dumpNodeAll(SU);

  if (ExitSU.getInstr() != nullptr)

    dumpNodeAll(ExitSU);

#endif

}


std::string ScheduleDAGInstrs::getGraphNodeLabel(const SUnit *SU) const {

  std::string s;

  raw_string_ostream oss(s);

  if (SU == &EntrySU)

    oss << "<entry>";

  else if (SU == &ExitSU)

    oss << "<exit>";

  else

    SU->getInstr()->print(oss, /*IsStandalone=*/true);

  return s;

}


/// Return the basic block label. It is not necessarily unique because a block

/// contains multiple scheduling regions. But it is fine for visualization.


std::string ScheduleDAGInstrs::getDAGName() const {

  return "dag." + BB->getFullName();

}


bool ScheduleDAGInstrs::canAddEdge(SUnit *SuccSU, SUnit *PredSU) {

  return SuccSU == &ExitSU || !Topo.IsReachable(PredSU, SuccSU);

}


bool ScheduleDAGInstrs::addEdge(SUnit *SuccSU, const SDep &PredDep) {

  if (SuccSU != &ExitSU) {

    // Do not use WillCreateCycle, it assumes SD scheduling.

    // If Pred is reachable from Succ, then the edge creates a cycle.

    if (Topo.IsReachable(PredDep.getSUnit(), SuccSU))

      return false;

    Topo.AddPredQueued(SuccSU, PredDep.getSUnit());

  }

  SuccSU->addPred(PredDep, /*Required=*/!PredDep.isArtificial());

  // Return true regardless of whether a new edge needed to be inserted.

  return true;

}


//===----------------------------------------------------------------------===//

// SchedDFSResult Implementation

//===----------------------------------------------------------------------===//


namespace llvm {


/// Internal state used to compute SchedDFSResult.


class SchedDFSImpl {

  SchedDFSResult &R;


  /// Join DAG nodes into equivalence classes by their subtree.

  IntEqClasses SubtreeClasses;

  /// List PredSU, SuccSU pairs that represent data edges between subtrees.

  std::vector<std::pair<const SUnit *, const SUnit*>> ConnectionPairs;


  struct RootData {

    unsigned NodeID;

    unsigned ParentNodeID;  ///< Parent node (member of the parent subtree).

    unsigned SubInstrCount = 0; ///< Instr count in this tree only, not

                                /// children.


    RootData(unsigned id): NodeID(id),

                           ParentNodeID(SchedDFSResult::InvalidSubtreeID) {}


    unsigned getSparseSetIndex() const { return NodeID; }

  };


  SparseSet<RootData> RootSet;


public:


  SchedDFSImpl(SchedDFSResult &r): R(r), SubtreeClasses(R.DFSNodeData.size()) {

    RootSet.setUniverse(R.DFSNodeData.size());

  }


  /// Returns true if this node been visited by the DFS traversal.

  ///

  /// During visitPostorderNode the Node's SubtreeID is assigned to the Node

  /// ID. Later, SubtreeID is updated but remains valid.


  bool isVisited(const SUnit *SU) const {

    return R.DFSNodeData[SU->NodeNum].SubtreeID

      != SchedDFSResult::InvalidSubtreeID;

  }


  /// Initializes this node's instruction count. We don't need to flag the node

  /// visited until visitPostorder because the DAG cannot have cycles.


  void visitPreorder(const SUnit *SU) {

    R.DFSNodeData[SU->NodeNum].InstrCount =

      SU->getInstr()->isTransient() ? 0 : 1;

  }


  /// Called once for each node after all predecessors are visited. Revisit this

  /// node's predecessors and potentially join them now that we know the ILP of

  /// the other predecessors.


  void visitPostorderNode(const SUnit *SU) {

    // Mark this node as the root of a subtree. It may be joined with its

    // successors later.

    R.DFSNodeData[SU->NodeNum].SubtreeID = SU->NodeNum;

    RootData RData(SU->NodeNum);

    RData.SubInstrCount = SU->getInstr()->isTransient() ? 0 : 1;


    // If any predecessors are still in their own subtree, they either cannot be

    // joined or are large enough to remain separate. If this parent node's

    // total instruction count is not greater than a child subtree by at least

    // the subtree limit, then try to join it now since splitting subtrees is

    // only useful if multiple high-pressure paths are possible.

    unsigned InstrCount = R.DFSNodeData[SU->NodeNum].InstrCount;

    for (const SDep &PredDep : SU->Preds) {

      if (PredDep.getKind() != SDep::Data)

        continue;

      unsigned PredNum = PredDep.getSUnit()->NodeNum;

      if ((InstrCount - R.DFSNodeData[PredNum].InstrCount) < R.SubtreeLimit)

        joinPredSubtree(PredDep, SU, /*CheckLimit=*/false);


      // Either link or merge the TreeData entry from the child to the parent.

      if (R.DFSNodeData[PredNum].SubtreeID == PredNum) {

        // If the predecessor's parent is invalid, this is a tree edge and the

        // current node is the parent.

        if (RootSet[PredNum].ParentNodeID == SchedDFSResult::InvalidSubtreeID)

          RootSet[PredNum].ParentNodeID = SU->NodeNum;

      }

      else if (RootSet.count(PredNum)) {

        // The predecessor is not a root, but is still in the root set. This

        // must be the new parent that it was just joined to. Note that

        // RootSet[PredNum].ParentNodeID may either be invalid or may still be

        // set to the original parent.

        RData.SubInstrCount += RootSet[PredNum].SubInstrCount;

        RootSet.erase(PredNum);

      }

    }

    RootSet[SU->NodeNum] = RData;

  }


  /// Called once for each tree edge after calling visitPostOrderNode on

  /// the predecessor. Increment the parent node's instruction count and

  /// preemptively join this subtree to its parent's if it is small enough.


  void visitPostorderEdge(const SDep &PredDep, const SUnit *Succ) {

    R.DFSNodeData[Succ->NodeNum].InstrCount

      += R.DFSNodeData[PredDep.getSUnit()->NodeNum].InstrCount;

    joinPredSubtree(PredDep, Succ);

  }


  /// Adds a connection for cross edges.


  void visitCrossEdge(const SDep &PredDep, const SUnit *Succ) {

    ConnectionPairs.emplace_back(PredDep.getSUnit(), Succ);

  }


  /// Sets each node's subtree ID to the representative ID and record

  /// connections between trees.


  void finalize() {

    SubtreeClasses.compress();

    R.DFSTreeData.resize(SubtreeClasses.getNumClasses());

    assert(SubtreeClasses.getNumClasses() == RootSet.size()

           && "number of roots should match trees");

    for (const RootData &Root : RootSet) {

      unsigned TreeID = SubtreeClasses[Root.NodeID];

      if (Root.ParentNodeID != SchedDFSResult::InvalidSubtreeID)

        R.DFSTreeData[TreeID].ParentTreeID = SubtreeClasses[Root.ParentNodeID];

      R.DFSTreeData[TreeID].SubInstrCount = Root.SubInstrCount;

      // Note that SubInstrCount may be greater than InstrCount if we joined

      // subtrees across a cross edge. InstrCount will be attributed to the

      // original parent, while SubInstrCount will be attributed to the joined

      // parent.

    }

    R.SubtreeConnections.resize(SubtreeClasses.getNumClasses());

    R.SubtreeConnectLevels.resize(SubtreeClasses.getNumClasses());

    LLVM_DEBUG(dbgs() << R.getNumSubtrees() << " subtrees:\n");

    for (unsigned Idx = 0, End = R.DFSNodeData.size(); Idx != End; ++Idx) {

      R.DFSNodeData[Idx].SubtreeID = SubtreeClasses[Idx];

      LLVM_DEBUG(dbgs() << "  SU(" << Idx << ") in tree "

                        << R.DFSNodeData[Idx].SubtreeID << '\n');

    }

    for (const auto &[Pred, Succ] : ConnectionPairs) {

      unsigned PredTree = SubtreeClasses[Pred->NodeNum];

      unsigned SuccTree = SubtreeClasses[Succ->NodeNum];

      if (PredTree == SuccTree)

        continue;

      unsigned Depth = Pred->getDepth();

      addConnection(PredTree, SuccTree, Depth);

      addConnection(SuccTree, PredTree, Depth);

    }

  }


protected:

  /// Joins the predecessor subtree with the successor that is its DFS parent.

  /// Applies some heuristics before joining.


  bool joinPredSubtree(const SDep &PredDep, const SUnit *Succ,

                       bool CheckLimit = true) {

    assert(PredDep.getKind() == SDep::Data && "Subtrees are for data edges");


    // Check if the predecessor is already joined.

    const SUnit *PredSU = PredDep.getSUnit();

    unsigned PredNum = PredSU->NodeNum;

    if (R.DFSNodeData[PredNum].SubtreeID != PredNum)

      return false;


    // Four is the magic number of successors before a node is considered a

    // pinch point.

    unsigned NumDataSucs = 0;

    for (const SDep &SuccDep : PredSU->Succs) {

      if (SuccDep.getKind() == SDep::Data) {

        if (++NumDataSucs >= 4)

          return false;

      }

    }

    if (CheckLimit && R.DFSNodeData[PredNum].InstrCount > R.SubtreeLimit)

      return false;

    R.DFSNodeData[PredNum].SubtreeID = Succ->NodeNum;

    SubtreeClasses.join(Succ->NodeNum, PredNum);

    return true;

  }


  /// Called by finalize() to record a connection between trees.


  void addConnection(unsigned FromTree, unsigned ToTree, unsigned Depth) {

    if (!Depth)

      return;


    do {

      SmallVectorImpl<SchedDFSResult::Connection> &Connections =

        R.SubtreeConnections[FromTree];

      for (SchedDFSResult::Connection &C : Connections) {

        if (C.TreeID == ToTree) {

          C.Level = std::max(C.Level, Depth);

          return;

        }

      }

      Connections.push_back(SchedDFSResult::Connection(ToTree, Depth));

      FromTree = R.DFSTreeData[FromTree].ParentTreeID;

    } while (FromTree != SchedDFSResult::InvalidSubtreeID);

  }


};


} // end namespace llvm


namespace {


/// Manage the stack used by a reverse depth-first search over the DAG.

class SchedDAGReverseDFS {

  std::vector<std::pair<const SUnit *, SUnit::const_pred_iterator>> DFSStack;


public:

  bool isComplete() const { return DFSStack.empty(); }


  void follow(const SUnit *SU) {

    DFSStack.emplace_back(SU, SU->Preds.begin());

  }

  void advance() { ++DFSStack.back().second; }


  const SDep *backtrack() {

    DFSStack.pop_back();

    return DFSStack.empty() ? nullptr : std::prev(DFSStack.back().second);

  }


  const SUnit *getCurr() const { return DFSStack.back().first; }


  SUnit::const_pred_iterator getPred() const { return DFSStack.back().second; }


  SUnit::const_pred_iterator getPredEnd() const {

    return getCurr()->Preds.end();

  }

};


} // end anonymous namespace


static bool hasDataSucc(const SUnit *SU) {

  for (const SDep &SuccDep : SU->Succs) {

    if (SuccDep.getKind() == SDep::Data &&

        !SuccDep.getSUnit()->isBoundaryNode())

      return true;

  }

  return false;

}


/// Computes an ILP metric for all nodes in the subDAG reachable via depth-first

/// search from this root.


void SchedDFSResult::compute(ArrayRef<SUnit> SUnits) {

  if (!IsBottomUp)

    llvm_unreachable("Top-down ILP metric is unimplemented");


  SchedDFSImpl Impl(*this);

  for (const SUnit &SU : SUnits) {

    if (Impl.isVisited(&SU) || hasDataSucc(&SU))

      continue;


    SchedDAGReverseDFS DFS;

    Impl.visitPreorder(&SU);

    DFS.follow(&SU);

    while (true) {

      // Traverse the leftmost path as far as possible.

      while (DFS.getPred() != DFS.getPredEnd()) {

        const SDep &PredDep = *DFS.getPred();

        DFS.advance();

        // Ignore non-data edges.

        if (PredDep.getKind() != SDep::Data

            || PredDep.getSUnit()->isBoundaryNode()) {

          continue;

        }

        // An already visited edge is a cross edge, assuming an acyclic DAG.

        if (Impl.isVisited(PredDep.getSUnit())) {

          Impl.visitCrossEdge(PredDep, DFS.getCurr());

          continue;

        }

        Impl.visitPreorder(PredDep.getSUnit());

        DFS.follow(PredDep.getSUnit());

      }

      // Visit the top of the stack in postorder and backtrack.

      const SUnit *Child = DFS.getCurr();

      const SDep *PredDep = DFS.backtrack();

      Impl.visitPostorderNode(Child);

      if (PredDep)

        Impl.visitPostorderEdge(*PredDep, DFS.getCurr());

      if (DFS.isComplete())

        break;

    }

  }

  Impl.finalize();

}


/// The root of the given SubtreeID was just scheduled. For all subtrees

/// connected to this tree, record the depth of the connection so that the

/// nearest connected subtrees can be prioritized.


void SchedDFSResult::scheduleTree(unsigned SubtreeID) {

  for (const Connection &C : SubtreeConnections[SubtreeID]) {

    SubtreeConnectLevels[C.TreeID] =

      std::max(SubtreeConnectLevels[C.TreeID], C.Level);

    LLVM_DEBUG(dbgs() << "  Tree: " << C.TreeID << " @"

                      << SubtreeConnectLevels[C.TreeID] << '\n');

  }

}


#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)


LLVM_DUMP_METHOD void ILPValue::print(raw_ostream &OS) const {

  OS << InstrCount << " / " << Length << " = ";

  if (!Length)

    OS << "BADILP";

  else

    OS << format("%g", ((double)InstrCount / Length));

}


LLVM_DUMP_METHOD void ILPValue::dump() const {

  dbgs() << *this << '\n';

}


LLVM_ATTRIBUTE_UNUSED


raw_ostream &llvm::operator<<(raw_ostream &OS, const ILPValue &Val) {

  Val.print(OS);

  return OS;

}


#endif

SubReg
unsigned SubReg
Definition AArch64AdvSIMDScalarPass.cpp:102

MRI
unsigned const MachineRegisterInfo * MRI
Definition AArch64AdvSIMDScalarPass.cpp:103

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

none
@ none
Definition AArch64StackTagging.cpp:81

UseAA
static cl::opt< bool > UseAA("aarch64-use-aa", cl::init(true), cl::desc("Enable the use of AA during codegen."))

MBB
MachineBasicBlock & MBB
Definition ARMSLSHardening.cpp:71

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition ARMSLSHardening.cpp:73

AliasAnalysis.h

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

Casting.h

CommandLine.h

Compiler.h

LLVM_DUMP_METHOD
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
Definition Compiler.h:638

LLVM_ATTRIBUTE_UNUSED
#define LLVM_ATTRIBUTE_UNUSED
Definition Compiler.h:298

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

InstrCount
static unsigned InstrCount
Definition DFAPacketizer.cpp:51

Format.h

UseReg
static Register UseReg(const MachineOperand &MO)
Definition HexagonCopyToCombine.cpp:245

loads
hexagon widen Hexagon Store false hexagon widen loads
Definition HexagonLoadStoreWidening.cpp:193

stores
hexagon widen stores
Definition HexagonLoadStoreWidening.cpp:187

MI
IRTranslator LLVM IR MI
Definition IRTranslator.cpp:110

Function.h

Type.h

Value.h

IntEqClasses.h
Equivalence classes for small integers.

LaneBitmask.h
A common definition of LaneBitmask for use in TableGen and CodeGen.

LiveIntervals.h

LivePhysRegs.h
This file implements the LivePhysRegs utility for tracking liveness of physical registers.

MCRegisterInfo.h

I
#define I(x, y, z)
Definition MD5.cpp:58

MachineBasicBlock.h

MachineFrameInfo.h

MachineFunction.h

MachineInstrBundle.h

MachineInstr.h

MachineMemOperand.h

MachineOperand.h

MachineRegisterInfo.h

Reg
Register Reg
Definition MachineSink.cpp:2117

MapVector.h
This file implements a map that provides insertion order iteration.

OpIdx
MachineInstr unsigned OpIdx
Definition NVPTXPrologEpilogPass.cpp:56

P
#define P(N)

PseudoSourceValue.h

RegisterPressure.h

toggleKills
static void toggleKills(const MachineRegisterInfo &MRI, LiveRegUnits &LiveRegs, MachineInstr &MI, bool addToLiveRegs)
Definition ScheduleDAGInstrs.cpp:1125

ReductionSize
static cl::opt< unsigned > ReductionSize("dag-maps-reduction-size", cl::Hidden, cl::desc("A huge scheduling region will have maps reduced by this many " "nodes at a time. Defaults to HugeRegion / 2."))

getUnderlyingObjectsForInstr
static bool getUnderlyingObjectsForInstr(const MachineInstr *MI, const MachineFrameInfo &MFI, UnderlyingObjectsVector &Objects, const DataLayout &DL)
If this machine instr has memory reference information and it can be tracked to a normal reference to...
Definition ScheduleDAGInstrs.cpp:139

hasDataSucc
static bool hasDataSucc(const SUnit *SU)
Definition ScheduleDAGInstrs.cpp:1475

EnableSchedModel
static cl::opt< bool > EnableSchedModel("schedmodel", cl::Hidden, cl::init(true), cl::desc("Use TargetSchedModel for latency lookup"))

EnableAASchedMI
static cl::opt< bool > EnableAASchedMI("enable-aa-sched-mi", cl::Hidden, cl::desc("Enable use of AA during MI DAG construction"))

HugeRegion
static cl::opt< unsigned > HugeRegion("dag-maps-huge-region", cl::Hidden, cl::init(1000), cl::desc("The limit to use while constructing the DAG " "prior to scheduling, at which point a trade-off " "is made to avoid excessive compile time."))

getReductionSize
static unsigned getReductionSize()
Definition ScheduleDAGInstrs.cpp:102

dumpSUList
static void dumpSUList(const ScheduleDAGInstrs::SUList &L)
Definition ScheduleDAGInstrs.cpp:110

UseTBAA
static cl::opt< bool > UseTBAA("use-tbaa-in-sched-mi", cl::Hidden, cl::init(true), cl::desc("Enable use of TBAA during MI DAG construction"))

EnableSchedItins
static cl::opt< bool > EnableSchedItins("scheditins", cl::Hidden, cl::init(true), cl::desc("Use InstrItineraryData for latency lookup"))

SchedPrintCycles
static cl::opt< bool > SchedPrintCycles("sched-print-cycles", cl::Hidden, cl::init(false), cl::desc("Report top/bottom cycles when dumping SUnit instances"))

ScheduleDAGInstrs.h

ScheduleDAG.h

ScheduleDFS.h

SlotIndexes.h

SmallVector.h
This file defines the SmallVector class.

SparseSet.h
This file defines the SparseSet class derived from the version described in Briggs,...

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition Debug.h:114

TargetInstrInfo.h

TargetRegisterInfo.h

TargetSubtargetInfo.h

ValueTracking.h

getFunction
static Function * getFunction(FunctionType *Ty, const Twine &Name, Module *M)
Definition WebAssemblyLowerEmscriptenEHSjLj.cpp:442

LiveRegs

llvm::ScheduleDAGInstrs::Value2SUsMap
Definition ScheduleDAGInstrs.cpp:640

llvm::ScheduleDAGInstrs::Value2SUsMap::reComputeSize
void reComputeSize()
Counts the number of SUs in this map after a reduction.
Definition ScheduleDAGInstrs.cpp:682

llvm::ScheduleDAGInstrs::Value2SUsMap::insert
void insert(SUnit *SU, ValueType V)
Adds SU to the SUList of V.
Definition ScheduleDAGInstrs.cpp:657

llvm::ScheduleDAGInstrs::Value2SUsMap::dump
void dump()
Definition ScheduleDAGInstrs.cpp:1057

llvm::ScheduleDAGInstrs::Value2SUsMap::clear
void clear()
Clears map from all contents.
Definition ScheduleDAGInstrs.cpp:674

llvm::ScheduleDAGInstrs::Value2SUsMap::Value2SUsMap
Value2SUsMap(unsigned lat=0)
Definition ScheduleDAGInstrs.cpp:648

llvm::ScheduleDAGInstrs::Value2SUsMap::clearList
void clearList(ValueType V)
Clears the list of SUs mapped to V.
Definition ScheduleDAGInstrs.cpp:663

llvm::ScheduleDAGInstrs::Value2SUsMap::size
unsigned size() const
Definition ScheduleDAGInstrs.cpp:679

llvm::ScheduleDAGInstrs::Value2SUsMap::operator[]
ValueType & operator[](const SUList &Key)
To keep NumNodes up to date, insert() is used instead of this operator w/ push_back().
Definition ScheduleDAGInstrs.cpp:652

llvm::ScheduleDAGInstrs::Value2SUsMap::getTrueMemOrderLatency
unsigned getTrueMemOrderLatency() const
Definition ScheduleDAGInstrs.cpp:688

llvm::AAResults
Definition AliasAnalysis.h:318

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41

llvm::ConstMIBundleOperands
ConstMIBundleOperands - Iterate over all operands in a const bundle of machine instructions.
Definition MachineInstrBundle.h:189

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:63

llvm::IntEqClasses
Definition IntEqClasses.h:29

llvm::LiveIntervals
Definition LiveIntervals.h:55

llvm::LiveIntervals::getInstructionIndex
SlotIndex getInstructionIndex(const MachineInstr &Instr) const
Returns the base index of the given instruction.
Definition LiveIntervals.h:247

llvm::LiveRegUnits
A set of register units used to track register liveness.
Definition LiveRegUnits.h:31

llvm::MCInstrDesc
Describe properties that are true of each instruction in the target description file.
Definition MCInstrDesc.h:210

llvm::MCInstrDesc::getNumOperands
unsigned getNumOperands() const
Return the number of declared MachineOperands for this MachineInstruction.
Definition MCInstrDesc.h:249

llvm::MCInstrDesc::hasImplicitUseOfPhysReg
bool hasImplicitUseOfPhysReg(MCRegister Reg) const
Return true if this instruction implicitly uses the specified physical register.
Definition MCInstrDesc.h:600

llvm::MCInstrDesc::hasImplicitDefOfPhysReg
LLVM_ABI bool hasImplicitDefOfPhysReg(MCRegister Reg, const MCRegisterInfo *MRI=nullptr) const
Return true if this instruction implicitly defines the specified physical register.
Definition MCInstrDesc.cpp:32

llvm::MCRegUnitMaskIterator
MCRegUnitMaskIterator enumerates a list of register units and their associated lane masks for Reg.
Definition MCRegisterInfo.h:674

llvm::MCRegUnitMaskIterator::isValid
bool isValid() const
Returns true if this iterator is not yet at the end.
Definition MCRegisterInfo.h:695

llvm::MachineBasicBlock
Definition MachineBasicBlock.h:122

llvm::MachineBasicBlock::instr_iterator
Instructions::iterator instr_iterator
Definition MachineBasicBlock.h:336

llvm::MachineBasicBlock::iterator
MachineInstrBundleIterator< MachineInstr > iterator
Definition MachineBasicBlock.h:341

llvm::MachineFrameInfo
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
Definition MachineFrameInfo.h:111

llvm::MachineFrameInfo::hasTailCall
bool hasTailCall() const
Returns true if the function contains a tail call.
Definition MachineFrameInfo.h:662

llvm::MachineFunction
Definition MachineFunction.h:286

llvm::MachineFunction::getSubtarget
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Definition MachineFunction.h:762

llvm::MachineInstr
Representation of each machine instruction.
Definition MachineInstr.h:72

llvm::MachineInstr::isBarrier
bool isBarrier(QueryType Type=AnyInBundle) const
Returns true if the specified instruction stops control flow from executing the instruction immediate...
Definition MachineInstr.h:965

llvm::MachineInstr::isCall
bool isCall(QueryType Type=AnyInBundle) const
Definition MachineInstr.h:948

llvm::MachineInstr::mayAlias
LLVM_ABI bool mayAlias(BatchAAResults *AA, const MachineInstr &Other, bool UseTBAA) const
Returns true if this instruction's memory access aliases the memory access of Other.
Definition MachineInstr.cpp:1514

llvm::MachineInstr::getDesc
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
Definition MachineInstr.h:584

llvm::MachineInstr::print
LLVM_ABI void print(raw_ostream &OS, bool IsStandalone=true, bool SkipOpers=false, bool SkipDebugLoc=false, bool AddNewLine=true, const TargetInstrInfo *TII=nullptr) const
Print this MI to OS.
Definition MachineInstr.cpp:1770

llvm::MachineInstr::all_uses
filtered_mop_range all_uses()
Returns an iterator range over all operands that are (explicit or implicit) register uses.
Definition MachineInstr.h:764

llvm::MachineInstr::isTransient
bool isTransient() const
Return true if this is a transient instruction that is either very likely to be eliminated during reg...
Definition MachineInstr.h:1460

llvm::MachineInstr::dump
LLVM_ABI void dump() const
Definition MachineInstr.cpp:1733

llvm::MachineInstr::getOperand
const MachineOperand & getOperand(unsigned i) const
Definition MachineInstr.h:595

llvm::MachineLoopInfo
Definition MachineLoopInfo.h:109

llvm::MachineMemOperand
A description of a memory reference used in the backend.
Definition MachineMemOperand.h:130

llvm::MachineOperand
MachineOperand class - Representation of each machine instruction operand.
Definition MachineOperand.h:48

llvm::MachineOperand::getSubReg
unsigned getSubReg() const
Definition MachineOperand.h:373

llvm::MachineOperand::isUndef
bool isUndef() const
Definition MachineOperand.h:403

llvm::MachineOperand::readsReg
bool readsReg() const
readsReg - Returns true if this operand reads the previous value of its register.
Definition MachineOperand.h:466

llvm::MachineOperand::isReg
bool isReg() const
isReg - Tests if this is a MO_Register operand.
Definition MachineOperand.h:328

llvm::MachineOperand::isRegMask
bool isRegMask() const
isRegMask - Tests if this is a MO_RegisterMask operand.
Definition MachineOperand.h:352

llvm::MachineOperand::isUse
bool isUse() const
Definition MachineOperand.h:378

llvm::MachineOperand::isDef
bool isDef() const
Definition MachineOperand.h:383

llvm::MachineOperand::setIsKill
void setIsKill(bool Val=true)
Definition MachineOperand.h:519

llvm::MachineOperand::isDead
bool isDead() const
Definition MachineOperand.h:393

llvm::MachineOperand::setIsUndef
void setIsUndef(bool Val=true)
Definition MachineOperand.h:530

llvm::MachineOperand::getReg
Register getReg() const
getReg - Returns the register number.
Definition MachineOperand.h:368

llvm::MachineOperand::getRegMask
const uint32_t * getRegMask() const
getRegMask - Returns a bit mask of registers preserved by this RegMask operand.
Definition MachineOperand.h:660

llvm::MachineRegisterInfo
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
Definition MachineRegisterInfo.h:53

llvm::MapVector< ValueType, SUList, SmallDenseMap< ValueType, unsigned, N >, SmallVector< std::pair< ValueType, SUList >, N > >::iterator
typename SmallVector< std::pair< ValueType, SUList >, N >::iterator iterator
Definition MapVector.h:42

llvm::MapVector::end
iterator end()
Definition MapVector.h:67

llvm::MapVector::operator[]
ValueT & operator[](const KeyT &Key)
Definition MapVector.h:98

llvm::MapVector< ValueType, SUList, SmallDenseMap< ValueType, unsigned, N >, SmallVector< std::pair< ValueType, SUList >, N > >::find
iterator find(const ValueType &Key)
Definition MapVector.h:149

llvm::MapVector::begin
iterator begin()
Definition MapVector.h:65

llvm::MapVector::remove_if
void remove_if(Function Pred)
Definition MapVector.h:232

llvm::MapVector< KeyT, ValueT, SmallDenseMap< KeyT, unsigned, N >, SmallVector< std::pair< KeyT, ValueT >, N > >::clear
void clear()
Definition MapVector.h:88

llvm::PressureDiffs
Array of PressureDiffs.
Definition RegisterPressure.h:200

llvm::PressureDiffs::addInstruction
LLVM_ABI void addInstruction(unsigned Idx, const RegisterOperands &RegOpers, const MachineRegisterInfo &MRI)
Record pressure difference induced by the given operand list to node with index Idx.
Definition RegisterPressure.cpp:645

llvm::PressureDiffs::init
LLVM_ABI void init(unsigned N)
Initialize an array of N PressureDiffs.
Definition RegisterPressure.cpp:634

llvm::PseudoSourceValue
Special value supplied for machine level alias analysis.
Definition PseudoSourceValue.h:33

llvm::RegPressureTracker
Track the current register pressure at some position in the instruction stream, and remember the high...
Definition RegisterPressure.h:361

llvm::RegPressureTracker::recede
LLVM_ABI void recede(SmallVectorImpl< VRegMaskOrUnit > *LiveUses=nullptr)
Recede across the previous instruction.
Definition RegisterPressure.cpp:859

llvm::RegPressureTracker::recedeSkipDebugValues
LLVM_ABI void recedeSkipDebugValues()
Recede until we find an instruction which is not a DebugValue.
Definition RegisterPressure.cpp:838

llvm::RegPressureTracker::getPos
MachineBasicBlock::const_iterator getPos() const
Get the MI position corresponding to this register pressure.
Definition RegisterPressure.h:417

llvm::RegisterOperands
List of registers defined and used by a machine instruction.
Definition RegisterPressure.h:167

llvm::RegisterOperands::collect
LLVM_ABI void collect(const MachineInstr &MI, const TargetRegisterInfo &TRI, const MachineRegisterInfo &MRI, bool TrackLaneMasks, bool IgnoreDead)
Analyze the given instruction MI and fill in the Uses, Defs and DeadDefs list based on the MachineOpe...
Definition RegisterPressure.cpp:562

llvm::RegisterOperands::adjustLaneLiveness
LLVM_ABI void adjustLaneLiveness(const LiveIntervals &LIS, const MachineRegisterInfo &MRI, SlotIndex Pos, MachineInstr *AddFlagsMI=nullptr)
Use liveness information to find out which uses/defs are partially undefined/dead and adjust the VReg...
Definition RegisterPressure.cpp:593

llvm::Register
Wrapper class representing virtual and physical registers.
Definition Register.h:19

llvm::SDep
Scheduling dependency.
Definition ScheduleDAG.h:51

llvm::SDep::getSUnit
SUnit * getSUnit() const
Definition ScheduleDAG.h:507

llvm::SDep::getKind
Kind getKind() const
Returns an enum value representing the kind of the dependence.
Definition ScheduleDAG.h:513

llvm::SDep::Kind
Kind
These are the different kinds of scheduling dependencies.
Definition ScheduleDAG.h:54

llvm::SDep::Output
@ Output
A register output-dependence (aka WAW).
Definition ScheduleDAG.h:57

llvm::SDep::Anti
@ Anti
A register anti-dependence (aka WAR).
Definition ScheduleDAG.h:56

llvm::SDep::Data
@ Data
Regular data dependence (aka true-dependence).
Definition ScheduleDAG.h:55

llvm::SDep::setLatency
void setLatency(unsigned Lat)
Sets the latency for this edge.
Definition ScheduleDAG.h:147

llvm::SDep::Artificial
@ Artificial
Arbitrary strong DAG edge (no real dependence).
Definition ScheduleDAG.h:74

llvm::SDep::MayAliasMem
@ MayAliasMem
Nonvolatile load/Store instructions that may alias.
Definition ScheduleDAG.h:72

llvm::SDep::isArtificial
bool isArtificial() const
Tests if this is an Order dependence that is marked as "artificial", meaning it isn't necessary for c...
Definition ScheduleDAG.h:200

llvm::SUnit
Scheduling unit. This is a node in the scheduling DAG.
Definition ScheduleDAG.h:249

llvm::SUnit::isCall
bool isCall
Is a function call.
Definition ScheduleDAG.h:296

llvm::SUnit::NumSuccs
unsigned NumSuccs
Definition ScheduleDAG.h:280

llvm::SUnit::TopReadyCycle
unsigned TopReadyCycle
Cycle relative to start when node is ready.
Definition ScheduleDAG.h:285

llvm::SUnit::NodeNum
unsigned NodeNum
Entry # of node in the node vector.
Definition ScheduleDAG.h:277

llvm::SUnit::isUnbuffered
bool isUnbuffered
Uses an unbuffered resource.
Definition ScheduleDAG.h:309

llvm::SUnit::const_pred_iterator
SmallVectorImpl< SDep >::const_iterator const_pred_iterator
Definition ScheduleDAG.h:274

llvm::SUnit::Latency
unsigned short Latency
Node latency.
Definition ScheduleDAG.h:312

llvm::SUnit::isBoundaryNode
bool isBoundaryNode() const
Boundary nodes are placeholders for the boundary of the scheduling region.
Definition ScheduleDAG.h:367

llvm::SUnit::hasPhysRegDefs
bool hasPhysRegDefs
Has physreg defs that are being used.
Definition ScheduleDAG.h:301

llvm::SUnit::BotReadyCycle
unsigned BotReadyCycle
Cycle relative to end when node is ready.
Definition ScheduleDAG.h:286

llvm::SUnit::Succs
SmallVector< SDep, 4 > Succs
All sunit successors.
Definition ScheduleDAG.h:270

llvm::SUnit::hasReservedResource
bool hasReservedResource
Uses a reserved resource.
Definition ScheduleDAG.h:310

llvm::SUnit::isCommutable
bool isCommutable
Is a commutable instruction.
Definition ScheduleDAG.h:299

llvm::SUnit::hasPhysRegUses
bool hasPhysRegUses
Has physreg uses.
Definition ScheduleDAG.h:300

llvm::SUnit::Preds
SmallVector< SDep, 4 > Preds
All sunit predecessors.
Definition ScheduleDAG.h:269

llvm::SUnit::addPred
LLVM_ABI bool addPred(const SDep &D, bool Required=true)
Adds the specified edge as a pred of the current node if not already.
Definition ScheduleDAG.cpp:106

llvm::SUnit::getInstr
MachineInstr * getInstr() const
Returns the representative MachineInstr for this SUnit.
Definition ScheduleDAG.h:399

llvm::SchedDFSImpl::visitPostorderNode
void visitPostorderNode(const SUnit *SU)
Called once for each node after all predecessors are visited.
Definition ScheduleDAGInstrs.cpp:1305

llvm::SchedDFSImpl::joinPredSubtree
bool joinPredSubtree(const SDep &PredDep, const SUnit *Succ, bool CheckLimit=true)
Joins the predecessor subtree with the successor that is its DFS parent.
Definition ScheduleDAGInstrs.cpp:1397

llvm::SchedDFSImpl::addConnection
void addConnection(unsigned FromTree, unsigned ToTree, unsigned Depth)
Called by finalize() to record a connection between trees.
Definition ScheduleDAGInstrs.cpp:1424

llvm::SchedDFSImpl::finalize
void finalize()
Sets each node's subtree ID to the representative ID and record connections between trees.
Definition ScheduleDAGInstrs.cpp:1360

llvm::SchedDFSImpl::visitCrossEdge
void visitCrossEdge(const SDep &PredDep, const SUnit *Succ)
Adds a connection for cross edges.
Definition ScheduleDAGInstrs.cpp:1354

llvm::SchedDFSImpl::visitPostorderEdge
void visitPostorderEdge(const SDep &PredDep, const SUnit *Succ)
Called once for each tree edge after calling visitPostOrderNode on the predecessor.
Definition ScheduleDAGInstrs.cpp:1347

llvm::SchedDFSImpl::visitPreorder
void visitPreorder(const SUnit *SU)
Initializes this node's instruction count.
Definition ScheduleDAGInstrs.cpp:1297

llvm::SchedDFSImpl::isVisited
bool isVisited(const SUnit *SU) const
Returns true if this node been visited by the DFS traversal.
Definition ScheduleDAGInstrs.cpp:1290

llvm::SchedDFSImpl::SchedDFSImpl
SchedDFSImpl(SchedDFSResult &r)
Definition ScheduleDAGInstrs.cpp:1282

llvm::SchedDFSResult
Compute the values of each DAG node for various metrics during DFS.
Definition ScheduleDFS.h:65

llvm::SchedDFSResult::SchedDFSImpl
friend class SchedDFSImpl
Definition ScheduleDFS.h:66

llvm::SchedDFSResult::compute
void compute(ArrayRef< SUnit > SUnits)
Compute various metrics for the DAG with given roots.
Definition ScheduleDAGInstrs.cpp:1486

llvm::SchedDFSResult::scheduleTree
void scheduleTree(unsigned SubtreeID)
Scheduler callback to update SubtreeConnectLevels when a tree is initially scheduled.
Definition ScheduleDAGInstrs.cpp:1532

llvm::ScheduleDAGInstrs::LiveRegs
LiveRegUnits LiveRegs
Set of live physical registers for updating kill flags.
Definition ScheduleDAGInstrs.h:273

llvm::ScheduleDAGInstrs::MISUnitMap
DenseMap< MachineInstr *, SUnit * > MISUnitMap
After calling BuildSchedGraph, each machine instruction in the current scheduling region is mapped to...
Definition ScheduleDAGInstrs.h:158

llvm::ScheduleDAGInstrs::addVRegUseDeps
void addVRegUseDeps(SUnit *SU, unsigned OperIdx)
Adds a register data dependency if the instruction that defines the virtual register used at OperIdx ...
Definition ScheduleDAGInstrs.cpp:545

llvm::ScheduleDAGInstrs::addVRegDefDeps
void addVRegDefDeps(SUnit *SU, unsigned OperIdx)
Adds register output and data dependencies from this SUnit to instructions that occur later in the sa...
Definition ScheduleDAGInstrs.cpp:425

llvm::ScheduleDAGInstrs::finishBlock
virtual void finishBlock()
Cleans up after scheduling in the given block.
Definition ScheduleDAGInstrs.cpp:193

llvm::ScheduleDAGInstrs::end
MachineBasicBlock::iterator end() const
Returns an iterator to the bottom of the current scheduling region.
Definition ScheduleDAGInstrs.h:306

llvm::ScheduleDAGInstrs::getDAGName
std::string getDAGName() const override
Returns a label for the region of code covered by the DAG.
Definition ScheduleDAGInstrs.cpp:1231

llvm::ScheduleDAGInstrs::BB
MachineBasicBlock * BB
The block in which to insert instructions.
Definition ScheduleDAGInstrs.h:145

llvm::ScheduleDAGInstrs::FirstDbgValue
MachineInstr * FirstDbgValue
Definition ScheduleDAGInstrs.h:270

llvm::ScheduleDAGInstrs::startBlock
virtual void startBlock(MachineBasicBlock *BB)
Prepares to perform scheduling in the given block.
Definition ScheduleDAGInstrs.cpp:189

llvm::ScheduleDAGInstrs::CanHandleTerminators
bool CanHandleTerminators
The standard DAG builder does not normally include terminators as DAG nodes because it does not creat...
Definition ScheduleDAGInstrs.h:136

llvm::ScheduleDAGInstrs::addBarrierChain
void addBarrierChain(Value2SUsMap &map)
Adds barrier chain edges from all SUs in map, and then clear the map.
Definition ScheduleDAGInstrs.cpp:711

llvm::ScheduleDAGInstrs::reduceHugeMemNodeMaps
void reduceHugeMemNodeMaps(Value2SUsMap &stores, Value2SUsMap &loads, unsigned N)
Reduces maps in FIFO order, by N SUs.
Definition ScheduleDAGInstrs.cpp:1075

llvm::ScheduleDAGInstrs::addPhysRegDeps
void addPhysRegDeps(SUnit *SU, unsigned OperIdx)
Adds register dependencies (data, anti, and output) from this SUnit to following instructions in the ...
Definition ScheduleDAGInstrs.cpp:315

llvm::ScheduleDAGInstrs::RegionEnd
MachineBasicBlock::iterator RegionEnd
The end of the range to be scheduled.
Definition ScheduleDAGInstrs.h:151

llvm::ScheduleDAGInstrs::CurrentVRegUses
VReg2SUnitOperIdxMultiMap CurrentVRegUses
Tracks the last instructions in this region using each virtual register.
Definition ScheduleDAGInstrs.h:175

llvm::ScheduleDAGInstrs::addChainDependencies
void addChainDependencies(SUnit *SU, SUList &SUs, unsigned Latency)
Adds dependencies as needed from all SUs in list to SU.
Definition ScheduleDAGInstrs.h:231

llvm::ScheduleDAGInstrs::getSchedClass
const MCSchedClassDesc * getSchedClass(SUnit *SU) const
Resolves and cache a resolved scheduling class for an SUnit.
Definition ScheduleDAGInstrs.h:286

llvm::ScheduleDAGInstrs::fixupKills
void fixupKills(MachineBasicBlock &MBB)
Fixes register kill flags that scheduling has made invalid.
Definition ScheduleDAGInstrs.cpp:1144

llvm::ScheduleDAGInstrs::addPhysRegDataDeps
void addPhysRegDataDeps(SUnit *SU, unsigned OperIdx)
MO is an operand of SU's instruction that defines a physical register.
Definition ScheduleDAGInstrs.cpp:259

llvm::ScheduleDAGInstrs::ScheduleDAGInstrs
ScheduleDAGInstrs(MachineFunction &mf, const MachineLoopInfo *mli, bool RemoveKillFlags=false)
Definition ScheduleDAGInstrs.cpp:122

llvm::ScheduleDAGInstrs::getLaneMaskForMO
LaneBitmask getLaneMaskForMO(const MachineOperand &MO) const
Returns a mask for which lanes get read/written by the given (register) machine operand.
Definition ScheduleDAGInstrs.cpp:398

llvm::ScheduleDAGInstrs::DbgValues
DbgValueVector DbgValues
Remember instruction that precedes DBG_VALUE.
Definition ScheduleDAGInstrs.h:269

llvm::ScheduleDAGInstrs::newSUnit
SUnit * newSUnit(MachineInstr *MI)
Creates a new SUnit and return a ptr to it.
Definition ScheduleDAGInstrs.h:413

llvm::ScheduleDAGInstrs::initSUnits
void initSUnits()
Creates an SUnit for each real instruction, numbered in top-down topological order.
Definition ScheduleDAGInstrs.cpp:593

llvm::ScheduleDAGInstrs::addEdge
bool addEdge(SUnit *SuccSU, const SDep &PredDep)
Add a DAG edge to the given SU with the given predecessor dependence data.
Definition ScheduleDAGInstrs.cpp:1239

llvm::ScheduleDAGInstrs::Topo
ScheduleDAGTopologicalSort Topo
Topo - A topological ordering for SUnits which permits fast IsReachable and similar queries.
Definition ScheduleDAGInstrs.h:262

llvm::ScheduleDAGInstrs::SUList
std::list< SUnit * > SUList
A list of SUnits, used in Value2SUsMap, during DAG construction.
Definition ScheduleDAGInstrs.h:192

llvm::ScheduleDAGInstrs::BarrierChain
SUnit * BarrierChain
Remember a generic side-effecting instruction as we proceed.
Definition ScheduleDAGInstrs.h:182

llvm::ScheduleDAGInstrs::getAAForDep
BatchAAResults * getAAForDep() const
Returns a (possibly null) pointer to the current BatchAAResults.
Definition ScheduleDAGInstrs.h:212

llvm::ScheduleDAGInstrs::TrackLaneMasks
bool TrackLaneMasks
Whether lane masks should get tracked.
Definition ScheduleDAGInstrs.h:139

llvm::ScheduleDAGInstrs::dumpNode
void dumpNode(const SUnit &SU) const override
Definition ScheduleDAGInstrs.cpp:1195

llvm::ScheduleDAGInstrs::Defs
RegUnit2SUnitsMap Defs
Defs, Uses - Remember where defs and uses of each register are as we iterate upward through the instr...
Definition ScheduleDAGInstrs.h:167

llvm::ScheduleDAGInstrs::UnknownValue
UndefValue * UnknownValue
For an unanalyzable memory access, this Value is used in maps.
Definition ScheduleDAGInstrs.h:257

llvm::ScheduleDAGInstrs::CurrentVRegDefs
VReg2SUnitMultiMap CurrentVRegDefs
Tracks the last instruction(s) in this region defining each virtual register.
Definition ScheduleDAGInstrs.h:173

llvm::ScheduleDAGInstrs::begin
MachineBasicBlock::iterator begin() const
Returns an iterator to the top of the current scheduling region.
Definition ScheduleDAGInstrs.h:303

llvm::ScheduleDAGInstrs::buildSchedGraph
void buildSchedGraph(AAResults *AA, RegPressureTracker *RPTracker=nullptr, PressureDiffs *PDiffs=nullptr, LiveIntervals *LIS=nullptr, bool TrackLaneMasks=false)
Builds SUnits for the current region.
Definition ScheduleDAGInstrs.cpp:755

llvm::ScheduleDAGInstrs::SchedModel
TargetSchedModel SchedModel
TargetSchedModel provides an interface to the machine model.
Definition ScheduleDAGInstrs.h:122

llvm::ScheduleDAGInstrs::exitRegion
virtual void exitRegion()
Called when the scheduler has finished scheduling the current region.
Definition ScheduleDAGInstrs.cpp:208

llvm::ScheduleDAGInstrs::Uses
RegUnit2SUnitsMap Uses
Definition ScheduleDAGInstrs.h:168

llvm::ScheduleDAGInstrs::canAddEdge
bool canAddEdge(SUnit *SuccSU, SUnit *PredSU)
True if an edge can be added from PredSU to SuccSU without creating a cycle.
Definition ScheduleDAGInstrs.cpp:1235

llvm::ScheduleDAGInstrs::insertBarrierChain
void insertBarrierChain(Value2SUsMap &map)
Inserts a barrier chain in a huge region, far below current SU.
Definition ScheduleDAGInstrs.cpp:722

llvm::ScheduleDAGInstrs::MLI
const MachineLoopInfo * MLI
Definition ScheduleDAGInstrs.h:118

llvm::ScheduleDAGInstrs::RemoveKillFlags
bool RemoveKillFlags
True if the DAG builder should remove kill flags (in preparation for rescheduling).
Definition ScheduleDAGInstrs.h:126

llvm::ScheduleDAGInstrs::AAForDep
std::optional< BatchAAResults > AAForDep
Definition ScheduleDAGInstrs.h:177

llvm::ScheduleDAGInstrs::RegionBegin
MachineBasicBlock::iterator RegionBegin
The beginning of the range to be scheduled.
Definition ScheduleDAGInstrs.h:148

llvm::ScheduleDAGInstrs::addSchedBarrierDeps
void addSchedBarrierDeps()
Adds dependencies from instructions in the current list of instructions being scheduled to scheduling...
Definition ScheduleDAGInstrs.cpp:212

llvm::ScheduleDAGInstrs::enterRegion
virtual void enterRegion(MachineBasicBlock *bb, MachineBasicBlock::iterator begin, MachineBasicBlock::iterator end, unsigned regioninstrs)
Initialize the DAG and common scheduler state for a new scheduling region.
Definition ScheduleDAGInstrs.cpp:198

llvm::ScheduleDAGInstrs::dump
void dump() const override
Definition ScheduleDAGInstrs.cpp:1206

llvm::ScheduleDAGInstrs::addChainDependency
void addChainDependency(SUnit *SUa, SUnit *SUb, unsigned Latency=0)
Adds a chain edge between SUa and SUb, but only if both AAResults and Target fail to deny the depende...
Definition ScheduleDAGInstrs.cpp:572

llvm::ScheduleDAGInstrs::NumRegionInstrs
unsigned NumRegionInstrs
Instructions in this region (distance(RegionBegin, RegionEnd)).
Definition ScheduleDAGInstrs.h:154

llvm::ScheduleDAGInstrs::MFI
const MachineFrameInfo & MFI
Definition ScheduleDAGInstrs.h:119

llvm::ScheduleDAGInstrs::deadDefHasNoUse
bool deadDefHasNoUse(const MachineOperand &MO)
Returns true if the def register in MO has no uses.
Definition ScheduleDAGInstrs.cpp:412

llvm::ScheduleDAGInstrs::getGraphNodeLabel
std::string getGraphNodeLabel(const SUnit *SU) const override
Returns a label for a DAG node that points to an instruction.
Definition ScheduleDAGInstrs.cpp:1217

llvm::ScheduleDAG::MRI
MachineRegisterInfo & MRI
Virtual/real register map.
Definition ScheduleDAG.h:587

llvm::ScheduleDAG::clearDAG
void clearDAG()
Clears the DAG state (between regions).
Definition ScheduleDAG.cpp:63

llvm::ScheduleDAG::TII
const TargetInstrInfo * TII
Target instruction information.
Definition ScheduleDAG.h:584

llvm::ScheduleDAG::SUnits
std::vector< SUnit > SUnits
The scheduling units.
Definition ScheduleDAG.h:588

llvm::ScheduleDAG::TRI
const TargetRegisterInfo * TRI
Target processor register info.
Definition ScheduleDAG.h:585

llvm::ScheduleDAG::EntrySU
SUnit EntrySU
Special node for the region entry.
Definition ScheduleDAG.h:589

llvm::ScheduleDAG::MF
MachineFunction & MF
Machine function.
Definition ScheduleDAG.h:586

llvm::ScheduleDAG::ScheduleDAG
ScheduleDAG(const ScheduleDAG &)=delete

llvm::ScheduleDAG::dumpNodeAll
void dumpNodeAll(const SUnit &SU) const
Definition ScheduleDAG.cpp:365

llvm::ScheduleDAG::dumpNodeName
void dumpNodeName(const SUnit &SU) const
Definition ScheduleDAG.cpp:356

llvm::ScheduleDAG::ExitSU
SUnit ExitSU
Special node for the region exit.
Definition ScheduleDAG.h:590

llvm::SlotIndex
SlotIndex - An opaque wrapper around machine indexes.
Definition SlotIndexes.h:66

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:573

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition SmallVector.h:937

llvm::SmallVectorImpl::clear
void clear()
Definition SmallVector.h:610

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:416

llvm::SmallVectorTemplateCommon::end
iterator end()
Definition SmallVector.h:272

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1196

llvm::SparseMultiSet< PhysRegSUOper, identity< unsigned >, uint16_t >::iterator
iterator_base< SparseMultiSet * > iterator
Definition SparseMultiSet.h:304

llvm::SparseMultiSet< PhysRegSUOper, identity< unsigned >, uint16_t >::RangePair
std::pair< iterator, iterator > RangePair
Definition SparseMultiSet.h:308

llvm::SparseSet
SparseSet - Fast set implementation for objects that can be identified by small unsigned keys.
Definition SparseSet.h:120

llvm::TargetInstrInfo
TargetInstrInfo - Interface to description of machine instruction set.
Definition TargetInstrInfo.h:114

llvm::TargetRegisterClass
Definition TargetRegisterInfo.h:45

llvm::TargetRegisterClass::HasDisjunctSubRegs
const bool HasDisjunctSubRegs
Whether the class supports two (or more) disjunct subregister indices.
Definition TargetRegisterInfo.h:65

llvm::TargetRegisterClass::getLaneMask
LaneBitmask getLaneMask() const
Returns the combination of all lane masks of register in this class.
Definition TargetRegisterInfo.h:215

llvm::TargetSubtargetInfo
TargetSubtargetInfo - Generic base class for all target subtargets.
Definition TargetSubtargetInfo.h:65

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::UndefValue
'undef' values are things that do not have specified contents.
Definition Constants.h:1420

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition Use.h:35

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::cl::opt
Definition CommandLine.h:1455

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53

llvm::raw_string_ostream
A raw_ostream that writes to an std::string.
Definition raw_ostream.h:662

iterator_range.h
This provides a very simple, boring adaptor for a begin and end iterator into a range type.

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::AA
Abstract Attribute helper functions.
Definition Attributor.h:165

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::cl::Hidden
@ Hidden
Definition CommandLine.h:139

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition CommandLine.h:445

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::drop_begin
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:316

llvm::size
auto size(R &&Range, std::enable_if_t< std::is_base_of< std::random_access_iterator_tag, typename std::iterator_traits< decltype(Range.begin())>::iterator_category >::value, void > *=nullptr)
Get the size of a range.
Definition STLExtras.h:1655

llvm::Latency
@ Latency
Definition SIMachineScheduler.h:34

llvm::Depth
@ Depth
Definition SIMachineScheduler.h:36

llvm::getUnderlyingObjectsForCodeGen
LLVM_ABI bool getUnderlyingObjectsForCodeGen(const Value *V, SmallVectorImpl< Value * > &Objects)
This is a wrapper around getUnderlyingObjects and adds support for basic ptrtoint+arithmetic+inttoptr...
Definition ValueTracking.cpp:6845

llvm::make_range
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
Definition iterator_range.h:70

llvm::reverse
auto reverse(ContainerTy &&C)
Definition STLExtras.h:406

llvm::get
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
Definition PointerIntPair.h:268

llvm::sort
void sort(IteratorTy Start, IteratorTy End)
Definition STLExtras.h:1622

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207

llvm::MCRegUnit
unsigned MCRegUnit
Register units are used to compute register aliasing.
Definition MCRegister.h:30

llvm::skipDebugInstructionsBackward
IterT skipDebugInstructionsBackward(IterT It, IterT Begin, bool SkipPseudoOp=true)
Decrement It until it points to a non-debug instruction or to Begin and return the resulting iterator...
Definition MachineBasicBlock.h:1490

llvm::isa
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:548

llvm::format
format_object< Ts... > format(const char *Fmt, const Ts &... Vals)
These are helper functions used to produce formatted output.
Definition Format.h:129

llvm::Key
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
Definition PassManager.h:668

llvm::UnderlyingObjectsVector
SmallVector< UnderlyingObject, 4 > UnderlyingObjectsVector
Definition ScheduleDAGInstrs.h:113

llvm::operator<<
raw_ostream & operator<<(raw_ostream &OS, const APFixedPoint &FX)
Definition APFixedPoint.h:312

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:560

llvm::ValueType
PointerUnion< const Value *, const PseudoSourceValue * > ValueType
Definition ScheduleDAGInstrs.h:103

llvm::isIdentifiedObject
LLVM_ABI bool isIdentifiedObject(const Value *V)
Return true if this pointer refers to a distinct and identifiable object.
Definition AliasAnalysis.cpp:837

llvm::printMBBReference
LLVM_ABI Printable printMBBReference(const MachineBasicBlock &MBB)
Prints a machine basic block reference.
Definition MachineBasicBlock.cpp:120

raw_ostream.h

N
#define N

llvm::ILPValue
Represent the ILP of the subDAG rooted at a DAG node.
Definition ScheduleDFS.h:34

llvm::ILPValue::Length
unsigned Length
Length may either correspond to depth or height, depending on direction, and cycles or nodes dependin...
Definition ScheduleDFS.h:38

llvm::ILPValue::dump
void dump() const
Definition ScheduleDAGInstrs.cpp:1550

llvm::ILPValue::print
void print(raw_ostream &OS) const
Definition ScheduleDAGInstrs.cpp:1542

llvm::ILPValue::InstrCount
unsigned InstrCount
Definition ScheduleDFS.h:35

llvm::LaneBitmask
Definition LaneBitmask.h:40

llvm::LaneBitmask::getAll
static constexpr LaneBitmask getAll()
Definition LaneBitmask.h:82

llvm::LaneBitmask::any
constexpr bool any() const
Definition LaneBitmask.h:53

llvm::MCSchedClassDesc
Summarize the scheduling resources required for an instruction of a particular scheduling class.
Definition MCSchedule.h:123

llvm::MCWriteProcResEntry
Identify one of the processor resource kinds consumed by a particular scheduling class for the specif...
Definition MCSchedule.h:68

llvm::PhysRegSUOper
Record a physical register access.
Definition ScheduleDAGInstrs.h:78

llvm::SmallMapVector
A MapVector that performs no allocations if smaller than a certain size.
Definition MapVector.h:257

llvm::UnderlyingObject
Definition ScheduleDAGInstrs.h:105

llvm::VReg2SUnitOperIdx
Mapping from virtual register to SUnit including an operand index.
Definition ScheduleDAGInstrs.h:68

llvm::VReg2SUnit
An individual mapping from virtual register number to SUnit.
Definition ScheduleDAGInstrs.h:54

llvm::cl::desc
Definition CommandLine.h:411