doxygen/HexagonSubtarget_8cpp_source.html

//===- HexagonSubtarget.cpp - Hexagon Subtarget Information ---------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the Hexagon specific subclass of TargetSubtarget.

//

//===----------------------------------------------------------------------===//


#include "HexagonSubtarget.h"

#include "HexagonInstrInfo.h"

#include "HexagonRegisterInfo.h"

#include "MCTargetDesc/HexagonMCTargetDesc.h"

#include "llvm/ADT/STLExtras.h"

#include "llvm/ADT/SmallSet.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/StringRef.h"

#include "llvm/CodeGen/MachineInstr.h"

#include "llvm/CodeGen/MachineOperand.h"

#include "llvm/CodeGen/MachineScheduler.h"

#include "llvm/CodeGen/ScheduleDAG.h"

#include "llvm/CodeGen/ScheduleDAGInstrs.h"

#include "llvm/IR/IntrinsicsHexagon.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Target/TargetMachine.h"

#include <algorithm>

#include <cassert>

#include <map>

#include <optional>


using namespace llvm;


#define DEBUG_TYPE "hexagon-subtarget"


#define GET_SUBTARGETINFO_CTOR

#define GET_SUBTARGETINFO_TARGET_DESC

#include "HexagonGenSubtargetInfo.inc"


static cl::opt<bool> EnableBSBSched("enable-bsb-sched", cl::Hidden,

                                    cl::init(true));


static cl::opt<bool> EnableTCLatencySched("enable-tc-latency-sched", cl::Hidden,

                                          cl::init(false));


static cl::opt<bool>

    EnableDotCurSched("enable-cur-sched", cl::Hidden, cl::init(true),

                      cl::desc("Enable the scheduler to generate .cur"));


static cl::opt<bool>

    DisableHexagonMISched("disable-hexagon-misched", cl::Hidden,

                          cl::desc("Disable Hexagon MI Scheduling"));


static cl::opt<bool> OverrideLongCalls(

    "hexagon-long-calls", cl::Hidden,

    cl::desc("If present, forces/disables the use of long calls"));


static cl::opt<bool>

    EnablePredicatedCalls("hexagon-pred-calls", cl::Hidden,

                          cl::desc("Consider calls to be predicable"));


static cl::opt<bool> SchedPredsCloser("sched-preds-closer", cl::Hidden,

                                      cl::init(true));


static cl::opt<bool> SchedRetvalOptimization("sched-retval-optimization",

                                             cl::Hidden, cl::init(true));


static cl::opt<bool> EnableCheckBankConflict(

    "hexagon-check-bank-conflict", cl::Hidden, cl::init(true),

    cl::desc("Enable checking for cache bank conflicts"));


HexagonSubtarget::HexagonSubtarget(const Triple &TT, StringRef CPU,

                                   StringRef FS, const TargetMachine &TM)

    : HexagonGenSubtargetInfo(TT, CPU, /*TuneCPU*/ CPU, FS),

      OptLevel(TM.getOptLevel()),

      CPUString(std::string(Hexagon_MC::selectHexagonCPU(CPU))),

      TargetTriple(TT), InstrInfo(initializeSubtargetDependencies(CPU, FS)),

      RegInfo(getHwMode()), TLInfo(TM, *this),

      InstrItins(getInstrItineraryForCPU(CPUString)) {

  Hexagon_MC::addArchSubtarget(this, FS);

  // Beware of the default constructor of InstrItineraryData: it will

  // reset all members to 0.

  assert(InstrItins.Itineraries != nullptr && "InstrItins not initialized");

}


HexagonSubtarget &

HexagonSubtarget::initializeSubtargetDependencies(StringRef CPU, StringRef FS) {

  std::optional<Hexagon::ArchEnum> ArchVer = Hexagon::getCpu(CPUString);

  if (ArchVer)

    HexagonArchVersion = *ArchVer;

  else

    llvm_unreachable("Unrecognized Hexagon processor version");


  UseHVX128BOps = false;

  UseHVX64BOps = false;

  UseAudioOps = false;

  UseLongCalls = false;


  SubtargetFeatures Features(FS);


  // Turn on QFloat if the HVX version is v68+.

  // The function ParseSubtargetFeatures will set feature bits and initialize

  // subtarget's variables all in one, so there isn't a good way to preprocess

  // the feature string, other than by tinkering with it directly.

  auto IsQFloatFS = [](StringRef F) {

    return F == "+hvx-qfloat" || F == "-hvx-qfloat";

  };

  if (!llvm::count_if(Features.getFeatures(), IsQFloatFS)) {

    auto getHvxVersion = [&Features](StringRef FS) -> StringRef {

      for (StringRef F : llvm::reverse(Features.getFeatures())) {

        if (F.starts_with("+hvxv"))

          return F;

      }

      for (StringRef F : llvm::reverse(Features.getFeatures())) {

        if (F == "-hvx")

          return StringRef();

        if (F.starts_with("+hvx") || F == "-hvx")

          return F.take_front(4);  // Return "+hvx" or "-hvx".

      }

      return StringRef();

    };


    bool AddQFloat = false;

    StringRef HvxVer = getHvxVersion(FS);

    if (HvxVer.starts_with("+hvxv")) {

      int Ver = 0;

      if (!HvxVer.drop_front(5).consumeInteger(10, Ver) && Ver >= 68)

        AddQFloat = true;

    } else if (HvxVer == "+hvx") {

      if (hasV68Ops())

        AddQFloat = true;

    }


    if (AddQFloat)

      Features.AddFeature("+hvx-qfloat");

  }


  std::string FeatureString = Features.getString();

  ParseSubtargetFeatures(CPUString, /*TuneCPU*/ CPUString, FeatureString);


  if (useHVXV68Ops())

    UseHVXFloatingPoint = UseHVXIEEEFPOps || UseHVXQFloatOps;


  if (UseHVXQFloatOps && UseHVXIEEEFPOps && UseHVXFloatingPoint)

    LLVM_DEBUG(

        dbgs() << "Behavior is undefined for simultaneous qfloat and ieee hvx codegen...");


  if (OverrideLongCalls.getPosition())

    UseLongCalls = OverrideLongCalls;


  UseBSBScheduling = hasV60Ops() && EnableBSBSched;


  if (isTinyCore()) {

    // Tiny core has a single thread, so back-to-back scheduling is enabled by

    // default.

    if (!EnableBSBSched.getPosition())

      UseBSBScheduling = false;

  }


  FeatureBitset FeatureBits = getFeatureBits();

  if (HexagonDisableDuplex)

    setFeatureBits(FeatureBits.reset(Hexagon::FeatureDuplex));

  setFeatureBits(Hexagon_MC::completeHVXFeatures(FeatureBits));


  return *this;

}


bool HexagonSubtarget::isHVXElementType(MVT Ty, bool IncludeBool) const {

  if (!useHVXOps())

    return false;

  if (Ty.isVector())

    Ty = Ty.getVectorElementType();

  if (IncludeBool && Ty == MVT::i1)

    return true;

  ArrayRef<MVT> ElemTypes = getHVXElementTypes();

  return llvm::is_contained(ElemTypes, Ty);

}


bool HexagonSubtarget::isHVXVectorType(EVT VecTy, bool IncludeBool) const {

  if (!VecTy.isSimple())

    return false;

  if (!VecTy.isVector() || !useHVXOps() || VecTy.isScalableVector())

    return false;

  MVT ElemTy = VecTy.getSimpleVT().getVectorElementType();

  if (!IncludeBool && ElemTy == MVT::i1)

    return false;


  unsigned HwLen = getVectorLength();

  unsigned NumElems = VecTy.getVectorNumElements();

  ArrayRef<MVT> ElemTypes = getHVXElementTypes();


  if (IncludeBool && ElemTy == MVT::i1) {

    // Boolean HVX vector types are formed from regular HVX vector types

    // by replacing the element type with i1.

    for (MVT T : ElemTypes)

      if (NumElems * T.getSizeInBits() == 8 * HwLen)

        return true;

    return false;

  }


  unsigned VecWidth = VecTy.getSizeInBits();

  if (VecWidth != 8 * HwLen && VecWidth != 16 * HwLen)

    return false;

  return llvm::is_contained(ElemTypes, ElemTy);

}


bool HexagonSubtarget::isTypeForHVX(Type *VecTy, bool IncludeBool) const {

  if (!VecTy->isVectorTy() || isa<ScalableVectorType>(VecTy))

    return false;

  // Avoid types like <2 x i32*>.

  Type *ScalTy = VecTy->getScalarType();

  if (!ScalTy->isIntegerTy() &&

      !(ScalTy->isFloatingPointTy() && useHVXFloatingPoint()))

    return false;

  // The given type may be something like <17 x i32>, which is not MVT,

  // but can be represented as (non-simple) EVT.

  EVT Ty = EVT::getEVT(VecTy, /*HandleUnknown*/false);

  if (!Ty.getVectorElementType().isSimple())

    return false;


  auto isHvxTy = [this, IncludeBool](MVT SimpleTy) {

    if (isHVXVectorType(SimpleTy, IncludeBool))

      return true;

    auto Action = getTargetLowering()->getPreferredVectorAction(SimpleTy);

    return Action == TargetLoweringBase::TypeWidenVector;

  };


  // Round up EVT to have power-of-2 elements, and keep checking if it

  // qualifies for HVX, dividing it in half after each step.

  MVT ElemTy = Ty.getVectorElementType().getSimpleVT();

  unsigned VecLen = PowerOf2Ceil(Ty.getVectorNumElements());

  while (VecLen > 1) {

    MVT SimpleTy = MVT::getVectorVT(ElemTy, VecLen);

    if (SimpleTy.isValid() && isHvxTy(SimpleTy))

      return true;

    VecLen /= 2;

  }


  return false;

}


void HexagonSubtarget::UsrOverflowMutation::apply(ScheduleDAGInstrs *DAG) {

  for (SUnit &SU : DAG->SUnits) {

    if (!SU.isInstr())

      continue;

    SmallVector<SDep, 4> Erase;

    for (auto &D : SU.Preds)

      if (D.getKind() == SDep::Output && D.getReg() == Hexagon::USR_OVF)

        Erase.push_back(D);

    for (auto &E : Erase)

      SU.removePred(E);

  }

}


void HexagonSubtarget::HVXMemLatencyMutation::apply(ScheduleDAGInstrs *DAG) {

  for (SUnit &SU : DAG->SUnits) {

    // Update the latency of chain edges between v60 vector load or store

    // instructions to be 1. These instruction cannot be scheduled in the

    // same packet.

    MachineInstr &MI1 = *SU.getInstr();

    auto *QII = static_cast<const HexagonInstrInfo*>(DAG->TII);

    bool IsStoreMI1 = MI1.mayStore();

    bool IsLoadMI1 = MI1.mayLoad();

    if (!QII->isHVXVec(MI1) || !(IsStoreMI1 || IsLoadMI1))

      continue;

    for (SDep &SI : SU.Succs) {

      if (SI.getKind() != SDep::Order || SI.getLatency() != 0)

        continue;

      MachineInstr &MI2 = *SI.getSUnit()->getInstr();

      if (!QII->isHVXVec(MI2))

        continue;

      if ((IsStoreMI1 && MI2.mayStore()) || (IsLoadMI1 && MI2.mayLoad())) {

        SI.setLatency(1);

        SU.setHeightDirty();

        // Change the dependence in the opposite direction too.

        for (SDep &PI : SI.getSUnit()->Preds) {

          if (PI.getSUnit() != &SU || PI.getKind() != SDep::Order)

            continue;

          PI.setLatency(1);

          SI.getSUnit()->setDepthDirty();

        }

      }

    }

  }

}


// Check if a call and subsequent A2_tfrpi instructions should maintain

// scheduling affinity. We are looking for the TFRI to be consumed in

// the next instruction. This should help reduce the instances of

// double register pairs being allocated and scheduled before a call

// when not used until after the call. This situation is exacerbated

// by the fact that we allocate the pair from the callee saves list,

// leading to excess spills and restores.

bool HexagonSubtarget::CallMutation::shouldTFRICallBind(

      const HexagonInstrInfo &HII, const SUnit &Inst1,

      const SUnit &Inst2) const {

  if (Inst1.getInstr()->getOpcode() != Hexagon::A2_tfrpi)

    return false;


  // TypeXTYPE are 64 bit operations.

  unsigned Type = HII.getType(*Inst2.getInstr());

  return Type == HexagonII::TypeS_2op || Type == HexagonII::TypeS_3op ||

         Type == HexagonII::TypeALU64 || Type == HexagonII::TypeM;

}


void HexagonSubtarget::CallMutation::apply(ScheduleDAGInstrs *DAGInstrs) {

  ScheduleDAGMI *DAG = static_cast<ScheduleDAGMI*>(DAGInstrs);

  SUnit* LastSequentialCall = nullptr;

  // Map from virtual register to physical register from the copy.

  DenseMap<unsigned, unsigned> VRegHoldingReg;

  // Map from the physical register to the instruction that uses virtual

  // register. This is used to create the barrier edge.

  DenseMap<unsigned, SUnit *> LastVRegUse;

  auto &TRI = *DAG->MF.getSubtarget().getRegisterInfo();

  auto &HII = *DAG->MF.getSubtarget<HexagonSubtarget>().getInstrInfo();


  // Currently we only catch the situation when compare gets scheduled

  // before preceding call.

  for (unsigned su = 0, e = DAG->SUnits.size(); su != e; ++su) {

    // Remember the call.

    if (DAG->SUnits[su].getInstr()->isCall())

      LastSequentialCall = &DAG->SUnits[su];

    // Look for a compare that defines a predicate.

    else if (DAG->SUnits[su].getInstr()->isCompare() && LastSequentialCall)

      DAG->addEdge(&DAG->SUnits[su], SDep(LastSequentialCall, SDep::Barrier));

    // Look for call and tfri* instructions.

    else if (SchedPredsCloser && LastSequentialCall && su > 1 && su < e-1 &&

             shouldTFRICallBind(HII, DAG->SUnits[su], DAG->SUnits[su+1]))

      DAG->addEdge(&DAG->SUnits[su], SDep(&DAG->SUnits[su-1], SDep::Barrier));

    // Prevent redundant register copies due to reads and writes of physical

    // registers. The original motivation for this was the code generated

    // between two calls, which are caused both the return value and the

    // argument for the next call being in %r0.

    // Example:

    //   1: <call1>

    //   2: %vreg = COPY %r0

    //   3: <use of %vreg>

    //   4: %r0 = ...

    //   5: <call2>

    // The scheduler would often swap 3 and 4, so an additional register is

    // needed. This code inserts a Barrier dependence between 3 & 4 to prevent

    // this.

    // The code below checks for all the physical registers, not just R0/D0/V0.

    else if (SchedRetvalOptimization) {

      const MachineInstr *MI = DAG->SUnits[su].getInstr();

      if (MI->isCopy() && MI->getOperand(1).getReg().isPhysical()) {

        // %vregX = COPY %r0

        VRegHoldingReg[MI->getOperand(0).getReg()] = MI->getOperand(1).getReg();

        LastVRegUse.erase(MI->getOperand(1).getReg());

      } else {

        for (const MachineOperand &MO : MI->operands()) {

          if (!MO.isReg())

            continue;

          if (MO.isUse() && !MI->isCopy() &&

              VRegHoldingReg.count(MO.getReg())) {

            // <use of %vregX>

            LastVRegUse[VRegHoldingReg[MO.getReg()]] = &DAG->SUnits[su];

          } else if (MO.isDef() && MO.getReg().isPhysical()) {

            for (MCRegAliasIterator AI(MO.getReg(), &TRI, true); AI.isValid();

                 ++AI) {

              if (LastVRegUse.count(*AI) &&

                  LastVRegUse[*AI] != &DAG->SUnits[su])

                // %r0 = ...

                DAG->addEdge(&DAG->SUnits[su], SDep(LastVRegUse[*AI], SDep::Barrier));

              LastVRegUse.erase(*AI);

            }

          }

        }

      }

    }

  }

}


void HexagonSubtarget::BankConflictMutation::apply(ScheduleDAGInstrs *DAG) {

  if (!EnableCheckBankConflict)

    return;


  const auto &HII = static_cast<const HexagonInstrInfo&>(*DAG->TII);


  // Create artificial edges between loads that could likely cause a bank

  // conflict. Since such loads would normally not have any dependency

  // between them, we cannot rely on existing edges.

  for (unsigned i = 0, e = DAG->SUnits.size(); i != e; ++i) {

    SUnit &S0 = DAG->SUnits[i];

    MachineInstr &L0 = *S0.getInstr();

    if (!L0.mayLoad() || L0.mayStore() ||

        HII.getAddrMode(L0) != HexagonII::BaseImmOffset)

      continue;

    int64_t Offset0;

    LocationSize Size0 = 0;

    MachineOperand *BaseOp0 = HII.getBaseAndOffset(L0, Offset0, Size0);

    // Is the access size is longer than the L1 cache line, skip the check.

    if (BaseOp0 == nullptr || !BaseOp0->isReg() || !Size0.hasValue() ||

        Size0.getValue() >= 32)

      continue;

    // Scan only up to 32 instructions ahead (to avoid n^2 complexity).

    for (unsigned j = i+1, m = std::min(i+32, e); j != m; ++j) {

      SUnit &S1 = DAG->SUnits[j];

      MachineInstr &L1 = *S1.getInstr();

      if (!L1.mayLoad() || L1.mayStore() ||

          HII.getAddrMode(L1) != HexagonII::BaseImmOffset)

        continue;

      int64_t Offset1;

      LocationSize Size1 = 0;

      MachineOperand *BaseOp1 = HII.getBaseAndOffset(L1, Offset1, Size1);

      if (BaseOp1 == nullptr || !BaseOp1->isReg() || !Size0.hasValue() ||

          Size1.getValue() >= 32 || BaseOp0->getReg() != BaseOp1->getReg())

        continue;

      // Check bits 3 and 4 of the offset: if they differ, a bank conflict

      // is unlikely.

      if (((Offset0 ^ Offset1) & 0x18) != 0)

        continue;

      // Bits 3 and 4 are the same, add an artificial edge and set extra

      // latency.

      SDep A(&S0, SDep::Artificial);

      A.setLatency(1);

      S1.addPred(A, true);

    }

  }

}


/// Enable use of alias analysis during code generation (during MI

/// scheduling, DAGCombine, etc.).

bool HexagonSubtarget::useAA() const {

  if (OptLevel != CodeGenOptLevel::None)

    return true;

  return false;

}


/// Perform target specific adjustments to the latency of a schedule

/// dependency.

void HexagonSubtarget::adjustSchedDependency(

    SUnit *Src, int SrcOpIdx, SUnit *Dst, int DstOpIdx, SDep &Dep,

    const TargetSchedModel *SchedModel) const {

  if (!Src->isInstr() || !Dst->isInstr())

    return;


  MachineInstr *SrcInst = Src->getInstr();

  MachineInstr *DstInst = Dst->getInstr();

  const HexagonInstrInfo *QII = getInstrInfo();


  // Instructions with .new operands have zero latency.

  SmallSet<SUnit *, 4> ExclSrc;

  SmallSet<SUnit *, 4> ExclDst;

  if (QII->canExecuteInBundle(*SrcInst, *DstInst) &&

      isBestZeroLatency(Src, Dst, QII, ExclSrc, ExclDst)) {

    Dep.setLatency(0);

    return;

  }


  // Set the latency for a copy to zero since we hope that is will get

  // removed.

  if (DstInst->isCopy())

    Dep.setLatency(0);


  // If it's a REG_SEQUENCE/COPY, use its destination instruction to determine

  // the correct latency.

  // If there are multiple uses of the def of COPY/REG_SEQUENCE, set the latency

  // only if the latencies on all the uses are equal, otherwise set it to

  // default.

  if ((DstInst->isRegSequence() || DstInst->isCopy())) {

    Register DReg = DstInst->getOperand(0).getReg();

    std::optional<unsigned> DLatency;

    for (const auto &DDep : Dst->Succs) {

      MachineInstr *DDst = DDep.getSUnit()->getInstr();

      int UseIdx = -1;

      for (unsigned OpNum = 0; OpNum < DDst->getNumOperands(); OpNum++) {

        const MachineOperand &MO = DDst->getOperand(OpNum);

        if (MO.isReg() && MO.getReg() && MO.isUse() && MO.getReg() == DReg) {

          UseIdx = OpNum;

          break;

        }

      }


      if (UseIdx == -1)

        continue;


      std::optional<unsigned> Latency =

          InstrInfo.getOperandLatency(&InstrItins, *SrcInst, 0, *DDst, UseIdx);


      // Set DLatency for the first time.

      if (!DLatency)

        DLatency = Latency;


      // For multiple uses, if the Latency is different across uses, reset

      // DLatency.

      if (DLatency != Latency) {

        DLatency = std::nullopt;

        break;

      }

    }

    Dep.setLatency(DLatency.value_or(0));

  }


  // Try to schedule uses near definitions to generate .cur.

  ExclSrc.clear();

  ExclDst.clear();

  if (EnableDotCurSched && QII->isToBeScheduledASAP(*SrcInst, *DstInst) &&

      isBestZeroLatency(Src, Dst, QII, ExclSrc, ExclDst)) {

    Dep.setLatency(0);

    return;

  }

  int Latency = Dep.getLatency();

  bool IsArtificial = Dep.isArtificial();

  Latency = updateLatency(*SrcInst, *DstInst, IsArtificial, Latency);

  Dep.setLatency(Latency);

}


void HexagonSubtarget::getPostRAMutations(

    std::vector<std::unique_ptr<ScheduleDAGMutation>> &Mutations) const {

  Mutations.push_back(std::make_unique<UsrOverflowMutation>());

  Mutations.push_back(std::make_unique<HVXMemLatencyMutation>());

  Mutations.push_back(std::make_unique<BankConflictMutation>());

}


void HexagonSubtarget::getSMSMutations(

    std::vector<std::unique_ptr<ScheduleDAGMutation>> &Mutations) const {

  Mutations.push_back(std::make_unique<UsrOverflowMutation>());

  Mutations.push_back(std::make_unique<HVXMemLatencyMutation>());

}


// Pin the vtable to this file.

void HexagonSubtarget::anchor() {}


bool HexagonSubtarget::enableMachineScheduler() const {

  if (DisableHexagonMISched.getNumOccurrences())

    return !DisableHexagonMISched;

  return true;

}


bool HexagonSubtarget::usePredicatedCalls() const {

  return EnablePredicatedCalls;

}


int HexagonSubtarget::updateLatency(MachineInstr &SrcInst,

                                    MachineInstr &DstInst, bool IsArtificial,

                                    int Latency) const {

  if (IsArtificial)

    return 1;

  if (!hasV60Ops())

    return Latency;


  auto &QII = static_cast<const HexagonInstrInfo &>(*getInstrInfo());

  // BSB scheduling.

  if (QII.isHVXVec(SrcInst) || useBSBScheduling())

    Latency = (Latency + 1) >> 1;

  return Latency;

}


void HexagonSubtarget::restoreLatency(SUnit *Src, SUnit *Dst) const {

  MachineInstr *SrcI = Src->getInstr();

  for (auto &I : Src->Succs) {

    if (!I.isAssignedRegDep() || I.getSUnit() != Dst)

      continue;

    Register DepR = I.getReg();

    int DefIdx = -1;

    for (unsigned OpNum = 0; OpNum < SrcI->getNumOperands(); OpNum++) {

      const MachineOperand &MO = SrcI->getOperand(OpNum);

      bool IsSameOrSubReg = false;

      if (MO.isReg()) {

        Register MOReg = MO.getReg();

        if (DepR.isVirtual()) {

          IsSameOrSubReg = (MOReg == DepR);

        } else {

          IsSameOrSubReg = getRegisterInfo()->isSubRegisterEq(DepR, MOReg);

        }

        if (MO.isDef() && IsSameOrSubReg)

          DefIdx = OpNum;

      }

    }

    assert(DefIdx >= 0 && "Def Reg not found in Src MI");

    MachineInstr *DstI = Dst->getInstr();

    SDep T = I;

    for (unsigned OpNum = 0; OpNum < DstI->getNumOperands(); OpNum++) {

      const MachineOperand &MO = DstI->getOperand(OpNum);

      if (MO.isReg() && MO.isUse() && MO.getReg() == DepR) {

        std::optional<unsigned> Latency = InstrInfo.getOperandLatency(

            &InstrItins, *SrcI, DefIdx, *DstI, OpNum);


        // For some instructions (ex: COPY), we might end up with < 0 latency

        // as they don't have any Itinerary class associated with them.

        if (!Latency)

          Latency = 0;

        bool IsArtificial = I.isArtificial();

        Latency = updateLatency(*SrcI, *DstI, IsArtificial, *Latency);

        I.setLatency(*Latency);

      }

    }


    // Update the latency of opposite edge too.

    T.setSUnit(Src);

    auto F = find(Dst->Preds, T);

    assert(F != Dst->Preds.end());

    F->setLatency(I.getLatency());

  }

}


/// Change the latency between the two SUnits.

void HexagonSubtarget::changeLatency(SUnit *Src, SUnit *Dst, unsigned Lat)

      const {

  for (auto &I : Src->Succs) {

    if (!I.isAssignedRegDep() || I.getSUnit() != Dst)

      continue;

    SDep T = I;

    I.setLatency(Lat);


    // Update the latency of opposite edge too.

    T.setSUnit(Src);

    auto F = find(Dst->Preds, T);

    assert(F != Dst->Preds.end());

    F->setLatency(Lat);

  }

}


/// If the SUnit has a zero latency edge, return the other SUnit.

static SUnit *getZeroLatency(SUnit *N, SmallVector<SDep, 4> &Deps) {

  for (auto &I : Deps)

    if (I.isAssignedRegDep() && I.getLatency() == 0 &&

        !I.getSUnit()->getInstr()->isPseudo())

      return I.getSUnit();

  return nullptr;

}


// Return true if these are the best two instructions to schedule

// together with a zero latency. Only one dependence should have a zero

// latency. If there are multiple choices, choose the best, and change

// the others, if needed.

bool HexagonSubtarget::isBestZeroLatency(SUnit *Src, SUnit *Dst,

      const HexagonInstrInfo *TII, SmallSet<SUnit*, 4> &ExclSrc,

      SmallSet<SUnit*, 4> &ExclDst) const {

  MachineInstr &SrcInst = *Src->getInstr();

  MachineInstr &DstInst = *Dst->getInstr();


  // Ignore Boundary SU nodes as these have null instructions.

  if (Dst->isBoundaryNode())

    return false;


  if (SrcInst.isPHI() || DstInst.isPHI())

    return false;


  if (!TII->isToBeScheduledASAP(SrcInst, DstInst) &&

      !TII->canExecuteInBundle(SrcInst, DstInst))

    return false;


  // The architecture doesn't allow three dependent instructions in the same

  // packet. So, if the destination has a zero latency successor, then it's

  // not a candidate for a zero latency predecessor.

  if (getZeroLatency(Dst, Dst->Succs) != nullptr)

    return false;


  // Check if the Dst instruction is the best candidate first.

  SUnit *Best = nullptr;

  SUnit *DstBest = nullptr;

  SUnit *SrcBest = getZeroLatency(Dst, Dst->Preds);

  if (SrcBest == nullptr || Src->NodeNum >= SrcBest->NodeNum) {

    // Check that Src doesn't have a better candidate.

    DstBest = getZeroLatency(Src, Src->Succs);

    if (DstBest == nullptr || Dst->NodeNum <= DstBest->NodeNum)

      Best = Dst;

  }

  if (Best != Dst)

    return false;


  // The caller frequently adds the same dependence twice. If so, then

  // return true for this case too.

  if ((Src == SrcBest && Dst == DstBest ) ||

      (SrcBest == nullptr && Dst == DstBest) ||

      (Src == SrcBest && Dst == nullptr))

    return true;


  // Reassign the latency for the previous bests, which requires setting

  // the dependence edge in both directions.

  if (SrcBest != nullptr) {

    if (!hasV60Ops())

      changeLatency(SrcBest, Dst, 1);

    else

      restoreLatency(SrcBest, Dst);

  }

  if (DstBest != nullptr) {

    if (!hasV60Ops())

      changeLatency(Src, DstBest, 1);

    else

      restoreLatency(Src, DstBest);

  }


  // Attempt to find another opprotunity for zero latency in a different

  // dependence.

  if (SrcBest && DstBest)

    // If there is an edge from SrcBest to DstBst, then try to change that

    // to 0 now.

    changeLatency(SrcBest, DstBest, 0);

  else if (DstBest) {

    // Check if the previous best destination instruction has a new zero

    // latency dependence opportunity.

    ExclSrc.insert(Src);

    for (auto &I : DstBest->Preds)

      if (ExclSrc.count(I.getSUnit()) == 0 &&

          isBestZeroLatency(I.getSUnit(), DstBest, TII, ExclSrc, ExclDst))

        changeLatency(I.getSUnit(), DstBest, 0);

  } else if (SrcBest) {

    // Check if previous best source instruction has a new zero latency

    // dependence opportunity.

    ExclDst.insert(Dst);

    for (auto &I : SrcBest->Succs)

      if (ExclDst.count(I.getSUnit()) == 0 &&

          isBestZeroLatency(SrcBest, I.getSUnit(), TII, ExclSrc, ExclDst))

        changeLatency(SrcBest, I.getSUnit(), 0);

  }


  return true;

}


unsigned HexagonSubtarget::getL1CacheLineSize() const {

  return 32;

}


unsigned HexagonSubtarget::getL1PrefetchDistance() const {

  return 32;

}


bool HexagonSubtarget::enableSubRegLiveness() const { return true; }


Intrinsic::ID HexagonSubtarget::getIntrinsicId(unsigned Opc) const {

  struct Scalar {

    unsigned Opcode;

    Intrinsic::ID IntId;

  };

  struct Hvx {

    unsigned Opcode;

    Intrinsic::ID Int64Id, Int128Id;

  };


  static Scalar ScalarInts[] = {

#define GET_SCALAR_INTRINSICS

#include "HexagonDepInstrIntrinsics.inc"

#undef GET_SCALAR_INTRINSICS

  };


  static Hvx HvxInts[] = {

#define GET_HVX_INTRINSICS

#include "HexagonDepInstrIntrinsics.inc"

#undef GET_HVX_INTRINSICS

  };


  const auto CmpOpcode = [](auto A, auto B) { return A.Opcode < B.Opcode; };

  [[maybe_unused]] static bool SortedScalar =

      (llvm::sort(ScalarInts, CmpOpcode), true);

  [[maybe_unused]] static bool SortedHvx =

      (llvm::sort(HvxInts, CmpOpcode), true);


  auto [BS, ES] = std::make_pair(std::begin(ScalarInts), std::end(ScalarInts));

  auto [BH, EH] = std::make_pair(std::begin(HvxInts), std::end(HvxInts));


  auto FoundScalar = std::lower_bound(BS, ES, Scalar{Opc, 0}, CmpOpcode);

  if (FoundScalar != ES && FoundScalar->Opcode == Opc)

    return FoundScalar->IntId;


  auto FoundHvx = std::lower_bound(BH, EH, Hvx{Opc, 0, 0}, CmpOpcode);

  if (FoundHvx != EH && FoundHvx->Opcode == Opc) {

    unsigned HwLen = getVectorLength();

    if (HwLen == 64)

      return FoundHvx->Int64Id;

    if (HwLen == 128)

      return FoundHvx->Int128Id;

  }


  std::string error = "Invalid opcode (" + std::to_string(Opc) + ")";

  llvm_unreachable(error.c_str());

  return 0;

}

S1
static const LLT S1
Definition: AMDGPULegalizerInfo.cpp:282

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

CommandLine.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition: Debug.h:106

TII
const HexagonInstrInfo * TII
Definition: HexagonCopyToCombine.cpp:125

HexagonDepInstrIntrinsics.inc

HexagonInstrInfo.h

HexagonMCTargetDesc.h

HexagonRegisterInfo.h

DisableHexagonMISched
static cl::opt< bool > DisableHexagonMISched("disable-hexagon-misched", cl::Hidden, cl::desc("Disable Hexagon MI Scheduling"))

EnableDotCurSched
static cl::opt< bool > EnableDotCurSched("enable-cur-sched", cl::Hidden, cl::init(true), cl::desc("Enable the scheduler to generate .cur"))

EnableCheckBankConflict
static cl::opt< bool > EnableCheckBankConflict("hexagon-check-bank-conflict", cl::Hidden, cl::init(true), cl::desc("Enable checking for cache bank conflicts"))

OverrideLongCalls
static cl::opt< bool > OverrideLongCalls("hexagon-long-calls", cl::Hidden, cl::desc("If present, forces/disables the use of long calls"))

SchedPredsCloser
static cl::opt< bool > SchedPredsCloser("sched-preds-closer", cl::Hidden, cl::init(true))

SchedRetvalOptimization
static cl::opt< bool > SchedRetvalOptimization("sched-retval-optimization", cl::Hidden, cl::init(true))

EnableTCLatencySched
static cl::opt< bool > EnableTCLatencySched("enable-tc-latency-sched", cl::Hidden, cl::init(false))

EnableBSBSched
static cl::opt< bool > EnableBSBSched("enable-bsb-sched", cl::Hidden, cl::init(true))

getZeroLatency
static SUnit * getZeroLatency(SUnit *N, SmallVector< SDep, 4 > &Deps)
If the SUnit has a zero latency edge, return the other SUnit.
Definition: HexagonSubtarget.cpp:619

EnablePredicatedCalls
static cl::opt< bool > EnablePredicatedCalls("hexagon-pred-calls", cl::Hidden, cl::desc("Consider calls to be predicable"))

HexagonSubtarget.h

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:112

SpecialSubKind::string
@ string

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

MachineInstr.h

MachineOperand.h

MachineScheduler.h

TRI
unsigned const TargetRegisterInfo * TRI
Definition: MachineSink.cpp:2029

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

STLExtras.h
This file contains some templates that are useful if you are working with the STL at all.

ScheduleDAGInstrs.h

ScheduleDAG.h

SmallSet.h
This file defines the SmallSet class.

SmallVector.h
This file defines the SmallVector class.

StringRef.h

error
#define error(X)
Definition: SymbolRecordMapping.cpp:14

HexagonGenSubtargetInfo

T

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::DenseMapBase::erase
bool erase(const KeyT &Val)
Definition: DenseMap.h:321

llvm::DenseMapBase::count
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition: DenseMap.h:152

llvm::DenseMap
Definition: DenseMap.h:727

llvm::FeatureBitset
Container class for subtarget features.
Definition: SubtargetFeature.h:41

llvm::FeatureBitset::reset
constexpr FeatureBitset & reset(unsigned I)
Definition: SubtargetFeature.h:67

llvm::HexagonInstrInfo
Definition: HexagonInstrInfo.h:38

llvm::HexagonInstrInfo::getAddrMode
unsigned getAddrMode(const MachineInstr &MI) const
Definition: HexagonInstrInfo.cpp:3284

llvm::HexagonInstrInfo::canExecuteInBundle
bool canExecuteInBundle(const MachineInstr &First, const MachineInstr &Second) const
Can these instructions execute at the same time in a bundle.
Definition: HexagonInstrInfo.cpp:3088

llvm::HexagonInstrInfo::getOperandLatency
std::optional< unsigned > getOperandLatency(const InstrItineraryData *ItinData, const MachineInstr &DefMI, unsigned DefIdx, const MachineInstr &UseMI, unsigned UseIdx) const override
getOperandLatency - Compute and return the use operand latency of a given pair of def and use.
Definition: HexagonInstrInfo.cpp:4330

llvm::HexagonInstrInfo::isToBeScheduledASAP
bool isToBeScheduledASAP(const MachineInstr &MI1, const MachineInstr &MI2) const
Definition: HexagonInstrInfo.cpp:2690

llvm::HexagonInstrInfo::getBaseAndOffset
MachineOperand * getBaseAndOffset(const MachineInstr &MI, int64_t &Offset, LocationSize &AccessSize) const
Definition: HexagonInstrInfo.cpp:3294

llvm::HexagonInstrInfo::getType
uint64_t getType(const MachineInstr &MI) const
Definition: HexagonInstrInfo.cpp:4618

llvm::HexagonSubtarget
Definition: HexagonSubtarget.h:43

llvm::HexagonSubtarget::HexagonArchVersion
Hexagon::ArchEnum HexagonArchVersion
Definition: HexagonSubtarget.h:71

llvm::HexagonSubtarget::adjustSchedDependency
void adjustSchedDependency(SUnit *Def, int DefOpIdx, SUnit *Use, int UseOpIdx, SDep &Dep, const TargetSchedModel *SchedModel) const override
Perform target specific adjustments to the latency of a schedule dependency.
Definition: HexagonSubtarget.cpp:435

llvm::HexagonSubtarget::usePredicatedCalls
bool usePredicatedCalls() const
Definition: HexagonSubtarget.cpp:534

llvm::HexagonSubtarget::getInstrInfo
const HexagonInstrInfo * getInstrInfo() const override
Definition: HexagonSubtarget.h:124

llvm::HexagonSubtarget::getRegisterInfo
const HexagonRegisterInfo * getRegisterInfo() const override
Definition: HexagonSubtarget.h:125

llvm::HexagonSubtarget::getSMSMutations
void getSMSMutations(std::vector< std::unique_ptr< ScheduleDAGMutation > > &Mutations) const override
Definition: HexagonSubtarget.cpp:519

llvm::HexagonSubtarget::HexagonSubtarget
HexagonSubtarget(const Triple &TT, StringRef CPU, StringRef FS, const TargetMachine &TM)
Definition: HexagonSubtarget.cpp:75

llvm::HexagonSubtarget::isHVXVectorType
bool isHVXVectorType(EVT VecTy, bool IncludeBool=false) const
Definition: HexagonSubtarget.cpp:182

llvm::HexagonSubtarget::hasV68Ops
bool hasV68Ops() const
Definition: HexagonSubtarget.h:189

llvm::HexagonSubtarget::getPostRAMutations
void getPostRAMutations(std::vector< std::unique_ptr< ScheduleDAGMutation > > &Mutations) const override
Definition: HexagonSubtarget.cpp:512

llvm::HexagonSubtarget::getTargetLowering
const HexagonTargetLowering * getTargetLowering() const override
Definition: HexagonSubtarget.h:128

llvm::HexagonSubtarget::UseBSBScheduling
bool UseBSBScheduling
True if the target should use Back-Skip-Back scheduling.
Definition: HexagonSubtarget.h:76

llvm::HexagonSubtarget::isTinyCore
bool isTinyCore() const
Definition: HexagonSubtarget.h:241

llvm::HexagonSubtarget::getL1PrefetchDistance
unsigned getL1PrefetchDistance() const
Definition: HexagonSubtarget.cpp:720

llvm::HexagonSubtarget::getHVXElementTypes
ArrayRef< MVT > getHVXElementTypes() const
Definition: HexagonSubtarget.h:338

llvm::HexagonSubtarget::useHVXFloatingPoint
bool useHVXFloatingPoint() const
Definition: HexagonSubtarget.h:248

llvm::HexagonSubtarget::enableSubRegLiveness
bool enableSubRegLiveness() const override
Definition: HexagonSubtarget.cpp:724

llvm::HexagonSubtarget::useHVXOps
bool useHVXOps() const
Definition: HexagonSubtarget.h:249

llvm::HexagonSubtarget::OptLevel
CodeGenOptLevel OptLevel
Definition: HexagonSubtarget.h:73

llvm::HexagonSubtarget::getVectorLength
unsigned getVectorLength() const
Definition: HexagonSubtarget.h:329

llvm::HexagonSubtarget::ParseSubtargetFeatures
void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS)
ParseSubtargetFeatures - Parses features string setting specified subtarget options.

llvm::HexagonSubtarget::hasV60Ops
bool hasV60Ops() const
Definition: HexagonSubtarget.h:159

llvm::HexagonSubtarget::useHVXV68Ops
bool useHVXV68Ops() const
Definition: HexagonSubtarget.h:267

llvm::HexagonSubtarget::getL1CacheLineSize
unsigned getL1CacheLineSize() const
Definition: HexagonSubtarget.cpp:716

llvm::HexagonSubtarget::isTypeForHVX
bool isTypeForHVX(Type *VecTy, bool IncludeBool=false) const
Definition: HexagonSubtarget.cpp:210

llvm::HexagonSubtarget::getIntrinsicId
Intrinsic::ID getIntrinsicId(unsigned Opc) const
Definition: HexagonSubtarget.cpp:726

llvm::HexagonSubtarget::initializeSubtargetDependencies
HexagonSubtarget & initializeSubtargetDependencies(StringRef CPU, StringRef FS)
Definition: HexagonSubtarget.cpp:90

llvm::HexagonSubtarget::enableMachineScheduler
bool enableMachineScheduler() const override
Definition: HexagonSubtarget.cpp:528

llvm::HexagonSubtarget::useBSBScheduling
bool useBSBScheduling() const
Definition: HexagonSubtarget.h:288

llvm::HexagonSubtarget::isHVXElementType
bool isHVXElementType(MVT Ty, bool IncludeBool=false) const
Definition: HexagonSubtarget.cpp:171

llvm::HexagonSubtarget::useAA
bool useAA() const override
Enable use of alias analysis during code generation (during MI scheduling, DAGCombine,...
Definition: HexagonSubtarget.cpp:427

llvm::HexagonTargetLowering::getPreferredVectorAction
LegalizeTypeAction getPreferredVectorAction(MVT VT) const override
Return the preferred vector type legalization action.
Definition: HexagonISelLowering.cpp:2195

llvm::InstrItineraryData::Itineraries
const InstrItinerary * Itineraries
Array of itineraries selected.
Definition: MCInstrItineraries.h:117

llvm::LocationSize
Definition: MemoryLocation.h:68

llvm::LocationSize::hasValue
bool hasValue() const
Definition: MemoryLocation.h:165

llvm::LocationSize::getValue
TypeSize getValue() const
Definition: MemoryLocation.h:170

llvm::MCRegAliasIterator
MCRegAliasIterator enumerates all registers aliasing Reg.
Definition: MCRegisterInfo.h:747

llvm::MCRegAliasIterator::isValid
bool isValid() const
Definition: MCRegisterInfo.h:763

llvm::MVT
Machine Value Type.
Definition: MachineValueType.h:35

llvm::MVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition: MachineValueType.h:106

llvm::MVT::getVectorVT
static MVT getVectorVT(MVT VT, unsigned NumElements)
Definition: MachineValueType.h:451

llvm::MVT::getVectorElementType
MVT getVectorElementType() const
Definition: MachineValueType.h:263

llvm::MVT::isValid
bool isValid() const
Return true if this is a valid simple valuetype.
Definition: MachineValueType.h:74

llvm::MachineFunction::getSubtarget
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Definition: MachineFunction.h:733

llvm::MachineInstr
Representation of each machine instruction.
Definition: MachineInstr.h:71

llvm::MachineInstr::getOpcode
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
Definition: MachineInstr.h:577

llvm::MachineInstr::isCopy
bool isCopy() const
Definition: MachineInstr.h:1440

llvm::MachineInstr::getNumOperands
unsigned getNumOperands() const
Retuns the total number of operands.
Definition: MachineInstr.h:580

llvm::MachineInstr::mayLoad
bool mayLoad(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read memory.
Definition: MachineInstr.h:1145

llvm::MachineInstr::isRegSequence
bool isRegSequence() const
Definition: MachineInstr.h:1432

llvm::MachineInstr::mayStore
bool mayStore(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly modify memory.
Definition: MachineInstr.h:1158

llvm::MachineInstr::isPHI
bool isPHI() const
Definition: MachineInstr.h:1406

llvm::MachineInstr::getOperand
const MachineOperand & getOperand(unsigned i) const
Definition: MachineInstr.h:587

llvm::MachineOperand
MachineOperand class - Representation of each machine instruction operand.
Definition: MachineOperand.h:48

llvm::MachineOperand::isReg
bool isReg() const
isReg - Tests if this is a MO_Register operand.
Definition: MachineOperand.h:329

llvm::MachineOperand::isUse
bool isUse() const
Definition: MachineOperand.h:379

llvm::MachineOperand::isDef
bool isDef() const
Definition: MachineOperand.h:384

llvm::MachineOperand::getReg
Register getReg() const
getReg - Returns the register number.
Definition: MachineOperand.h:369

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::Register::isVirtual
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
Definition: Register.h:91

llvm::SDep
Scheduling dependency.
Definition: ScheduleDAG.h:49

llvm::SDep::Output
@ Output
A register output-dependence (aka WAW).
Definition: ScheduleDAG.h:55

llvm::SDep::Order
@ Order
Any other ordering dependency.
Definition: ScheduleDAG.h:56

llvm::SDep::setLatency
void setLatency(unsigned Lat)
Sets the latency for this edge.
Definition: ScheduleDAG.h:147

llvm::SDep::Barrier
@ Barrier
An unknown scheduling barrier.
Definition: ScheduleDAG.h:69

llvm::SDep::Artificial
@ Artificial
Arbitrary strong DAG edge (no real dependence).
Definition: ScheduleDAG.h:72

llvm::SDep::getLatency
unsigned getLatency() const
Returns the latency value for this edge, which roughly means the minimum number of cycles that must e...
Definition: ScheduleDAG.h:142

llvm::SDep::isArtificial
bool isArtificial() const
Tests if this is an Order dependence that is marked as "artificial", meaning it isn't necessary for c...
Definition: ScheduleDAG.h:200

llvm::SUnit
Scheduling unit. This is a node in the scheduling DAG.
Definition: ScheduleDAG.h:242

llvm::SUnit::isInstr
bool isInstr() const
Returns true if this SUnit refers to a machine instruction as opposed to an SDNode.
Definition: ScheduleDAG.h:378

llvm::SUnit::NodeNum
unsigned NodeNum
Entry # of node in the node vector.
Definition: ScheduleDAG.h:270

llvm::SUnit::setHeightDirty
void setHeightDirty()
Sets a flag in this node to indicate that its stored Height value will require recomputation the next...
Definition: ScheduleDAG.cpp:232

llvm::SUnit::removePred
void removePred(const SDep &D)
Removes the specified edge as a pred of the current node if it exists.
Definition: ScheduleDAG.cpp:175

llvm::SUnit::Succs
SmallVector< SDep, 4 > Succs
All sunit successors.
Definition: ScheduleDAG.h:263

llvm::SUnit::Preds
SmallVector< SDep, 4 > Preds
All sunit predecessors.
Definition: ScheduleDAG.h:262

llvm::SUnit::getInstr
MachineInstr * getInstr() const
Returns the representative MachineInstr for this SUnit.
Definition: ScheduleDAG.h:390

llvm::ScheduleDAGInstrs
A ScheduleDAG for scheduling lists of MachineInstr.
Definition: ScheduleDAGInstrs.h:115

llvm::ScheduleDAGInstrs::addEdge
bool addEdge(SUnit *SuccSU, const SDep &PredDep)
Add a DAG edge to the given SU with the given predecessor dependence data.
Definition: ScheduleDAGInstrs.cpp:1219

llvm::ScheduleDAGMI
ScheduleDAGMI is an implementation of ScheduleDAGInstrs that simply schedules machine instructions ac...
Definition: MachineScheduler.h:285

llvm::ScheduleDAG::TII
const TargetInstrInfo * TII
Target instruction information.
Definition: ScheduleDAG.h:575

llvm::ScheduleDAG::SUnits
std::vector< SUnit > SUnits
The scheduling units.
Definition: ScheduleDAG.h:579

llvm::ScheduleDAG::MF
MachineFunction & MF
Machine function.
Definition: ScheduleDAG.h:577

llvm::SmallSet
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
Definition: SmallSet.h:132

llvm::SmallSet::count
size_type count(const T &V) const
count - Return 1 if the element is in the set, 0 otherwise.
Definition: SmallSet.h:175

llvm::SmallSet::clear
void clear()
Definition: SmallSet.h:204

llvm::SmallSet::insert
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
Definition: SmallSet.h:181

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:413

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51

llvm::StringRef::consumeInteger
bool consumeInteger(unsigned Radix, T &Result)
Parse the current string as an integer of the specified radix.
Definition: StringRef.h:499

llvm::StringRef::starts_with
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
Definition: StringRef.h:265

llvm::StringRef::drop_front
StringRef drop_front(size_t N=1) const
Return a StringRef equal to 'this' but with the first N elements dropped.
Definition: StringRef.h:609

llvm::SubtargetFeatures
Manages the enabling and disabling of subtarget specific features.
Definition: SubtargetFeature.h:174

llvm::SubtargetFeatures::getFeatures
const std::vector< std::string > & getFeatures() const
Returns the vector of individual subtarget features.
Definition: SubtargetFeature.h:189

llvm::SubtargetFeatures::getString
std::string getString() const
Returns features as a string.
Definition: SubtargetFeature.cpp:54

llvm::SubtargetFeatures::AddFeature
void AddFeature(StringRef String, bool Enable=true)
Adds Features.
Definition: SubtargetFeature.cpp:36

llvm::TargetLoweringBase::TypeWidenVector
@ TypeWidenVector
Definition: TargetLowering.h:217

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:77

llvm::TargetSchedModel
Provide an instruction scheduling machine model to CodeGen passes.
Definition: TargetSchedule.h:30

llvm::TargetSubtargetInfo::getRegisterInfo
virtual const TargetRegisterInfo * getRegisterInfo() const
getRegisterInfo - If register information is available, return it.
Definition: TargetSubtargetInfo.h:129

llvm::Triple
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition: Type.h:270

llvm::Type::isFloatingPointTy
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
Definition: Type.h:184

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:237

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition: Type.h:355

llvm::cl::Option::getNumOccurrences
int getNumOccurrences() const
Definition: CommandLine.h:399

llvm::cl::Option::getPosition
unsigned getPosition() const
Definition: CommandLine.h:306

llvm::cl::opt
Definition: CommandLine.h:1423

unsigned

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

TargetMachine.h

llvm::HexagonII::TypeALU64
@ TypeALU64
Definition: HexagonDepITypes.h:20

llvm::HexagonII::TypeM
@ TypeM
Definition: HexagonDepITypes.h:54

llvm::HexagonII::TypeS_2op
@ TypeS_2op
Definition: HexagonDepITypes.h:60

llvm::HexagonII::TypeS_3op
@ TypeS_3op
Definition: HexagonDepITypes.h:61

llvm::HexagonII::BaseImmOffset
@ BaseImmOffset
Definition: HexagonBaseInfo.h:34

llvm::Hexagon_MC::addArchSubtarget
void addArchSubtarget(MCSubtargetInfo const *STI, StringRef FS)
Definition: HexagonMCTargetDesc.cpp:644

llvm::Hexagon_MC::completeHVXFeatures
FeatureBitset completeHVXFeatures(const FeatureBitset &FB)
Definition: HexagonMCTargetDesc.cpp:520

llvm::Hexagon::getCpu
std::optional< Hexagon::ArchEnum > getCpu(StringRef CPU)
Definition: HexagonDepArch.h:35

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:137

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::find
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1759

llvm::Latency
@ Latency
Definition: SIMachineScheduler.h:34

llvm::PowerOf2Ceil
uint64_t PowerOf2Ceil(uint64_t A)
Returns the power of two which is greater than or equal to the given value.
Definition: MathExtras.h:395

llvm::reverse
auto reverse(ContainerTy &&C)
Definition: STLExtras.h:420

llvm::sort
void sort(IteratorTy Start, IteratorTy End)
Definition: STLExtras.h:1664

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

llvm::CodeGenOptLevel::None
@ None
-O0

llvm::count_if
auto count_if(R &&Range, UnaryPredicate P)
Wrapper function around std::count_if to count the number of times an element satisfying a given pred...
Definition: STLExtras.h:1945

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition: STLExtras.h:1903

llvm::HexagonDisableDuplex
cl::opt< bool > HexagonDisableDuplex

std
Implement std::hash so that hash_code can be used in STL containers.
Definition: BitVector.h:858

N
#define N

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:35

llvm::EVT::isSimple
bool isSimple() const
Test if the given EVT is simple (as opposed to being extended).
Definition: ValueTypes.h:137

llvm::EVT::getSizeInBits
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition: ValueTypes.h:368

llvm::EVT::getEVT
static EVT getEVT(Type *Ty, bool HandleUnknown=false)
Return the value type corresponding to the specified type.
Definition: ValueTypes.cpp:289

llvm::EVT::getSimpleVT
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Definition: ValueTypes.h:311

llvm::EVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition: ValueTypes.h:168

llvm::EVT::isScalableVector
bool isScalableVector() const
Return true if this is a vector type where the runtime length is machine dependent.
Definition: ValueTypes.h:174

llvm::EVT::getVectorElementType
EVT getVectorElementType() const
Given a vector type, return the type of each element.
Definition: ValueTypes.h:323

llvm::EVT::getVectorNumElements
unsigned getVectorNumElements() const
Given a vector type, return the number of elements it contains.
Definition: ValueTypes.h:331

llvm::HexagonSubtarget::BankConflictMutation::apply
void apply(ScheduleDAGInstrs *DAG) override
Definition: HexagonSubtarget.cpp:377

llvm::HexagonSubtarget::CallMutation::apply
void apply(ScheduleDAGInstrs *DAG) override
Definition: HexagonSubtarget.cpp:309

llvm::HexagonSubtarget::HVXMemLatencyMutation::apply
void apply(ScheduleDAGInstrs *DAG) override
Definition: HexagonSubtarget.cpp:258

llvm::HexagonSubtarget::UsrOverflowMutation::apply
void apply(ScheduleDAGInstrs *DAG) override
Definition: HexagonSubtarget.cpp:245

llvm::cl::desc
Definition: CommandLine.h:409