doxygen/LSUnit_8h_source.html

//===------------------------- LSUnit.h --------------------------*- C++-*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

///

/// A Load/Store unit class that models load/store queues and that implements

/// a simple weak memory consistency model.

///

//===----------------------------------------------------------------------===//


#ifndef LLVM_MCA_HARDWAREUNITS_LSUNIT_H

#define LLVM_MCA_HARDWAREUNITS_LSUNIT_H


#include "llvm/ADT/DenseMap.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/MC/MCSchedule.h"

#include "llvm/MCA/HardwareUnits/HardwareUnit.h"

#include "llvm/MCA/Instruction.h"


namespace llvm {

namespace mca {


/// Abstract base interface for LS (load/store) units in llvm-mca.

class LSUnitBase : public HardwareUnit {

  /// Load queue size.

  ///

  /// A value of zero for this field means that the load queue is unbounded.

  /// Processor models can declare the size of a load queue via tablegen (see

  /// the definition of tablegen class LoadQueue in

  /// llvm/Target/TargetSchedule.td).

  unsigned LQSize;


  /// Load queue size.

  ///

  /// A value of zero for this field means that the store queue is unbounded.

  /// Processor models can declare the size of a store queue via tablegen (see

  /// the definition of tablegen class StoreQueue in

  /// llvm/Target/TargetSchedule.td).

  unsigned SQSize;


  unsigned UsedLQEntries;

  unsigned UsedSQEntries;


  /// True if loads don't alias with stores.

  ///

  /// By default, the LS unit assumes that loads and stores don't alias with

  /// each other. If this field is set to false, then loads are always assumed

  /// to alias with stores.

  const bool NoAlias;


public:

  LSUnitBase(const MCSchedModel &SM, unsigned LoadQueueSize,

             unsigned StoreQueueSize, bool AssumeNoAlias);


  virtual ~LSUnitBase();


  /// Returns the total number of entries in the load queue.

  unsigned getLoadQueueSize() const { return LQSize; }


  /// Returns the total number of entries in the store queue.

  unsigned getStoreQueueSize() const { return SQSize; }


  unsigned getUsedLQEntries() const { return UsedLQEntries; }

  unsigned getUsedSQEntries() const { return UsedSQEntries; }

  void acquireLQSlot() { ++UsedLQEntries; }

  void acquireSQSlot() { ++UsedSQEntries; }

  void releaseLQSlot() { --UsedLQEntries; }

  void releaseSQSlot() { --UsedSQEntries; }


  bool assumeNoAlias() const { return NoAlias; }


  enum Status {

    LSU_AVAILABLE = 0,

    LSU_LQUEUE_FULL, // Load Queue unavailable

    LSU_SQUEUE_FULL  // Store Queue unavailable

  };


  /// This method checks the availability of the load/store buffers.

  ///

  /// Returns LSU_AVAILABLE if there are enough load/store queue entries to

  /// accomodate instruction IR. By default, LSU_AVAILABLE is returned if IR is

  /// not a memory operation.

  virtual Status isAvailable(const InstRef &IR) const = 0;


  /// Allocates LS resources for instruction IR.

  ///

  /// This method assumes that a previous call to `isAvailable(IR)` succeeded

  /// with a LSUnitBase::Status value of LSU_AVAILABLE.

  /// Returns the GroupID associated with this instruction. That value will be

  /// used to set the LSUTokenID field in class Instruction.

  virtual unsigned dispatch(const InstRef &IR) = 0;


  bool isSQEmpty() const { return !UsedSQEntries; }

  bool isLQEmpty() const { return !UsedLQEntries; }

  bool isSQFull() const { return SQSize && SQSize == UsedSQEntries; }

  bool isLQFull() const { return LQSize && LQSize == UsedLQEntries; }


  /// Check if a peviously dispatched instruction IR is now ready for execution.

  virtual bool isReady(const InstRef &IR) const = 0;


  /// Check if instruction IR only depends on memory instructions that are

  /// currently executing.

  virtual bool isPending(const InstRef &IR) const = 0;


  /// Check if instruction IR is still waiting on memory operations, and the

  /// wait time is still unknown.

  virtual bool isWaiting(const InstRef &IR) const = 0;


  virtual bool hasDependentUsers(const InstRef &IR) const = 0;


  virtual const CriticalDependency getCriticalPredecessor(unsigned GroupId) = 0;


  virtual void onInstructionExecuted(const InstRef &IR) = 0;


  // Loads are tracked by the LDQ (load queue) from dispatch until completion.

  // Stores are tracked by the STQ (store queue) from dispatch until commitment.

  // By default we conservatively assume that the LDQ receives a load at

  // dispatch. Loads leave the LDQ at retirement stage.

  virtual void onInstructionRetired(const InstRef &IR) = 0;


  virtual void onInstructionIssued(const InstRef &IR) = 0;


  virtual void cycleEvent() = 0;


#ifndef NDEBUG

  virtual void dump() const = 0;

#endif

};


/// Default Load/Store Unit (LS Unit) for simulated processors.

///

/// Each load (or store) consumes one entry in the load (or store) queue.

///

/// Rules are:

/// 1) A younger load is allowed to pass an older load only if there are no

///    stores nor barriers in between the two loads.

/// 2) An younger store is not allowed to pass an older store.

/// 3) A younger store is not allowed to pass an older load.

/// 4) A younger load is allowed to pass an older store only if the load does

///    not alias with the store.

///

/// This class optimistically assumes that loads don't alias store operations.

/// Under this assumption, younger loads are always allowed to pass older

/// stores (this would only affects rule 4).

/// Essentially, this class doesn't perform any sort alias analysis to

/// identify aliasing loads and stores.

///

/// To enforce aliasing between loads and stores, flag `AssumeNoAlias` must be

/// set to `false` by the constructor of LSUnit.

///

/// Note that this class doesn't know about the existence of different memory

/// types for memory operations (example: write-through, write-combining, etc.).

/// Derived classes are responsible for implementing that extra knowledge, and

/// provide different sets of rules for loads and stores by overriding method

/// `isReady()`.

/// To emulate a write-combining memory type, rule 2. must be relaxed in a

/// derived class to enable the reordering of non-aliasing store operations.

///

/// No assumptions are made by this class on the size of the store buffer.  This

/// class doesn't know how to identify cases where store-to-load forwarding may

/// occur.

///

/// LSUnit doesn't attempt to predict whether a load or store hits or misses

/// the L1 cache. To be more specific, LSUnit doesn't know anything about

/// cache hierarchy and memory types.

/// It only knows if an instruction "mayLoad" and/or "mayStore". For loads, the

/// scheduling model provides an "optimistic" load-to-use latency (which usually

/// matches the load-to-use latency for when there is a hit in the L1D).

/// Derived classes may expand this knowledge.

///

/// Class MCInstrDesc in LLVM doesn't know about serializing operations, nor

/// memory-barrier like instructions.

/// LSUnit conservatively assumes that an instruction which `mayLoad` and has

/// `unmodeled side effects` behave like a "soft" load-barrier. That means, it

/// serializes loads without forcing a flush of the load queue.

/// Similarly, instructions that both `mayStore` and have `unmodeled side

/// effects` are treated like store barriers. A full memory

/// barrier is a 'mayLoad' and 'mayStore' instruction with unmodeled side

/// effects. This is obviously inaccurate, but this is the best that we can do

/// at the moment.

///

/// Each load/store barrier consumes one entry in the load/store queue. A

/// load/store barrier enforces ordering of loads/stores:

///  - A younger load cannot pass a load barrier.

///  - A younger store cannot pass a store barrier.

///

/// A younger load has to wait for the memory load barrier to execute.

/// A load/store barrier is "executed" when it becomes the oldest entry in

/// the load/store queue(s). That also means, all the older loads/stores have

/// already been executed.

class LSUnit : public LSUnitBase {


  // This class doesn't know about the latency of a load instruction. So, it

  // conservatively/pessimistically assumes that the latency of a load opcode

  // matches the instruction latency.

  //

  // FIXME: In the absence of cache misses (i.e. L1I/L1D/iTLB/dTLB hits/misses),

  // and load/store conflicts, the latency of a load is determined by the depth

  // of the load pipeline. So, we could use field `LoadLatency` in the

  // MCSchedModel to model that latency.

  // Field `LoadLatency` often matches the so-called 'load-to-use' latency from

  // L1D, and it usually already accounts for any extra latency due to data

  // forwarding.

  // When doing throughput analysis, `LoadLatency` is likely to

  // be a better predictor of load latency than instruction latency. This is

  // particularly true when simulating code with temporal/spatial locality of

  // memory accesses.

  // Using `LoadLatency` (instead of the instruction latency) is also expected

  // to improve the load queue allocation for long latency instructions with

  // folded memory operands (See PR39829).

  //

  // FIXME: On some processors, load/store operations are split into multiple

  // uOps. For example, X86 AMD Jaguar natively supports 128-bit data types, but

  // not 256-bit data types. So, a 256-bit load is effectively split into two

  // 128-bit loads, and each split load consumes one 'LoadQueue' entry. For

  // simplicity, this class optimistically assumes that a load instruction only

  // consumes one entry in the LoadQueue.  Similarly, store instructions only

  // consume a single entry in the StoreQueue.

  // In future, we should reassess the quality of this design, and consider

  // alternative approaches that let instructions specify the number of

  // load/store queue entries which they consume at dispatch stage (See

  // PR39830).

  //

  // An instruction that both 'mayStore' and 'HasUnmodeledSideEffects' is

  // conservatively treated as a store barrier. It forces older store to be

  // executed before newer stores are issued.

  //

  // An instruction that both 'MayLoad' and 'HasUnmodeledSideEffects' is

  // conservatively treated as a load barrier. It forces older loads to execute

  // before newer loads are issued.


protected:

  /// A node of a memory dependency graph. A MemoryGroup describes a set of

  /// instructions with same memory dependencies.

  ///

  /// By construction, instructions of a MemoryGroup don't depend on each other.

  /// At dispatch stage, instructions are mapped by the LSUnit to MemoryGroups.

  /// A Memory group identifier is then stored as a "token" in field

  /// Instruction::LSUTokenID of each dispatched instructions. That token is

  /// used internally by the LSUnit to track memory dependencies.

  class MemoryGroup {

    unsigned NumPredecessors = 0;

    unsigned NumExecutingPredecessors = 0;

    unsigned NumExecutedPredecessors = 0;


    unsigned NumInstructions = 0;

    unsigned NumExecuting = 0;

    unsigned NumExecuted = 0;

    // Successors that are in a order dependency with this group.

    SmallVector<MemoryGroup *, 4> OrderSucc;

    // Successors that are in a data dependency with this group.

    SmallVector<MemoryGroup *, 4> DataSucc;


    CriticalDependency CriticalPredecessor;

    InstRef CriticalMemoryInstruction;


    MemoryGroup(const MemoryGroup &) = delete;

    MemoryGroup &operator=(const MemoryGroup &) = delete;


  public:

    MemoryGroup() = default;

    MemoryGroup(MemoryGroup &&) = default;


    size_t getNumSuccessors() const {

      return OrderSucc.size() + DataSucc.size();

    }

    unsigned getNumPredecessors() const { return NumPredecessors; }

    unsigned getNumExecutingPredecessors() const {

      return NumExecutingPredecessors;

    }

    unsigned getNumExecutedPredecessors() const {

      return NumExecutedPredecessors;

    }

    unsigned getNumInstructions() const { return NumInstructions; }

    unsigned getNumExecuting() const { return NumExecuting; }

    unsigned getNumExecuted() const { return NumExecuted; }


    const InstRef &getCriticalMemoryInstruction() const {

      return CriticalMemoryInstruction;

    }

    const CriticalDependency &getCriticalPredecessor() const {

      return CriticalPredecessor;

    }


    void addSuccessor(MemoryGroup *Group, bool IsDataDependent) {

      // Do not need to add a dependency if there is no data

      // dependency and all instructions from this group have been

      // issued already.

      if (!IsDataDependent && isExecuting())

        return;


      Group->NumPredecessors++;

      assert(!isExecuted() && "Should have been removed!");

      if (isExecuting())

        Group->onGroupIssued(CriticalMemoryInstruction, IsDataDependent);


      if (IsDataDependent)

        DataSucc.emplace_back(Group);

      else

        OrderSucc.emplace_back(Group);

    }


    bool isWaiting() const {

      return NumPredecessors >

             (NumExecutingPredecessors + NumExecutedPredecessors);

    }

    bool isPending() const {

      return NumExecutingPredecessors &&

             ((NumExecutedPredecessors + NumExecutingPredecessors) ==

              NumPredecessors);

    }

    bool isReady() const { return NumExecutedPredecessors == NumPredecessors; }

    bool isExecuting() const {

      return NumExecuting && (NumExecuting == (NumInstructions - NumExecuted));

    }

    bool isExecuted() const { return NumInstructions == NumExecuted; }


    void onGroupIssued(const InstRef &IR, bool ShouldUpdateCriticalDep) {

      assert(!isReady() && "Unexpected group-start event!");

      NumExecutingPredecessors++;


      if (!ShouldUpdateCriticalDep)

        return;


      unsigned Cycles = IR.getInstruction()->getCyclesLeft();

      if (CriticalPredecessor.Cycles < Cycles) {

        CriticalPredecessor.IID = IR.getSourceIndex();

        CriticalPredecessor.Cycles = Cycles;

      }

    }


    void onGroupExecuted() {

      assert(!isReady() && "Inconsistent state found!");

      NumExecutingPredecessors--;

      NumExecutedPredecessors++;

    }


    void onInstructionIssued(const InstRef &IR) {

      assert(!isExecuting() && "Invalid internal state!");

      ++NumExecuting;


      // update the CriticalMemDep.

      const Instruction &IS = *IR.getInstruction();

      if ((bool)CriticalMemoryInstruction) {

        const Instruction &OtherIS =

            *CriticalMemoryInstruction.getInstruction();

        if (OtherIS.getCyclesLeft() < IS.getCyclesLeft())

          CriticalMemoryInstruction = IR;

      } else {

        CriticalMemoryInstruction = IR;

      }


      if (!isExecuting())

        return;


      // Notify successors that this group started execution.

      for (MemoryGroup *MG : OrderSucc) {

        MG->onGroupIssued(CriticalMemoryInstruction, false);

        // Release the order dependency with this group.

        MG->onGroupExecuted();

      }


      for (MemoryGroup *MG : DataSucc)

        MG->onGroupIssued(CriticalMemoryInstruction, true);

    }


    void onInstructionExecuted(const InstRef &IR) {

      assert(isReady() && !isExecuted() && "Invalid internal state!");

      --NumExecuting;

      ++NumExecuted;


      if (CriticalMemoryInstruction &&

          CriticalMemoryInstruction.getSourceIndex() == IR.getSourceIndex()) {

        CriticalMemoryInstruction.invalidate();

      }


      if (!isExecuted())

        return;


      // Notify data dependent successors that this group has finished

      // execution.

      for (MemoryGroup *MG : DataSucc)

        MG->onGroupExecuted();

    }


    void addInstruction() {

      assert(!getNumSuccessors() && "Cannot add instructions to this group!");

      ++NumInstructions;

    }


    void cycleEvent() {

      if (isWaiting() && CriticalPredecessor.Cycles)

        CriticalPredecessor.Cycles--;

    }

  };

  /// Used to map group identifiers to MemoryGroups.

  DenseMap<unsigned, std::unique_ptr<MemoryGroup>> Groups;

  unsigned NextGroupID = 1;


  unsigned CurrentLoadGroupID;

  unsigned CurrentLoadBarrierGroupID;

  unsigned CurrentStoreGroupID;

  unsigned CurrentStoreBarrierGroupID;


public:

  LSUnit(const MCSchedModel &SM)

      : LSUnit(SM, /* LQSize */ 0, /* SQSize */ 0, /* NoAlias */ false) {}

  LSUnit(const MCSchedModel &SM, unsigned LQ, unsigned SQ)

      : LSUnit(SM, LQ, SQ, /* NoAlias */ false) {}

  LSUnit(const MCSchedModel &SM, unsigned LQ, unsigned SQ, bool AssumeNoAlias)

      : LSUnitBase(SM, LQ, SQ, AssumeNoAlias), CurrentLoadGroupID(0),

        CurrentLoadBarrierGroupID(0), CurrentStoreGroupID(0),

        CurrentStoreBarrierGroupID(0) {}


  /// Returns LSU_AVAILABLE if there are enough load/store queue entries to

  /// accomodate instruction IR.

  Status isAvailable(const InstRef &IR) const override;


  bool isReady(const InstRef &IR) const override {

    unsigned GroupID = IR.getInstruction()->getLSUTokenID();

    const MemoryGroup &Group = getGroup(GroupID);

    return Group.isReady();

  }


  bool isPending(const InstRef &IR) const override {

    unsigned GroupID = IR.getInstruction()->getLSUTokenID();

    const MemoryGroup &Group = getGroup(GroupID);

    return Group.isPending();

  }


  bool isWaiting(const InstRef &IR) const override {

    unsigned GroupID = IR.getInstruction()->getLSUTokenID();

    const MemoryGroup &Group = getGroup(GroupID);

    return Group.isWaiting();

  }


  bool hasDependentUsers(const InstRef &IR) const override {

    unsigned GroupID = IR.getInstruction()->getLSUTokenID();

    const MemoryGroup &Group = getGroup(GroupID);

    return !Group.isExecuted() && Group.getNumSuccessors();

  }


  const CriticalDependency getCriticalPredecessor(unsigned GroupId) override {

    const MemoryGroup &Group = getGroup(GroupId);

    return Group.getCriticalPredecessor();

  }


  /// Allocates LS resources for instruction IR.

  ///

  /// This method assumes that a previous call to `isAvailable(IR)` succeeded

  /// returning LSU_AVAILABLE.

  ///

  /// Rules are:

  /// By default, rules are:

  /// 1. A store may not pass a previous store.

  /// 2. A load may not pass a previous store unless flag 'NoAlias' is set.

  /// 3. A load may pass a previous load.

  /// 4. A store may not pass a previous load (regardless of flag 'NoAlias').

  /// 5. A load has to wait until an older load barrier is fully executed.

  /// 6. A store has to wait until an older store barrier is fully executed.

  unsigned dispatch(const InstRef &IR) override;


  virtual void onInstructionIssued(const InstRef &IR) override {

    unsigned GroupID = IR.getInstruction()->getLSUTokenID();

    Groups[GroupID]->onInstructionIssued(IR);

  }


  virtual void onInstructionRetired(const InstRef &IR) override;


  virtual void onInstructionExecuted(const InstRef &IR) override;


  virtual void cycleEvent() override;


#ifndef NDEBUG

  virtual void dump() const override;

#endif


private:

  bool isValidGroupID(unsigned Index) const {

    return Index && Groups.contains(Index);

  }


  const MemoryGroup &getGroup(unsigned Index) const {

    assert(isValidGroupID(Index) && "Group doesn't exist!");

    return *Groups.find(Index)->second;

  }


  MemoryGroup &getGroup(unsigned Index) {

    assert(isValidGroupID(Index) && "Group doesn't exist!");

    return *Groups.find(Index)->second;

  }


  unsigned createMemoryGroup() {

    Groups.insert(std::make_pair(NextGroupID, std::make_unique<MemoryGroup>()));

    return NextGroupID++;

  }

};


} // namespace mca

} // namespace llvm


#endif // LLVM_MCA_HARDWAREUNITS_LSUNIT_H

DenseMap.h
This file defines the DenseMap class.

Index
uint32_t Index
Definition: ELFObjHandler.cpp:83

HardwareUnit.h
This file defines a base class for describing a simulated hardware unit.

IR
Legalize the Machine IR a function s Machine IR
Definition: Legalizer.cpp:80

Instruction.h
This file defines abstractions used by the Pipeline to model register reads, register writes and inst...

MCSchedule.h

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

SmallVector.h
This file defines the SmallVector class.

llvm::DenseMap
Definition: DenseMap.h:727

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:78

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition: SmallVector.h:937

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::mca::HardwareUnit
Definition: HardwareUnit.h:21

llvm::mca::InstRef
An InstRef contains both a SourceMgr index and Instruction pair.
Definition: Instruction.h:720

llvm::mca::InstRef::invalidate
void invalidate()
Invalidate this reference.
Definition: Instruction.h:741

llvm::mca::InstRef::getSourceIndex
unsigned getSourceIndex() const
Definition: Instruction.h:733

llvm::mca::Instruction
An instruction propagated through the simulated instruction pipeline.
Definition: Instruction.h:600

llvm::mca::Instruction::getCyclesLeft
int getCyclesLeft() const
Definition: Instruction.h:663

llvm::mca::LSUnitBase
Abstract base interface for LS (load/store) units in llvm-mca.
Definition: LSUnit.h:28

llvm::mca::LSUnitBase::dump
virtual void dump() const =0

llvm::mca::LSUnitBase::~LSUnitBase
virtual ~LSUnitBase()

llvm::mca::LSUnitBase::dispatch
virtual unsigned dispatch(const InstRef &IR)=0
Allocates LS resources for instruction IR.

llvm::mca::LSUnitBase::isLQFull
bool isLQFull() const
Definition: LSUnit.h:100

llvm::mca::LSUnitBase::getUsedSQEntries
unsigned getUsedSQEntries() const
Definition: LSUnit.h:68

llvm::mca::LSUnitBase::acquireSQSlot
void acquireSQSlot()
Definition: LSUnit.h:70

llvm::mca::LSUnitBase::isReady
virtual bool isReady(const InstRef &IR) const =0
Check if a peviously dispatched instruction IR is now ready for execution.

llvm::mca::LSUnitBase::releaseLQSlot
void releaseLQSlot()
Definition: LSUnit.h:71

llvm::mca::LSUnitBase::isAvailable
virtual Status isAvailable(const InstRef &IR) const =0
This method checks the availability of the load/store buffers.

llvm::mca::LSUnitBase::onInstructionRetired
virtual void onInstructionRetired(const InstRef &IR)=0

llvm::mca::LSUnitBase::onInstructionExecuted
virtual void onInstructionExecuted(const InstRef &IR)=0

llvm::mca::LSUnitBase::cycleEvent
virtual void cycleEvent()=0

llvm::mca::LSUnitBase::getUsedLQEntries
unsigned getUsedLQEntries() const
Definition: LSUnit.h:67

llvm::mca::LSUnitBase::isSQEmpty
bool isSQEmpty() const
Definition: LSUnit.h:97

llvm::mca::LSUnitBase::assumeNoAlias
bool assumeNoAlias() const
Definition: LSUnit.h:74

llvm::mca::LSUnitBase::getLoadQueueSize
unsigned getLoadQueueSize() const
Returns the total number of entries in the load queue.
Definition: LSUnit.h:62

llvm::mca::LSUnitBase::LSU_LQUEUE_FULL
@ LSU_LQUEUE_FULL
Definition: LSUnit.h:78

llvm::mca::LSUnitBase::LSU_AVAILABLE
@ LSU_AVAILABLE
Definition: LSUnit.h:77

llvm::mca::LSUnitBase::LSU_SQUEUE_FULL
@ LSU_SQUEUE_FULL
Definition: LSUnit.h:79

llvm::mca::LSUnitBase::isWaiting
virtual bool isWaiting(const InstRef &IR) const =0
Check if instruction IR is still waiting on memory operations, and the wait time is still unknown.

llvm::mca::LSUnitBase::isSQFull
bool isSQFull() const
Definition: LSUnit.h:99

llvm::mca::LSUnitBase::getCriticalPredecessor
virtual const CriticalDependency getCriticalPredecessor(unsigned GroupId)=0

llvm::mca::LSUnitBase::isPending
virtual bool isPending(const InstRef &IR) const =0
Check if instruction IR only depends on memory instructions that are currently executing.

llvm::mca::LSUnitBase::hasDependentUsers
virtual bool hasDependentUsers(const InstRef &IR) const =0

llvm::mca::LSUnitBase::isLQEmpty
bool isLQEmpty() const
Definition: LSUnit.h:98

llvm::mca::LSUnitBase::getStoreQueueSize
unsigned getStoreQueueSize() const
Returns the total number of entries in the store queue.
Definition: LSUnit.h:65

llvm::mca::LSUnitBase::acquireLQSlot
void acquireLQSlot()
Definition: LSUnit.h:69

llvm::mca::LSUnitBase::onInstructionIssued
virtual void onInstructionIssued(const InstRef &IR)=0

llvm::mca::LSUnitBase::releaseSQSlot
void releaseSQSlot()
Definition: LSUnit.h:72

llvm::mca::LSUnit::MemoryGroup
A node of a memory dependency graph.
Definition: LSUnit.h:245

llvm::mca::LSUnit::MemoryGroup::getNumInstructions
unsigned getNumInstructions() const
Definition: LSUnit.h:278

llvm::mca::LSUnit::MemoryGroup::getNumExecutingPredecessors
unsigned getNumExecutingPredecessors() const
Definition: LSUnit.h:272

llvm::mca::LSUnit::MemoryGroup::addInstruction
void addInstruction()
Definition: LSUnit.h:390

llvm::mca::LSUnit::MemoryGroup::getNumExecuting
unsigned getNumExecuting() const
Definition: LSUnit.h:279

llvm::mca::LSUnit::MemoryGroup::onGroupIssued
void onGroupIssued(const InstRef &IR, bool ShouldUpdateCriticalDep)
Definition: LSUnit.h:322

llvm::mca::LSUnit::MemoryGroup::getNumPredecessors
unsigned getNumPredecessors() const
Definition: LSUnit.h:271

llvm::mca::LSUnit::MemoryGroup::isExecuted
bool isExecuted() const
Definition: LSUnit.h:320

llvm::mca::LSUnit::MemoryGroup::onInstructionExecuted
void onInstructionExecuted(const InstRef &IR)
Definition: LSUnit.h:371

llvm::mca::LSUnit::MemoryGroup::isExecuting
bool isExecuting() const
Definition: LSUnit.h:317

llvm::mca::LSUnit::MemoryGroup::getCriticalPredecessor
const CriticalDependency & getCriticalPredecessor() const
Definition: LSUnit.h:285

llvm::mca::LSUnit::MemoryGroup::isPending
bool isPending() const
Definition: LSUnit.h:311

llvm::mca::LSUnit::MemoryGroup::addSuccessor
void addSuccessor(MemoryGroup *Group, bool IsDataDependent)
Definition: LSUnit.h:289

llvm::mca::LSUnit::MemoryGroup::getNumExecuted
unsigned getNumExecuted() const
Definition: LSUnit.h:280

llvm::mca::LSUnit::MemoryGroup::isWaiting
bool isWaiting() const
Definition: LSUnit.h:307

llvm::mca::LSUnit::MemoryGroup::getNumExecutedPredecessors
unsigned getNumExecutedPredecessors() const
Definition: LSUnit.h:275

llvm::mca::LSUnit::MemoryGroup::onGroupExecuted
void onGroupExecuted()
Definition: LSUnit.h:336

llvm::mca::LSUnit::MemoryGroup::isReady
bool isReady() const
Definition: LSUnit.h:316

llvm::mca::LSUnit::MemoryGroup::MemoryGroup
MemoryGroup(MemoryGroup &&)=default

llvm::mca::LSUnit::MemoryGroup::getNumSuccessors
size_t getNumSuccessors() const
Definition: LSUnit.h:268

llvm::mca::LSUnit::MemoryGroup::onInstructionIssued
void onInstructionIssued(const InstRef &IR)
Definition: LSUnit.h:342

llvm::mca::LSUnit::MemoryGroup::cycleEvent
void cycleEvent()
Definition: LSUnit.h:395

llvm::mca::LSUnit::MemoryGroup::MemoryGroup
MemoryGroup()=default

llvm::mca::LSUnit::MemoryGroup::getCriticalMemoryInstruction
const InstRef & getCriticalMemoryInstruction() const
Definition: LSUnit.h:282

llvm::mca::LSUnit
Default Load/Store Unit (LS Unit) for simulated processors.
Definition: LSUnit.h:195

llvm::mca::LSUnit::dump
virtual void dump() const override
Definition: LSUnit.cpp:50

llvm::mca::LSUnit::CurrentLoadGroupID
unsigned CurrentLoadGroupID
Definition: LSUnit.h:404

llvm::mca::LSUnit::isPending
bool isPending(const InstRef &IR) const override
Check if instruction IR only depends on memory instructions that are currently executing.
Definition: LSUnit.h:429

llvm::mca::LSUnit::isAvailable
Status isAvailable(const InstRef &IR) const override
Returns LSU_AVAILABLE if there are enough load/store queue entries to accomodate instruction IR.
Definition: LSUnit.cpp:194

llvm::mca::LSUnit::isReady
bool isReady(const InstRef &IR) const override
Check if a peviously dispatched instruction IR is now ready for execution.
Definition: LSUnit.h:423

llvm::mca::LSUnit::Groups
DenseMap< unsigned, std::unique_ptr< MemoryGroup > > Groups
Used to map group identifiers to MemoryGroups.
Definition: LSUnit.h:401

llvm::mca::LSUnit::onInstructionIssued
virtual void onInstructionIssued(const InstRef &IR) override
Definition: LSUnit.h:467

llvm::mca::LSUnit::CurrentStoreGroupID
unsigned CurrentStoreGroupID
Definition: LSUnit.h:406

llvm::mca::LSUnit::cycleEvent
virtual void cycleEvent() override
Definition: LSUnit.cpp:44

llvm::mca::LSUnit::LSUnit
LSUnit(const MCSchedModel &SM, unsigned LQ, unsigned SQ, bool AssumeNoAlias)
Definition: LSUnit.h:414

llvm::mca::LSUnit::onInstructionExecuted
virtual void onInstructionExecuted(const InstRef &IR) override
Definition: LSUnit.cpp:222

llvm::mca::LSUnit::CurrentLoadBarrierGroupID
unsigned CurrentLoadBarrierGroupID
Definition: LSUnit.h:405

llvm::mca::LSUnit::NextGroupID
unsigned NextGroupID
Definition: LSUnit.h:402

llvm::mca::LSUnit::isWaiting
bool isWaiting(const InstRef &IR) const override
Check if instruction IR is still waiting on memory operations, and the wait time is still unknown.
Definition: LSUnit.h:435

llvm::mca::LSUnit::onInstructionRetired
virtual void onInstructionRetired(const InstRef &IR) override
Definition: LSUnit.cpp:203

llvm::mca::LSUnit::dispatch
unsigned dispatch(const InstRef &IR) override
Allocates LS resources for instruction IR.
Definition: LSUnit.cpp:69

llvm::mca::LSUnit::CurrentStoreBarrierGroupID
unsigned CurrentStoreBarrierGroupID
Definition: LSUnit.h:407

llvm::mca::LSUnit::LSUnit
LSUnit(const MCSchedModel &SM, unsigned LQ, unsigned SQ)
Definition: LSUnit.h:412

llvm::mca::LSUnit::getCriticalPredecessor
const CriticalDependency getCriticalPredecessor(unsigned GroupId) override
Definition: LSUnit.h:447

llvm::mca::LSUnit::hasDependentUsers
bool hasDependentUsers(const InstRef &IR) const override
Definition: LSUnit.h:441

llvm::mca::LSUnit::LSUnit
LSUnit(const MCSchedModel &SM)
Definition: LSUnit.h:410

false
Definition: StackSlotColoring.cpp:193

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

Status
Definition: SIModeRegister.cpp:29

llvm::MCSchedModel
Machine model for scheduling, bundling, and heuristics.
Definition: MCSchedule.h:256

llvm::mca::CriticalDependency
A critical data dependency descriptor.
Definition: Instruction.h:185

llvm::mca::CriticalDependency::IID
unsigned IID
Definition: Instruction.h:186

llvm::mca::CriticalDependency::Cycles
unsigned Cycles
Definition: Instruction.h:188