doxygen/AMDGPUHazardLatency_8cpp_source.html

//===--- AMDGPUHazardLatency.cpp - AMDGPU Hazard Latency Adjustment -------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file This file contains a DAG scheduling mutation to adjust the

///       latency of data edges between instructions which use registers

///       potentially subject to additional hazard waits not accounted

///       for in the normal scheduling model.

///       While the scheduling model is typically still accurate in these

///       scenarios, adjusting latency of relevant edges can improve wait

///       merging and reduce pipeline impact of any required waits.

//

//===----------------------------------------------------------------------===//


#include "AMDGPUHazardLatency.h"

#include "GCNSubtarget.h"

#include "MCTargetDesc/AMDGPUMCTargetDesc.h"

#include "SIInstrInfo.h"

#include "llvm/CodeGen/ScheduleDAGInstrs.h"


using namespace llvm;


namespace {


class HazardLatency : public ScheduleDAGMutation {

private:

  const GCNSubtarget &ST;

  const SIRegisterInfo &TRI;

  const MachineRegisterInfo &MRI;


public:

  HazardLatency(MachineFunction *MF)

      : ST(MF->getSubtarget<GCNSubtarget>()), TRI(*ST.getRegisterInfo()),

        MRI(MF->getRegInfo()) {}

  void apply(ScheduleDAGInstrs *DAG) override;

};


void HazardLatency::apply(ScheduleDAGInstrs *DAG) {

  constexpr unsigned MaskLatencyBoost = 3;


  // Hazard only manifests in Wave64

  if (!ST.hasVALUMaskWriteHazard() || !ST.isWave64())

    return;


  for (SUnit &SU : DAG->SUnits) {

    const MachineInstr *MI = SU.getInstr();

    if (!SIInstrInfo::isVALU(*MI))

      continue;

    if (MI->getOpcode() == AMDGPU::V_READLANE_B32 ||

        MI->getOpcode() == AMDGPU::V_READFIRSTLANE_B32)

      continue;

    for (SDep &SuccDep : SU.Succs) {

      if (SuccDep.isCtrl())

        continue;

      // Boost latency on VALU writes to SGPRs used by VALUs.

      // Reduce risk of premature VALU pipeline stall on associated reads.

      MachineInstr *DestMI = SuccDep.getSUnit()->getInstr();

      if (!SIInstrInfo::isVALU(*DestMI))

        continue;

      Register Reg = SuccDep.getReg();

      if (!TRI.isSGPRReg(MRI, Reg))

        continue;

      SuccDep.setLatency(SuccDep.getLatency() * MaskLatencyBoost);

    }

  }

}


} // end namespace


std::unique_ptr<ScheduleDAGMutation>


llvm::createAMDGPUHazardLatencyDAGMutation(MachineFunction *MF) {

  return std::make_unique<HazardLatency>(MF);

}


AMDGPUHazardLatency.h

AMDGPUMCTargetDesc.h
Provides AMDGPU specific target descriptions.

GCNSubtarget.h
AMD GCN specific subclass of TargetSubtarget.

MI
IRTranslator LLVM IR MI
Definition IRTranslator.cpp:110

Reg
Register Reg
Definition MachineSink.cpp:2126

TRI
Register const TargetRegisterInfo * TRI
Definition MachineSink.cpp:2127

Register
Promote Memory to Register
Definition Mem2Reg.cpp:110

SIInstrInfo.h
Interface definition for SIInstrInfo.

ScheduleDAGInstrs.h

llvm::GCNSubtarget::hasVALUMaskWriteHazard
bool hasVALUMaskWriteHazard() const
Definition GCNSubtarget.h:627

llvm::GCNSubtarget::isWave64
bool isWave64() const
Definition GCNSubtarget.h:911

llvm::MachineFunction
Definition MachineFunction.h:294

llvm::SDep::getSUnit
SUnit * getSUnit() const
Definition ScheduleDAG.h:509

llvm::SDep::setLatency
void setLatency(unsigned Lat)
Sets the latency for this edge.
Definition ScheduleDAG.h:147

llvm::SDep::getLatency
unsigned getLatency() const
Returns the latency value for this edge, which roughly means the minimum number of cycles that must e...
Definition ScheduleDAG.h:142

llvm::SDep::isCtrl
bool isCtrl() const
Shorthand for getKind() != SDep::Data.
Definition ScheduleDAG.h:161

llvm::SDep::getReg
Register getReg() const
Returns the register associated with this edge.
Definition ScheduleDAG.h:216

llvm::SIInstrInfo::isVALU
static bool isVALU(const MachineInstr &MI)
Definition SIInstrInfo.h:494

llvm::SUnit::Succs
SmallVector< SDep, 4 > Succs
All sunit successors.
Definition ScheduleDAG.h:270

llvm::SUnit::getInstr
MachineInstr * getInstr() const
Returns the representative MachineInstr for this SUnit.
Definition ScheduleDAG.h:399

llvm::ScheduleDAGInstrs
A ScheduleDAG for scheduling lists of MachineInstr.
Definition ScheduleDAGInstrs.h:118

llvm::ScheduleDAGMutation
Mutate the DAG as a postpass after normal DAG building.
Definition ScheduleDAGMutation.h:24

llvm::ScheduleDAG::SUnits
std::vector< SUnit > SUnits
The scheduling units.
Definition ScheduleDAG.h:590

llvm::cl::apply
void apply(Opt *O, const Mod &M, const Mods &... Ms)
Definition CommandLine.h:1340

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition FunctionInfo.h:25

llvm::createAMDGPUHazardLatencyDAGMutation
std::unique_ptr< ScheduleDAGMutation > createAMDGPUHazardLatencyDAGMutation(MachineFunction *MF)
Definition AMDGPUHazardLatency.cpp:75