doxygen/AMDGPUAsmBackend_8cpp_source.html

//===-- AMDGPUAsmBackend.cpp - AMDGPU Assembler Backend -------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

/// \file

//===----------------------------------------------------------------------===//


#include "MCTargetDesc/AMDGPUFixupKinds.h"

#include "MCTargetDesc/AMDGPUMCTargetDesc.h"

#include "Utils/AMDGPUBaseInfo.h"

#include "llvm/ADT/StringSwitch.h"

#include "llvm/BinaryFormat/ELF.h"

#include "llvm/MC/MCAsmBackend.h"

#include "llvm/MC/MCAsmInfo.h"

#include "llvm/MC/MCAssembler.h"

#include "llvm/MC/MCContext.h"

#include "llvm/MC/MCObjectWriter.h"

#include "llvm/MC/MCSubtargetInfo.h"

#include "llvm/MC/MCValue.h"

#include "llvm/MC/TargetRegistry.h"

#include "llvm/Support/EndianStream.h"

#include "llvm/TargetParser/TargetParser.h"


using namespace llvm;

using namespace llvm::AMDGPU;


namespace {


class AMDGPUAsmBackend : public MCAsmBackend {

public:

  AMDGPUAsmBackend(const Target &T) : MCAsmBackend(llvm::endianness::little) {}


  void applyFixup(const MCFragment &, const MCFixup &, const MCValue &Target,

                  uint8_t *Data, uint64_t Value, bool IsResolved) override;

  bool fixupNeedsRelaxation(const MCFixup &Fixup,

                            uint64_t Value) const override;


  void relaxInstruction(MCInst &Inst,

                        const MCSubtargetInfo &STI) const override;


  bool mayNeedRelaxation(unsigned Opcode, ArrayRef<MCOperand> Operands,

                         const MCSubtargetInfo &STI) const override;


  unsigned getMinimumNopSize() const override;

  bool writeNopData(raw_ostream &OS, uint64_t Count,

                    const MCSubtargetInfo *STI) const override;


  std::optional<MCFixupKind> getFixupKind(StringRef Name) const override;

  MCFixupKindInfo getFixupKindInfo(MCFixupKind Kind) const override;

};


} //End anonymous namespace


void AMDGPUAsmBackend::relaxInstruction(MCInst &Inst,

                                        const MCSubtargetInfo &STI) const {

  MCInst Res;

  unsigned RelaxedOpcode = AMDGPU::getSOPPWithRelaxation(Inst.getOpcode());

  Res.setOpcode(RelaxedOpcode);

  Res.addOperand(Inst.getOperand(0));

  Inst = std::move(Res);

}


bool AMDGPUAsmBackend::fixupNeedsRelaxation(const MCFixup &Fixup,

                                            uint64_t Value) const {

  // if the branch target has an offset of x3f this needs to be relaxed to

  // add a s_nop 0 immediately after branch to effectively increment offset

  // for hardware workaround in gfx1010

  return (((int64_t(Value)/4)-1) == 0x3f);

}


bool AMDGPUAsmBackend::mayNeedRelaxation(unsigned Opcode,

                                         ArrayRef<MCOperand> Operands,

                                         const MCSubtargetInfo &STI) const {

  if (!STI.hasFeature(AMDGPU::FeatureOffset3fBug))

    return false;


  if (AMDGPU::getSOPPWithRelaxation(Opcode) >= 0)

    return true;


  return false;

}


static unsigned getFixupKindNumBytes(unsigned Kind) {

  switch (Kind) {

  case AMDGPU::fixup_si_sopp_br:

    return 2;

  case FK_SecRel_1:

  case FK_Data_1:

    return 1;

  case FK_SecRel_2:

  case FK_Data_2:

    return 2;

  case FK_SecRel_4:

  case FK_Data_4:

    return 4;

  case FK_SecRel_8:

  case FK_Data_8:

    return 8;

  default:

    llvm_unreachable("Unknown fixup kind!");

  }

}


static uint64_t adjustFixupValue(const MCFixup &Fixup, uint64_t Value,

                                 MCContext *Ctx) {

  int64_t SignedValue = static_cast<int64_t>(Value);


  switch (Fixup.getKind()) {

  case AMDGPU::fixup_si_sopp_br: {

    int64_t BrImm = (SignedValue - 4) / 4;


    if (Ctx && !isInt<16>(BrImm))

      Ctx->reportError(Fixup.getLoc(), "branch size exceeds simm16");


    return BrImm;

  }

  case FK_Data_1:

  case FK_Data_2:

  case FK_Data_4:

  case FK_Data_8:

  case FK_SecRel_4:

    return Value;

  default:

    llvm_unreachable("unhandled fixup kind");

  }

}


void AMDGPUAsmBackend::applyFixup(const MCFragment &F, const MCFixup &Fixup,

                                  const MCValue &Target, uint8_t *Data,

                                  uint64_t Value, bool IsResolved) {

  if (Target.getSpecifier())

    IsResolved = false;

  maybeAddReloc(F, Fixup, Target, Value, IsResolved);

  if (mc::isRelocation(Fixup.getKind()))

    return;


  Value = adjustFixupValue(Fixup, Value, &getContext());

  if (!Value)

    return; // Doesn't change encoding.


  MCFixupKindInfo Info = getFixupKindInfo(Fixup.getKind());


  // Shift the value into position.

  Value <<= Info.TargetOffset;


  unsigned NumBytes = getFixupKindNumBytes(Fixup.getKind());

  assert(Fixup.getOffset() + NumBytes <= F.getSize() &&

         "Invalid fixup offset!");


  // For each byte of the fragment that the fixup touches, mask in the bits from

  // the fixup value.

  for (unsigned i = 0; i != NumBytes; ++i)

    Data[i] |= static_cast<uint8_t>((Value >> (i * 8)) & 0xff);

}


std::optional<MCFixupKind>

AMDGPUAsmBackend::getFixupKind(StringRef Name) const {

  auto Type = StringSwitch<unsigned>(Name)

#define ELF_RELOC(Name, Value) .Case(#Name, Value)

#include "llvm/BinaryFormat/ELFRelocs/AMDGPU.def"

#undef ELF_RELOC

                  .Case("BFD_RELOC_NONE", ELF::R_AMDGPU_NONE)

                  .Case("BFD_RELOC_32", ELF::R_AMDGPU_ABS32)

                  .Case("BFD_RELOC_64", ELF::R_AMDGPU_ABS64)

                  .Default(-1u);

  if (Type != -1u)

    return static_cast<MCFixupKind>(FirstLiteralRelocationKind + Type);

  return std::nullopt;

}


MCFixupKindInfo AMDGPUAsmBackend::getFixupKindInfo(MCFixupKind Kind) const {

  const static MCFixupKindInfo Infos[AMDGPU::NumTargetFixupKinds] = {

      // name                   offset bits  flags

      {"fixup_si_sopp_br", 0, 16, 0},

  };


  if (mc::isRelocation(Kind))

    return {};


  if (Kind < FirstTargetFixupKind)

    return MCAsmBackend::getFixupKindInfo(Kind);


  assert(unsigned(Kind - FirstTargetFixupKind) < AMDGPU::NumTargetFixupKinds &&

         "Invalid kind!");

  return Infos[Kind - FirstTargetFixupKind];

}


unsigned AMDGPUAsmBackend::getMinimumNopSize() const {

  return 4;

}


bool AMDGPUAsmBackend::writeNopData(raw_ostream &OS, uint64_t Count,

                                    const MCSubtargetInfo *STI) const {

  // If the count is not aligned to the minimum instruction alignment, we must

  // be writing data into the text section (otherwise we have unaligned

  // instructions, and thus have far bigger problems), so just write zeros

  // instead.

  unsigned MinInstAlignment = getContext().getAsmInfo()->getMinInstAlignment();

  OS.write_zeros(Count % MinInstAlignment);


  // We are properly aligned, so write NOPs as requested.

  Count /= MinInstAlignment;


  // FIXME: R600 support.

  // s_nop 0

  const uint32_t Encoded_S_NOP_0 = 0xbf800000;


  assert(MinInstAlignment == sizeof(Encoded_S_NOP_0));

  for (uint64_t I = 0; I != Count; ++I)

    support::endian::write<uint32_t>(OS, Encoded_S_NOP_0, Endian);


  return true;

}


//===----------------------------------------------------------------------===//

// ELFAMDGPUAsmBackend class

//===----------------------------------------------------------------------===//


namespace {


class ELFAMDGPUAsmBackend : public AMDGPUAsmBackend {

  bool Is64Bit;

  bool HasRelocationAddend;

  uint8_t OSABI = ELF::ELFOSABI_NONE;


public:

  ELFAMDGPUAsmBackend(const Target &T, const Triple &TT)

      : AMDGPUAsmBackend(T), Is64Bit(TT.isAMDGCN()),

        HasRelocationAddend(TT.getOS() == Triple::AMDHSA) {

    switch (TT.getOS()) {

    case Triple::AMDHSA:

      OSABI = ELF::ELFOSABI_AMDGPU_HSA;

      break;

    case Triple::AMDPAL:

      OSABI = ELF::ELFOSABI_AMDGPU_PAL;

      break;

    case Triple::Mesa3D:

      OSABI = ELF::ELFOSABI_AMDGPU_MESA3D;

      break;

    default:

      break;

    }

  }


  std::unique_ptr<MCObjectTargetWriter>

  createObjectTargetWriter() const override {

    return createAMDGPUELFObjectWriter(Is64Bit, OSABI, HasRelocationAddend);

  }

};


} // end anonymous namespace


MCAsmBackend *llvm::createAMDGPUAsmBackend(const Target &T,

                                           const MCSubtargetInfo &STI,

                                           const MCRegisterInfo &MRI,

                                           const MCTargetOptions &Options) {

  return new ELFAMDGPUAsmBackend(T, STI.getTargetTriple());

}


MRI
unsigned const MachineRegisterInfo * MRI
Definition AArch64AdvSIMDScalarPass.cpp:103

getFixupKindNumBytes
static unsigned getFixupKindNumBytes(unsigned Kind)
The number of bytes the fixup may change.
Definition AArch64AsmBackend.cpp:95

adjustFixupValue
static uint64_t adjustFixupValue(const MCFixup &Fixup, const MCValue &Target, uint64_t Value, MCContext &Ctx, const Triple &TheTriple, bool IsResolved)
Definition AArch64AsmBackend.cpp:140

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

AMDGPUBaseInfo.h

AMDGPUFixupKinds.h

AMDGPUMCTargetDesc.h
Provides AMDGPU specific target descriptions.

ELF.h

Info
Analysis containing CSE Info
Definition CSEInfo.cpp:27

EndianStream.h

TemplateParamKind::Type
@ Type
Definition ItaniumDemangle.h:1243

Options
static LVOptions Options
Definition LVOptions.cpp:25

MCAsmBackend.h

MCAsmInfo.h

MCAssembler.h

MCContext.h

MCObjectWriter.h

MCSubtargetInfo.h

MCValue.h

F
#define F(x, y, z)
Definition MD5.cpp:54

I
#define I(x, y, z)
Definition MD5.cpp:57

T
#define T
Definition Mips16ISelLowering.cpp:282

Fixup
PowerPC TLS Dynamic Call Fixup
Definition PPCTLSDynamicCall.cpp:336

StringSwitch.h
This file implements the StringSwitch template, which mimics a switch() statement whose cases are str...

TargetParser.h

TargetRegistry.h

llvm::MCAsmBackend
Generic interface to target specific assembler backends.
Definition MCAsmBackend.h:55

llvm::MCAsmBackend::getFixupKindInfo
virtual MCFixupKindInfo getFixupKindInfo(MCFixupKind Kind) const
Get information on a fixup kind.
Definition MCAsmBackend.cpp:89

llvm::MCContext
Context object for machine code objects.
Definition MCContext.h:83

llvm::MCFixup
Encode information on a single operation to perform on a byte sequence (e.g., an encoded instruction)...
Definition MCFixup.h:61

llvm::MCInst
Instances of this class represent a single low-level machine instruction.
Definition MCInst.h:188

llvm::MCInst::getOpcode
unsigned getOpcode() const
Definition MCInst.h:202

llvm::MCInst::addOperand
void addOperand(const MCOperand Op)
Definition MCInst.h:215

llvm::MCInst::setOpcode
void setOpcode(unsigned Op)
Definition MCInst.h:201

llvm::MCInst::getOperand
const MCOperand & getOperand(unsigned i) const
Definition MCInst.h:210

llvm::MCRegisterInfo
MCRegisterInfo base class - We assume that the target defines a static array of MCRegisterDesc object...
Definition MCRegisterInfo.h:151

llvm::MCSubtargetInfo
Generic base class for all target subtargets.
Definition MCSubtargetInfo.h:77

llvm::MCSubtargetInfo::hasFeature
bool hasFeature(unsigned Feature) const
Definition MCSubtargetInfo.h:122

llvm::MCSubtargetInfo::getTargetTriple
const Triple & getTargetTriple() const
Definition MCSubtargetInfo.h:111

llvm::MCTargetOptions
Definition MCTargetOptions.h:29

llvm::Target
Target - Wrapper for Target specific information.
Definition TargetRegistry.h:146

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::raw_ostream::write_zeros
raw_ostream & write_zeros(unsigned NumZeros)
write_zeros - Insert 'NumZeros' nulls.
Definition raw_ostream.cpp:490

uint64_t

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::AMDGPU::Exp::Target
Target
Definition SIDefines.h:1012

llvm::AMDGPU
Definition AMDGPUMetadataVerifier.h:34

llvm::AMDGPU::fixup_si_sopp_br
@ fixup_si_sopp_br
16-bit PC relative fixup for SOPP branch instructions.
Definition AMDGPUFixupKinds.h:18

llvm::AMDGPU::NumTargetFixupKinds
@ NumTargetFixupKinds
Definition AMDGPUFixupKinds.h:22

llvm::AMDGPU::getSOPPWithRelaxation
LLVM_READONLY int getSOPPWithRelaxation(uint16_t Opcode)

llvm::ARM::PredBlockMask::TT
@ TT
Definition ARMBaseInfo.h:107

llvm::ELF::ELFOSABI_NONE
@ ELFOSABI_NONE
Definition ELF.h:346

llvm::VE::getFixupKind
VE::Fixups getFixupKind(uint8_t S)
Definition VEMCAsmInfo.cpp:38

llvm::jitlink::aarch32::applyFixup
Error applyFixup(LinkGraph &G, Block &B, const Edge &E, const ArmConfig &ArmCfg)
Apply fixup expression for edge to block content.
Definition aarch32.h:316

llvm::lltok::Kind
Kind
Definition LLToken.h:18

llvm::mc::isRelocation
bool isRelocation(MCFixupKind FixupKind)
Definition MCFixup.h:130

llvm::sandboxir::getContext
Context & getContext() const
Definition BasicBlock.h:99

llvm::support::endian::write
void write(void *memory, value_type value, endianness endian)
Write a value to memory with a particular endianness.
Definition Endian.h:96

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::isInt
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
Definition MathExtras.h:165

llvm::createAMDGPUAsmBackend
MCAsmBackend * createAMDGPUAsmBackend(const Target &T, const MCSubtargetInfo &STI, const MCRegisterInfo &MRI, const MCTargetOptions &Options)
Definition AMDGPUAsmBackend.cpp:255

llvm::createAMDGPUELFObjectWriter
std::unique_ptr< MCObjectTargetWriter > createAMDGPUELFObjectWriter(bool Is64Bit, uint8_t OSABI, bool HasRelocationAddend)
Definition AMDGPUELFObjectWriter.cpp:97

llvm::MCFixupKind
uint16_t MCFixupKind
Extensible enumeration to represent the type of a fixup.
Definition MCFixup.h:22

llvm::Count
FunctionAddr VTableAddr Count
Definition InstrProf.h:139

llvm::FirstTargetFixupKind
@ FirstTargetFixupKind
Definition MCFixup.h:44

llvm::FK_SecRel_2
@ FK_SecRel_2
A two-byte section relative fixup.
Definition MCFixup.h:40

llvm::FirstLiteralRelocationKind
@ FirstLiteralRelocationKind
Definition MCFixup.h:29

llvm::FK_Data_8
@ FK_Data_8
A eight-byte fixup.
Definition MCFixup.h:37

llvm::FK_Data_1
@ FK_Data_1
A one-byte fixup.
Definition MCFixup.h:34

llvm::FK_Data_4
@ FK_Data_4
A four-byte fixup.
Definition MCFixup.h:36

llvm::FK_SecRel_8
@ FK_SecRel_8
A eight-byte section relative fixup.
Definition MCFixup.h:42

llvm::FK_SecRel_4
@ FK_SecRel_4
A four-byte section relative fixup.
Definition MCFixup.h:41

llvm::FK_SecRel_1
@ FK_SecRel_1
A one-byte section relative fixup.
Definition MCFixup.h:39

llvm::FK_Data_2
@ FK_Data_2
A two-byte fixup.
Definition MCFixup.h:35

llvm::Data
FunctionAddr VTableAddr uintptr_t uintptr_t Data
Definition InstrProf.h:189

llvm::ArrayRef
ArrayRef(const T &OneElt) -> ArrayRef< T >

llvm::endianness
endianness
Definition bit.h:71

llvm::endianness::little
@ little
Definition bit.h:73