LLVM 17.0.0git
AMDGPUAsmBackend.cpp
Go to the documentation of this file.
1//===-- AMDGPUAsmBackend.cpp - AMDGPU Assembler Backend -------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7/// \file
8//===----------------------------------------------------------------------===//
9
15#include "llvm/MC/MCAssembler.h"
16#include "llvm/MC/MCContext.h"
23
24using namespace llvm;
25using namespace llvm::AMDGPU;
26
27namespace {
28
29class AMDGPUAsmBackend : public MCAsmBackend {
30public:
31 AMDGPUAsmBackend(const Target &T) : MCAsmBackend(support::little) {}
32
33 unsigned getNumFixupKinds() const override { return AMDGPU::NumTargetFixupKinds; };
34
35 void applyFixup(const MCAssembler &Asm, const MCFixup &Fixup,
37 uint64_t Value, bool IsResolved,
38 const MCSubtargetInfo *STI) const override;
41 const MCAsmLayout &Layout) const override;
42
43 void relaxInstruction(MCInst &Inst,
44 const MCSubtargetInfo &STI) const override;
45
46 bool mayNeedRelaxation(const MCInst &Inst,
47 const MCSubtargetInfo &STI) const override;
48
49 unsigned getMinimumNopSize() const override;
51 const MCSubtargetInfo *STI) const override;
52
53 std::optional<MCFixupKind> getFixupKind(StringRef Name) const override;
54 const MCFixupKindInfo &getFixupKindInfo(MCFixupKind Kind) const override;
55 bool shouldForceRelocation(const MCAssembler &Asm, const MCFixup &Fixup,
56 const MCValue &Target) override;
57};
58
59} //End anonymous namespace
60
61void AMDGPUAsmBackend::relaxInstruction(MCInst &Inst,
62 const MCSubtargetInfo &STI) const {
63 MCInst Res;
64 unsigned RelaxedOpcode = AMDGPU::getSOPPWithRelaxation(Inst.getOpcode());
65 Res.setOpcode(RelaxedOpcode);
66 Res.addOperand(Inst.getOperand(0));
67 Inst = std::move(Res);
68}
69
70bool AMDGPUAsmBackend::fixupNeedsRelaxation(const MCFixup &Fixup,
73 const MCAsmLayout &Layout) const {
74 // if the branch target has an offset of x3f this needs to be relaxed to
75 // add a s_nop 0 immediately after branch to effectively increment offset
76 // for hardware workaround in gfx1010
77 return (((int64_t(Value)/4)-1) == 0x3f);
78}
79
80bool AMDGPUAsmBackend::mayNeedRelaxation(const MCInst &Inst,
81 const MCSubtargetInfo &STI) const {
82 if (!STI.hasFeature(AMDGPU::FeatureOffset3fBug))
83 return false;
84
86 return true;
87
88 return false;
89}
90
91static unsigned getFixupKindNumBytes(unsigned Kind) {
92 switch (Kind) {
94 return 2;
95 case FK_SecRel_1:
96 case FK_Data_1:
97 return 1;
98 case FK_SecRel_2:
99 case FK_Data_2:
100 return 2;
101 case FK_SecRel_4:
102 case FK_Data_4:
103 case FK_PCRel_4:
104 return 4;
105 case FK_SecRel_8:
106 case FK_Data_8:
107 return 8;
108 default:
109 llvm_unreachable("Unknown fixup kind!");
110 }
111}
112
114 MCContext *Ctx) {
115 int64_t SignedValue = static_cast<int64_t>(Value);
116
117 switch (Fixup.getTargetKind()) {
119 int64_t BrImm = (SignedValue - 4) / 4;
120
121 if (Ctx && !isInt<16>(BrImm))
122 Ctx->reportError(Fixup.getLoc(), "branch size exceeds simm16");
123
124 return BrImm;
125 }
126 case FK_Data_1:
127 case FK_Data_2:
128 case FK_Data_4:
129 case FK_Data_8:
130 case FK_PCRel_4:
131 case FK_SecRel_4:
132 return Value;
133 default:
134 llvm_unreachable("unhandled fixup kind");
135 }
136}
137
138void AMDGPUAsmBackend::applyFixup(const MCAssembler &Asm, const MCFixup &Fixup,
139 const MCValue &Target,
141 bool IsResolved,
142 const MCSubtargetInfo *STI) const {
143 if (Fixup.getKind() >= FirstLiteralRelocationKind)
144 return;
145
146 Value = adjustFixupValue(Fixup, Value, &Asm.getContext());
147 if (!Value)
148 return; // Doesn't change encoding.
149
150 MCFixupKindInfo Info = getFixupKindInfo(Fixup.getKind());
151
152 // Shift the value into position.
153 Value <<= Info.TargetOffset;
154
155 unsigned NumBytes = getFixupKindNumBytes(Fixup.getKind());
156 uint32_t Offset = Fixup.getOffset();
157 assert(Offset + NumBytes <= Data.size() && "Invalid fixup offset!");
158
159 // For each byte of the fragment that the fixup touches, mask in the bits from
160 // the fixup value.
161 for (unsigned i = 0; i != NumBytes; ++i)
162 Data[Offset + i] |= static_cast<uint8_t>((Value >> (i * 8)) & 0xff);
163}
164
165std::optional<MCFixupKind>
166AMDGPUAsmBackend::getFixupKind(StringRef Name) const {
168#define ELF_RELOC(Name, Value) \
170#include "llvm/BinaryFormat/ELFRelocs/AMDGPU.def"
171#undef ELF_RELOC
172 .Default(std::nullopt);
173}
174
175const MCFixupKindInfo &AMDGPUAsmBackend::getFixupKindInfo(
176 MCFixupKind Kind) const {
177 const static MCFixupKindInfo Infos[AMDGPU::NumTargetFixupKinds] = {
178 // name offset bits flags
179 { "fixup_si_sopp_br", 0, 16, MCFixupKindInfo::FKF_IsPCRel },
180 };
181
182 if (Kind >= FirstLiteralRelocationKind)
184
185 if (Kind < FirstTargetFixupKind)
187
188 return Infos[Kind - FirstTargetFixupKind];
189}
190
191bool AMDGPUAsmBackend::shouldForceRelocation(const MCAssembler &,
192 const MCFixup &Fixup,
193 const MCValue &) {
194 return Fixup.getKind() >= FirstLiteralRelocationKind;
195}
196
197unsigned AMDGPUAsmBackend::getMinimumNopSize() const {
198 return 4;
199}
200
201bool AMDGPUAsmBackend::writeNopData(raw_ostream &OS, uint64_t Count,
202 const MCSubtargetInfo *STI) const {
203 // If the count is not 4-byte aligned, we must be writing data into the text
204 // section (otherwise we have unaligned instructions, and thus have far
205 // bigger problems), so just write zeros instead.
206 OS.write_zeros(Count % 4);
207
208 // We are properly aligned, so write NOPs as requested.
209 Count /= 4;
210
211 // FIXME: R600 support.
212 // s_nop 0
213 const uint32_t Encoded_S_NOP_0 = 0xbf800000;
214
215 for (uint64_t I = 0; I != Count; ++I)
216 support::endian::write<uint32_t>(OS, Encoded_S_NOP_0, Endian);
217
218 return true;
219}
220
221//===----------------------------------------------------------------------===//
222// ELFAMDGPUAsmBackend class
223//===----------------------------------------------------------------------===//
224
225namespace {
226
227class ELFAMDGPUAsmBackend : public AMDGPUAsmBackend {
228 bool Is64Bit;
229 bool HasRelocationAddend;
230 uint8_t OSABI = ELF::ELFOSABI_NONE;
231 uint8_t ABIVersion = 0;
232
233public:
234 ELFAMDGPUAsmBackend(const Target &T, const Triple &TT, uint8_t ABIVersion) :
235 AMDGPUAsmBackend(T), Is64Bit(TT.getArch() == Triple::amdgcn),
236 HasRelocationAddend(TT.getOS() == Triple::AMDHSA),
237 ABIVersion(ABIVersion) {
238 switch (TT.getOS()) {
239 case Triple::AMDHSA:
241 break;
242 case Triple::AMDPAL:
244 break;
245 case Triple::Mesa3D:
247 break;
248 default:
249 break;
250 }
251 }
252
253 std::unique_ptr<MCObjectTargetWriter>
254 createObjectTargetWriter() const override {
255 return createAMDGPUELFObjectWriter(Is64Bit, OSABI, HasRelocationAddend,
256 ABIVersion);
257 }
258};
259
260} // end anonymous namespace
261
263 const MCSubtargetInfo &STI,
264 const MCRegisterInfo &MRI,
265 const MCTargetOptions &Options) {
266 return new ELFAMDGPUAsmBackend(T, STI.getTargetTriple(),
267 getHsaAbiVersion(&STI).value_or(0));
268}
unsigned const MachineRegisterInfo * MRI
#define ELF_RELOC(Name, Value)
static uint64_t adjustFixupValue(const MCFixup &Fixup, uint64_t Value, MCContext *Ctx)
static unsigned getFixupKindNumBytes(unsigned Kind)
Provides AMDGPU specific target descriptions.
Analysis containing CSE Info
Definition: CSEInfo.cpp:27
static RegisterPass< DebugifyFunctionPass > DF("debugify-function", "Attach debug info to a function")
@ Default
Definition: DwarfDebug.cpp:86
std::string Name
static LVOptions Options
Definition: LVOptions.cpp:25
#define I(x, y, z)
Definition: MD5.cpp:58
PowerPC TLS Dynamic Call Fixup
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
raw_pwrite_stream & OS
Generic interface to target specific assembler backends.
Definition: MCAsmBackend.h:41
virtual unsigned getMinimumNopSize() const
Returns the minimum size of a nop in bytes on this target.
Definition: MCAsmBackend.h:190
virtual bool writeNopData(raw_ostream &OS, uint64_t Count, const MCSubtargetInfo *STI) const =0
Write an (optimal) nop sequence of Count bytes to the given output.
virtual void relaxInstruction(MCInst &Inst, const MCSubtargetInfo &STI) const
Relax the instruction in the given fragment to the next wider instruction.
Definition: MCAsmBackend.h:171
virtual bool mayNeedRelaxation(const MCInst &Inst, const MCSubtargetInfo &STI) const
Check whether the given instruction may need relaxation.
Definition: MCAsmBackend.h:148
virtual bool fixupNeedsRelaxation(const MCFixup &Fixup, uint64_t Value, const MCRelaxableFragment *DF, const MCAsmLayout &Layout) const =0
Simple predicate for targets where !Resolved implies requiring relaxation.
virtual bool shouldForceRelocation(const MCAssembler &Asm, const MCFixup &Fixup, const MCValue &Target)
Hook to check if a relocation is needed for some target specific reason.
Definition: MCAsmBackend.h:97
virtual unsigned getNumFixupKinds() const =0
Get the number of target specific fixup kinds.
virtual const MCFixupKindInfo & getFixupKindInfo(MCFixupKind Kind) const
Get information on a fixup kind.
virtual std::optional< MCFixupKind > getFixupKind(StringRef Name) const
Map a relocation name used in .reloc to a fixup kind.
virtual void applyFixup(const MCAssembler &Asm, const MCFixup &Fixup, const MCValue &Target, MutableArrayRef< char > Data, uint64_t Value, bool IsResolved, const MCSubtargetInfo *STI) const =0
Apply the Value for given Fixup into the provided data fragment, at the offset specified by the fixup...
Encapsulates the layout of an assembly file at a particular point in time.
Definition: MCAsmLayout.h:28
Context object for machine code objects.
Definition: MCContext.h:76
void reportError(SMLoc L, const Twine &Msg)
Definition: MCContext.cpp:1049
Encode information on a single operation to perform on a byte sequence (e.g., an encoded instruction)...
Definition: MCFixup.h:71
Instances of this class represent a single low-level machine instruction.
Definition: MCInst.h:184
unsigned getOpcode() const
Definition: MCInst.h:198
void addOperand(const MCOperand Op)
Definition: MCInst.h:210
void setOpcode(unsigned Op)
Definition: MCInst.h:197
const MCOperand & getOperand(unsigned i) const
Definition: MCInst.h:206
MCRegisterInfo base class - We assume that the target defines a static array of MCRegisterDesc object...
A relaxable fragment holds on to its MCInst, since it may need to be relaxed during the assembler lay...
Definition: MCFragment.h:270
Generic base class for all target subtargets.
bool hasFeature(unsigned Feature) const
const Triple & getTargetTriple() const
This represents an "assembler immediate".
Definition: MCValue.h:36
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
Definition: ArrayRef.h:305
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50
A switch()-like statement whose cases are string literals.
Definition: StringSwitch.h:44
Target - Wrapper for Target specific information.
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44
LLVM Value Representation.
Definition: Value.h:74
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:52
raw_ostream & write_zeros(unsigned NumZeros)
write_zeros - Insert 'NumZeros' nulls.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ fixup_si_sopp_br
16-bit PC relative fixup for SOPP branch instructions.
std::optional< uint8_t > getHsaAbiVersion(const MCSubtargetInfo *STI)
LLVM_READONLY int getSOPPWithRelaxation(uint16_t Opcode)
@ ELFOSABI_AMDGPU_HSA
Definition: ELF.h:360
@ ELFOSABI_AMDGPU_MESA3D
Definition: ELF.h:362
@ ELFOSABI_NONE
Definition: ELF.h:341
@ ELFOSABI_AMDGPU_PAL
Definition: ELF.h:361
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
@ Offset
Definition: DWP.cpp:406
MCAsmBackend * createAMDGPUAsmBackend(const Target &T, const MCSubtargetInfo &STI, const MCRegisterInfo &MRI, const MCTargetOptions &Options)
std::unique_ptr< MCObjectTargetWriter > createAMDGPUELFObjectWriter(bool Is64Bit, uint8_t OSABI, bool HasRelocationAddend, uint8_t ABIVersion)
MCFixupKind
Extensible enumeration to represent the type of a fixup.
Definition: MCFixup.h:21
@ FirstTargetFixupKind
Definition: MCFixup.h:45
@ FK_PCRel_4
A four-byte pc relative fixup.
Definition: MCFixup.h:30
@ FK_SecRel_2
A two-byte section relative fixup.
Definition: MCFixup.h:41
@ FirstLiteralRelocationKind
The range [FirstLiteralRelocationKind, MaxTargetFixupKind) is used for relocations coming from ....
Definition: MCFixup.h:50
@ FK_Data_8
A eight-byte fixup.
Definition: MCFixup.h:26
@ FK_Data_1
A one-byte fixup.
Definition: MCFixup.h:23
@ FK_Data_4
A four-byte fixup.
Definition: MCFixup.h:25
@ FK_SecRel_8
A eight-byte section relative fixup.
Definition: MCFixup.h:43
@ FK_NONE
A no-op fixup.
Definition: MCFixup.h:22
@ FK_SecRel_4
A four-byte section relative fixup.
Definition: MCFixup.h:42
@ FK_SecRel_1
A one-byte section relative fixup.
Definition: MCFixup.h:40
@ FK_Data_2
A two-byte fixup.
Definition: MCFixup.h:24
Target independent information on a fixup kind.
@ FKF_IsPCRel
Is this fixup kind PCrelative? This is used by the assembler backend to evaluate fixup values in a ta...