LLVM 22.0.0git
X86Subtarget.cpp
Go to the documentation of this file.
1//===-- X86Subtarget.cpp - X86 Subtarget Information ----------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the X86 specific subclass of TargetSubtargetInfo.
10//
11//===----------------------------------------------------------------------===//
12
13#include "X86Subtarget.h"
18#include "X86.h"
19#include "X86MacroFusion.h"
20#include "X86TargetMachine.h"
25#include "llvm/IR/Attributes.h"
27#include "llvm/IR/Function.h"
28#include "llvm/IR/GlobalValue.h"
29#include "llvm/IR/Module.h"
33#include "llvm/Support/Debug.h"
37
38#if defined(_MSC_VER)
39#include <intrin.h>
40#endif
41
42using namespace llvm;
43
44#define DEBUG_TYPE "subtarget"
45
46#define GET_SUBTARGETINFO_TARGET_DESC
47#define GET_SUBTARGETINFO_CTOR
48#include "X86GenSubtargetInfo.inc"
49
50// Temporary option to control early if-conversion for x86 while adding machine
51// models.
52static cl::opt<bool>
53X86EarlyIfConv("x86-early-ifcvt", cl::Hidden,
54 cl::desc("Enable early if-conversion on X86"));
55
56
57/// Classify a blockaddress reference for the current subtarget according to how
58/// we should reference it in a non-pcrel context.
60 return classifyLocalReference(nullptr);
61}
62
63/// Classify a global variable reference for the current subtarget according to
64/// how we should reference it in a non-pcrel context.
65unsigned char
69
70unsigned char
72 CodeModel::Model CM = TM.getCodeModel();
73 // Tagged globals have non-zero upper bits, which makes direct references
74 // require a 64-bit immediate. With the small/medium code models this causes
75 // relocation errors, so we go through the GOT instead.
76 if (AllowTaggedGlobals && CM != CodeModel::Large && GV && !isa<Function>(GV))
78
79 // If we're not PIC, it's not very interesting.
81 return X86II::MO_NO_FLAG;
82
83 if (is64Bit()) {
84 // 64-bit ELF PIC local references may use GOTOFF relocations.
85 if (isTargetELF()) {
86 assert(CM != CodeModel::Tiny &&
87 "Tiny codesize model not supported on X86");
88 // In the large code model, all text is far from any global data, so we
89 // use GOTOFF.
90 if (CM == CodeModel::Large)
91 return X86II::MO_GOTOFF;
92 // Large GlobalValues use GOTOFF, otherwise use RIP-rel access.
93 if (GV)
94 return TM.isLargeGlobalValue(GV) ? X86II::MO_GOTOFF : X86II::MO_NO_FLAG;
95 // GV == nullptr is for all other non-GlobalValue global data like the
96 // constant pool, jump tables, labels, etc. The small and medium code
97 // models treat these as accessible with a RIP-rel access.
98 return X86II::MO_NO_FLAG;
99 }
100
101 // Otherwise, this is either a RIP-relative reference or a 64-bit movabsq,
102 // both of which use MO_NO_FLAG.
103 return X86II::MO_NO_FLAG;
104 }
105
106 // The COFF dynamic linker just patches the executable sections.
107 if (isTargetCOFF())
108 return X86II::MO_NO_FLAG;
109
110 if (isTargetDarwin()) {
111 // 32 bit macho has no relocation for a-b if a is undefined, even if
112 // b is in the section that is being relocated.
113 // This means we have to use o load even for GVs that are known to be
114 // local to the dso.
115 if (GV && (GV->isDeclarationForLinker() || GV->hasCommonLinkage()))
117
119 }
120
121 return X86II::MO_GOTOFF;
122}
123
125 const Module &M) const {
126 // The static large model never uses stubs.
127 if (TM.getCodeModel() == CodeModel::Large && !isPositionIndependent())
128 return X86II::MO_NO_FLAG;
129
130 // Absolute symbols can be referenced directly.
131 if (GV) {
132 if (std::optional<ConstantRange> CR = GV->getAbsoluteSymbolRange()) {
133 // See if we can use the 8-bit immediate form. Note that some instructions
134 // will sign extend the immediate operand, so to be conservative we only
135 // accept the range [0,128).
136 if (CR->getUnsignedMax().ult(128))
137 return X86II::MO_ABS8;
138 else
139 return X86II::MO_NO_FLAG;
140 }
141 }
142
143 if (TM.shouldAssumeDSOLocal(GV))
144 return classifyLocalReference(GV);
145
146 if (isTargetCOFF()) {
147 // ExternalSymbolSDNode like _tls_index.
148 if (!GV)
149 return X86II::MO_NO_FLAG;
150 if (GV->hasDLLImportStorageClass())
151 return X86II::MO_DLLIMPORT;
152 return X86II::MO_COFFSTUB;
153 }
154 // Some JIT users use *-win32-elf triples; these shouldn't use GOT tables.
155 if (isOSWindows())
156 return X86II::MO_NO_FLAG;
157
158 if (is64Bit()) {
159 // ELF supports a large, truly PIC code model with non-PC relative GOT
160 // references. Other object file formats do not. Use the no-flag, 64-bit
161 // reference for them.
162 if (TM.getCodeModel() == CodeModel::Large)
164 // Tagged globals have non-zero upper bits, which makes direct references
165 // require a 64-bit immediate. So we can't let the linker relax the
166 // relocation to a 32-bit RIP-relative direct reference.
167 if (AllowTaggedGlobals && GV && !isa<Function>(GV))
169 return X86II::MO_GOTPCREL;
170 }
171
172 if (isTargetDarwin()) {
176 }
177
178 // 32-bit ELF references GlobalAddress directly in static relocation model.
179 // We cannot use MO_GOT because EBX may not be set up.
180 if (TM.getRelocationModel() == Reloc::Static)
181 return X86II::MO_NO_FLAG;
182 return X86II::MO_GOT;
183}
184
185unsigned char
189
190unsigned char
192 const Module &M) const {
193 if (TM.shouldAssumeDSOLocal(GV))
194 return X86II::MO_NO_FLAG;
195
196 // Functions on COFF can be non-DSO local for three reasons:
197 // - They are intrinsic functions (!GV)
198 // - They are marked dllimport
199 // - They are extern_weak, and a stub is needed
200 if (isTargetCOFF()) {
201 if (!GV)
202 return X86II::MO_NO_FLAG;
203 if (GV->hasDLLImportStorageClass())
204 return X86II::MO_DLLIMPORT;
205 return X86II::MO_COFFSTUB;
206 }
207
209
210 if (isTargetELF()) {
211 if (is64Bit() && F && (CallingConv::X86_RegCall == F->getCallingConv()))
212 // According to psABI, PLT stub clobbers XMM8-XMM15.
213 // In Regcall calling convention those registers are used for passing
214 // parameters. Thus we need to prevent lazy binding in Regcall.
215 return X86II::MO_GOTPCREL;
216 // If PLT must be avoided then the call should be via GOTPCREL.
217 if (((F && F->hasFnAttribute(Attribute::NonLazyBind)) ||
218 (!F && M.getRtLibUseGOT())) &&
219 is64Bit())
220 return X86II::MO_GOTPCREL;
221 // Reference ExternalSymbol directly in static relocation model.
222 if (!is64Bit() && !GV && TM.getRelocationModel() == Reloc::Static)
223 return X86II::MO_NO_FLAG;
224 return X86II::MO_PLT;
225 }
226
227 if (is64Bit()) {
228 if (F && F->hasFnAttribute(Attribute::NonLazyBind))
229 // If the function is marked as non-lazy, generate an indirect call
230 // which loads from the GOT directly. This avoids runtime overhead
231 // at the cost of eager binding (and one extra byte of encoding).
232 return X86II::MO_GOTPCREL;
233 return X86II::MO_NO_FLAG;
234 }
235
236 return X86II::MO_NO_FLAG;
237}
238
239/// Return true if the subtarget allows calls to immediate address.
241 // FIXME: I386 PE/COFF supports PC relative calls using IMAGE_REL_I386_REL32
242 // but WinCOFFObjectWriter::RecordRelocation cannot emit them. Once it does,
243 // the following check for Win32 should be removed.
244 if (Is64Bit || isTargetWin32())
245 return false;
246 return isTargetELF() || TM.getRelocationModel() == Reloc::Static;
247}
248
249void X86Subtarget::initSubtargetFeatures(StringRef CPU, StringRef TuneCPU,
250 StringRef FS) {
251 if (CPU.empty())
252 CPU = "generic";
253
254 if (TuneCPU.empty())
255 TuneCPU = "i586"; // FIXME: "generic" is more modern than llc tests expect.
256
257 std::string FullFS = X86_MC::ParseX86Triple(TargetTriple);
258 assert(!FullFS.empty() && "Failed to parse X86 triple");
259
260 if (!FS.empty())
261 FullFS = (Twine(FullFS) + "," + FS).str();
262
263 // Disable 64-bit only features in non-64-bit mode.
264 StringRef FeaturesIn64BitOnly[] = {
265 "egpr", "push2pop2", "ppx", "ndd", "ccmp", "nf", "cf", "zu", "uintr"};
266 if (FullFS.find("-64bit-mode") != std::string::npos)
267 for (StringRef F : FeaturesIn64BitOnly)
268 FullFS += ",-" + F.str();
269
270 // Parse features string and set the CPU.
271 ParseSubtargetFeatures(CPU, TuneCPU, FullFS);
272
273 // All CPUs that implement SSE4.2 or SSE4A support unaligned accesses of
274 // 16-bytes and under that are reasonably fast. These features were
275 // introduced with Intel's Nehalem/Silvermont and AMD's Family10h
276 // micro-architectures respectively.
277 if (hasSSE42() || hasSSE4A())
278 IsUnalignedMem16Slow = false;
279
280 LLVM_DEBUG(dbgs() << "Subtarget features: SSELevel " << X86SSELevel
281 << ", MMX " << HasMMX << ", 64bit " << HasX86_64 << "\n");
282 if (Is64Bit && !HasX86_64)
283 reportFatalUsageError("64-bit code requested on a subtarget that doesn't "
284 "support it!");
285
286 // Stack alignment is 16 bytes on Darwin, Linux, kFreeBSD, Hurd and for all
287 // 64-bit targets. On Solaris (32-bit), stack alignment is 4 bytes
288 // following the i386 psABI, while on Illumos it is always 16 bytes.
289 if (StackAlignOverride)
290 stackAlignment = *StackAlignOverride;
291 else if (isTargetDarwin() || isTargetLinux() || isTargetKFreeBSD() ||
292 isTargetHurd() || Is64Bit)
293 stackAlignment = Align(16);
294
295 // Consume the vector width attribute or apply any target specific limit.
296 if (PreferVectorWidthOverride)
297 PreferVectorWidth = PreferVectorWidthOverride;
298 else if (Prefer128Bit)
299 PreferVectorWidth = 128;
300 else if (Prefer256Bit)
301 PreferVectorWidth = 256;
302}
303
304X86Subtarget &X86Subtarget::initializeSubtargetDependencies(StringRef CPU,
305 StringRef TuneCPU,
306 StringRef FS) {
307 initSubtargetFeatures(CPU, TuneCPU, FS);
308 return *this;
309}
310
312 StringRef FS, const X86TargetMachine &TM,
313 MaybeAlign StackAlignOverride,
314 unsigned PreferVectorWidthOverride,
315 unsigned RequiredVectorWidth)
316 : X86GenSubtargetInfo(TT, CPU, TuneCPU, FS),
317 PICStyle(PICStyles::Style::None), TM(TM), TargetTriple(TT),
318 StackAlignOverride(StackAlignOverride),
319 PreferVectorWidthOverride(PreferVectorWidthOverride),
320 RequiredVectorWidth(RequiredVectorWidth),
321 InstrInfo(initializeSubtargetDependencies(CPU, TuneCPU, FS)),
322 TLInfo(TM, *this), FrameLowering(*this, getStackAlignment()) {
323 // Determine the PICStyle based on the target selected.
324 if (!isPositionIndependent() || TM.getCodeModel() == CodeModel::Large)
325 // With the large code model, None forces all memory accesses to be indirect
326 // rather than RIP-relative.
328 else if (is64Bit())
330 else if (isTargetCOFF())
332 else if (isTargetDarwin())
334 else if (isTargetELF())
336
337 CallLoweringInfo.reset(new X86CallLowering(*getTargetLowering()));
338 Legalizer.reset(new X86LegalizerInfo(*this, TM));
339
340 auto *RBI = new X86RegisterBankInfo(*getRegisterInfo());
341 RegBankInfo.reset(RBI);
342 InstSelector.reset(createX86InstructionSelector(TM, *this, *RBI));
343}
344
345// Define the virtual destructor out-of-line for build efficiency.
347
349 return CallLoweringInfo.get();
350}
351
353 return InstSelector.get();
354}
355
357 return Legalizer.get();
358}
359
361 return RegBankInfo.get();
362}
363
367
369 std::vector<std::unique_ptr<ScheduleDAGMutation>> &Mutations) const {
370 Mutations.push_back(createX86MacroFusionDAGMutation());
371}
372
374 return TM.isPositionIndependent();
375}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
This file contains the simple types necessary to represent the attributes associated with functions a...
This file describes how to lower LLVM calls to machine code calls.
Module.h This file contains the declarations for the Module class.
#define F(x, y, z)
Definition MD5.cpp:54
#define LLVM_DEBUG(...)
Definition Debug.h:114
This file describes how to lower LLVM calls to machine code calls.
static bool is64Bit(const char *name)
This file declares the targeting of the Machinelegalizer class for X86.
This file declares the targeting of the RegisterBankInfo class for X86.
static cl::opt< bool > X86EarlyIfConv("x86-early-ifcvt", cl::Hidden, cl::desc("Enable early if-conversion on X86"))
bool hasDLLImportStorageClass() const
bool isDeclarationForLinker() const
Module * getParent()
Get the module that this global value is contained inside of...
LLVM_ABI std::optional< ConstantRange > getAbsoluteSymbolRange() const
If this is an absolute symbol reference, returns the range of the symbol, otherwise returns std::null...
Definition Globals.cpp:445
bool hasCommonLinkage() const
A Module instance is used to store all the information related to an LLVM module.
Definition Module.h:67
Holds all the information related to register banks.
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
constexpr bool empty() const
empty - Check if the string is empty.
Definition StringRef.h:143
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82
This class provides the information for the target register banks.
bool enableEarlyIfConversion() const override
~X86Subtarget() override
bool isOSWindows() const
bool isTargetKFreeBSD() const
bool hasSSE42() const
InstructionSelector * getInstructionSelector() const override
const X86TargetLowering * getTargetLowering() const override
bool canUseCMOV() const
bool isLegalToCallImmediateAddr() const
Return true if the subtarget allows calls to immediate address.
bool isTargetDarwin() const
const RegisterBankInfo * getRegBankInfo() const override
bool isTargetCOFF() const
Align getStackAlignment() const
Returns the minimum alignment known to hold of the stack frame on entry to the function and which mus...
bool isTargetELF() const
unsigned char classifyGlobalReference(const GlobalValue *GV, const Module &M) const
const LegalizerInfo * getLegalizerInfo() const override
bool isPositionIndependent() const
unsigned char classifyLocalReference(const GlobalValue *GV) const
Classify a global variable reference for the current subtarget according to how we should reference i...
unsigned char classifyBlockAddressReference() const
Classify a blockaddress reference for the current subtarget according to how we should reference it i...
const X86RegisterInfo * getRegisterInfo() const override
void setPICStyle(PICStyles::Style Style)
X86Subtarget(const Triple &TT, StringRef CPU, StringRef TuneCPU, StringRef FS, const X86TargetMachine &TM, MaybeAlign StackAlignOverride, unsigned PreferVectorWidthOverride, unsigned RequiredVectorWidth)
This constructor initializes the data members to match that of the specified triple.
const CallLowering * getCallLowering() const override
Methods used by Global ISel.
void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS)
ParseSubtargetFeatures - Parses features string setting specified subtarget options.
void getPostRAMutations(std::vector< std::unique_ptr< ScheduleDAGMutation > > &Mutations) const override
bool isTargetHurd() const
bool isTargetWin32() const
unsigned char classifyGlobalFunctionReference(const GlobalValue *GV, const Module &M) const
Classify a global function reference for the current subtarget.
bool isTargetLinux() const
@ X86_RegCall
Register calling convention used for parameters transfer optimization.
The X86 backend supports a number of different styles of PIC.
@ MO_GOTPCREL_NORELAX
MO_GOTPCREL_NORELAX - Same as MO_GOTPCREL except that R_X86_64_GOTPCREL relocations are guaranteed to...
@ MO_GOTOFF
MO_GOTOFF - On a symbol operand this indicates that the immediate is the offset to the location of th...
@ MO_DARWIN_NONLAZY_PIC_BASE
MO_DARWIN_NONLAZY_PIC_BASE - On a symbol operand "FOO", this indicates that the reference is actually...
@ MO_COFFSTUB
MO_COFFSTUB - On a symbol operand "FOO", this indicates that the reference is actually to the "....
@ MO_DARWIN_NONLAZY
MO_DARWIN_NONLAZY - On a symbol operand "FOO", this indicates that the reference is actually to the "...
@ MO_GOT
MO_GOT - On a symbol operand this indicates that the immediate is the offset to the GOT entry for the...
@ MO_ABS8
MO_ABS8 - On a symbol operand this indicates that the symbol is known to be an absolute symbol in ran...
@ MO_PLT
MO_PLT - On a symbol operand this indicates that the immediate is offset to the PLT entry of symbol n...
@ MO_NO_FLAG
MO_NO_FLAG - No flag for the operand.
@ MO_DLLIMPORT
MO_DLLIMPORT - On a symbol operand "FOO", this indicates that the reference is actually to the "__imp...
@ MO_PIC_BASE_OFFSET
MO_PIC_BASE_OFFSET - On a symbol operand this indicates that the immediate should get the value of th...
@ MO_GOTPCREL
MO_GOTPCREL - On a symbol operand this indicates that the immediate is offset to the GOT entry for th...
std::string ParseX86Triple(const Triple &TT)
This is an optimization pass for GlobalISel generic memory operations.
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
std::unique_ptr< ScheduleDAGMutation > createX86MacroFusionDAGMutation()
Note that you have to add: DAG.addMutation(createX86MacroFusionDAGMutation()); to X86TargetMachine::c...
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
InstructionSelector * createX86InstructionSelector(const X86TargetMachine &TM, const X86Subtarget &, const X86RegisterBankInfo &)
LLVM_ABI void reportFatalUsageError(Error Err)
Report a fatal error that does not indicate a bug in LLVM.
Definition Error.cpp:180
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Definition Alignment.h:106