LLVM 23.0.0git
SystemZTargetMachine.cpp
Go to the documentation of this file.
1//===-- SystemZTargetMachine.cpp - Define TargetMachine for SystemZ -------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
11#include "SystemZ.h"
17#include "llvm/ADT/StringRef.h"
19#include "llvm/CodeGen/Passes.h"
22#include "llvm/IR/DataLayout.h"
28#include <memory>
29#include <optional>
30#include <string>
31
32using namespace llvm;
33
35 "systemz-machine-combiner",
36 cl::desc("Enable the machine combiner pass"),
37 cl::init(true), cl::Hidden);
38
40 "generic-sched", cl::Hidden, cl::init(false),
41 cl::desc("Run the generic pre-ra scheduler instead of the SystemZ "
42 "scheduler."));
43
44// NOLINTNEXTLINE(readability-identifier-naming)
61
62static std::unique_ptr<TargetLoweringObjectFile> createTLOF(const Triple &TT) {
63 if (TT.isOSzOS())
64 return std::make_unique<TargetLoweringObjectFileGOFF>();
65
66 // Note: Some times run with -triple s390x-unknown.
67 // In this case, default to ELF unless z/OS specifically provided.
68 return std::make_unique<SystemZELFTargetObjectFile>();
69}
70
71static Reloc::Model getEffectiveRelocModel(std::optional<Reloc::Model> RM) {
72 // Static code is suitable for use in a dynamic executable; there is no
73 // separate DynamicNoPIC model.
74 if (!RM || *RM == Reloc::DynamicNoPIC)
75 return Reloc::Static;
76 return *RM;
77}
78
79// For SystemZ we define the models as follows:
80//
81// Small: BRASL can call any function and will use a stub if necessary.
82// Locally-binding symbols will always be in range of LARL.
83//
84// Medium: BRASL can call any function and will use a stub if necessary.
85// GOT slots and locally-defined text will always be in range
86// of LARL, but other symbols might not be.
87//
88// Large: Equivalent to Medium for now.
89//
90// Kernel: Equivalent to Medium for now.
91//
92// This means that any PIC module smaller than 4GB meets the
93// requirements of Small, so Small seems like the best default there.
94//
95// All symbols bind locally in a non-PIC module, so the choice is less
96// obvious. There are two cases:
97//
98// - When creating an executable, PLTs and copy relocations allow
99// us to treat external symbols as part of the executable.
100// Any executable smaller than 4GB meets the requirements of Small,
101// so that seems like the best default.
102//
103// - When creating JIT code, stubs will be in range of BRASL if the
104// image is less than 4GB in size. GOT entries will likewise be
105// in range of LARL. However, the JIT environment has no equivalent
106// of copy relocs, so locally-binding data symbols might not be in
107// the range of LARL. We need the Medium model in that case.
108static CodeModel::Model
109getEffectiveSystemZCodeModel(std::optional<CodeModel::Model> CM,
110 Reloc::Model RM, bool JIT) {
111 if (CM) {
112 if (*CM == CodeModel::Tiny)
113 report_fatal_error("Target does not support the tiny CodeModel", false);
114 if (*CM == CodeModel::Kernel)
115 report_fatal_error("Target does not support the kernel CodeModel", false);
116 return *CM;
117 }
118 if (JIT)
120 return CodeModel::Small;
121}
122
124 StringRef CPU, StringRef FS,
125 const TargetOptions &Options,
126 std::optional<Reloc::Model> RM,
127 std::optional<CodeModel::Model> CM,
128 CodeGenOptLevel OL, bool JIT)
130 T, TT.computeDataLayout(), TT, CPU, FS, Options,
133 OL),
134 TLOF(createTLOF(getTargetTriple())) {
135 initAsmInfo();
136}
137
139
140const SystemZSubtarget *
142 Attribute CPUAttr = F.getFnAttribute("target-cpu");
143 Attribute TuneAttr = F.getFnAttribute("tune-cpu");
144 Attribute FSAttr = F.getFnAttribute("target-features");
145
146 std::string CPU =
147 CPUAttr.isValid() ? CPUAttr.getValueAsString().str() : TargetCPU;
148 std::string TuneCPU =
149 TuneAttr.isValid() ? TuneAttr.getValueAsString().str() : CPU;
150 std::string FS =
151 FSAttr.isValid() ? FSAttr.getValueAsString().str() : TargetFS;
152
153 // FIXME: This is related to the code below to reset the target options,
154 // we need to know whether the soft float and backchain flags are set on the
155 // function, so we can enable them as subtarget features.
156 bool SoftFloat = F.getFnAttribute("use-soft-float").getValueAsBool();
157 if (SoftFloat)
158 FS += FS.empty() ? "+soft-float" : ",+soft-float";
159 bool BackChain = F.hasFnAttribute("backchain");
160 if (BackChain)
161 FS += FS.empty() ? "+backchain" : ",+backchain";
162
163 auto &I = SubtargetMap[CPU + TuneCPU + FS];
164 if (!I) {
165 I = std::make_unique<SystemZSubtarget>(TargetTriple, CPU, TuneCPU, FS,
166 *this);
167 }
168
169 return I.get();
170}
171
174 // Use GenericScheduler if requested on CL or for Z10 which has no sched
175 // model.
176 if (GenericSched ||
177 !C->MF->getSubtarget().getSchedModel().hasInstrSchedModel())
178 return nullptr;
179
181}
182
187
188namespace {
189
190/// SystemZ Code Generator Pass Configuration Options.
191class SystemZPassConfig : public TargetPassConfig {
192public:
193 SystemZPassConfig(SystemZTargetMachine &TM, PassManagerBase &PM)
194 : TargetPassConfig(TM, PM) {}
195
196 SystemZTargetMachine &getSystemZTargetMachine() const {
198 }
199
200 void addIRPasses() override;
201 bool addInstSelector() override;
202 bool addILPOpts() override;
203 void addPreRegAlloc() override;
204 void addPostRewrite() override;
205 void addPostRegAlloc() override;
206 void addPreSched2() override;
207 void addPreEmitPass() override;
208};
209
210} // end anonymous namespace
211
212void SystemZPassConfig::addIRPasses() {
213 if (getOptLevel() != CodeGenOptLevel::None) {
214 addPass(createSystemZTDCPass());
216 }
217
219
221}
222
223bool SystemZPassConfig::addInstSelector() {
224 addPass(createSystemZISelDag(getSystemZTargetMachine(), getOptLevel()));
225
226 if (getOptLevel() != CodeGenOptLevel::None)
227 addPass(createSystemZLDCleanupPass(getSystemZTargetMachine()));
228
229 return false;
230}
231
232bool SystemZPassConfig::addILPOpts() {
233 addPass(&EarlyIfConverterLegacyID);
234
236 addPass(&MachineCombinerID);
237
238 return true;
239}
240
241void SystemZPassConfig::addPreRegAlloc() {
242 addPass(createSystemZCopyPhysRegsPass(getSystemZTargetMachine()));
243}
244
245void SystemZPassConfig::addPostRewrite() {
246 addPass(createSystemZPostRewritePass(getSystemZTargetMachine()));
247}
248
249void SystemZPassConfig::addPostRegAlloc() {
250 // PostRewrite needs to be run at -O0 also (in which case addPostRewrite()
251 // is not called).
252 if (getOptLevel() == CodeGenOptLevel::None)
253 addPass(createSystemZPostRewritePass(getSystemZTargetMachine()));
254}
255
256void SystemZPassConfig::addPreSched2() {
257 if (getOptLevel() != CodeGenOptLevel::None)
258 addPass(&IfConverterID);
259}
260
261void SystemZPassConfig::addPreEmitPass() {
262 // Do instruction shortening before compare elimination because some
263 // vector instructions will be shortened into opcodes that compare
264 // elimination recognizes.
265 if (getOptLevel() != CodeGenOptLevel::None)
266 addPass(createSystemZShortenInstPass(getSystemZTargetMachine()));
267
268 // We eliminate comparisons here rather than earlier because some
269 // transformations can change the set of available CC values and we
270 // generally want those transformations to have priority. This is
271 // especially true in the commonest case where the result of the comparison
272 // is used by a single in-range branch instruction, since we will then
273 // be able to fuse the compare and the branch instead.
274 //
275 // For example, two-address NILF can sometimes be converted into
276 // three-address RISBLG. NILF produces a CC value that indicates whether
277 // the low word is zero, but RISBLG does not modify CC at all. On the
278 // other hand, 64-bit ANDs like NILL can sometimes be converted to RISBG.
279 // The CC value produced by NILL isn't useful for our purposes, but the
280 // value produced by RISBG can be used for any comparison with zero
281 // (not just equality). So there are some transformations that lose
282 // CC values (while still being worthwhile) and others that happen to make
283 // the CC result more useful than it was originally.
284 //
285 // Another reason is that we only want to use BRANCH ON COUNT in cases
286 // where we know that the count register is not going to be spilled.
287 //
288 // Doing it so late makes it more likely that a register will be reused
289 // between the comparison and the branch, but it isn't clear whether
290 // preventing that would be a win or not.
291 if (getOptLevel() != CodeGenOptLevel::None)
292 addPass(createSystemZElimComparePass(getSystemZTargetMachine()));
293 addPass(createSystemZLongBranchPass(getSystemZTargetMachine()));
294
295 // Do final scheduling after all other optimizations, to get an
296 // optimal input for the decoder (branch relaxation must happen
297 // after block placement).
298 if (getOptLevel() != CodeGenOptLevel::None)
299 addPass(&PostMachineSchedulerID);
300}
301
303 return new SystemZPassConfig(*this, PM);
304}
305
308 return TargetTransformInfo(std::make_unique<SystemZTTIImpl>(this, F));
309}
310
static std::unique_ptr< TargetLoweringObjectFile > createTLOF(const Triple &TT)
static Reloc::Model getEffectiveRelocModel()
#define X(NUM, ENUM, NAME)
Definition ELF.h:853
#define LLVM_ABI
Definition Compiler.h:213
#define LLVM_EXTERNAL_VISIBILITY
Definition Compiler.h:132
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
#define T
static cl::opt< bool > EnableMachineCombinerPass("ppc-machine-combiner", cl::desc("Enable the machine combiner pass"), cl::init(true), cl::Hidden)
const GCNTargetMachine & getTM(const GCNSubtarget *STI)
static CodeModel::Model getEffectiveSystemZCodeModel(std::optional< CodeModel::Model > CM, Reloc::Model RM, bool JIT)
static cl::opt< bool > GenericSched("generic-sched", cl::Hidden, cl::init(false), cl::desc("Run the generic pre-ra scheduler instead of the SystemZ " "scheduler."))
static cl::opt< bool > EnableMachineCombinerPass("systemz-machine-combiner", cl::desc("Enable the machine combiner pass"), cl::init(true), cl::Hidden)
LLVM_ABI LLVM_EXTERNAL_VISIBILITY void LLVMInitializeSystemZTarget()
Target-Independent Code Generator Pass Configuration Options pass.
This pass exposes codegen information to IR-level passes.
static std::unique_ptr< TargetLoweringObjectFile > createTLOF()
Functions, function parameters, and return types can have attributes to indicate how they should be t...
Definition Attributes.h:105
LLVM_ABI StringRef getValueAsString() const
Return the attribute's value as a string.
bool isValid() const
Return true if the attribute is any kind of attribute.
Definition Attributes.h:261
CodeGenTargetMachineImpl(const Target &T, StringRef DataLayoutString, const Triple &TT, StringRef CPU, StringRef FS, const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM, CodeGenOptLevel OL)
static LLVM_ABI PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
A ScheduleDAG for scheduling lists of MachineInstr.
Represent a constant reference to a string, i.e.
Definition StringRef.h:56
std::string str() const
Get the contents as an std::string.
Definition StringRef.h:222
ScheduleDAGInstrs * createMachineScheduler(MachineSchedContext *C) const override
Create an instance of ScheduleDAGInstrs to be run within the standard MachineScheduler pass for this ...
const SystemZSubtarget * getSubtargetImpl() const =delete
SystemZTargetMachine(const Target &T, const Triple &TT, StringRef CPU, StringRef FS, const TargetOptions &Options, std::optional< Reloc::Model > RM, std::optional< CodeModel::Model > CM, CodeGenOptLevel OL, bool JIT)
TargetTransformInfo getTargetTransformInfo(const Function &F) const override
Get a TargetTransformInfo implementation for the target.
MachineFunctionInfo * createMachineFunctionInfo(BumpPtrAllocator &Allocator, const Function &F, const TargetSubtargetInfo *STI) const override
Create the target's instance of MachineFunctionInfo.
TargetPassConfig * createPassConfig(PassManagerBase &PM) override
Create a pass configuration object to be used by addPassToEmitX methods for generating a pipeline of ...
ScheduleDAGInstrs * createPostMachineScheduler(MachineSchedContext *C) const override
Similar to createMachineScheduler but used when postRA machine scheduling is enabled.
Triple TargetTriple
Triple string, CPU name, and target feature strings the TargetMachine instance is created with.
const Triple & getTargetTriple() const
std::unique_ptr< const MCSubtargetInfo > STI
TargetOptions Options
Target-Independent Code Generator Pass Configuration Options.
virtual void addIRPasses()
Add common target configurable passes that perform LLVM IR to IR transforms following machine indepen...
TargetSubtargetInfo - Generic base class for all target subtargets.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Target - Wrapper for Target specific information.
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47
PassManagerBase - An abstract interface to allow code to add passes to a pass manager without having ...
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ DynamicNoPIC
Definition CodeGen.h:25
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
ScheduleDAGMILive * createSchedLive(MachineSchedContext *C)
Create the standard converging machine scheduler.
Target & getTheSystemZTarget()
void initializeSystemZElimComparePass(PassRegistry &)
FunctionPass * createSystemZLongBranchPass(SystemZTargetMachine &TM)
FunctionPass * createSystemZISelDag(SystemZTargetMachine &TM, CodeGenOptLevel OptLevel)
FunctionPass * createSystemZCopyPhysRegsPass(SystemZTargetMachine &TM)
FunctionPass * createSystemZElimComparePass(SystemZTargetMachine &TM)
void initializeSystemZCopyPhysRegsPass(PassRegistry &)
LLVM_ABI char & PostMachineSchedulerID
PostMachineScheduler - This pass schedules machine instructions postRA.
void initializeSystemZLongBranchPass(PassRegistry &)
void initializeSystemZShortenInstPass(PassRegistry &)
LLVM_ABI char & EarlyIfConverterLegacyID
EarlyIfConverter - This pass performs if-conversion on SSA form by inserting cmov instructions.
LLVM_ABI char & MachineCombinerID
This pass performs instruction combining using trace metrics to estimate critical-path and resource d...
static Reloc::Model getEffectiveRelocModel(std::optional< Reloc::Model > RM)
void initializeSystemZDAGToDAGISelLegacyPass(PassRegistry &)
ScheduleDAGMI * createSchedPostRA(MachineSchedContext *C)
Create a generic scheduler with no vreg liveness or DAG mutation passes.
FunctionPass * createSystemZTDCPass()
LLVM_ABI FunctionPass * createLoopDataPrefetchPass()
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:163
FunctionPass * createSystemZShortenInstPass(SystemZTargetMachine &TM)
void initializeSystemZPostRewritePass(PassRegistry &)
CodeGenOptLevel
Code generation optimization level.
Definition CodeGen.h:82
void initializeSystemZTDCPassPass(PassRegistry &)
FunctionPass * createSystemZLDCleanupPass(SystemZTargetMachine &TM)
void initializeSystemZAsmPrinterPass(PassRegistry &)
FunctionPass * createSystemZPostRewritePass(SystemZTargetMachine &TM)
LLVM_ABI char & IfConverterID
IfConverter - This pass performs machine code if conversion.
LLVM_ABI FunctionPass * createAtomicExpandLegacyPass()
AtomicExpandPass - At IR level this pass replace atomic instructions with __atomic_* library calls,...
BumpPtrAllocatorImpl<> BumpPtrAllocator
The standard BumpPtrAllocator which just uses the default template parameters.
Definition Allocator.h:383
void initializeSystemZLDCleanupPass(PassRegistry &)
MachineFunctionInfo - This class can be derived from and used by targets to hold private target-speci...
static FuncInfoTy * create(BumpPtrAllocator &Allocator, const Function &F, const SubtargetTy *STI)
Factory function: default behavior is to call new using the supplied allocator.
MachineSchedContext provides enough context from the MachineScheduler pass for the target to instanti...
RegisterTargetMachine - Helper template for registering a target machine implementation,...