LLVM 23.0.0git
LoongArchTargetMachine.cpp
Go to the documentation of this file.
1//===-- LoongArchTargetMachine.cpp - Define TargetMachine for LoongArch ---===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Implements the info about LoongArch target spec.
10//
11//===----------------------------------------------------------------------===//
12
14#include "LoongArch.h"
21#include "llvm/CodeGen/Passes.h"
28#include <optional>
29
30using namespace llvm;
31
32#define DEBUG_TYPE "loongarch"
33
48
50 "loongarch-enable-dead-defs", cl::Hidden,
51 cl::desc("Enable the pass that removes dead"
52 " definitons and replaces stores to"
53 " them with stores to r0"),
54 cl::init(true));
55
56static cl::opt<bool>
57 EnableLoopDataPrefetch("loongarch-enable-loop-data-prefetch", cl::Hidden,
58 cl::desc("Enable the loop data prefetch pass"),
59 cl::init(false));
60
61static cl::opt<bool>
62 EnableMergeBaseOffset("loongarch-enable-merge-offset",
63 cl::desc("Enable the merge base offset pass"),
64 cl::init(true), cl::Hidden);
65
66static cl::opt<bool>
67 EnableSinkFold("loongarch-enable-sink-fold",
68 cl::desc("Enable sinking and folding of instruction copies"),
69 cl::init(true), cl::Hidden);
70
71static Reloc::Model getEffectiveRelocModel(std::optional<Reloc::Model> RM) {
72 return RM.value_or(Reloc::Static);
73}
74
77 std::optional<CodeModel::Model> CM) {
78 if (!CM)
79 return TT.isArch64Bit() ? CodeModel::Medium : CodeModel::Small;
80
81 switch (*CM) {
84 return *CM;
86 if (!TT.isArch64Bit())
87 report_fatal_error("Large code model requires LA64");
88 return *CM;
89 default:
91 "Only small, medium and large code models are allowed on LoongArch");
92 }
93}
94
96 const Target &T, const Triple &TT, StringRef CPU, StringRef FS,
97 const TargetOptions &Options, std::optional<Reloc::Model> RM,
98 std::optional<CodeModel::Model> CM, CodeGenOptLevel OL, bool JIT)
99 : CodeGenTargetMachineImpl(T, TT.computeDataLayout(), TT, CPU, FS, Options,
102 TLOF(std::make_unique<LoongArchELFTargetObjectFile>()) {
103 initAsmInfo();
104}
105
107
108const LoongArchSubtarget *
110 Attribute CPUAttr = F.getFnAttribute("target-cpu");
111 Attribute TuneAttr = F.getFnAttribute("tune-cpu");
112 Attribute FSAttr = F.getFnAttribute("target-features");
113
114 std::string CPU =
115 CPUAttr.isValid() ? CPUAttr.getValueAsString().str() : TargetCPU;
116 std::string TuneCPU =
117 TuneAttr.isValid() ? TuneAttr.getValueAsString().str() : CPU;
118 std::string FS =
119 FSAttr.isValid() ? FSAttr.getValueAsString().str() : TargetFS;
120
121 std::string Key = CPU + TuneCPU + FS;
122 auto &I = SubtargetMap[Key];
123 if (!I) {
124 auto ABIName = Options.MCOptions.getABIName();
125 if (const MDString *ModuleTargetABI = dyn_cast_or_null<MDString>(
126 F.getParent()->getModuleFlag("target-abi"))) {
127 auto TargetABI = LoongArchABI::getTargetABI(ABIName);
128 if (TargetABI != LoongArchABI::ABI_Unknown &&
129 ModuleTargetABI->getString() != ABIName) {
130 report_fatal_error("-target-abi option != target-abi module flag");
131 }
132 ABIName = ModuleTargetABI->getString();
133 }
134 I = std::make_unique<LoongArchSubtarget>(TargetTriple, CPU, TuneCPU, FS,
135 ABIName, *this);
136 }
137 return I.get();
138}
139
146
147namespace {
148class LoongArchPassConfig : public TargetPassConfig {
149public:
150 LoongArchPassConfig(LoongArchTargetMachine &TM, PassManagerBase &PM)
151 : TargetPassConfig(TM, PM) {
152 setEnableSinkAndFold(EnableSinkFold);
153 }
154
155 LoongArchTargetMachine &getLoongArchTargetMachine() const {
157 }
158
159 void addIRPasses() override;
160 void addCodeGenPrepare() override;
161 bool addInstSelector() override;
162 void addPreEmitPass() override;
163 void addPreEmitPass2() override;
164 void addMachineSSAOptimization() override;
165 void addPreRegAlloc() override;
166 bool addRegAssignAndRewriteFast() override;
167 bool addRegAssignAndRewriteOptimized() override;
168};
169} // end namespace
170
173 return new LoongArchPassConfig(*this, PM);
174}
175
176void LoongArchPassConfig::addIRPasses() {
177 // Run LoopDataPrefetch
178 //
179 // Run this before LSR to remove the multiplies involved in computing the
180 // pointer values N iterations ahead.
181 if (TM->getOptLevel() != CodeGenOptLevel::None && EnableLoopDataPrefetch)
184
186}
187
188void LoongArchPassConfig::addCodeGenPrepare() {
189 if (getOptLevel() != CodeGenOptLevel::None)
192}
193
194bool LoongArchPassConfig::addInstSelector() {
195 addPass(createLoongArchISelDag(getLoongArchTargetMachine(), getOptLevel()));
196
197 return false;
198}
199
202 return TargetTransformInfo(std::make_unique<LoongArchTTIImpl>(this, F));
203}
204
205void LoongArchPassConfig::addPreEmitPass() { addPass(&BranchRelaxationPassID); }
206
207void LoongArchPassConfig::addPreEmitPass2() {
209 // Schedule the expansion of AtomicPseudos at the last possible moment,
210 // avoiding the possibility for other passes to break the requirements for
211 // forward progress in the LL/SC block.
213}
214
215void LoongArchPassConfig::addMachineSSAOptimization() {
217
218 if (TM->getTargetTriple().isLoongArch64()) {
220 }
221}
222
223void LoongArchPassConfig::addPreRegAlloc() {
225 if (TM->getOptLevel() != CodeGenOptLevel::None && EnableMergeBaseOffset)
227}
228
229bool LoongArchPassConfig::addRegAssignAndRewriteFast() {
230 if (TM->getOptLevel() != CodeGenOptLevel::None &&
234}
235
236bool LoongArchPassConfig::addRegAssignAndRewriteOptimized() {
237 if (TM->getOptLevel() != CodeGenOptLevel::None &&
241}
static cl::opt< bool > EnableSinkFold("aarch64-enable-sink-fold", cl::desc("Enable sinking and folding of instruction copies"), cl::init(true), cl::Hidden)
static cl::opt< bool > EnableLoopDataPrefetch("aarch64-enable-loop-data-prefetch", cl::Hidden, cl::desc("Enable the loop data prefetch pass"), cl::init(true))
static Reloc::Model getEffectiveRelocModel()
#define X(NUM, ENUM, NAME)
Definition ELF.h:853
#define LLVM_ABI
Definition Compiler.h:213
#define LLVM_EXTERNAL_VISIBILITY
Definition Compiler.h:132
static cl::opt< bool > EnableLoongArchDeadRegisterElimination("loongarch-enable-dead-defs", cl::Hidden, cl::desc("Enable the pass that removes dead" " definitons and replaces stores to" " them with stores to r0"), cl::init(true))
static cl::opt< bool > EnableMergeBaseOffset("loongarch-enable-merge-offset", cl::desc("Enable the merge base offset pass"), cl::init(true), cl::Hidden)
static cl::opt< bool > EnableLoopDataPrefetch("loongarch-enable-loop-data-prefetch", cl::Hidden, cl::desc("Enable the loop data prefetch pass"), cl::init(false))
LLVM_ABI LLVM_EXTERNAL_VISIBILITY void LLVMInitializeLoongArchTarget()
static CodeModel::Model getEffectiveLoongArchCodeModel(const Triple &TT, std::optional< CodeModel::Model > CM)
static cl::opt< bool > EnableSinkFold("loongarch-enable-sink-fold", cl::desc("Enable sinking and folding of instruction copies"), cl::init(true), cl::Hidden)
This file a TargetTransformInfoImplBase conforming object specific to the LoongArch target machine.
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
#define T
const GCNTargetMachine & getTM(const GCNSubtarget *STI)
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
Target-Independent Code Generator Pass Configuration Options pass.
This pass exposes codegen information to IR-level passes.
Functions, function parameters, and return types can have attributes to indicate how they should be t...
Definition Attributes.h:105
LLVM_ABI StringRef getValueAsString() const
Return the attribute's value as a string.
bool isValid() const
Return true if the attribute is any kind of attribute.
Definition Attributes.h:261
CodeGenTargetMachineImpl(const Target &T, StringRef DataLayoutString, const Triple &TT, StringRef CPU, StringRef FS, const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM, CodeGenOptLevel OL)
This implementation is used for LoongArch ELF targets.
LoongArchTargetMachine(const Target &T, const Triple &TT, StringRef CPU, StringRef FS, const TargetOptions &Options, std::optional< Reloc::Model > RM, std::optional< CodeModel::Model > CM, CodeGenOptLevel OL, bool JIT)
const LoongArchSubtarget * getSubtargetImpl() const =delete
TargetPassConfig * createPassConfig(PassManagerBase &PM) override
Create a pass configuration object to be used by addPassToEmitX methods for generating a pipeline of ...
TargetTransformInfo getTargetTransformInfo(const Function &F) const override
Get a TargetTransformInfo implementation for the target.
MachineFunctionInfo * createMachineFunctionInfo(BumpPtrAllocator &Allocator, const Function &F, const TargetSubtargetInfo *STI) const override
Create the target's instance of MachineFunctionInfo.
A single uniqued string.
Definition Metadata.h:722
static LLVM_ABI PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Represent a constant reference to a string, i.e.
Definition StringRef.h:56
std::string str() const
Get the contents as an std::string.
Definition StringRef.h:222
Triple TargetTriple
Triple string, CPU name, and target feature strings the TargetMachine instance is created with.
std::unique_ptr< const MCSubtargetInfo > STI
TargetOptions Options
Target-Independent Code Generator Pass Configuration Options.
virtual void addCodeGenPrepare()
Add pass to prepare the LLVM IR for code generation.
virtual bool addRegAssignAndRewriteFast()
Add core register allocator passes which do the actual register assignment and rewriting.
virtual void addIRPasses()
Add common target configurable passes that perform LLVM IR to IR transforms following machine indepen...
virtual void addMachineSSAOptimization()
addMachineSSAOptimization - Add standard passes that optimize machine instructions in SSA form.
virtual bool addRegAssignAndRewriteOptimized()
TargetSubtargetInfo - Generic base class for all target subtargets.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Target - Wrapper for Target specific information.
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47
PassManagerBase - An abstract interface to allow code to add passes to a pass manager without having ...
ABI getTargetABI(StringRef ABIName)
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
Target & getTheLoongArch64Target()
FunctionPass * createLoongArchExpandAtomicPseudoPass()
FunctionPass * createLoongArchDeadRegisterDefinitionsPass()
void initializeLoongArchDAGToDAGISelLegacyPass(PassRegistry &)
LLVM_ABI FunctionPass * createTypePromotionLegacyPass()
Create IR Type Promotion pass.
void initializeLoongArchPreRAExpandPseudoPass(PassRegistry &)
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
void initializeLoongArchMergeBaseOffsetOptPass(PassRegistry &)
static Reloc::Model getEffectiveRelocModel(std::optional< Reloc::Model > RM)
void initializeLoongArchExpandAtomicPseudoPass(PassRegistry &)
LLVM_ABI char & BranchRelaxationPassID
BranchRelaxation - This pass replaces branches that need to jump further than is supported by a branc...
void initializeLoongArchExpandPseudoPass(PassRegistry &)
FunctionPass * createLoongArchOptWInstrsPass()
LLVM_ABI FunctionPass * createLoopDataPrefetchPass()
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:163
CodeGenOptLevel
Code generation optimization level.
Definition CodeGen.h:82
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
Target & getTheLoongArch32Target()
FunctionPass * createLoongArchISelDag(LoongArchTargetMachine &TM, CodeGenOptLevel OptLevel)
FunctionPass * createLoongArchPreRAExpandPseudoPass()
void initializeLoongArchOptWInstrsPass(PassRegistry &)
FunctionPass * createLoongArchExpandPseudoPass()
LLVM_ABI FunctionPass * createAtomicExpandLegacyPass()
AtomicExpandPass - At IR level this pass replace atomic instructions with __atomic_* library calls,...
BumpPtrAllocatorImpl<> BumpPtrAllocator
The standard BumpPtrAllocator which just uses the default template parameters.
Definition Allocator.h:383
void initializeLoongArchDeadRegisterDefinitionsPass(PassRegistry &)
FunctionPass * createLoongArchMergeBaseOffsetOptPass()
Returns an instance of the Merge Base Offset Optimization pass.
Implement std::hash so that hash_code can be used in STL containers.
Definition BitVector.h:860
MachineFunctionInfo - This class can be derived from and used by targets to hold private target-speci...
static FuncInfoTy * create(BumpPtrAllocator &Allocator, const Function &F, const SubtargetTy *STI)
Factory function: default behavior is to call new using the supplied allocator.
RegisterTargetMachine - Helper template for registering a target machine implementation,...