LLVM 23.0.0git
SystemZTargetMachine.cpp
Go to the documentation of this file.
1//===-- SystemZTargetMachine.cpp - Define TargetMachine for SystemZ -------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
11#include "SystemZ.h"
17#include "llvm/ADT/StringRef.h"
19#include "llvm/CodeGen/Passes.h"
22#include "llvm/IR/DataLayout.h"
28#include <memory>
29#include <optional>
30#include <string>
31
32using namespace llvm;
33
35 "systemz-machine-combiner",
36 cl::desc("Enable the machine combiner pass"),
37 cl::init(true), cl::Hidden);
38
40 "generic-sched", cl::Hidden, cl::init(false),
41 cl::desc("Run the generic pre-ra scheduler instead of the SystemZ "
42 "scheduler."));
43
44// NOLINTNEXTLINE(readability-identifier-naming)
61
62static std::unique_ptr<TargetLoweringObjectFile> createTLOF(const Triple &TT) {
63 if (TT.isOSzOS())
64 return std::make_unique<TargetLoweringObjectFileGOFF>();
65
66 // Note: Some times run with -triple s390x-unknown.
67 // In this case, default to ELF unless z/OS specifically provided.
68 return std::make_unique<SystemZELFTargetObjectFile>();
69}
70
71static Reloc::Model getEffectiveRelocModel(std::optional<Reloc::Model> RM) {
72 // Static code is suitable for use in a dynamic executable; there is no
73 // separate DynamicNoPIC model.
74 if (!RM || *RM == Reloc::DynamicNoPIC)
75 return Reloc::Static;
76 return *RM;
77}
78
79// For SystemZ we define the models as follows:
80//
81// Small: BRASL can call any function and will use a stub if necessary.
82// Locally-binding symbols will always be in range of LARL.
83//
84// Medium: BRASL can call any function and will use a stub if necessary.
85// GOT slots and locally-defined text will always be in range
86// of LARL, but other symbols might not be.
87//
88// Large: Equivalent to Medium for now.
89//
90// Kernel: Equivalent to Medium for now.
91//
92// This means that any PIC module smaller than 4GB meets the
93// requirements of Small, so Small seems like the best default there.
94//
95// All symbols bind locally in a non-PIC module, so the choice is less
96// obvious. There are two cases:
97//
98// - When creating an executable, PLTs and copy relocations allow
99// us to treat external symbols as part of the executable.
100// Any executable smaller than 4GB meets the requirements of Small,
101// so that seems like the best default.
102//
103// - When creating JIT code, stubs will be in range of BRASL if the
104// image is less than 4GB in size. GOT entries will likewise be
105// in range of LARL. However, the JIT environment has no equivalent
106// of copy relocs, so locally-binding data symbols might not be in
107// the range of LARL. We need the Medium model in that case.
108static CodeModel::Model
109getEffectiveSystemZCodeModel(std::optional<CodeModel::Model> CM,
110 Reloc::Model RM, bool JIT) {
111 if (CM) {
112 if (*CM == CodeModel::Tiny)
113 report_fatal_error("Target does not support the tiny CodeModel", false);
114 if (*CM == CodeModel::Kernel)
115 report_fatal_error("Target does not support the kernel CodeModel", false);
116 return *CM;
117 }
118 if (JIT)
120 return CodeModel::Small;
121}
122
124 StringRef CPU, StringRef FS,
125 const TargetOptions &Options,
126 std::optional<Reloc::Model> RM,
127 std::optional<CodeModel::Model> CM,
128 CodeGenOptLevel OL, bool JIT)
130 T, TT.computeDataLayout(), TT, CPU, FS, Options,
133 OL),
134 TLOF(createTLOF(getTargetTriple())) {
135 initAsmInfo();
136}
137
139
140const SystemZSubtarget *
142 Attribute CPUAttr = F.getFnAttribute("target-cpu");
143 Attribute TuneAttr = F.getFnAttribute("tune-cpu");
144 Attribute FSAttr = F.getFnAttribute("target-features");
145
146 std::string CPU =
147 CPUAttr.isValid() ? CPUAttr.getValueAsString().str() : TargetCPU;
148 std::string TuneCPU =
149 TuneAttr.isValid() ? TuneAttr.getValueAsString().str() : CPU;
150 std::string FS =
151 FSAttr.isValid() ? FSAttr.getValueAsString().str() : TargetFS;
152
153 // FIXME: This is related to the code below to reset the target options,
154 // we need to know whether the soft float and backchain flags are set on the
155 // function, so we can enable them as subtarget features.
156 bool SoftFloat = F.getFnAttribute("use-soft-float").getValueAsBool();
157 if (SoftFloat)
158 FS += FS.empty() ? "+soft-float" : ",+soft-float";
159 bool BackChain = F.hasFnAttribute("backchain");
160 if (BackChain)
161 FS += FS.empty() ? "+backchain" : ",+backchain";
162
163 auto &I = SubtargetMap[CPU + TuneCPU + FS];
164 if (!I) {
165 // This needs to be done before we create a new subtarget since any
166 // creation will depend on the TM and the code generation flags on the
167 // function that reside in TargetOptions.
169 I = std::make_unique<SystemZSubtarget>(TargetTriple, CPU, TuneCPU, FS,
170 *this);
171 }
172
173 return I.get();
174}
175
178 // Use GenericScheduler if requested on CL or for Z10 which has no sched
179 // model.
180 if (GenericSched ||
181 !C->MF->getSubtarget().getSchedModel().hasInstrSchedModel())
182 return nullptr;
183
185}
186
191
192namespace {
193
194/// SystemZ Code Generator Pass Configuration Options.
195class SystemZPassConfig : public TargetPassConfig {
196public:
197 SystemZPassConfig(SystemZTargetMachine &TM, PassManagerBase &PM)
198 : TargetPassConfig(TM, PM) {}
199
200 SystemZTargetMachine &getSystemZTargetMachine() const {
202 }
203
204 void addIRPasses() override;
205 bool addInstSelector() override;
206 bool addILPOpts() override;
207 void addPreRegAlloc() override;
208 void addPostRewrite() override;
209 void addPostRegAlloc() override;
210 void addPreSched2() override;
211 void addPreEmitPass() override;
212};
213
214} // end anonymous namespace
215
216void SystemZPassConfig::addIRPasses() {
217 if (getOptLevel() != CodeGenOptLevel::None) {
218 addPass(createSystemZTDCPass());
220 }
221
223
225}
226
227bool SystemZPassConfig::addInstSelector() {
228 addPass(createSystemZISelDag(getSystemZTargetMachine(), getOptLevel()));
229
230 if (getOptLevel() != CodeGenOptLevel::None)
231 addPass(createSystemZLDCleanupPass(getSystemZTargetMachine()));
232
233 return false;
234}
235
236bool SystemZPassConfig::addILPOpts() {
237 addPass(&EarlyIfConverterLegacyID);
238
240 addPass(&MachineCombinerID);
241
242 return true;
243}
244
245void SystemZPassConfig::addPreRegAlloc() {
246 addPass(createSystemZCopyPhysRegsPass(getSystemZTargetMachine()));
247}
248
249void SystemZPassConfig::addPostRewrite() {
250 addPass(createSystemZPostRewritePass(getSystemZTargetMachine()));
251}
252
253void SystemZPassConfig::addPostRegAlloc() {
254 // PostRewrite needs to be run at -O0 also (in which case addPostRewrite()
255 // is not called).
256 if (getOptLevel() == CodeGenOptLevel::None)
257 addPass(createSystemZPostRewritePass(getSystemZTargetMachine()));
258}
259
260void SystemZPassConfig::addPreSched2() {
261 if (getOptLevel() != CodeGenOptLevel::None)
262 addPass(&IfConverterID);
263}
264
265void SystemZPassConfig::addPreEmitPass() {
266 // Do instruction shortening before compare elimination because some
267 // vector instructions will be shortened into opcodes that compare
268 // elimination recognizes.
269 if (getOptLevel() != CodeGenOptLevel::None)
270 addPass(createSystemZShortenInstPass(getSystemZTargetMachine()));
271
272 // We eliminate comparisons here rather than earlier because some
273 // transformations can change the set of available CC values and we
274 // generally want those transformations to have priority. This is
275 // especially true in the commonest case where the result of the comparison
276 // is used by a single in-range branch instruction, since we will then
277 // be able to fuse the compare and the branch instead.
278 //
279 // For example, two-address NILF can sometimes be converted into
280 // three-address RISBLG. NILF produces a CC value that indicates whether
281 // the low word is zero, but RISBLG does not modify CC at all. On the
282 // other hand, 64-bit ANDs like NILL can sometimes be converted to RISBG.
283 // The CC value produced by NILL isn't useful for our purposes, but the
284 // value produced by RISBG can be used for any comparison with zero
285 // (not just equality). So there are some transformations that lose
286 // CC values (while still being worthwhile) and others that happen to make
287 // the CC result more useful than it was originally.
288 //
289 // Another reason is that we only want to use BRANCH ON COUNT in cases
290 // where we know that the count register is not going to be spilled.
291 //
292 // Doing it so late makes it more likely that a register will be reused
293 // between the comparison and the branch, but it isn't clear whether
294 // preventing that would be a win or not.
295 if (getOptLevel() != CodeGenOptLevel::None)
296 addPass(createSystemZElimComparePass(getSystemZTargetMachine()));
297 addPass(createSystemZLongBranchPass(getSystemZTargetMachine()));
298
299 // Do final scheduling after all other optimizations, to get an
300 // optimal input for the decoder (branch relaxation must happen
301 // after block placement).
302 if (getOptLevel() != CodeGenOptLevel::None)
303 addPass(&PostMachineSchedulerID);
304}
305
307 return new SystemZPassConfig(*this, PM);
308}
309
312 return TargetTransformInfo(std::make_unique<SystemZTTIImpl>(this, F));
313}
314
static std::unique_ptr< TargetLoweringObjectFile > createTLOF(const Triple &TT)
static Reloc::Model getEffectiveRelocModel()
#define LLVM_ABI
Definition Compiler.h:213
#define LLVM_EXTERNAL_VISIBILITY
Definition Compiler.h:132
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
#define T
static cl::opt< bool > EnableMachineCombinerPass("ppc-machine-combiner", cl::desc("Enable the machine combiner pass"), cl::init(true), cl::Hidden)
const GCNTargetMachine & getTM(const GCNSubtarget *STI)
static CodeModel::Model getEffectiveSystemZCodeModel(std::optional< CodeModel::Model > CM, Reloc::Model RM, bool JIT)
static cl::opt< bool > GenericSched("generic-sched", cl::Hidden, cl::init(false), cl::desc("Run the generic pre-ra scheduler instead of the SystemZ " "scheduler."))
static cl::opt< bool > EnableMachineCombinerPass("systemz-machine-combiner", cl::desc("Enable the machine combiner pass"), cl::init(true), cl::Hidden)
LLVM_ABI LLVM_EXTERNAL_VISIBILITY void LLVMInitializeSystemZTarget()
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")
Target-Independent Code Generator Pass Configuration Options pass.
This pass exposes codegen information to IR-level passes.
static std::unique_ptr< TargetLoweringObjectFile > createTLOF()
Functions, function parameters, and return types can have attributes to indicate how they should be t...
Definition Attributes.h:105
LLVM_ABI StringRef getValueAsString() const
Return the attribute's value as a string.
bool isValid() const
Return true if the attribute is any kind of attribute.
Definition Attributes.h:261
CodeGenTargetMachineImpl(const Target &T, StringRef DataLayoutString, const Triple &TT, StringRef CPU, StringRef FS, const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM, CodeGenOptLevel OL)
static LLVM_ABI PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
A ScheduleDAG for scheduling lists of MachineInstr.
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
std::string str() const
str - Get the contents as an std::string.
Definition StringRef.h:222
ScheduleDAGInstrs * createMachineScheduler(MachineSchedContext *C) const override
Create an instance of ScheduleDAGInstrs to be run within the standard MachineScheduler pass for this ...
const SystemZSubtarget * getSubtargetImpl() const =delete
SystemZTargetMachine(const Target &T, const Triple &TT, StringRef CPU, StringRef FS, const TargetOptions &Options, std::optional< Reloc::Model > RM, std::optional< CodeModel::Model > CM, CodeGenOptLevel OL, bool JIT)
TargetTransformInfo getTargetTransformInfo(const Function &F) const override
Get a TargetTransformInfo implementation for the target.
MachineFunctionInfo * createMachineFunctionInfo(BumpPtrAllocator &Allocator, const Function &F, const TargetSubtargetInfo *STI) const override
Create the target's instance of MachineFunctionInfo.
TargetPassConfig * createPassConfig(PassManagerBase &PM) override
Create a pass configuration object to be used by addPassToEmitX methods for generating a pipeline of ...
ScheduleDAGInstrs * createPostMachineScheduler(MachineSchedContext *C) const override
Similar to createMachineScheduler but used when postRA machine scheduling is enabled.
Triple TargetTriple
Triple string, CPU name, and target feature strings the TargetMachine instance is created with.
const Triple & getTargetTriple() const
std::unique_ptr< const MCSubtargetInfo > STI
TargetOptions Options
void resetTargetOptions(const Function &F) const
Reset the target options based on the function's attributes.
Target-Independent Code Generator Pass Configuration Options.
virtual void addIRPasses()
Add common target configurable passes that perform LLVM IR to IR transforms following machine indepen...
TargetSubtargetInfo - Generic base class for all target subtargets.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Target - Wrapper for Target specific information.
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47
PassManagerBase - An abstract interface to allow code to add passes to a pass manager without having ...
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ DynamicNoPIC
Definition CodeGen.h:25
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26
ScheduleDAGMILive * createSchedLive(MachineSchedContext *C)
Create the standard converging machine scheduler.
Target & getTheSystemZTarget()
void initializeSystemZElimComparePass(PassRegistry &)
FunctionPass * createSystemZLongBranchPass(SystemZTargetMachine &TM)
FunctionPass * createSystemZISelDag(SystemZTargetMachine &TM, CodeGenOptLevel OptLevel)
FunctionPass * createSystemZCopyPhysRegsPass(SystemZTargetMachine &TM)
FunctionPass * createSystemZElimComparePass(SystemZTargetMachine &TM)
void initializeSystemZCopyPhysRegsPass(PassRegistry &)
LLVM_ABI char & PostMachineSchedulerID
PostMachineScheduler - This pass schedules machine instructions postRA.
void initializeSystemZLongBranchPass(PassRegistry &)
void initializeSystemZShortenInstPass(PassRegistry &)
LLVM_ABI char & EarlyIfConverterLegacyID
EarlyIfConverter - This pass performs if-conversion on SSA form by inserting cmov instructions.
LLVM_ABI char & MachineCombinerID
This pass performs instruction combining using trace metrics to estimate critical-path and resource d...
static Reloc::Model getEffectiveRelocModel(std::optional< Reloc::Model > RM)
void initializeSystemZDAGToDAGISelLegacyPass(PassRegistry &)
ScheduleDAGMI * createSchedPostRA(MachineSchedContext *C)
Create a generic scheduler with no vreg liveness or DAG mutation passes.
FunctionPass * createSystemZTDCPass()
LLVM_ABI FunctionPass * createLoopDataPrefetchPass()
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:163
FunctionPass * createSystemZShortenInstPass(SystemZTargetMachine &TM)
void initializeSystemZPostRewritePass(PassRegistry &)
CodeGenOptLevel
Code generation optimization level.
Definition CodeGen.h:82
void initializeSystemZTDCPassPass(PassRegistry &)
FunctionPass * createSystemZLDCleanupPass(SystemZTargetMachine &TM)
void initializeSystemZAsmPrinterPass(PassRegistry &)
FunctionPass * createSystemZPostRewritePass(SystemZTargetMachine &TM)
LLVM_ABI char & IfConverterID
IfConverter - This pass performs machine code if conversion.
LLVM_ABI FunctionPass * createAtomicExpandLegacyPass()
AtomicExpandPass - At IR level this pass replace atomic instructions with __atomic_* library calls,...
BumpPtrAllocatorImpl<> BumpPtrAllocator
The standard BumpPtrAllocator which just uses the default template parameters.
Definition Allocator.h:383
void initializeSystemZLDCleanupPass(PassRegistry &)
MachineFunctionInfo - This class can be derived from and used by targets to hold private target-speci...
static FuncInfoTy * create(BumpPtrAllocator &Allocator, const Function &F, const SubtargetTy *STI)
Factory function: default behavior is to call new using the supplied allocator.
MachineSchedContext provides enough context from the MachineScheduler pass for the target to instanti...
RegisterTargetMachine - Helper template for registering a target machine implementation,...