LLVM 20.0.0git
AArch64Subtarget.h
Go to the documentation of this file.
1//===--- AArch64Subtarget.h - Define Subtarget for the AArch64 -*- C++ -*--===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file declares the AArch64 specific subclass of TargetSubtarget.
10//
11//===----------------------------------------------------------------------===//
12
13#ifndef LLVM_LIB_TARGET_AARCH64_AARCH64SUBTARGET_H
14#define LLVM_LIB_TARGET_AARCH64_AARCH64SUBTARGET_H
15
17#include "AArch64ISelLowering.h"
18#include "AArch64InstrInfo.h"
19#include "AArch64PointerAuth.h"
20#include "AArch64RegisterInfo.h"
28#include "llvm/IR/DataLayout.h"
29
30#define GET_SUBTARGETINFO_HEADER
31#include "AArch64GenSubtargetInfo.inc"
32
33namespace llvm {
34class GlobalValue;
35class StringRef;
36class Triple;
37
39public:
42#define ARM_PROCESSOR_FAMILY(ENUM) ENUM,
43#include "llvm/TargetParser/AArch64TargetParserDef.inc"
44#undef ARM_PROCESSOR_FAMILY
45 };
46
47protected:
48 /// ARMProcFamily - ARM processor family: Cortex-A53, Cortex-A57, and others.
50
51 // Enable 64-bit vectorization in SLP.
53
54// Bool members corresponding to the SubtargetFeatures defined in tablegen
55#define GET_SUBTARGETINFO_MACRO(ATTRIBUTE, DEFAULT, GETTER) \
56 bool ATTRIBUTE = DEFAULT;
57#include "AArch64GenSubtargetInfo.inc"
58
63 // Default scatter/gather overhead.
64 unsigned ScatterOverhead = 10;
65 unsigned GatherOverhead = 10;
68 unsigned MaxPrefetchIterationsAhead = UINT_MAX;
73 unsigned MaxJumpTableSize = 0;
74
75 // ReserveXRegister[i] - X#i is not available as a general purpose register.
77
78 // ReserveXRegisterForRA[i] - X#i is not available for register allocator.
80
81 // CustomCallUsedXRegister[i] - X#i call saved.
83
85
88 std::optional<unsigned> StreamingHazardSize;
91 unsigned VScaleForTuning = 1;
93
95
96 /// TargetTriple - What processor and OS we're targeting.
98
103
104 /// GlobalISel related APIs.
105 std::unique_ptr<CallLowering> CallLoweringInfo;
106 std::unique_ptr<InlineAsmLowering> InlineAsmLoweringInfo;
107 std::unique_ptr<InstructionSelector> InstSelector;
108 std::unique_ptr<LegalizerInfo> Legalizer;
109 std::unique_ptr<RegisterBankInfo> RegBankInfo;
110
111private:
112 /// initializeSubtargetDependencies - Initializes using CPUString and the
113 /// passed in feature string so that we can use initializer lists for
114 /// subtarget initialization.
115 AArch64Subtarget &initializeSubtargetDependencies(StringRef FS,
116 StringRef CPUString,
117 StringRef TuneCPUString,
118 bool HasMinSize);
119
120 /// Initialize properties based on the selected processor family.
121 void initializeProperties(bool HasMinSize);
122
123public:
124 /// This constructor initializes the data members to match that
125 /// of the specified triple.
126 AArch64Subtarget(const Triple &TT, StringRef CPU, StringRef TuneCPU,
127 StringRef FS, const TargetMachine &TM, bool LittleEndian,
128 unsigned MinSVEVectorSizeInBitsOverride = 0,
129 unsigned MaxSVEVectorSizeInBitsOverride = 0,
130 bool IsStreaming = false, bool IsStreamingCompatible = false,
131 bool HasMinSize = false);
132
133// Getters for SubtargetFeatures defined in tablegen
134#define GET_SUBTARGETINFO_MACRO(ATTRIBUTE, DEFAULT, GETTER) \
135 bool GETTER() const { return ATTRIBUTE; }
136#include "AArch64GenSubtargetInfo.inc"
137
139 return &TSInfo;
140 }
141 const AArch64FrameLowering *getFrameLowering() const override {
142 return &FrameLowering;
143 }
144 const AArch64TargetLowering *getTargetLowering() const override {
145 return &TLInfo;
146 }
147 const AArch64InstrInfo *getInstrInfo() const override { return &InstrInfo; }
148 const AArch64RegisterInfo *getRegisterInfo() const override {
149 return &getInstrInfo()->getRegisterInfo();
150 }
151 const CallLowering *getCallLowering() const override;
152 const InlineAsmLowering *getInlineAsmLowering() const override;
154 const LegalizerInfo *getLegalizerInfo() const override;
155 const RegisterBankInfo *getRegBankInfo() const override;
156 const Triple &getTargetTriple() const { return TargetTriple; }
157 bool enableMachineScheduler() const override { return true; }
158 bool enablePostRAScheduler() const override { return usePostRAScheduler(); }
159 bool enableSubRegLiveness() const override { return EnableSubregLiveness; }
160
161 bool enableMachinePipeliner() const override;
162 bool useDFAforSMS() const override { return false; }
163
164 /// Returns ARM processor family.
165 /// Avoid this function! CPU specifics should be kept local to this class
166 /// and preferably modeled with SubtargetFeatures or properties in
167 /// initializeProperties().
169 return ARMProcFamily;
170 }
171
172 bool isXRaySupported() const override { return true; }
173
174 /// Returns true if the function has a streaming body.
175 bool isStreaming() const { return IsStreaming; }
176
177 /// Returns true if the function has a streaming-compatible body.
179
180 /// Returns the size of memory region that if accessed by both the CPU and
181 /// the SME unit could result in a hazard. 0 = disabled.
182 unsigned getStreamingHazardSize() const {
183 return StreamingHazardSize.value_or(
184 !hasSMEFA64() && hasSME() && hasSVE() ? 1024 : 0);
185 }
186
187 /// Returns true if the target has NEON and the function at runtime is known
188 /// to have NEON enabled (e.g. the function is known not to be in streaming-SVE
189 /// mode, which disables NEON instructions).
190 bool isNeonAvailable() const {
191 return hasNEON() &&
192 (hasSMEFA64() || (!isStreaming() && !isStreamingCompatible()));
193 }
194
195 /// Returns true if the target has SVE and can use the full range of SVE
196 /// instructions, for example because it knows the function is known not to be
197 /// in streaming-SVE mode or when the target has FEAT_FA64 enabled.
198 bool isSVEAvailable() const {
199 return hasSVE() &&
200 (hasSMEFA64() || (!isStreaming() && !isStreamingCompatible()));
201 }
202
203 /// Returns true if the target has access to the streaming-compatible subset
204 /// of SVE instructions.
205 bool isStreamingSVEAvailable() const { return hasSME() && isStreaming(); }
206
207 /// Returns true if the target has access to either the full range of SVE
208 /// instructions, or the streaming-compatible subset of SVE instructions.
210 return hasSVE() || isStreamingSVEAvailable();
211 }
212
214 // Don't assume any minimum vector size when PSTATE.SM may not be 0, because
215 // we don't yet support streaming-compatible codegen support that we trust
216 // is safe for functions that may be executed in streaming-SVE mode.
217 // By returning '0' here, we disable vectorization.
218 if (!isSVEAvailable() && !isNeonAvailable())
219 return 0;
221 }
222
223 bool isXRegisterReserved(size_t i) const { return ReserveXRegister[i]; }
224 bool isXRegisterReservedForRA(size_t i) const { return ReserveXRegisterForRA[i]; }
225 unsigned getNumXRegisterReserved() const {
226 BitVector AllReservedX(AArch64::GPR64commonRegClass.getNumRegs());
227 AllReservedX |= ReserveXRegister;
228 AllReservedX |= ReserveXRegisterForRA;
229 return AllReservedX.count();
230 }
231 bool isLRReservedForRA() const { return ReserveLRForRA; }
232 bool isXRegCustomCalleeSaved(size_t i) const {
233 return CustomCallSavedXRegs[i];
234 }
236
237 /// Return true if the CPU supports any kind of instruction fusion.
238 bool hasFusion() const {
239 return hasArithmeticBccFusion() || hasArithmeticCbzFusion() ||
240 hasFuseAES() || hasFuseArithmeticLogic() || hasFuseCCSelect() ||
241 hasFuseAdrpAdd() || hasFuseLiterals();
242 }
243
246 }
247 unsigned getMaxInterleaveFactor() const { return MaxInterleaveFactor; }
248 unsigned getVectorInsertExtractBaseCost() const;
249 unsigned getCacheLineSize() const override { return CacheLineSize; }
250 unsigned getScatterOverhead() const { return ScatterOverhead; }
251 unsigned getGatherOverhead() const { return GatherOverhead; }
252 unsigned getPrefetchDistance() const override { return PrefetchDistance; }
253 unsigned getMinPrefetchStride(unsigned NumMemAccesses,
254 unsigned NumStridedMemAccesses,
255 unsigned NumPrefetches,
256 bool HasCall) const override {
257 return MinPrefetchStride;
258 }
259 unsigned getMaxPrefetchIterationsAhead() const override {
261 }
264 }
266
269 }
270
271 unsigned getMaximumJumpTableSize() const { return MaxJumpTableSize; }
272 unsigned getMinimumJumpTableEntries() const {
274 }
275
276 /// CPU has TBI (top byte of addresses is ignored during HW address
277 /// translation) and OS enables it.
279
280 bool isLittleEndian() const { return IsLittle; }
281
282 bool isTargetDarwin() const { return TargetTriple.isOSDarwin(); }
283 bool isTargetIOS() const { return TargetTriple.isiOS(); }
284 bool isTargetLinux() const { return TargetTriple.isOSLinux(); }
285 bool isTargetWindows() const { return TargetTriple.isOSWindows(); }
286 bool isTargetAndroid() const { return TargetTriple.isAndroid(); }
287 bool isTargetFuchsia() const { return TargetTriple.isOSFuchsia(); }
289
290 bool isTargetCOFF() const { return TargetTriple.isOSBinFormatCOFF(); }
291 bool isTargetELF() const { return TargetTriple.isOSBinFormatELF(); }
293
294 bool isTargetILP32() const {
295 return TargetTriple.isArch32Bit() ||
297 }
298
299 bool useAA() const override;
300
301 bool addrSinkUsingGEPs() const override {
302 // Keeping GEPs inbounds is important for exploiting AArch64
303 // addressing-modes in ILP32 mode.
304 return useAA() || isTargetILP32();
305 }
306
307 bool useSmallAddressing() const {
310 // Kernel is currently allowed only for Fuchsia targets,
311 // where it is the same as Small for almost all purposes.
312 case CodeModel::Small:
313 return true;
314 default:
315 return false;
316 }
317 }
318
319 /// ParseSubtargetFeatures - Parses features string setting specified
320 /// subtarget options. Definition of function is auto generated by tblgen.
322
323 /// ClassifyGlobalReference - Find the target operand flags that describe
324 /// how a global value should be referenced for the current subtarget.
325 unsigned ClassifyGlobalReference(const GlobalValue *GV,
326 const TargetMachine &TM) const;
327
329 const TargetMachine &TM) const;
330
331 /// This function is design to compatible with the function def in other
332 /// targets and escape build error about the virtual function def in base
333 /// class TargetSubtargetInfo. Updeate me if AArch64 target need to use it.
334 unsigned char
336 return 0;
337 }
338
340 unsigned NumRegionInstrs) const override;
341 void adjustSchedDependency(SUnit *Def, int DefOpIdx, SUnit *Use, int UseOpIdx,
342 SDep &Dep,
343 const TargetSchedModel *SchedModel) const override;
344
345 bool enableEarlyIfConversion() const override;
346
347 std::unique_ptr<PBQPRAConstraint> getCustomPBQPConstraints() const override;
348
349 bool isCallingConvWin64(CallingConv::ID CC, bool IsVarArg) const {
350 switch (CC) {
351 case CallingConv::C:
355 return isTargetWindows();
357 return IsVarArg && isTargetWindows();
359 return true;
360 default:
361 return false;
362 }
363 }
364
365 /// Return whether FrameLowering should always set the "extended frame
366 /// present" bit in FP, or set it based on a symbol in the runtime.
368 // Older OS versions (particularly system unwinders) are confused by the
369 // Swift extended frame, so when building code that might be run on them we
370 // must dynamically query the concurrency library to determine whether
371 // extended frames should be flagged as present.
372 const Triple &TT = getTargetTriple();
373
374 unsigned Major = TT.getOSVersion().getMajor();
375 switch(TT.getOS()) {
376 default:
377 return false;
378 case Triple::IOS:
379 case Triple::TvOS:
380 return Major < 15;
381 case Triple::WatchOS:
382 return Major < 8;
383 case Triple::MacOSX:
384 case Triple::Darwin:
385 return Major < 12;
386 }
387 }
388
389 void mirFileLoaded(MachineFunction &MF) const override;
390
391 // Return the known range for the bit length of SVE data registers. A value
392 // of 0 means nothing is known about that particular limit beyong what's
393 // implied by the architecture.
394 unsigned getMaxSVEVectorSizeInBits() const {
396 "Tried to get SVE vector length without SVE support!");
398 }
399
400 unsigned getMinSVEVectorSizeInBits() const {
402 "Tried to get SVE vector length without SVE support!");
404 }
405
408 return false;
409
410 // Prefer NEON unless larger SVE registers are available.
411 return !isNeonAvailable() || getMinSVEVectorSizeInBits() >= 256;
412 }
413
416 return false;
419 }
420
421 unsigned getVScaleForTuning() const { return VScaleForTuning; }
422
424 return DefaultSVETFOpts;
425 }
426
427 /// Returns true to use the addvl/inc/dec instructions, as opposed to separate
428 /// add + cnt instructions.
429 bool useScalarIncVL() const;
430
431 const char* getChkStkName() const {
432 if (isWindowsArm64EC())
433 return "#__chkstk_arm64ec";
434 return "__chkstk";
435 }
436
437 const char* getSecurityCheckCookieName() const {
438 if (isWindowsArm64EC())
439 return "#__security_check_cookie_arm64ec";
440 return "__security_check_cookie";
441 }
442
443 /// Choose a method of checking LR before performing a tail call.
446
447 /// Compute the integer discriminator for a given BlockAddress constant, if
448 /// blockaddress signing is enabled, or std::nullopt otherwise.
449 /// Blockaddress signing is controlled by the function attribute
450 /// "ptrauth-indirect-gotos" on the parent function.
451 /// Note that this assumes the discriminator is independent of the indirect
452 /// goto branch site itself, i.e., it's the same for all BlockAddresses in
453 /// a function.
454 std::optional<uint16_t>
456};
457} // End llvm namespace
458
459#endif
This file describes how to lower LLVM calls to machine code calls.
This file describes how to lower LLVM inline asm to machine code INLINEASM.
Interface for Targets to specify which operations they can successfully select and how the others sho...
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
const AArch64RegisterInfo & getRegisterInfo() const
getRegisterInfo - TargetInstrInfo is a superset of MRegister info.
const AArch64SelectionDAGInfo * getSelectionDAGInfo() const override
const CallLowering * getCallLowering() const override
const AArch64RegisterInfo * getRegisterInfo() const override
bool isNeonAvailable() const
Returns true if the target has NEON and the function at runtime is known to have NEON enabled (e....
bool isLRReservedForRA() const
TailFoldingOpts DefaultSVETFOpts
unsigned getMinPrefetchStride(unsigned NumMemAccesses, unsigned NumStridedMemAccesses, unsigned NumPrefetches, bool HasCall) const override
bool addrSinkUsingGEPs() const override
std::unique_ptr< InstructionSelector > InstSelector
ARMProcFamilyEnum ARMProcFamily
ARMProcFamily - ARM processor family: Cortex-A53, Cortex-A57, and others.
unsigned getMinimumJumpTableEntries() const
std::unique_ptr< RegisterBankInfo > RegBankInfo
bool useSVEForFixedLengthVectors(EVT VT) const
const AArch64InstrInfo * getInstrInfo() const override
bool useSmallAddressing() const
bool hasFusion() const
Return true if the CPU supports any kind of instruction fusion.
AArch64SelectionDAGInfo TSInfo
const char * getSecurityCheckCookieName() const
unsigned getMaximumJumpTableSize() const
std::optional< unsigned > StreamingHazardSize
void overrideSchedPolicy(MachineSchedPolicy &Policy, unsigned NumRegionInstrs) const override
AArch64FrameLowering FrameLowering
bool enableEarlyIfConversion() const override
const InlineAsmLowering * getInlineAsmLowering() const override
unsigned getCacheLineSize() const override
unsigned getVectorInsertExtractBaseCost() const
bool enableMachinePipeliner() const override
ARMProcFamilyEnum getProcFamily() const
Returns ARM processor family.
std::unique_ptr< CallLowering > CallLoweringInfo
GlobalISel related APIs.
std::optional< uint16_t > getPtrAuthBlockAddressDiscriminatorIfEnabled(const Function &ParentFn) const
Compute the integer discriminator for a given BlockAddress constant, if blockaddress signing is enabl...
unsigned getGatherOverhead() const
bool isXRegisterReservedForRA(size_t i) const
unsigned getNumXRegisterReserved() const
unsigned classifyGlobalFunctionReference(const GlobalValue *GV, const TargetMachine &TM) const
bool useAA() const override
bool isStreamingSVEAvailable() const
Returns true if the target has access to the streaming-compatible subset of SVE instructions.
const AArch64TargetLowering * getTargetLowering() const override
Align getPrefLoopAlignment() const
Align getPrefFunctionAlignment() const
unsigned getMaxBytesForLoopAlignment() const
bool supportsAddressTopByteIgnored() const
CPU has TBI (top byte of addresses is ignored during HW address translation) and OS enables it.
unsigned getMaxInterleaveFactor() const
unsigned char classifyGlobalFunctionReference(const GlobalValue *GV) const override
This function is design to compatible with the function def in other targets and escape build error a...
const Triple & getTargetTriple() const
unsigned getStreamingHazardSize() const
Returns the size of memory region that if accessed by both the CPU and the SME unit could result in a...
bool isStreamingCompatible() const
Returns true if the function has a streaming-compatible body.
const char * getChkStkName() const
bool isXRegCustomCalleeSaved(size_t i) const
void adjustSchedDependency(SUnit *Def, int DefOpIdx, SUnit *Use, int UseOpIdx, SDep &Dep, const TargetSchedModel *SchedModel) const override
void mirFileLoaded(MachineFunction &MF) const override
Triple TargetTriple
TargetTriple - What processor and OS we're targeting.
InstructionSelector * getInstructionSelector() const override
bool isSVEorStreamingSVEAvailable() const
Returns true if the target has access to either the full range of SVE instructions,...
bool enableSubRegLiveness() const override
TailFoldingOpts getSVETailFoldingDefaultOpts() const
bool useSVEForFixedLengthVectors() const
unsigned ClassifyGlobalReference(const GlobalValue *GV, const TargetMachine &TM) const
ClassifyGlobalReference - Find the target operand flags that describe how a global value should be re...
void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS)
ParseSubtargetFeatures - Parses features string setting specified subtarget options.
unsigned getMinVectorRegisterBitWidth() const
bool isStreaming() const
Returns true if the function has a streaming body.
bool isXRegisterReserved(size_t i) const
unsigned getMaxPrefetchIterationsAhead() const override
bool useScalarIncVL() const
Returns true to use the addvl/inc/dec instructions, as opposed to separate add + cnt instructions.
bool useDFAforSMS() const override
const LegalizerInfo * getLegalizerInfo() const override
bool enableMachineScheduler() const override
unsigned getScatterOverhead() const
bool enablePostRAScheduler() const override
std::unique_ptr< PBQPRAConstraint > getCustomPBQPConstraints() const override
unsigned getEpilogueVectorizationMinVF() const
unsigned getMaxSVEVectorSizeInBits() const
bool isCallingConvWin64(CallingConv::ID CC, bool IsVarArg) const
unsigned getVScaleForTuning() const
unsigned getMinSVEVectorSizeInBits() const
AArch64PAuth::AuthCheckMethod getAuthenticatedLRCheckMethod(const MachineFunction &MF) const
Choose a method of checking LR before performing a tail call.
AArch64InstrInfo InstrInfo
AArch64TargetLowering TLInfo
const RegisterBankInfo * getRegBankInfo() const override
std::unique_ptr< LegalizerInfo > Legalizer
std::unique_ptr< InlineAsmLowering > InlineAsmLoweringInfo
bool isXRaySupported() const override
bool isSVEAvailable() const
Returns true if the target has SVE and can use the full range of SVE instructions,...
bool hasCustomCallingConv() const
const AArch64FrameLowering * getFrameLowering() const override
bool swiftAsyncContextIsDynamicallySet() const
Return whether FrameLowering should always set the "extended frame present" bit in FP,...
unsigned getPrefetchDistance() const override
size_type count() const
count - Returns the number of bits which are set.
Definition: BitVector.h:162
bool any() const
any - Returns true if any bit is set.
Definition: BitVector.h:170
Holds all the information related to register banks.
Scheduling dependency.
Definition: ScheduleDAG.h:49
Scheduling unit. This is a node in the scheduling DAG.
Definition: ScheduleDAG.h:242
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51
const TargetMachine & getTargetMachine() const
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:77
CodeModel::Model getCodeModel() const
Returns the code model.
Provide an instruction scheduling machine model to CodeGen passes.
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44
bool isAndroid() const
Tests whether the target is Android.
Definition: Triple.h:797
bool isOSBinFormatMachO() const
Tests whether the environment is MachO.
Definition: Triple.h:760
bool isOSBinFormatCOFF() const
Tests whether the OS uses the COFF binary format.
Definition: Triple.h:752
EnvironmentType getEnvironment() const
Get the parsed environment type of this triple.
Definition: Triple.h:412
bool isOSWindows() const
Tests whether the OS is Windows.
Definition: Triple.h:652
bool isOSLinux() const
Tests whether the OS is Linux.
Definition: Triple.h:706
bool isOSDarwin() const
Is this a "Darwin" OS (macOS, iOS, tvOS, watchOS, XROS, or DriverKit).
Definition: Triple.h:585
bool isWindowsArm64EC() const
Definition: Triple.h:668
bool isiOS() const
Is this an iOS triple.
Definition: Triple.h:553
bool isArch32Bit() const
Test whether the architecture is 32-bit.
Definition: Triple.cpp:1718
bool isOSFuchsia() const
Definition: Triple.h:615
bool isOSBinFormatELF() const
Tests whether the OS uses the ELF binary format.
Definition: Triple.h:747
A Use represents the edge between a Value definition and its users.
Definition: Use.h:43
AuthCheckMethod
Variants of check performed on an authenticated pointer.
static constexpr unsigned SVEBitsPerBlock
@ Swift
Calling convention for Swift.
Definition: CallingConv.h:69
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition: CallingConv.h:41
@ PreserveNone
Used for runtime calls that preserves none general registers.
Definition: CallingConv.h:90
@ Win64
The C convention as implemented on Windows/x86-64 and AArch64.
Definition: CallingConv.h:159
@ SwiftTail
This follows the Swift calling convention in how arguments are passed but guarantees tail calls will ...
Definition: CallingConv.h:87
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
TailFoldingOpts
An enum to describe what types of loops we should attempt to tail-fold: Disabled: None Reductions: Lo...
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39
Extended Value Type.
Definition: ValueTypes.h:35
uint64_t getFixedSizeInBits() const
Return the size of the specified fixed width value type in bits.
Definition: ValueTypes.h:376
bool isFixedLengthVector() const
Definition: ValueTypes.h:181
Define a generic scheduling policy for targets that don't provide their own MachineSchedStrategy.