LLVM 22.0.0git
AArch64Subtarget.h
Go to the documentation of this file.
1//===--- AArch64Subtarget.h - Define Subtarget for the AArch64 -*- C++ -*--===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file declares the AArch64 specific subclass of TargetSubtarget.
10//
11//===----------------------------------------------------------------------===//
12
13#ifndef LLVM_LIB_TARGET_AARCH64_AARCH64SUBTARGET_H
14#define LLVM_LIB_TARGET_AARCH64_AARCH64SUBTARGET_H
15
17#include "AArch64ISelLowering.h"
18#include "AArch64InstrInfo.h"
19#include "AArch64PointerAuth.h"
20#include "AArch64RegisterInfo.h"
28#include "llvm/IR/DataLayout.h"
30
31#define GET_SUBTARGETINFO_HEADER
32#include "AArch64GenSubtargetInfo.inc"
33
34namespace llvm {
35class GlobalValue;
36class StringRef;
37
39public:
42#define ARM_PROCESSOR_FAMILY(ENUM) ENUM,
43#include "llvm/TargetParser/AArch64TargetParserDef.inc"
44#undef ARM_PROCESSOR_FAMILY
45 };
46
47protected:
48 /// ARMProcFamily - ARM processor family: Cortex-A53, Cortex-A57, and others.
50
51 // Enable 64-bit vectorization in SLP.
53
54// Bool members corresponding to the SubtargetFeatures defined in tablegen
55#define GET_SUBTARGETINFO_MACRO(ATTRIBUTE, DEFAULT, GETTER) \
56 bool ATTRIBUTE = DEFAULT;
57#include "AArch64GenSubtargetInfo.inc"
58
63 // Default scatter/gather overhead.
64 unsigned ScatterOverhead = 10;
65 unsigned GatherOverhead = 10;
68 unsigned MaxPrefetchIterationsAhead = UINT_MAX;
73 unsigned MaxJumpTableSize = 0;
74
75 // ReserveXRegister[i] - X#i is not available as a general purpose register.
77
78 // ReserveXRegisterForRA[i] - X#i is not available for register allocator.
80
81 // CustomCallUsedXRegister[i] - X#i call saved.
83
85
88 std::optional<unsigned> StreamingHazardSize;
91 unsigned VScaleForTuning = 1;
93
95
96 /// TargetTriple - What processor and OS we're targeting.
98
103
104 /// GlobalISel related APIs.
105 std::unique_ptr<CallLowering> CallLoweringInfo;
106 std::unique_ptr<InlineAsmLowering> InlineAsmLoweringInfo;
107 std::unique_ptr<InstructionSelector> InstSelector;
108 std::unique_ptr<LegalizerInfo> Legalizer;
109 std::unique_ptr<RegisterBankInfo> RegBankInfo;
110
111private:
112 /// initializeSubtargetDependencies - Initializes using CPUString and the
113 /// passed in feature string so that we can use initializer lists for
114 /// subtarget initialization.
115 AArch64Subtarget &initializeSubtargetDependencies(StringRef FS,
116 StringRef CPUString,
117 StringRef TuneCPUString,
118 bool HasMinSize);
119
120 /// Initialize properties based on the selected processor family.
121 void initializeProperties(bool HasMinSize);
122
123public:
124 /// This constructor initializes the data members to match that
125 /// of the specified triple.
126 AArch64Subtarget(const Triple &TT, StringRef CPU, StringRef TuneCPU,
127 StringRef FS, const TargetMachine &TM, bool LittleEndian,
128 unsigned MinSVEVectorSizeInBitsOverride = 0,
129 unsigned MaxSVEVectorSizeInBitsOverride = 0,
130 bool IsStreaming = false, bool IsStreamingCompatible = false,
131 bool HasMinSize = false);
132
133// Getters for SubtargetFeatures defined in tablegen
134#define GET_SUBTARGETINFO_MACRO(ATTRIBUTE, DEFAULT, GETTER) \
135 bool GETTER() const { return ATTRIBUTE; }
136#include "AArch64GenSubtargetInfo.inc"
137
139 return &TSInfo;
140 }
141 const AArch64FrameLowering *getFrameLowering() const override {
142 return &FrameLowering;
143 }
144 const AArch64TargetLowering *getTargetLowering() const override {
145 return &TLInfo;
146 }
147 const AArch64InstrInfo *getInstrInfo() const override { return &InstrInfo; }
148 const AArch64RegisterInfo *getRegisterInfo() const override {
149 return &getInstrInfo()->getRegisterInfo();
150 }
151 const CallLowering *getCallLowering() const override;
152 const InlineAsmLowering *getInlineAsmLowering() const override;
154 const LegalizerInfo *getLegalizerInfo() const override;
155 const RegisterBankInfo *getRegBankInfo() const override;
156 const Triple &getTargetTriple() const { return TargetTriple; }
157 bool enableMachineScheduler() const override { return true; }
158 bool enablePostRAScheduler() const override { return usePostRAScheduler(); }
159 bool enableSubRegLiveness() const override { return EnableSubregLiveness; }
160
161 bool enableMachinePipeliner() const override;
162 bool useDFAforSMS() const override { return false; }
163
164 /// Returns ARM processor family.
165 /// Avoid this function! CPU specifics should be kept local to this class
166 /// and preferably modeled with SubtargetFeatures or properties in
167 /// initializeProperties().
169 return ARMProcFamily;
170 }
171
172 bool isXRaySupported() const override { return true; }
173
174 /// Returns true if the function has a streaming body.
175 bool isStreaming() const { return IsStreaming; }
176
177 /// Returns true if the function has a streaming-compatible body.
179
180 /// Returns the size of memory region that if accessed by both the CPU and
181 /// the SME unit could result in a hazard. 0 = disabled.
182 unsigned getStreamingHazardSize() const {
183 return StreamingHazardSize.value_or(
184 !hasSMEFA64() && hasSME() && hasSVE() ? 1024 : 0);
185 }
186
187 /// Returns true if the target has NEON and the function at runtime is known
188 /// to have NEON enabled (e.g. the function is known not to be in streaming-SVE
189 /// mode, which disables NEON instructions).
190 bool isNeonAvailable() const {
191 return hasNEON() &&
192 (hasSMEFA64() || (!isStreaming() && !isStreamingCompatible()));
193 }
194
195 /// Returns true if the target has SVE and can use the full range of SVE
196 /// instructions, for example because it knows the function is known not to be
197 /// in streaming-SVE mode or when the target has FEAT_FA64 enabled.
198 bool isSVEAvailable() const {
199 return hasSVE() &&
200 (hasSMEFA64() || (!isStreaming() && !isStreamingCompatible()));
201 }
202
203 /// Returns true if the target has access to the streaming-compatible subset
204 /// of SVE instructions.
205 bool isStreamingSVEAvailable() const { return hasSME() && isStreaming(); }
206
207 /// Returns true if the target has access to either the full range of SVE
208 /// instructions, or the streaming-compatible subset of SVE instructions.
210 return hasSVE() || isStreamingSVEAvailable();
211 }
212
213 /// Returns true if the target has access to either the full range of SVE
214 /// instructions, or the streaming-compatible subset of SVE instructions
215 /// available to SME2.
217 return isSVEAvailable() || (isSVEorStreamingSVEAvailable() && hasSME2());
218 }
219
221 // Don't assume any minimum vector size when PSTATE.SM may not be 0, because
222 // we don't yet support streaming-compatible codegen support that we trust
223 // is safe for functions that may be executed in streaming-SVE mode.
224 // By returning '0' here, we disable vectorization.
225 if (!isSVEAvailable() && !isNeonAvailable())
226 return 0;
228 }
229
230 bool isXRegisterReserved(size_t i) const { return ReserveXRegister[i]; }
231 bool isXRegisterReservedForRA(size_t i) const { return ReserveXRegisterForRA[i]; }
232 unsigned getNumXRegisterReserved() const {
233 BitVector AllReservedX(AArch64::GPR64commonRegClass.getNumRegs());
234 AllReservedX |= ReserveXRegister;
235 AllReservedX |= ReserveXRegisterForRA;
236 return AllReservedX.count();
237 }
238 bool isLRReservedForRA() const { return ReserveLRForRA; }
239 bool isXRegCustomCalleeSaved(size_t i) const {
240 return CustomCallSavedXRegs[i];
241 }
242 bool hasCustomCallingConv() const { return CustomCallSavedXRegs.any(); }
243
244 /// Return true if the CPU supports any kind of instruction fusion.
245 bool hasFusion() const {
246 return hasArithmeticBccFusion() || hasArithmeticCbzFusion() ||
247 hasFuseAES() || hasFuseArithmeticLogic() || hasFuseCmpCSel() ||
248 hasFuseCmpCSet() || hasFuseAdrpAdd() || hasFuseLiterals();
249 }
250
253 }
254 unsigned getMaxInterleaveFactor() const { return MaxInterleaveFactor; }
255 unsigned getVectorInsertExtractBaseCost() const;
256 unsigned getCacheLineSize() const override { return CacheLineSize; }
257 unsigned getScatterOverhead() const { return ScatterOverhead; }
258 unsigned getGatherOverhead() const { return GatherOverhead; }
259 unsigned getPrefetchDistance() const override { return PrefetchDistance; }
260 unsigned getMinPrefetchStride(unsigned NumMemAccesses,
261 unsigned NumStridedMemAccesses,
262 unsigned NumPrefetches,
263 bool HasCall) const override {
264 return MinPrefetchStride;
265 }
266 unsigned getMaxPrefetchIterationsAhead() const override {
268 }
273
276 }
277
278 unsigned getMaximumJumpTableSize() const { return MaxJumpTableSize; }
279 unsigned getMinimumJumpTableEntries() const {
281 }
282
283 /// CPU has TBI (top byte of addresses is ignored during HW address
284 /// translation) and OS enables it.
286
287 bool isLittleEndian() const { return IsLittle; }
288
289 bool isTargetDarwin() const { return TargetTriple.isOSDarwin(); }
290 bool isTargetIOS() const { return TargetTriple.isiOS(); }
291 bool isTargetLinux() const { return TargetTriple.isOSLinux(); }
292 bool isTargetWindows() const { return TargetTriple.isOSWindows(); }
293 bool isTargetAndroid() const { return TargetTriple.isAndroid(); }
294 bool isTargetFuchsia() const { return TargetTriple.isOSFuchsia(); }
295 bool isWindowsArm64EC() const { return TargetTriple.isWindowsArm64EC(); }
296
297 bool isTargetCOFF() const { return TargetTriple.isOSBinFormatCOFF(); }
298 bool isTargetELF() const { return TargetTriple.isOSBinFormatELF(); }
299 bool isTargetMachO() const { return TargetTriple.isOSBinFormatMachO(); }
300
301 bool isTargetILP32() const {
302 return TargetTriple.isArch32Bit() ||
303 TargetTriple.getEnvironment() == Triple::GNUILP32;
304 }
305
306 bool useAA() const override;
307
308 bool addrSinkUsingGEPs() const override {
309 // Keeping GEPs inbounds is important for exploiting AArch64
310 // addressing-modes in ILP32 mode.
311 return useAA() || isTargetILP32();
312 }
313
314 bool useSmallAddressing() const {
315 switch (TLInfo.getTargetMachine().getCodeModel()) {
317 // Kernel is currently allowed only for Fuchsia targets,
318 // where it is the same as Small for almost all purposes.
319 case CodeModel::Small:
320 return true;
321 default:
322 return false;
323 }
324 }
325
326 /// Returns whether the operating system makes it safer to store sensitive
327 /// values in x16 and x17 as opposed to other registers.
328 bool isX16X17Safer() const;
329
330 /// ParseSubtargetFeatures - Parses features string setting specified
331 /// subtarget options. Definition of function is auto generated by tblgen.
333
334 /// ClassifyGlobalReference - Find the target operand flags that describe
335 /// how a global value should be referenced for the current subtarget.
336 unsigned ClassifyGlobalReference(const GlobalValue *GV,
337 const TargetMachine &TM) const;
338
340 const TargetMachine &TM) const;
341
342 /// This function is design to compatible with the function def in other
343 /// targets and escape build error about the virtual function def in base
344 /// class TargetSubtargetInfo. Updeate me if AArch64 target need to use it.
345 unsigned char
347 return 0;
348 }
349
351 const SchedRegion &Region) const override;
352
353 void adjustSchedDependency(SUnit *Def, int DefOpIdx, SUnit *Use, int UseOpIdx,
354 SDep &Dep,
355 const TargetSchedModel *SchedModel) const override;
356
357 bool enableEarlyIfConversion() const override;
358
359 std::unique_ptr<PBQPRAConstraint> getCustomPBQPConstraints() const override;
360
361 bool isCallingConvWin64(CallingConv::ID CC, bool IsVarArg) const {
362 switch (CC) {
363 case CallingConv::C:
367 return isTargetWindows();
369 return IsVarArg && isTargetWindows();
371 return true;
372 default:
373 return false;
374 }
375 }
376
377 /// Return whether FrameLowering should always set the "extended frame
378 /// present" bit in FP, or set it based on a symbol in the runtime.
380 // Older OS versions (particularly system unwinders) are confused by the
381 // Swift extended frame, so when building code that might be run on them we
382 // must dynamically query the concurrency library to determine whether
383 // extended frames should be flagged as present.
384 const Triple &TT = getTargetTriple();
385
386 unsigned Major = TT.getOSVersion().getMajor();
387 switch(TT.getOS()) {
388 default:
389 return false;
390 case Triple::IOS:
391 case Triple::TvOS:
392 return Major < 15;
393 case Triple::WatchOS:
394 return Major < 8;
395 case Triple::MacOSX:
396 case Triple::Darwin:
397 return Major < 12;
398 }
399 }
400
401 void mirFileLoaded(MachineFunction &MF) const override;
402
403 // Return the known range for the bit length of SVE data registers. A value
404 // of 0 means nothing is known about that particular limit beyond what's
405 // implied by the architecture.
406 unsigned getMaxSVEVectorSizeInBits() const {
408 "Tried to get SVE vector length without SVE support!");
410 }
411
412 unsigned getMinSVEVectorSizeInBits() const {
414 "Tried to get SVE vector length without SVE support!");
416 }
417
418 // Return the known bit length of SVE data registers. A value of 0 means the
419 // length is unknown beyond what's implied by the architecture.
420 unsigned getSVEVectorSizeInBits() const {
422 "Tried to get SVE vector length without SVE support!");
425 return 0;
426 }
427
430 return false;
431
432 // Prefer NEON unless larger SVE registers are available.
433 return !isNeonAvailable() || getMinSVEVectorSizeInBits() >= 256;
434 }
435
438 return false;
441 }
442
443 unsigned getVScaleForTuning() const { return VScaleForTuning; }
444
448
449 /// Returns true to use the addvl/inc/dec instructions, as opposed to separate
450 /// add + cnt instructions.
451 bool useScalarIncVL() const;
452
453 const char* getChkStkName() const {
454 if (isWindowsArm64EC())
455 return "#__chkstk_arm64ec";
456 return "__chkstk";
457 }
458
459 /// Choose a method of checking LR before performing a tail call.
462
463 /// Compute the integer discriminator for a given BlockAddress constant, if
464 /// blockaddress signing is enabled, or std::nullopt otherwise.
465 /// Blockaddress signing is controlled by the function attribute
466 /// "ptrauth-indirect-gotos" on the parent function.
467 /// Note that this assumes the discriminator is independent of the indirect
468 /// goto branch site itself, i.e., it's the same for all BlockAddresses in
469 /// a function.
470 std::optional<uint16_t>
472};
473} // End llvm namespace
474
475#endif
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
This file describes how to lower LLVM calls to machine code calls.
This file describes how to lower LLVM inline asm to machine code INLINEASM.
Interface for Targets to specify which operations they can successfully select and how the others sho...
const AArch64RegisterInfo & getRegisterInfo() const
getRegisterInfo - TargetInstrInfo is a superset of MRegister info.
AArch64Subtarget(const Triple &TT, StringRef CPU, StringRef TuneCPU, StringRef FS, const TargetMachine &TM, bool LittleEndian, unsigned MinSVEVectorSizeInBitsOverride=0, unsigned MaxSVEVectorSizeInBitsOverride=0, bool IsStreaming=false, bool IsStreamingCompatible=false, bool HasMinSize=false)
This constructor initializes the data members to match that of the specified triple.
const AArch64SelectionDAGInfo * getSelectionDAGInfo() const override
const CallLowering * getCallLowering() const override
const AArch64RegisterInfo * getRegisterInfo() const override
bool isNeonAvailable() const
Returns true if the target has NEON and the function at runtime is known to have NEON enabled (e....
TailFoldingOpts DefaultSVETFOpts
unsigned getMinPrefetchStride(unsigned NumMemAccesses, unsigned NumStridedMemAccesses, unsigned NumPrefetches, bool HasCall) const override
bool addrSinkUsingGEPs() const override
std::unique_ptr< InstructionSelector > InstSelector
ARMProcFamilyEnum ARMProcFamily
ARMProcFamily - ARM processor family: Cortex-A53, Cortex-A57, and others.
unsigned getMinimumJumpTableEntries() const
std::unique_ptr< RegisterBankInfo > RegBankInfo
bool useSVEForFixedLengthVectors(EVT VT) const
const AArch64InstrInfo * getInstrInfo() const override
bool hasFusion() const
Return true if the CPU supports any kind of instruction fusion.
AArch64SelectionDAGInfo TSInfo
unsigned getMaximumJumpTableSize() const
std::optional< unsigned > StreamingHazardSize
AArch64FrameLowering FrameLowering
bool enableEarlyIfConversion() const override
const InlineAsmLowering * getInlineAsmLowering() const override
unsigned getCacheLineSize() const override
unsigned getVectorInsertExtractBaseCost() const
bool enableMachinePipeliner() const override
ARMProcFamilyEnum getProcFamily() const
Returns ARM processor family.
std::unique_ptr< CallLowering > CallLoweringInfo
GlobalISel related APIs.
std::optional< uint16_t > getPtrAuthBlockAddressDiscriminatorIfEnabled(const Function &ParentFn) const
Compute the integer discriminator for a given BlockAddress constant, if blockaddress signing is enabl...
unsigned getGatherOverhead() const
bool isXRegisterReservedForRA(size_t i) const
unsigned getNumXRegisterReserved() const
unsigned classifyGlobalFunctionReference(const GlobalValue *GV, const TargetMachine &TM) const
bool useAA() const override
bool isStreamingSVEAvailable() const
Returns true if the target has access to the streaming-compatible subset of SVE instructions.
const AArch64TargetLowering * getTargetLowering() const override
Align getPrefLoopAlignment() const
Align getPrefFunctionAlignment() const
unsigned getMaxBytesForLoopAlignment() const
bool isNonStreamingSVEorSME2Available() const
Returns true if the target has access to either the full range of SVE instructions,...
bool supportsAddressTopByteIgnored() const
CPU has TBI (top byte of addresses is ignored during HW address translation) and OS enables it.
unsigned getMaxInterleaveFactor() const
void overrideSchedPolicy(MachineSchedPolicy &Policy, const SchedRegion &Region) const override
unsigned char classifyGlobalFunctionReference(const GlobalValue *GV) const override
This function is design to compatible with the function def in other targets and escape build error a...
const Triple & getTargetTriple() const
unsigned getStreamingHazardSize() const
Returns the size of memory region that if accessed by both the CPU and the SME unit could result in a...
bool isStreamingCompatible() const
Returns true if the function has a streaming-compatible body.
const char * getChkStkName() const
bool isXRegCustomCalleeSaved(size_t i) const
void adjustSchedDependency(SUnit *Def, int DefOpIdx, SUnit *Use, int UseOpIdx, SDep &Dep, const TargetSchedModel *SchedModel) const override
void mirFileLoaded(MachineFunction &MF) const override
Triple TargetTriple
TargetTriple - What processor and OS we're targeting.
InstructionSelector * getInstructionSelector() const override
bool isSVEorStreamingSVEAvailable() const
Returns true if the target has access to either the full range of SVE instructions,...
bool enableSubRegLiveness() const override
TailFoldingOpts getSVETailFoldingDefaultOpts() const
bool useSVEForFixedLengthVectors() const
unsigned ClassifyGlobalReference(const GlobalValue *GV, const TargetMachine &TM) const
ClassifyGlobalReference - Find the target operand flags that describe how a global value should be re...
void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS)
ParseSubtargetFeatures - Parses features string setting specified subtarget options.
unsigned getMinVectorRegisterBitWidth() const
bool isStreaming() const
Returns true if the function has a streaming body.
bool isX16X17Safer() const
Returns whether the operating system makes it safer to store sensitive values in x16 and x17 as oppos...
unsigned getSVEVectorSizeInBits() const
bool isXRegisterReserved(size_t i) const
unsigned getMaxPrefetchIterationsAhead() const override
bool useScalarIncVL() const
Returns true to use the addvl/inc/dec instructions, as opposed to separate add + cnt instructions.
bool useDFAforSMS() const override
const LegalizerInfo * getLegalizerInfo() const override
bool enableMachineScheduler() const override
unsigned getScatterOverhead() const
bool enablePostRAScheduler() const override
std::unique_ptr< PBQPRAConstraint > getCustomPBQPConstraints() const override
unsigned getEpilogueVectorizationMinVF() const
unsigned getMaxSVEVectorSizeInBits() const
bool isCallingConvWin64(CallingConv::ID CC, bool IsVarArg) const
unsigned getVScaleForTuning() const
unsigned getMinSVEVectorSizeInBits() const
AArch64PAuth::AuthCheckMethod getAuthenticatedLRCheckMethod(const MachineFunction &MF) const
Choose a method of checking LR before performing a tail call.
AArch64InstrInfo InstrInfo
AArch64TargetLowering TLInfo
const RegisterBankInfo * getRegBankInfo() const override
std::unique_ptr< LegalizerInfo > Legalizer
std::unique_ptr< InlineAsmLowering > InlineAsmLoweringInfo
bool isXRaySupported() const override
bool isSVEAvailable() const
Returns true if the target has SVE and can use the full range of SVE instructions,...
bool hasCustomCallingConv() const
const AArch64FrameLowering * getFrameLowering() const override
bool swiftAsyncContextIsDynamicallySet() const
Return whether FrameLowering should always set the "extended framepresent" bit in FP,...
unsigned getPrefetchDistance() const override
size_type count() const
count - Returns the number of bits which are set.
Definition BitVector.h:181
Holds all the information related to register banks.
Scheduling dependency.
Definition ScheduleDAG.h:51
Scheduling unit. This is a node in the scheduling DAG.
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
Primary interface to the complete machine description for the target machine.
Provide an instruction scheduling machine model to CodeGen passes.
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47
A Use represents the edge between a Value definition and its users.
Definition Use.h:35
AuthCheckMethod
Variants of check performed on an authenticated pointer.
static constexpr unsigned SVEBitsPerBlock
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ Swift
Calling convention for Swift.
Definition CallingConv.h:69
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition CallingConv.h:41
@ PreserveNone
Used for runtime calls that preserves none general registers.
Definition CallingConv.h:90
@ Win64
The C convention as implemented on Windows/x86-64 and AArch64.
@ SwiftTail
This follows the Swift calling convention in how arguments are passed but guarantees tail calls will ...
Definition CallingConv.h:87
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
This is an optimization pass for GlobalISel generic memory operations.
TailFoldingOpts
An enum to describe what types of loops we should attempt to tail-fold: Disabled: None Reductions: Lo...
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
Extended Value Type.
Definition ValueTypes.h:35
uint64_t getFixedSizeInBits() const
Return the size of the specified fixed width value type in bits.
Definition ValueTypes.h:381
bool isFixedLengthVector() const
Definition ValueTypes.h:181
Define a generic scheduling policy for targets that don't provide their own MachineSchedStrategy.
A region of an MBB for scheduling.