LLVM: lib/Target/AArch64/AArch64Subtarget.cpp Source File

//===-- AArch64Subtarget.cpp - AArch64 Subtarget Information ----*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the AArch64 specific subclass of TargetSubtarget.

//

//===----------------------------------------------------------------------===//


#include "AArch64Subtarget.h"


#include "AArch64.h"

#include "AArch64InstrInfo.h"

#include "AArch64PBQPRegAlloc.h"

#include "AArch64TargetMachine.h"

#include "GISel/AArch64CallLowering.h"

#include "GISel/AArch64LegalizerInfo.h"

#include "GISel/AArch64RegisterBankInfo.h"

#include "MCTargetDesc/AArch64AddressingModes.h"

#include "llvm/CodeGen/GlobalISel/InstructionSelect.h"

#include "llvm/CodeGen/MachineFrameInfo.h"

#include "llvm/CodeGen/MachineScheduler.h"

#include "llvm/IR/GlobalValue.h"

#include "llvm/Support/SipHash.h"

#include "llvm/TargetParser/AArch64TargetParser.h"


using namespace llvm;


#define DEBUG_TYPE "aarch64-subtarget"


#define GET_SUBTARGETINFO_CTOR

#define GET_SUBTARGETINFO_TARGET_DESC

#include "AArch64GenSubtargetInfo.inc"


static cl::opt<bool>

EnableEarlyIfConvert("aarch64-early-ifcvt", cl::desc("Enable the early if "

                     "converter pass"), cl::init(true), cl::Hidden);


// If OS supports TBI, use this flag to enable it.

static cl::opt<bool>

UseAddressTopByteIgnored("aarch64-use-tbi", cl::desc("Assume that top byte of "

                         "an address is ignored"), cl::init(false), cl::Hidden);


static cl::opt<bool> MachOUseNonLazyBind(

    "aarch64-macho-enable-nonlazybind",

    cl::desc("Call nonlazybind functions via direct GOT load for Mach-O"),

    cl::Hidden);


static cl::opt<bool> UseAA("aarch64-use-aa", cl::init(true),

                           cl::desc("Enable the use of AA during codegen."));


static cl::opt<unsigned> OverrideVectorInsertExtractBaseCost(

    "aarch64-insert-extract-base-cost",

    cl::desc("Base cost of vector insert/extract element"), cl::Hidden);


// Reserve a list of X# registers, so they are unavailable for register

// allocator, but can still be used as ABI requests, such as passing arguments

// to function call.

static cl::list<std::string>

ReservedRegsForRA("reserve-regs-for-regalloc", cl::desc("Reserve physical "

                  "registers, so they can't be used by register allocator. "

                  "Should only be used for testing register allocator."),

                  cl::CommaSeparated, cl::Hidden);


static cl::opt<AArch64PAuth::AuthCheckMethod>

    AuthenticatedLRCheckMethod("aarch64-authenticated-lr-check-method",

                               cl::Hidden,

                               cl::desc("Override the variant of check applied "

                                        "to authenticated LR during tail call"),

                               cl::values(AUTH_CHECK_METHOD_CL_VALUES_LR));


static cl::opt<unsigned> AArch64MinimumJumpTableEntries(

    "aarch64-min-jump-table-entries", cl::init(13), cl::Hidden,

    cl::desc("Set minimum number of entries to use a jump table on AArch64"));


static cl::opt<unsigned> AArch64StreamingHazardSize(

    "aarch64-streaming-hazard-size",

    cl::desc("Hazard size for streaming mode memory accesses. 0 = disabled."),

    cl::init(0), cl::Hidden);


static cl::alias AArch64StreamingStackHazardSize(

    "aarch64-stack-hazard-size",

    cl::desc("alias for -aarch64-streaming-hazard-size"),

    cl::aliasopt(AArch64StreamingHazardSize));


static cl::opt<bool> EnableZPRPredicateSpills(

    "aarch64-enable-zpr-predicate-spills", cl::init(false), cl::Hidden,

    cl::desc(

        "Enables spilling/reloading SVE predicates as data vectors (ZPRs)"));


// Subreg liveness tracking is disabled by default for now until all issues

// are ironed out. This option allows the feature to be used in tests.

static cl::opt<bool>

    EnableSubregLivenessTracking("aarch64-enable-subreg-liveness-tracking",

                                 cl::init(false), cl::Hidden,

                                 cl::desc("Enable subreg liveness tracking"));


static cl::opt<bool>

    UseScalarIncVL("sve-use-scalar-inc-vl", cl::init(false), cl::Hidden,

                   cl::desc("Prefer add+cnt over addvl/inc/dec"));


unsigned AArch64Subtarget::getVectorInsertExtractBaseCost() const {

  if (OverrideVectorInsertExtractBaseCost.getNumOccurrences() > 0)

    return OverrideVectorInsertExtractBaseCost;

  return VectorInsertExtractBaseCost;

}


AArch64Subtarget &AArch64Subtarget::initializeSubtargetDependencies(

    StringRef FS, StringRef CPUString, StringRef TuneCPUString,

    bool HasMinSize) {

  // Determine default and user-specified characteristics


  if (CPUString.empty())

    CPUString = "generic";


  if (TuneCPUString.empty())

    TuneCPUString = CPUString;


  ParseSubtargetFeatures(CPUString, TuneCPUString, FS);

  initializeProperties(HasMinSize);


  return *this;

}


void AArch64Subtarget::initializeProperties(bool HasMinSize) {

  // Initialize CPU specific properties. We should add a tablegen feature for

  // this in the future so we can specify it together with the subtarget

  // features.

  switch (ARMProcFamily) {

  case Generic:

    // Using TuneCPU=generic we avoid ldapur instructions to line up with the

    // cpus that use the AvoidLDAPUR feature. We don't want this to be on

    // forever, so it is enabled between armv8.4 and armv8.7/armv9.2.

    if (hasV8_4aOps() && !hasV8_8aOps())

      AvoidLDAPUR = true;

    break;

  case Carmel:

    CacheLineSize = 64;

    break;

  case CortexA35:

  case CortexA53:

  case CortexA55:

  case CortexR82:

  case CortexR82AE:

    PrefFunctionAlignment = Align(16);

    PrefLoopAlignment = Align(16);

    MaxBytesForLoopAlignment = 8;

    break;

  case CortexA57:

    MaxInterleaveFactor = 4;

    PrefFunctionAlignment = Align(16);

    PrefLoopAlignment = Align(16);

    MaxBytesForLoopAlignment = 8;

    break;

  case CortexA65:

    PrefFunctionAlignment = Align(8);

    break;

  case CortexA72:

  case CortexA73:

  case CortexA75:

    PrefFunctionAlignment = Align(16);

    PrefLoopAlignment = Align(16);

    MaxBytesForLoopAlignment = 8;

    break;

  case CortexA76:

  case CortexA77:

  case CortexA78:

  case CortexA78AE:

  case CortexA78C:

  case CortexX1:

    PrefFunctionAlignment = Align(16);

    PrefLoopAlignment = Align(32);

    MaxBytesForLoopAlignment = 16;

    break;

  case CortexA510:

  case CortexA520:

    PrefFunctionAlignment = Align(16);

    VScaleForTuning = 1;

    PrefLoopAlignment = Align(16);

    MaxBytesForLoopAlignment = 8;

    break;

  case CortexA710:

  case CortexA715:

  case CortexA720:

  case CortexA725:

  case CortexX2:

  case CortexX3:

  case CortexX4:

  case CortexX925:

    PrefFunctionAlignment = Align(16);

    VScaleForTuning = 1;

    PrefLoopAlignment = Align(32);

    MaxBytesForLoopAlignment = 16;

    break;

  case A64FX:

    CacheLineSize = 256;

    PrefFunctionAlignment = Align(8);

    PrefLoopAlignment = Align(4);

    MaxInterleaveFactor = 4;

    PrefetchDistance = 128;

    MinPrefetchStride = 1024;

    MaxPrefetchIterationsAhead = 4;

    VScaleForTuning = 4;

    break;

  case MONAKA:

    VScaleForTuning = 2;

    break;

  case AppleA7:

  case AppleA10:

  case AppleA11:

  case AppleA12:

  case AppleA13:

  case AppleA14:

  case AppleA15:

  case AppleA16:

  case AppleA17:

  case AppleM4:

    CacheLineSize = 64;

    PrefetchDistance = 280;

    MinPrefetchStride = 2048;

    MaxPrefetchIterationsAhead = 3;

    switch (ARMProcFamily) {

    case AppleA14:

    case AppleA15:

    case AppleA16:

    case AppleA17:

    case AppleM4:

      MaxInterleaveFactor = 4;

      break;

    default:

      break;

    }

    break;

  case ExynosM3:

    MaxInterleaveFactor = 4;

    MaxJumpTableSize = 20;

    PrefFunctionAlignment = Align(32);

    PrefLoopAlignment = Align(16);

    break;

  case Falkor:

    MaxInterleaveFactor = 4;

    // FIXME: remove this to enable 64-bit SLP if performance looks good.

    MinVectorRegisterBitWidth = 128;

    CacheLineSize = 128;

    PrefetchDistance = 820;

    MinPrefetchStride = 2048;

    MaxPrefetchIterationsAhead = 8;

    break;

  case Kryo:

    MaxInterleaveFactor = 4;

    VectorInsertExtractBaseCost = 2;

    CacheLineSize = 128;

    PrefetchDistance = 740;

    MinPrefetchStride = 1024;

    MaxPrefetchIterationsAhead = 11;

    // FIXME: remove this to enable 64-bit SLP if performance looks good.

    MinVectorRegisterBitWidth = 128;

    break;

  case NeoverseE1:

    PrefFunctionAlignment = Align(8);

    break;

  case NeoverseN1:

    PrefFunctionAlignment = Align(16);

    PrefLoopAlignment = Align(32);

    MaxBytesForLoopAlignment = 16;

    break;

  case NeoverseV2:

  case NeoverseV3:

    EpilogueVectorizationMinVF = 8;

    MaxInterleaveFactor = 4;

    ScatterOverhead = 13;

    LLVM_FALLTHROUGH;

  case NeoverseN2:

  case NeoverseN3:

    PrefFunctionAlignment = Align(16);

    PrefLoopAlignment = Align(32);

    MaxBytesForLoopAlignment = 16;

    VScaleForTuning = 1;

    break;

  case NeoverseV1:

    PrefFunctionAlignment = Align(16);

    PrefLoopAlignment = Align(32);

    MaxBytesForLoopAlignment = 16;

    VScaleForTuning = 2;

    DefaultSVETFOpts = TailFoldingOpts::Simple;

    break;

  case Neoverse512TVB:

    PrefFunctionAlignment = Align(16);

    VScaleForTuning = 1;

    MaxInterleaveFactor = 4;

    break;

  case Saphira:

    MaxInterleaveFactor = 4;

    // FIXME: remove this to enable 64-bit SLP if performance looks good.

    MinVectorRegisterBitWidth = 128;

    break;

  case ThunderX2T99:

    CacheLineSize = 64;

    PrefFunctionAlignment = Align(8);

    PrefLoopAlignment = Align(4);

    MaxInterleaveFactor = 4;

    PrefetchDistance = 128;

    MinPrefetchStride = 1024;

    MaxPrefetchIterationsAhead = 4;

    // FIXME: remove this to enable 64-bit SLP if performance looks good.

    MinVectorRegisterBitWidth = 128;

    break;

  case ThunderX:

  case ThunderXT88:

  case ThunderXT81:

  case ThunderXT83:

    CacheLineSize = 128;

    PrefFunctionAlignment = Align(8);

    PrefLoopAlignment = Align(4);

    // FIXME: remove this to enable 64-bit SLP if performance looks good.

    MinVectorRegisterBitWidth = 128;

    break;

  case TSV110:

    CacheLineSize = 64;

    PrefFunctionAlignment = Align(16);

    PrefLoopAlignment = Align(4);

    break;

  case ThunderX3T110:

    CacheLineSize = 64;

    PrefFunctionAlignment = Align(16);

    PrefLoopAlignment = Align(4);

    MaxInterleaveFactor = 4;

    PrefetchDistance = 128;

    MinPrefetchStride = 1024;

    MaxPrefetchIterationsAhead = 4;

    // FIXME: remove this to enable 64-bit SLP if performance looks good.

    MinVectorRegisterBitWidth = 128;

    break;

  case Ampere1:

  case Ampere1A:

  case Ampere1B:

    CacheLineSize = 64;

    PrefFunctionAlignment = Align(64);

    PrefLoopAlignment = Align(64);

    MaxInterleaveFactor = 4;

    break;

  case Oryon:

    CacheLineSize = 64;

    PrefFunctionAlignment = Align(16);

    MaxInterleaveFactor = 4;

    PrefetchDistance = 128;

    MinPrefetchStride = 1024;

    break;

  }


  if (AArch64MinimumJumpTableEntries.getNumOccurrences() > 0 || !HasMinSize)

    MinimumJumpTableEntries = AArch64MinimumJumpTableEntries;

}


AArch64Subtarget::AArch64Subtarget(const Triple &TT, StringRef CPU,

                                   StringRef TuneCPU, StringRef FS,

                                   const TargetMachine &TM, bool LittleEndian,

                                   unsigned MinSVEVectorSizeInBitsOverride,

                                   unsigned MaxSVEVectorSizeInBitsOverride,

                                   bool IsStreaming, bool IsStreamingCompatible,

                                   bool HasMinSize)

    : AArch64GenSubtargetInfo(TT, CPU, TuneCPU, FS),

      ReserveXRegister(AArch64::GPR64commonRegClass.getNumRegs()),

      ReserveXRegisterForRA(AArch64::GPR64commonRegClass.getNumRegs()),

      CustomCallSavedXRegs(AArch64::GPR64commonRegClass.getNumRegs()),

      IsLittle(LittleEndian), IsStreaming(IsStreaming),

      IsStreamingCompatible(IsStreamingCompatible),

      StreamingHazardSize(

          AArch64StreamingHazardSize.getNumOccurrences() > 0

              ? std::optional<unsigned>(AArch64StreamingHazardSize)

              : std::nullopt),

      MinSVEVectorSizeInBits(MinSVEVectorSizeInBitsOverride),

      MaxSVEVectorSizeInBits(MaxSVEVectorSizeInBitsOverride), TargetTriple(TT),

      InstrInfo(initializeSubtargetDependencies(FS, CPU, TuneCPU, HasMinSize)),

      TLInfo(TM, *this) {

  if (AArch64::isX18ReservedByDefault(TT))

    ReserveXRegister.set(18);


  CallLoweringInfo.reset(new AArch64CallLowering(*getTargetLowering()));

  InlineAsmLoweringInfo.reset(new InlineAsmLowering(getTargetLowering()));

  Legalizer.reset(new AArch64LegalizerInfo(*this));


  auto *RBI = new AArch64RegisterBankInfo(*getRegisterInfo());


  // FIXME: At this point, we can't rely on Subtarget having RBI.

  // It's awkward to mix passing RBI and the Subtarget; should we pass

  // TII/TRI as well?

  InstSelector.reset(createAArch64InstructionSelector(

      *static_cast<const AArch64TargetMachine *>(&TM), *this, *RBI));


  RegBankInfo.reset(RBI);


  auto TRI = getRegisterInfo();

  StringSet<> ReservedRegNames;

  ReservedRegNames.insert(ReservedRegsForRA.begin(), ReservedRegsForRA.end());

  for (unsigned i = 0; i < 29; ++i) {

    if (ReservedRegNames.count(TRI->getName(AArch64::X0 + i)))

      ReserveXRegisterForRA.set(i);

  }

  // X30 is named LR, so we can't use TRI->getName to check X30.

  if (ReservedRegNames.count("X30") || ReservedRegNames.count("LR"))

    ReserveXRegisterForRA.set(30);

  // X29 is named FP, so we can't use TRI->getName to check X29.

  if (ReservedRegNames.count("X29") || ReservedRegNames.count("FP"))

    ReserveXRegisterForRA.set(29);


  EnableSubregLiveness = EnableSubregLivenessTracking.getValue();

}


unsigned AArch64Subtarget::getHwModeSet() const {

  AArch64HwModeBits Modes = AArch64HwModeBits::DefaultMode;


  // Use a special hardware mode in streaming[-compatible] functions with

  // aarch64-enable-zpr-predicate-spills. This changes the spill size (and

  // alignment) for the predicate register class.

  if (EnableZPRPredicateSpills.getValue() &&

      (isStreaming() || isStreamingCompatible())) {

    Modes |= AArch64HwModeBits::SMEWithZPRPredicateSpills;

  }


  return to_underlying(Modes);

}


const CallLowering *AArch64Subtarget::getCallLowering() const {

  return CallLoweringInfo.get();

}


const InlineAsmLowering *AArch64Subtarget::getInlineAsmLowering() const {

  return InlineAsmLoweringInfo.get();

}


InstructionSelector *AArch64Subtarget::getInstructionSelector() const {

  return InstSelector.get();

}


const LegalizerInfo *AArch64Subtarget::getLegalizerInfo() const {

  return Legalizer.get();

}


const RegisterBankInfo *AArch64Subtarget::getRegBankInfo() const {

  return RegBankInfo.get();

}


/// Find the target operand flags that describe how a global value should be

/// referenced for the current subtarget.

unsigned

AArch64Subtarget::ClassifyGlobalReference(const GlobalValue *GV,

                                          const TargetMachine &TM) const {

  // MachO large model always goes via a GOT, simply to get a single 8-byte

  // absolute relocation on all global addresses.

  if (TM.getCodeModel() == CodeModel::Large && isTargetMachO())

    return AArch64II::MO_GOT;


  // All globals dynamically protected by MTE must have their address tags

  // synthesized. This is done by having the loader stash the tag in the GOT

  // entry. Force all tagged globals (even ones with internal linkage) through

  // the GOT.

  if (GV->isTagged())

    return AArch64II::MO_GOT;


  if (!TM.shouldAssumeDSOLocal(GV)) {

    if (GV->hasDLLImportStorageClass()) {

      return AArch64II::MO_GOT | AArch64II::MO_DLLIMPORT;

    }

    if (getTargetTriple().isOSWindows())

      return AArch64II::MO_GOT | AArch64II::MO_COFFSTUB;

    return AArch64II::MO_GOT;

  }


  // The small code model's direct accesses use ADRP, which cannot

  // necessarily produce the value 0 (if the code is above 4GB).

  // Same for the tiny code model, where we have a pc relative LDR.

  if ((useSmallAddressing() || TM.getCodeModel() == CodeModel::Tiny) &&

      GV->hasExternalWeakLinkage())

    return AArch64II::MO_GOT;


  // References to tagged globals are marked with MO_NC | MO_TAGGED to indicate

  // that their nominal addresses are tagged and outside of the code model. In

  // AArch64ExpandPseudo::expandMI we emit an additional instruction to set the

  // tag if necessary based on MO_TAGGED.

  if (AllowTaggedGlobals && !isa<FunctionType>(GV->getValueType()))

    return AArch64II::MO_NC | AArch64II::MO_TAGGED;


  return AArch64II::MO_NO_FLAG;

}


unsigned AArch64Subtarget::classifyGlobalFunctionReference(

    const GlobalValue *GV, const TargetMachine &TM) const {

  // MachO large model always goes via a GOT, because we don't have the

  // relocations available to do anything else..

  if (TM.getCodeModel() == CodeModel::Large && isTargetMachO() &&

      !GV->hasInternalLinkage())

    return AArch64II::MO_GOT;


  // NonLazyBind goes via GOT unless we know it's available locally.

  auto *F = dyn_cast<Function>(GV);

  if ((!isTargetMachO() || MachOUseNonLazyBind) && F &&

      F->hasFnAttribute(Attribute::NonLazyBind) && !TM.shouldAssumeDSOLocal(GV))

    return AArch64II::MO_GOT;


  if (getTargetTriple().isOSWindows()) {

    if (isWindowsArm64EC() && GV->getValueType()->isFunctionTy()) {

      if (GV->hasDLLImportStorageClass()) {

        // On Arm64EC, if we're calling a symbol from the import table

        // directly, use MO_ARM64EC_CALLMANGLE.

        return AArch64II::MO_GOT | AArch64II::MO_DLLIMPORT |

               AArch64II::MO_ARM64EC_CALLMANGLE;

      }

      if (GV->hasExternalLinkage()) {

        // If we're calling a symbol directly, use the mangled form in the

        // call instruction.

        return AArch64II::MO_ARM64EC_CALLMANGLE;

      }

    }


    // Use ClassifyGlobalReference for setting MO_DLLIMPORT/MO_COFFSTUB.

    return ClassifyGlobalReference(GV, TM);

  }


  return AArch64II::MO_NO_FLAG;

}


void AArch64Subtarget::overrideSchedPolicy(MachineSchedPolicy &Policy,

                                           unsigned NumRegionInstrs) const {

  // LNT run (at least on Cyclone) showed reasonably significant gains for

  // bi-directional scheduling. 253.perlbmk.

  Policy.OnlyTopDown = false;

  Policy.OnlyBottomUp = false;

  // Enabling or Disabling the latency heuristic is a close call: It seems to

  // help nearly no benchmark on out-of-order architectures, on the other hand

  // it regresses register pressure on a few benchmarking.

  Policy.DisableLatencyHeuristic = DisableLatencySchedHeuristic;

}


void AArch64Subtarget::adjustSchedDependency(

    SUnit *Def, int DefOpIdx, SUnit *Use, int UseOpIdx, SDep &Dep,

    const TargetSchedModel *SchedModel) const {

  if (!SchedModel || Dep.getKind() != SDep::Kind::Data || !Dep.getReg() ||

      !Def->isInstr() || !Use->isInstr() ||

      (Def->getInstr()->getOpcode() != TargetOpcode::BUNDLE &&

       Use->getInstr()->getOpcode() != TargetOpcode::BUNDLE))

    return;


  // If the Def is a BUNDLE, find the last instruction in the bundle that defs

  // the register.

  const MachineInstr *DefMI = Def->getInstr();

  if (DefMI->getOpcode() == TargetOpcode::BUNDLE) {

    Register Reg = DefMI->getOperand(DefOpIdx).getReg();

    for (const auto &Op : const_mi_bundle_ops(*DefMI)) {

      if (Op.isReg() && Op.isDef() && Op.getReg() == Reg) {

        DefMI = Op.getParent();

        DefOpIdx = Op.getOperandNo();

      }

    }

  }


  // If the Use is a BUNDLE, find the first instruction that uses the Reg.

  const MachineInstr *UseMI = Use->getInstr();

  if (UseMI->getOpcode() == TargetOpcode::BUNDLE) {

    Register Reg = UseMI->getOperand(UseOpIdx).getReg();

    for (const auto &Op : const_mi_bundle_ops(*UseMI)) {

      if (Op.isReg() && Op.isUse() && Op.getReg() == Reg) {

        UseMI = Op.getParent();

        UseOpIdx = Op.getOperandNo();

        break;

      }

    }

  }


  Dep.setLatency(

      SchedModel->computeOperandLatency(DefMI, DefOpIdx, UseMI, UseOpIdx));

}


bool AArch64Subtarget::enableEarlyIfConversion() const {

  return EnableEarlyIfConvert;

}


bool AArch64Subtarget::supportsAddressTopByteIgnored() const {

  if (!UseAddressTopByteIgnored)

    return false;


  if (TargetTriple.isDriverKit())

    return true;

  if (TargetTriple.isiOS()) {

    return TargetTriple.getiOSVersion() >= VersionTuple(8);

  }


  return false;

}


std::unique_ptr<PBQPRAConstraint>

AArch64Subtarget::getCustomPBQPConstraints() const {

  return balanceFPOps() ? std::make_unique<A57ChainingConstraint>() : nullptr;

}


void AArch64Subtarget::mirFileLoaded(MachineFunction &MF) const {

  // We usually compute max call frame size after ISel. Do the computation now

  // if the .mir file didn't specify it. Note that this will probably give you

  // bogus values after PEI has eliminated the callframe setup/destroy pseudo

  // instructions, specify explicitly if you need it to be correct.

  MachineFrameInfo &MFI = MF.getFrameInfo();

  if (!MFI.isMaxCallFrameSizeComputed())

    MFI.computeMaxCallFrameSize(MF);

}


bool AArch64Subtarget::useAA() const { return UseAA; }


bool AArch64Subtarget::useScalarIncVL() const {

  // If SVE2 or SME is present (we are not SVE-1 only) and UseScalarIncVL

  // is not otherwise set, enable it by default.

  if (UseScalarIncVL.getNumOccurrences())

    return UseScalarIncVL;

  return hasSVE2() || hasSME();

}


// If return address signing is enabled, tail calls are emitted as follows:

//

// ```

//   <authenticate LR>

//   <check LR>

//   TCRETURN          ; the callee may sign and spill the LR in its prologue

// ```

//

// LR may require explicit checking because if FEAT_FPAC is not implemented

// and LR was tampered with, then `<authenticate LR>` will not generate an

// exception on its own. Later, if the callee spills the signed LR value and

// neither FEAT_PAuth2 nor FEAT_EPAC are implemented, the valid PAC replaces

// the higher bits of LR thus hiding the authentication failure.

AArch64PAuth::AuthCheckMethod AArch64Subtarget::getAuthenticatedLRCheckMethod(

    const MachineFunction &MF) const {

  // TODO: Check subtarget for the scheme. Present variant is a default for

  // pauthtest ABI.

  if (MF.getFunction().hasFnAttribute("ptrauth-returns") &&

      MF.getFunction().hasFnAttribute("ptrauth-auth-traps"))

    return AArch64PAuth::AuthCheckMethod::HighBitsNoTBI;

  if (AuthenticatedLRCheckMethod.getNumOccurrences())

    return AuthenticatedLRCheckMethod;


  // At now, use None by default because checks may introduce an unexpected

  // performance regression or incompatibility with execute-only mappings.

  return AArch64PAuth::AuthCheckMethod::None;

}


std::optional<uint16_t>

AArch64Subtarget::getPtrAuthBlockAddressDiscriminatorIfEnabled(

    const Function &ParentFn) const {

  if (!ParentFn.hasFnAttribute("ptrauth-indirect-gotos"))

    return std::nullopt;

  // We currently have one simple mechanism for all targets.

  // This isn't ABI, so we can always do better in the future.

  return getPointerAuthStableSipHash(

      (Twine(ParentFn.getName()) + " blockaddress").str());

}


bool AArch64Subtarget::enableMachinePipeliner() const {

  return getSchedModel().hasInstrSchedModel();

}

AArch64AddressingModes.h

AArch64CallLowering.h
This file describes how to lower LLVM calls to machine code calls.

UseMI
MachineInstrBuilder & UseMI
Definition: AArch64ExpandPseudoInsts.cpp:112

DefMI
MachineInstrBuilder MachineInstrBuilder & DefMI
Definition: AArch64ExpandPseudoInsts.cpp:113

AArch64InstrInfo.h

AArch64LegalizerInfo.h
This file declares the targeting of the Machinelegalizer class for AArch64.

AArch64PBQPRegAlloc.h

AUTH_CHECK_METHOD_CL_VALUES_LR
#define AUTH_CHECK_METHOD_CL_VALUES_LR
Definition: AArch64PointerAuth.h:99

AArch64RegisterBankInfo.h
This file declares the targeting of the RegisterBankInfo class for AArch64.

UseAddressTopByteIgnored
static cl::opt< bool > UseAddressTopByteIgnored("aarch64-use-tbi", cl::desc("Assume that top byte of " "an address is ignored"), cl::init(false), cl::Hidden)

MachOUseNonLazyBind
static cl::opt< bool > MachOUseNonLazyBind("aarch64-macho-enable-nonlazybind", cl::desc("Call nonlazybind functions via direct GOT load for Mach-O"), cl::Hidden)

AArch64MinimumJumpTableEntries
static cl::opt< unsigned > AArch64MinimumJumpTableEntries("aarch64-min-jump-table-entries", cl::init(13), cl::Hidden, cl::desc("Set minimum number of entries to use a jump table on AArch64"))

AuthenticatedLRCheckMethod
static cl::opt< AArch64PAuth::AuthCheckMethod > AuthenticatedLRCheckMethod("aarch64-authenticated-lr-check-method", cl::Hidden, cl::desc("Override the variant of check applied " "to authenticated LR during tail call"), cl::values(AUTH_CHECK_METHOD_CL_VALUES_LR))

EnableSubregLivenessTracking
static cl::opt< bool > EnableSubregLivenessTracking("aarch64-enable-subreg-liveness-tracking", cl::init(false), cl::Hidden, cl::desc("Enable subreg liveness tracking"))

EnableEarlyIfConvert
static cl::opt< bool > EnableEarlyIfConvert("aarch64-early-ifcvt", cl::desc("Enable the early if " "converter pass"), cl::init(true), cl::Hidden)

AArch64StreamingHazardSize
static cl::opt< unsigned > AArch64StreamingHazardSize("aarch64-streaming-hazard-size", cl::desc("Hazard size for streaming mode memory accesses. 0 = disabled."), cl::init(0), cl::Hidden)

UseAA
static cl::opt< bool > UseAA("aarch64-use-aa", cl::init(true), cl::desc("Enable the use of AA during codegen."))

AArch64StreamingStackHazardSize
static cl::alias AArch64StreamingStackHazardSize("aarch64-stack-hazard-size", cl::desc("alias for -aarch64-streaming-hazard-size"), cl::aliasopt(AArch64StreamingHazardSize))

UseScalarIncVL
static cl::opt< bool > UseScalarIncVL("sve-use-scalar-inc-vl", cl::init(false), cl::Hidden, cl::desc("Prefer add+cnt over addvl/inc/dec"))

EnableZPRPredicateSpills
static cl::opt< bool > EnableZPRPredicateSpills("aarch64-enable-zpr-predicate-spills", cl::init(false), cl::Hidden, cl::desc("Enables spilling/reloading SVE predicates as data vectors (ZPRs)"))

ReservedRegsForRA
static cl::list< std::string > ReservedRegsForRA("reserve-regs-for-regalloc", cl::desc("Reserve physical " "registers, so they can't be used by register allocator. " "Should only be used for testing register allocator."), cl::CommaSeparated, cl::Hidden)

OverrideVectorInsertExtractBaseCost
static cl::opt< unsigned > OverrideVectorInsertExtractBaseCost("aarch64-insert-extract-base-cost", cl::desc("Base cost of vector insert/extract element"), cl::Hidden)

AArch64Subtarget.h

AArch64TargetMachine.h

AArch64TargetParser.h

AArch64.h

LLVM_FALLTHROUGH
#define LLVM_FALLTHROUGH
LLVM_FALLTHROUGH - Mark fallthrough cases in switch statements.
Definition: Compiler.h:388

GlobalValue.h

InstructionSelect.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

MachineFrameInfo.h

MachineScheduler.h

TRI
unsigned const TargetRegisterInfo * TRI
Definition: MachineSink.cpp:2029

SipHash.h

AArch64GenSubtargetInfo

llvm::AArch64CallLowering
Definition: AArch64CallLowering.h:30

llvm::AArch64LegalizerInfo
Definition: AArch64LegalizerInfo.h:26

llvm::AArch64RegisterBankInfo
This class provides the information for the target register banks.
Definition: AArch64RegisterBankInfo.h:105

llvm::AArch64Subtarget
Definition: AArch64Subtarget.h:38

llvm::AArch64Subtarget::AArch64Subtarget
AArch64Subtarget(const Triple &TT, StringRef CPU, StringRef TuneCPU, StringRef FS, const TargetMachine &TM, bool LittleEndian, unsigned MinSVEVectorSizeInBitsOverride=0, unsigned MaxSVEVectorSizeInBitsOverride=0, bool IsStreaming=false, bool IsStreamingCompatible=false, bool HasMinSize=false)
This constructor initializes the data members to match that of the specified triple.
Definition: AArch64Subtarget.cpp:358

llvm::AArch64Subtarget::ReserveXRegisterForRA
BitVector ReserveXRegisterForRA
Definition: AArch64Subtarget.h:79

llvm::AArch64Subtarget::ReserveXRegister
BitVector ReserveXRegister
Definition: AArch64Subtarget.h:76

llvm::AArch64Subtarget::getCallLowering
const CallLowering * getCallLowering() const override
Definition: AArch64Subtarget.cpp:427

llvm::AArch64Subtarget::getRegisterInfo
const AArch64RegisterInfo * getRegisterInfo() const override
Definition: AArch64Subtarget.h:150

llvm::AArch64Subtarget::DefaultSVETFOpts
TailFoldingOpts DefaultSVETFOpts
Definition: AArch64Subtarget.h:92

llvm::AArch64Subtarget::InstSelector
std::unique_ptr< InstructionSelector > InstSelector
Definition: AArch64Subtarget.h:107

llvm::AArch64Subtarget::ARMProcFamily
ARMProcFamilyEnum ARMProcFamily
ARMProcFamily - ARM processor family: Cortex-A53, Cortex-A57, and others.
Definition: AArch64Subtarget.h:49

llvm::AArch64Subtarget::Generic
@ Generic
Definition: AArch64Subtarget.h:41

llvm::AArch64Subtarget::RegBankInfo
std::unique_ptr< RegisterBankInfo > RegBankInfo
Definition: AArch64Subtarget.h:109

llvm::AArch64Subtarget::VScaleForTuning
unsigned VScaleForTuning
Definition: AArch64Subtarget.h:91

llvm::AArch64Subtarget::useSmallAddressing
bool useSmallAddressing() const
Definition: AArch64Subtarget.h:309

llvm::AArch64Subtarget::EpilogueVectorizationMinVF
unsigned EpilogueVectorizationMinVF
Definition: AArch64Subtarget.h:59

llvm::AArch64Subtarget::overrideSchedPolicy
void overrideSchedPolicy(MachineSchedPolicy &Policy, unsigned NumRegionInstrs) const override
Definition: AArch64Subtarget.cpp:526

llvm::AArch64Subtarget::enableEarlyIfConversion
bool enableEarlyIfConversion() const override
Definition: AArch64Subtarget.cpp:577

llvm::AArch64Subtarget::getInlineAsmLowering
const InlineAsmLowering * getInlineAsmLowering() const override
Definition: AArch64Subtarget.cpp:431

llvm::AArch64Subtarget::MaxPrefetchIterationsAhead
unsigned MaxPrefetchIterationsAhead
Definition: AArch64Subtarget.h:68

llvm::AArch64Subtarget::getVectorInsertExtractBaseCost
unsigned getVectorInsertExtractBaseCost() const
Definition: AArch64Subtarget.cpp:105

llvm::AArch64Subtarget::enableMachinePipeliner
bool enableMachinePipeliner() const override
Definition: AArch64Subtarget.cpp:658

llvm::AArch64Subtarget::CallLoweringInfo
std::unique_ptr< CallLowering > CallLoweringInfo
GlobalISel related APIs.
Definition: AArch64Subtarget.h:105

llvm::AArch64Subtarget::getPtrAuthBlockAddressDiscriminatorIfEnabled
std::optional< uint16_t > getPtrAuthBlockAddressDiscriminatorIfEnabled(const Function &ParentFn) const
Compute the integer discriminator for a given BlockAddress constant, if blockaddress signing is enabl...
Definition: AArch64Subtarget.cpp:648

llvm::AArch64Subtarget::PrefLoopAlignment
Align PrefLoopAlignment
Definition: AArch64Subtarget.h:70

llvm::AArch64Subtarget::classifyGlobalFunctionReference
unsigned classifyGlobalFunctionReference(const GlobalValue *GV, const TargetMachine &TM) const
Definition: AArch64Subtarget.cpp:490

llvm::AArch64Subtarget::useAA
bool useAA() const override
Definition: AArch64Subtarget.cpp:609

llvm::AArch64Subtarget::VectorInsertExtractBaseCost
uint8_t VectorInsertExtractBaseCost
Definition: AArch64Subtarget.h:61

llvm::AArch64Subtarget::getTargetLowering
const AArch64TargetLowering * getTargetLowering() const override
Definition: AArch64Subtarget.h:146

llvm::AArch64Subtarget::isTargetMachO
bool isTargetMachO() const
Definition: AArch64Subtarget.h:294

llvm::AArch64Subtarget::PrefetchDistance
uint16_t PrefetchDistance
Definition: AArch64Subtarget.h:66

llvm::AArch64Subtarget::supportsAddressTopByteIgnored
bool supportsAddressTopByteIgnored() const
CPU has TBI (top byte of addresses is ignored during HW address translation) and OS enables it.
Definition: AArch64Subtarget.cpp:581

llvm::AArch64Subtarget::PrefFunctionAlignment
Align PrefFunctionAlignment
Definition: AArch64Subtarget.h:69

llvm::AArch64Subtarget::getTargetTriple
const Triple & getTargetTriple() const
Definition: AArch64Subtarget.h:158

llvm::AArch64Subtarget::MinVectorRegisterBitWidth
unsigned MinVectorRegisterBitWidth
Definition: AArch64Subtarget.h:52

llvm::AArch64Subtarget::isStreamingCompatible
bool isStreamingCompatible() const
Returns true if the function has a streaming-compatible body.
Definition: AArch64Subtarget.h:180

llvm::AArch64Subtarget::adjustSchedDependency
void adjustSchedDependency(SUnit *Def, int DefOpIdx, SUnit *Use, int UseOpIdx, SDep &Dep, const TargetSchedModel *SchedModel) const override
Definition: AArch64Subtarget.cpp:538

llvm::AArch64Subtarget::mirFileLoaded
void mirFileLoaded(MachineFunction &MF) const override
Definition: AArch64Subtarget.cpp:599

llvm::AArch64Subtarget::TargetTriple
Triple TargetTriple
TargetTriple - What processor and OS we're targeting.
Definition: AArch64Subtarget.h:97

llvm::AArch64Subtarget::getInstructionSelector
InstructionSelector * getInstructionSelector() const override
Definition: AArch64Subtarget.cpp:435

llvm::AArch64Subtarget::MinPrefetchStride
uint16_t MinPrefetchStride
Definition: AArch64Subtarget.h:67

llvm::AArch64Subtarget::CacheLineSize
uint16_t CacheLineSize
Definition: AArch64Subtarget.h:62

llvm::AArch64Subtarget::ClassifyGlobalReference
unsigned ClassifyGlobalReference(const GlobalValue *GV, const TargetMachine &TM) const
ClassifyGlobalReference - Find the target operand flags that describe how a global value should be re...
Definition: AArch64Subtarget.cpp:450

llvm::AArch64Subtarget::ParseSubtargetFeatures
void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS)
ParseSubtargetFeatures - Parses features string setting specified subtarget options.

llvm::AArch64Subtarget::MaxJumpTableSize
unsigned MaxJumpTableSize
Definition: AArch64Subtarget.h:73

llvm::AArch64Subtarget::isWindowsArm64EC
bool isWindowsArm64EC() const
Definition: AArch64Subtarget.h:290

llvm::AArch64Subtarget::isStreaming
bool isStreaming() const
Returns true if the function has a streaming body.
Definition: AArch64Subtarget.h:177

llvm::AArch64Subtarget::getHwModeSet
virtual unsigned getHwModeSet() const override
Definition: AArch64Subtarget.cpp:413

llvm::AArch64Subtarget::useScalarIncVL
bool useScalarIncVL() const
Returns true to use the addvl/inc/dec instructions, as opposed to separate add + cnt instructions.
Definition: AArch64Subtarget.cpp:611

llvm::AArch64Subtarget::MinimumJumpTableEntries
unsigned MinimumJumpTableEntries
Definition: AArch64Subtarget.h:72

llvm::AArch64Subtarget::getLegalizerInfo
const LegalizerInfo * getLegalizerInfo() const override
Definition: AArch64Subtarget.cpp:439

llvm::AArch64Subtarget::EnableSubregLiveness
bool EnableSubregLiveness
Definition: AArch64Subtarget.h:94

llvm::AArch64Subtarget::getCustomPBQPConstraints
std::unique_ptr< PBQPRAConstraint > getCustomPBQPConstraints() const override
Definition: AArch64Subtarget.cpp:595

llvm::AArch64Subtarget::MaxInterleaveFactor
uint8_t MaxInterleaveFactor
Definition: AArch64Subtarget.h:60

llvm::AArch64Subtarget::ScatterOverhead
unsigned ScatterOverhead
Definition: AArch64Subtarget.h:64

llvm::AArch64Subtarget::getAuthenticatedLRCheckMethod
AArch64PAuth::AuthCheckMethod getAuthenticatedLRCheckMethod(const MachineFunction &MF) const
Choose a method of checking LR before performing a tail call.
Definition: AArch64Subtarget.cpp:632

llvm::AArch64Subtarget::getRegBankInfo
const RegisterBankInfo * getRegBankInfo() const override
Definition: AArch64Subtarget.cpp:443

llvm::AArch64Subtarget::MaxBytesForLoopAlignment
unsigned MaxBytesForLoopAlignment
Definition: AArch64Subtarget.h:71

llvm::AArch64Subtarget::InlineAsmLoweringInfo
std::unique_ptr< InlineAsmLowering > InlineAsmLoweringInfo
Definition: AArch64Subtarget.h:106

llvm::AArch64TargetMachine
Definition: AArch64TargetMachine.h:24

llvm::BitVector::set
BitVector & set()
Definition: BitVector.h:351

llvm::CallLowering
Definition: CallLowering.h:44

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::Function
Definition: Function.h:63

llvm::Function::hasFnAttribute
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
Definition: Function.cpp:731

llvm::GlobalValue
Definition: GlobalValue.h:48

llvm::GlobalValue::hasExternalLinkage
bool hasExternalLinkage() const
Definition: GlobalValue.h:512

llvm::GlobalValue::isTagged
bool isTagged() const
Definition: GlobalValue.h:366

llvm::GlobalValue::hasExternalWeakLinkage
bool hasExternalWeakLinkage() const
Definition: GlobalValue.h:530

llvm::GlobalValue::hasDLLImportStorageClass
bool hasDLLImportStorageClass() const
Definition: GlobalValue.h:279

llvm::GlobalValue::hasInternalLinkage
bool hasInternalLinkage() const
Definition: GlobalValue.h:527

llvm::GlobalValue::getValueType
Type * getValueType() const
Definition: GlobalValue.h:297

llvm::InlineAsmLowering
Definition: InlineAsmLowering.h:28

llvm::InstructionSelector
Definition: InstructionSelector.h:21

llvm::LegalizerInfo
Definition: LegalizerInfo.h:1308

llvm::Legalizer
Definition: Legalizer.h:37

llvm::MachineFrameInfo
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
Definition: MachineFrameInfo.h:106

llvm::MachineFrameInfo::computeMaxCallFrameSize
void computeMaxCallFrameSize(MachineFunction &MF, std::vector< MachineBasicBlock::iterator > *FrameSDOps=nullptr)
Computes the maximum size of a callframe.
Definition: MachineFrameInfo.cpp:187

llvm::MachineFrameInfo::isMaxCallFrameSizeComputed
bool isMaxCallFrameSizeComputed() const
Definition: MachineFrameInfo.h:673

llvm::MachineFunction
Definition: MachineFunction.h:267

llvm::MachineFunction::getFrameInfo
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Definition: MachineFunction.h:749

llvm::MachineFunction::getFunction
Function & getFunction()
Return the LLVM function that this machine code represents.
Definition: MachineFunction.h:704

llvm::MachineInstr
Representation of each machine instruction.
Definition: MachineInstr.h:71

llvm::MachineInstr::getOpcode
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
Definition: MachineInstr.h:577

llvm::MachineInstr::getOperand
const MachineOperand & getOperand(unsigned i) const
Definition: MachineInstr.h:587

llvm::MachineOperand::getReg
Register getReg() const
getReg - Returns the register number.
Definition: MachineOperand.h:365

llvm::RegisterBankInfo
Holds all the information related to register banks.
Definition: RegisterBankInfo.h:40

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::SDep
Scheduling dependency.
Definition: ScheduleDAG.h:49

llvm::SDep::getKind
Kind getKind() const
Returns an enum value representing the kind of the dependence.
Definition: ScheduleDAG.h:504

llvm::SDep::Data
@ Data
Regular data dependence (aka true-dependence).
Definition: ScheduleDAG.h:53

llvm::SDep::setLatency
void setLatency(unsigned Lat)
Sets the latency for this edge.
Definition: ScheduleDAG.h:147

llvm::SDep::getReg
unsigned getReg() const
Returns the register associated with this edge.
Definition: ScheduleDAG.h:218

llvm::SUnit
Scheduling unit. This is a node in the scheduling DAG.
Definition: ScheduleDAG.h:242

llvm::StringMap::count
size_type count(StringRef Key) const
count - Return 1 if the element is in the map, 0 otherwise.
Definition: StringMap.h:276

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51

llvm::StringRef::empty
constexpr bool empty() const
empty - Check if the string is empty.
Definition: StringRef.h:147

llvm::StringSet
StringSet - A wrapper for StringMap that provides set-like functionality.
Definition: StringSet.h:23

llvm::StringSet::insert
std::pair< typename Base::iterator, bool > insert(StringRef key)
Definition: StringSet.h:38

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:81

llvm::TargetSchedModel
Provide an instruction scheduling machine model to CodeGen passes.
Definition: TargetSchedule.h:30

llvm::TargetSchedModel::computeOperandLatency
unsigned computeOperandLatency(const MachineInstr *DefMI, unsigned DefOperIdx, const MachineInstr *UseMI, unsigned UseOperIdx) const
Compute operand latency based on the available machine model.
Definition: TargetSchedule.cpp:172

llvm::Triple
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44

llvm::Triple::isDriverKit
bool isDriverKit() const
Is this an Apple DriverKit triple.
Definition: Triple.h:578

llvm::Triple::isiOS
bool isiOS() const
Is this an iOS triple.
Definition: Triple.h:556

llvm::Triple::getiOSVersion
VersionTuple getiOSVersion() const
Parse the version number as with getOSVersion.
Definition: Triple.cpp:1472

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition: Twine.h:81

llvm::Type::isFunctionTy
bool isFunctionTy() const
True if this is an instance of FunctionType.
Definition: Type.h:255

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition: Use.h:35

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

llvm::VersionTuple
Represents a version number in the form major[.minor[.subminor[.build]]].
Definition: VersionTuple.h:29

llvm::cl::Option::getNumOccurrences
int getNumOccurrences() const
Definition: CommandLine.h:399

llvm::cl::alias
Definition: CommandLine.h:1913

llvm::cl::list
Definition: CommandLine.h:1655

llvm::cl::opt_storage::getValue
DataType & getValue()
Definition: CommandLine.h:1352

llvm::cl::opt
Definition: CommandLine.h:1423

unsigned

llvm::AArch64II::MO_DLLIMPORT
@ MO_DLLIMPORT
MO_DLLIMPORT - On a symbol operand, this represents that the reference to the symbol is for an import...
Definition: AArch64BaseInfo.h:843

llvm::AArch64II::MO_NC
@ MO_NC
MO_NC - Indicates whether the linker is expected to check the symbol reference for overflow.
Definition: AArch64BaseInfo.h:832

llvm::AArch64II::MO_GOT
@ MO_GOT
MO_GOT - This flag indicates that a symbol operand represents the address of the GOT entry for the sy...
Definition: AArch64BaseInfo.h:827

llvm::AArch64II::MO_NO_FLAG
@ MO_NO_FLAG
Definition: AArch64BaseInfo.h:784

llvm::AArch64II::MO_ARM64EC_CALLMANGLE
@ MO_ARM64EC_CALLMANGLE
MO_ARM64EC_CALLMANGLE - Operand refers to the Arm64EC-mangled version of a symbol,...
Definition: AArch64BaseInfo.h:865

llvm::AArch64II::MO_TAGGED
@ MO_TAGGED
MO_TAGGED - With MO_PAGE, indicates that the page includes a memory tag in bits 56-63.
Definition: AArch64BaseInfo.h:859

llvm::AArch64II::MO_COFFSTUB
@ MO_COFFSTUB
MO_COFFSTUB - On a symbol operand "FOO", this indicates that the reference is actually to the "....
Definition: AArch64BaseInfo.h:822

llvm::AArch64PAuth::AuthCheckMethod
AuthCheckMethod
Variants of check performed on an authenticated pointer.
Definition: AArch64PointerAuth.h:44

llvm::AArch64PAuth::AuthCheckMethod::HighBitsNoTBI
@ HighBitsNoTBI
Check by comparing bits 62 and 61 of the authenticated address.

llvm::AArch64PAuth::AuthCheckMethod::None
@ None
Do not check the value at all.

llvm::AArch64::isX18ReservedByDefault
bool isX18ReservedByDefault(const Triple &TT)
Definition: AArch64TargetParser.cpp:139

llvm::CodeModel::Large
@ Large
Definition: CodeGen.h:31

llvm::CodeModel::Tiny
@ Tiny
Definition: CodeGen.h:31

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:137

llvm::cl::values
ValuesClass values(OptsTy... Options)
Helper to build a ValuesClass by forwarding a variable number of arguments as an initializer list to ...
Definition: CommandLine.h:711

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm::cl::CommaSeparated
@ CommaSeparated
Definition: CommandLine.h:163

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::TailFoldingOpts::Simple
@ Simple

llvm::createAArch64InstructionSelector
InstructionSelector * createAArch64InstructionSelector(const AArch64TargetMachine &, const AArch64Subtarget &, const AArch64RegisterBankInfo &)
Definition: AArch64InstructionSelector.cpp:8091

llvm::to_underlying
constexpr std::underlying_type_t< Enum > to_underlying(Enum E)
Returns underlying integer value of an enum.
Definition: STLForwardCompat.h:66

llvm::const_mi_bundle_ops
iterator_range< ConstMIBundleOperands > const_mi_bundle_ops(const MachineInstr &MI)
Definition: MachineInstrBundle.h:205

llvm::getPointerAuthStableSipHash
uint16_t getPointerAuthStableSipHash(StringRef S)
Compute a stable non-zero 16-bit hash of the given string.
Definition: SipHash.cpp:168

std
Implement std::hash so that hash_code can be used in STL containers.
Definition: BitVector.h:858

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::MachineSchedPolicy
Define a generic scheduling policy for targets that don't provide their own MachineSchedStrategy.
Definition: MachineScheduler.h:198

llvm::MachineSchedPolicy::OnlyTopDown
bool OnlyTopDown
Definition: MachineScheduler.h:207

llvm::MachineSchedPolicy::DisableLatencyHeuristic
bool DisableLatencyHeuristic
Definition: MachineScheduler.h:212

llvm::MachineSchedPolicy::OnlyBottomUp
bool OnlyBottomUp
Definition: MachineScheduler.h:208

llvm::cl::aliasopt
Definition: CommandLine.h:1972

llvm::cl::desc
Definition: CommandLine.h:409