LLVM: lib/Target/AMDGPU/SIMachineFunctionInfo.h Source File

//==- SIMachineFunctionInfo.h - SIMachineFunctionInfo interface --*- C++ -*-==//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_AMDGPU_SIMACHINEFUNCTIONINFO_H

#define LLVM_LIB_TARGET_AMDGPU_SIMACHINEFUNCTIONINFO_H


#include "AMDGPUArgumentUsageInfo.h"

#include "AMDGPUMachineFunction.h"

#include "AMDGPUTargetMachine.h"

#include "GCNSubtarget.h"

#include "MCTargetDesc/AMDGPUMCTargetDesc.h"

#include "SIInstrInfo.h"

#include "SIModeRegisterDefaults.h"

#include "llvm/ADT/SetVector.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/CodeGen/MIRYamlMapping.h"

#include "llvm/CodeGen/PseudoSourceValue.h"

#include "llvm/Support/raw_ostream.h"

#include <optional>


namespace llvm {


class MachineFrameInfo;

class MachineFunction;

class SIMachineFunctionInfo;

class SIRegisterInfo;

class TargetRegisterClass;


class AMDGPUPseudoSourceValue : public PseudoSourceValue {

public:

  enum AMDGPUPSVKind : unsigned {

    PSVImage = PseudoSourceValue::TargetCustom,

    GWSResource

  };


protected:

  AMDGPUPseudoSourceValue(unsigned Kind, const AMDGPUTargetMachine &TM)

      : PseudoSourceValue(Kind, TM) {}


public:

  bool isConstant(const MachineFrameInfo *) const override {

    // This should probably be true for most images, but we will start by being

    // conservative.

    return false;

  }


  bool isAliased(const MachineFrameInfo *) const override {

    return true;

  }


  bool mayAlias(const MachineFrameInfo *) const override {

    return true;

  }

};


class AMDGPUGWSResourcePseudoSourceValue final : public AMDGPUPseudoSourceValue {

public:

  explicit AMDGPUGWSResourcePseudoSourceValue(const AMDGPUTargetMachine &TM)

      : AMDGPUPseudoSourceValue(GWSResource, TM) {}


  static bool classof(const PseudoSourceValue *V) {

    return V->kind() == GWSResource;

  }


  // These are inaccessible memory from IR.

  bool isAliased(const MachineFrameInfo *) const override {

    return false;

  }


  // These are inaccessible memory from IR.

  bool mayAlias(const MachineFrameInfo *) const override {

    return false;

  }


  void printCustom(raw_ostream &OS) const override {

    OS << "GWSResource";

  }

};


namespace yaml {


struct SIArgument {

  bool IsRegister;

  union {

    StringValue RegisterName;

    unsigned StackOffset;

  };

  std::optional<unsigned> Mask;


  // Default constructor, which creates a stack argument.

  SIArgument() : IsRegister(false), StackOffset(0) {}

  SIArgument(const SIArgument &Other) {

    IsRegister = Other.IsRegister;

    if (IsRegister)

      new (&RegisterName) StringValue(Other.RegisterName);

    else

      StackOffset = Other.StackOffset;

    Mask = Other.Mask;

  }

  SIArgument &operator=(const SIArgument &Other) {

    // Default-construct or destruct the old RegisterName in case of switching

    // union members

    if (IsRegister != Other.IsRegister) {

      if (Other.IsRegister)

        new (&RegisterName) StringValue();

      else

        RegisterName.~StringValue();

    }

    IsRegister = Other.IsRegister;

    if (IsRegister)

      RegisterName = Other.RegisterName;

    else

      StackOffset = Other.StackOffset;

    Mask = Other.Mask;

    return *this;

  }

  ~SIArgument() {

    if (IsRegister)

      RegisterName.~StringValue();

  }


  // Helper to create a register or stack argument.

  static inline SIArgument createArgument(bool IsReg) {

    if (IsReg)

      return SIArgument(IsReg);

    return SIArgument();

  }


private:

  // Construct a register argument.

  SIArgument(bool) : IsRegister(true), RegisterName() {}

};


template <> struct MappingTraits<SIArgument> {

  static void mapping(IO &YamlIO, SIArgument &A) {

    if (YamlIO.outputting()) {

      if (A.IsRegister)

        YamlIO.mapRequired("reg", A.RegisterName);

      else

        YamlIO.mapRequired("offset", A.StackOffset);

    } else {

      auto Keys = YamlIO.keys();

      if (is_contained(Keys, "reg")) {

        A = SIArgument::createArgument(true);

        YamlIO.mapRequired("reg", A.RegisterName);

      } else if (is_contained(Keys, "offset"))

        YamlIO.mapRequired("offset", A.StackOffset);

      else

        YamlIO.setError("missing required key 'reg' or 'offset'");

    }

    YamlIO.mapOptional("mask", A.Mask);

  }

  static const bool flow = true;

};


struct SIArgumentInfo {

  std::optional<SIArgument> PrivateSegmentBuffer;

  std::optional<SIArgument> DispatchPtr;

  std::optional<SIArgument> QueuePtr;

  std::optional<SIArgument> KernargSegmentPtr;

  std::optional<SIArgument> DispatchID;

  std::optional<SIArgument> FlatScratchInit;

  std::optional<SIArgument> PrivateSegmentSize;


  std::optional<SIArgument> WorkGroupIDX;

  std::optional<SIArgument> WorkGroupIDY;

  std::optional<SIArgument> WorkGroupIDZ;

  std::optional<SIArgument> WorkGroupInfo;

  std::optional<SIArgument> LDSKernelId;

  std::optional<SIArgument> PrivateSegmentWaveByteOffset;


  std::optional<SIArgument> ImplicitArgPtr;

  std::optional<SIArgument> ImplicitBufferPtr;


  std::optional<SIArgument> WorkItemIDX;

  std::optional<SIArgument> WorkItemIDY;

  std::optional<SIArgument> WorkItemIDZ;

};


template <> struct MappingTraits<SIArgumentInfo> {

  static void mapping(IO &YamlIO, SIArgumentInfo &AI) {

    YamlIO.mapOptional("privateSegmentBuffer", AI.PrivateSegmentBuffer);

    YamlIO.mapOptional("dispatchPtr", AI.DispatchPtr);

    YamlIO.mapOptional("queuePtr", AI.QueuePtr);

    YamlIO.mapOptional("kernargSegmentPtr", AI.KernargSegmentPtr);

    YamlIO.mapOptional("dispatchID", AI.DispatchID);

    YamlIO.mapOptional("flatScratchInit", AI.FlatScratchInit);

    YamlIO.mapOptional("privateSegmentSize", AI.PrivateSegmentSize);


    YamlIO.mapOptional("workGroupIDX", AI.WorkGroupIDX);

    YamlIO.mapOptional("workGroupIDY", AI.WorkGroupIDY);

    YamlIO.mapOptional("workGroupIDZ", AI.WorkGroupIDZ);

    YamlIO.mapOptional("workGroupInfo", AI.WorkGroupInfo);

    YamlIO.mapOptional("LDSKernelId", AI.LDSKernelId);

    YamlIO.mapOptional("privateSegmentWaveByteOffset",

                       AI.PrivateSegmentWaveByteOffset);


    YamlIO.mapOptional("implicitArgPtr", AI.ImplicitArgPtr);

    YamlIO.mapOptional("implicitBufferPtr", AI.ImplicitBufferPtr);


    YamlIO.mapOptional("workItemIDX", AI.WorkItemIDX);

    YamlIO.mapOptional("workItemIDY", AI.WorkItemIDY);

    YamlIO.mapOptional("workItemIDZ", AI.WorkItemIDZ);

  }

};


// Default to default mode for default calling convention.

struct SIMode {

  bool IEEE = true;

  bool DX10Clamp = true;

  bool FP32InputDenormals = true;

  bool FP32OutputDenormals = true;

  bool FP64FP16InputDenormals = true;

  bool FP64FP16OutputDenormals = true;


  SIMode() = default;


  SIMode(const SIModeRegisterDefaults &Mode) {

    IEEE = Mode.IEEE;

    DX10Clamp = Mode.DX10Clamp;

    FP32InputDenormals = Mode.FP32Denormals.Input != DenormalMode::PreserveSign;

    FP32OutputDenormals =

        Mode.FP32Denormals.Output != DenormalMode::PreserveSign;

    FP64FP16InputDenormals =

        Mode.FP64FP16Denormals.Input != DenormalMode::PreserveSign;

    FP64FP16OutputDenormals =

        Mode.FP64FP16Denormals.Output != DenormalMode::PreserveSign;

  }


  bool operator ==(const SIMode Other) const {

    return IEEE == Other.IEEE &&

           DX10Clamp == Other.DX10Clamp &&

           FP32InputDenormals == Other.FP32InputDenormals &&

           FP32OutputDenormals == Other.FP32OutputDenormals &&

           FP64FP16InputDenormals == Other.FP64FP16InputDenormals &&

           FP64FP16OutputDenormals == Other.FP64FP16OutputDenormals;

  }

};


template <> struct MappingTraits<SIMode> {

  static void mapping(IO &YamlIO, SIMode &Mode) {

    YamlIO.mapOptional("ieee", Mode.IEEE, true);

    YamlIO.mapOptional("dx10-clamp", Mode.DX10Clamp, true);

    YamlIO.mapOptional("fp32-input-denormals", Mode.FP32InputDenormals, true);

    YamlIO.mapOptional("fp32-output-denormals", Mode.FP32OutputDenormals, true);

    YamlIO.mapOptional("fp64-fp16-input-denormals", Mode.FP64FP16InputDenormals, true);

    YamlIO.mapOptional("fp64-fp16-output-denormals", Mode.FP64FP16OutputDenormals, true);

  }

};


struct SIMachineFunctionInfo final : public yaml::MachineFunctionInfo {

  uint64_t ExplicitKernArgSize = 0;

  Align MaxKernArgAlign;

  uint32_t LDSSize = 0;

  uint32_t GDSSize = 0;

  Align DynLDSAlign;

  bool IsEntryFunction = false;

  bool IsChainFunction = false;

  bool NoSignedZerosFPMath = false;

  bool MemoryBound = false;

  bool WaveLimiter = false;

  bool HasSpilledSGPRs = false;

  bool HasSpilledVGPRs = false;

  uint16_t NumWaveDispatchSGPRs = 0;

  uint16_t NumWaveDispatchVGPRs = 0;

  uint32_t HighBitsOf32BitAddress = 0;


  // TODO: 10 may be a better default since it's the maximum.

  unsigned Occupancy = 0;


  SmallVector<StringValue, 2> SpillPhysVGPRS;

  SmallVector<StringValue> WWMReservedRegs;


  StringValue ScratchRSrcReg = "$private_rsrc_reg";

  StringValue FrameOffsetReg = "$fp_reg";

  StringValue StackPtrOffsetReg = "$sp_reg";


  unsigned BytesInStackArgArea = 0;

  bool ReturnsVoid = true;


  std::optional<SIArgumentInfo> ArgInfo;


  unsigned PSInputAddr = 0;

  unsigned PSInputEnable = 0;

  unsigned MaxMemoryClusterDWords = DefaultMemoryClusterDWordsLimit;


  SIMode Mode;

  std::optional<FrameIndex> ScavengeFI;

  StringValue VGPRForAGPRCopy;

  StringValue SGPRForEXECCopy;

  StringValue LongBranchReservedReg;


  bool HasInitWholeWave = false;

  bool IsWholeWaveFunction = false;


  unsigned DynamicVGPRBlockSize = 0;

  unsigned ScratchReservedForDynamicVGPRs = 0;


  SIMachineFunctionInfo() = default;

  SIMachineFunctionInfo(const llvm::SIMachineFunctionInfo &,

                        const TargetRegisterInfo &TRI,

                        const llvm::MachineFunction &MF);


  void mappingImpl(yaml::IO &YamlIO) override;

  ~SIMachineFunctionInfo() = default;

};


template <> struct MappingTraits<SIMachineFunctionInfo> {

  static void mapping(IO &YamlIO, SIMachineFunctionInfo &MFI) {

    YamlIO.mapOptional("explicitKernArgSize", MFI.ExplicitKernArgSize,

                       UINT64_C(0));

    YamlIO.mapOptional("maxKernArgAlign", MFI.MaxKernArgAlign);

    YamlIO.mapOptional("ldsSize", MFI.LDSSize, 0u);

    YamlIO.mapOptional("gdsSize", MFI.GDSSize, 0u);

    YamlIO.mapOptional("dynLDSAlign", MFI.DynLDSAlign, Align());

    YamlIO.mapOptional("isEntryFunction", MFI.IsEntryFunction, false);

    YamlIO.mapOptional("isChainFunction", MFI.IsChainFunction, false);

    YamlIO.mapOptional("noSignedZerosFPMath", MFI.NoSignedZerosFPMath, false);

    YamlIO.mapOptional("memoryBound", MFI.MemoryBound, false);

    YamlIO.mapOptional("waveLimiter", MFI.WaveLimiter, false);

    YamlIO.mapOptional("hasSpilledSGPRs", MFI.HasSpilledSGPRs, false);

    YamlIO.mapOptional("hasSpilledVGPRs", MFI.HasSpilledVGPRs, false);

    YamlIO.mapOptional("numWaveDispatchSGPRs", MFI.NumWaveDispatchSGPRs, false);

    YamlIO.mapOptional("numWaveDispatchVGPRs", MFI.NumWaveDispatchVGPRs, false);

    YamlIO.mapOptional("scratchRSrcReg", MFI.ScratchRSrcReg,

                       StringValue("$private_rsrc_reg"));

    YamlIO.mapOptional("frameOffsetReg", MFI.FrameOffsetReg,

                       StringValue("$fp_reg"));

    YamlIO.mapOptional("stackPtrOffsetReg", MFI.StackPtrOffsetReg,

                       StringValue("$sp_reg"));

    YamlIO.mapOptional("bytesInStackArgArea", MFI.BytesInStackArgArea, 0u);

    YamlIO.mapOptional("returnsVoid", MFI.ReturnsVoid, true);

    YamlIO.mapOptional("argumentInfo", MFI.ArgInfo);

    YamlIO.mapOptional("psInputAddr", MFI.PSInputAddr, 0u);

    YamlIO.mapOptional("psInputEnable", MFI.PSInputEnable, 0u);

    YamlIO.mapOptional("maxMemoryClusterDWords", MFI.MaxMemoryClusterDWords,

                       DefaultMemoryClusterDWordsLimit);

    YamlIO.mapOptional("mode", MFI.Mode, SIMode());

    YamlIO.mapOptional("highBitsOf32BitAddress",

                       MFI.HighBitsOf32BitAddress, 0u);

    YamlIO.mapOptional("occupancy", MFI.Occupancy, 0);

    YamlIO.mapOptional("spillPhysVGPRs", MFI.SpillPhysVGPRS);

    YamlIO.mapOptional("wwmReservedRegs", MFI.WWMReservedRegs);

    YamlIO.mapOptional("scavengeFI", MFI.ScavengeFI);

    YamlIO.mapOptional("vgprForAGPRCopy", MFI.VGPRForAGPRCopy,

                       StringValue()); // Don't print out when it's empty.

    YamlIO.mapOptional("sgprForEXECCopy", MFI.SGPRForEXECCopy,

                       StringValue()); // Don't print out when it's empty.

    YamlIO.mapOptional("longBranchReservedReg", MFI.LongBranchReservedReg,

                       StringValue());

    YamlIO.mapOptional("hasInitWholeWave", MFI.HasInitWholeWave, false);

    YamlIO.mapOptional("dynamicVGPRBlockSize", MFI.DynamicVGPRBlockSize, false);

    YamlIO.mapOptional("scratchReservedForDynamicVGPRs",

                       MFI.ScratchReservedForDynamicVGPRs, 0);

    YamlIO.mapOptional("isWholeWaveFunction", MFI.IsWholeWaveFunction, false);

  }

};


} // end namespace yaml


// A CSR SGPR value can be preserved inside a callee using one of the following

// methods.

//   1. Copy to an unused scratch SGPR.

//   2. Spill to a VGPR lane.

//   3. Spill to memory via. a scratch VGPR.

// class PrologEpilogSGPRSaveRestoreInfo represents the save/restore method used

// for an SGPR at function prolog/epilog.

enum class SGPRSaveKind : uint8_t {

  COPY_TO_SCRATCH_SGPR,

  SPILL_TO_VGPR_LANE,

  SPILL_TO_MEM

};


class PrologEpilogSGPRSaveRestoreInfo {

  SGPRSaveKind Kind;

  union {

    int Index;

    Register Reg;

  };


public:

  PrologEpilogSGPRSaveRestoreInfo(SGPRSaveKind K, int I) : Kind(K), Index(I) {}

  PrologEpilogSGPRSaveRestoreInfo(SGPRSaveKind K, Register R)

      : Kind(K), Reg(R) {}

  Register getReg() const { return Reg; }

  int getIndex() const { return Index; }

  SGPRSaveKind getKind() const { return Kind; }

};


struct VGPRBlock2IndexFunctor {

  using argument_type = Register;

  unsigned operator()(Register Reg) const {

    assert(AMDGPU::VReg_1024RegClass.contains(Reg) && "Expecting a VGPR block");


    const MCRegister FirstVGPRBlock = AMDGPU::VReg_1024RegClass.getRegister(0);

    return Reg - FirstVGPRBlock;

  }

};


/// This class keeps track of the SPI_SP_INPUT_ADDR config register, which

/// tells the hardware which interpolation parameters to load.

class SIMachineFunctionInfo final : public AMDGPUMachineFunction,

                                    private MachineRegisterInfo::Delegate {

  friend class GCNTargetMachine;


  // State of MODE register, assumed FP mode.

  SIModeRegisterDefaults Mode;


  // Registers that may be reserved for spilling purposes. These may be the same

  // as the input registers.

  Register ScratchRSrcReg = AMDGPU::PRIVATE_RSRC_REG;


  // This is the unswizzled offset from the current dispatch's scratch wave

  // base to the beginning of the current function's frame.

  Register FrameOffsetReg = AMDGPU::FP_REG;


  // This is an ABI register used in the non-entry calling convention to

  // communicate the unswizzled offset from the current dispatch's scratch wave

  // base to the beginning of the new function's frame.

  Register StackPtrOffsetReg = AMDGPU::SP_REG;


  // Registers that may be reserved when RA doesn't allocate enough

  // registers to plan for the case where an indirect branch ends up

  // being needed during branch relaxation.

  Register LongBranchReservedReg;


  AMDGPUFunctionArgInfo ArgInfo;


  // Graphics info.

  unsigned PSInputAddr = 0;

  unsigned PSInputEnable = 0;


  /// Number of bytes of arguments this function has on the stack. If the callee

  /// is expected to restore the argument stack this should be a multiple of 16,

  /// all usable during a tail call.

  ///

  /// The alternative would forbid tail call optimisation in some cases: if we

  /// want to transfer control from a function with 8-bytes of stack-argument

  /// space to a function with 16-bytes then misalignment of this value would

  /// make a stack adjustment necessary, which could not be undone by the

  /// callee.

  unsigned BytesInStackArgArea = 0;


  bool ReturnsVoid = true;


  // A pair of default/requested minimum/maximum flat work group sizes.

  // Minimum - first, maximum - second.

  std::pair<unsigned, unsigned> FlatWorkGroupSizes = {0, 0};


  // A pair of default/requested minimum/maximum number of waves per execution

  // unit. Minimum - first, maximum - second.

  std::pair<unsigned, unsigned> WavesPerEU = {0, 0};


  const AMDGPUGWSResourcePseudoSourceValue GWSResourcePSV;


  // Default/requested number of work groups for the function.

  SmallVector<unsigned> MaxNumWorkGroups = {0, 0, 0};


private:

  unsigned NumUserSGPRs = 0;

  unsigned NumSystemSGPRs = 0;


  unsigned NumWaveDispatchSGPRs = 0;

  unsigned NumWaveDispatchVGPRs = 0;


  bool HasSpilledSGPRs = false;

  bool HasSpilledVGPRs = false;

  bool HasNonSpillStackObjects = false;

  bool IsStackRealigned = false;


  unsigned NumSpilledSGPRs = 0;

  unsigned NumSpilledVGPRs = 0;


  unsigned DynamicVGPRBlockSize = 0;


  // The size in bytes of the scratch space reserved for the CWSR trap handler

  // to spill some of the dynamic VGPRs.

  unsigned ScratchReservedForDynamicVGPRs = 0;


  // Tracks information about user SGPRs that will be setup by hardware which

  // will apply to all wavefronts of the grid.

  GCNUserSGPRUsageInfo UserSGPRInfo;


  // Feature bits required for inputs passed in system SGPRs.

  bool WorkGroupIDX : 1; // Always initialized.

  bool WorkGroupIDY : 1;

  bool WorkGroupIDZ : 1;

  bool WorkGroupInfo : 1;

  bool LDSKernelId : 1;

  bool PrivateSegmentWaveByteOffset : 1;


  bool WorkItemIDX : 1; // Always initialized.

  bool WorkItemIDY : 1;

  bool WorkItemIDZ : 1;


  // Pointer to where the ABI inserts special kernel arguments separate from the

  // user arguments. This is an offset from the KernargSegmentPtr.

  bool ImplicitArgPtr : 1;


  bool MayNeedAGPRs : 1;


  // The hard-wired high half of the address of the global information table

  // for AMDPAL OS type. 0xffffffff represents no hard-wired high half, since

  // current hardware only allows a 16 bit value.

  unsigned GITPtrHigh;


  unsigned HighBitsOf32BitAddress;


  // Flags associated with the virtual registers.

  IndexedMap<uint8_t, VirtReg2IndexFunctor> VRegFlags;


  // Current recorded maximum possible occupancy.

  unsigned Occupancy;


  // Maximum number of dwords that can be clusterred during instruction

  // scheduler stage.

  unsigned MaxMemoryClusterDWords = DefaultMemoryClusterDWordsLimit;


  MCPhysReg getNextUserSGPR() const;


  MCPhysReg getNextSystemSGPR() const;


  // MachineRegisterInfo callback functions to notify events.

  void MRI_NoteNewVirtualRegister(Register Reg) override;

  void MRI_NoteCloneVirtualRegister(Register NewReg, Register SrcReg) override;


public:

  struct VGPRSpillToAGPR {

    SmallVector<MCPhysReg, 32> Lanes;

    bool FullyAllocated = false;

    bool IsDead = false;

  };


private:

  // To track virtual VGPR + lane index for each subregister of the SGPR spilled

  // to frameindex key during SILowerSGPRSpills pass.

  DenseMap<int, std::vector<SIRegisterInfo::SpilledReg>>

      SGPRSpillsToVirtualVGPRLanes;

  // To track physical VGPR + lane index for CSR SGPR spills and special SGPRs

  // like Frame Pointer identified during PrologEpilogInserter.

  DenseMap<int, std::vector<SIRegisterInfo::SpilledReg>>

      SGPRSpillsToPhysicalVGPRLanes;

  unsigned NumVirtualVGPRSpillLanes = 0;

  unsigned NumPhysicalVGPRSpillLanes = 0;

  SmallVector<Register, 2> SpillVGPRs;

  SmallVector<Register, 2> SpillPhysVGPRs;

  using WWMSpillsMap = MapVector<Register, int>;

  // To track the registers used in instructions that can potentially modify the

  // inactive lanes. The WWM instructions and the writelane instructions for

  // spilling SGPRs to VGPRs fall under such category of operations. The VGPRs

  // modified by them should be spilled/restored at function prolog/epilog to

  // avoid any undesired outcome. Each entry in this map holds a pair of values,

  // the VGPR and its stack slot index.

  WWMSpillsMap WWMSpills;


  // Before allocation, the VGPR registers are partitioned into two distinct

  // sets, the first one for WWM-values and the second set for non-WWM values.

  // The latter set should be reserved during WWM-regalloc.

  BitVector NonWWMRegMask;


  using ReservedRegSet = SmallSetVector<Register, 8>;

  // To track the VGPRs reserved for WWM instructions. They get stack slots

  // later during PrologEpilogInserter and get added into the superset WWMSpills

  // for actual spilling. A separate set makes the register reserved part and

  // the serialization easier.

  ReservedRegSet WWMReservedRegs;


  bool IsWholeWaveFunction = false;


  using PrologEpilogSGPRSpill =

      std::pair<Register, PrologEpilogSGPRSaveRestoreInfo>;

  // To track the SGPR spill method used for a CSR SGPR register during

  // frame lowering. Even though the SGPR spills are handled during

  // SILowerSGPRSpills pass, some special handling needed later during the

  // PrologEpilogInserter.

  SmallVector<PrologEpilogSGPRSpill, 3> PrologEpilogSGPRSpills;


  // To save/restore EXEC MASK around WWM spills and copies.

  Register SGPRForEXECCopy;


  DenseMap<int, VGPRSpillToAGPR> VGPRToAGPRSpills;


  // AGPRs used for VGPR spills.

  SmallVector<MCPhysReg, 32> SpillAGPR;


  // VGPRs used for AGPR spills.

  SmallVector<MCPhysReg, 32> SpillVGPR;


  // Emergency stack slot. Sometimes, we create this before finalizing the stack

  // frame, so save it here and add it to the RegScavenger later.

  std::optional<int> ScavengeFI;


  // Map each VGPR CSR to the mask needed to save and restore it using block

  // load/store instructions. Only used if the subtarget feature for VGPR block

  // load/store is enabled.

  IndexedMap<uint32_t, VGPRBlock2IndexFunctor> MaskForVGPRBlockOps;


private:

  Register VGPRForAGPRCopy;


  bool allocateVirtualVGPRForSGPRSpills(MachineFunction &MF, int FI,

                                        unsigned LaneIndex);

  bool allocatePhysicalVGPRForSGPRSpills(MachineFunction &MF, int FI,

                                         unsigned LaneIndex,

                                         bool IsPrologEpilog);


public:

  Register getVGPRForAGPRCopy() const {

    return VGPRForAGPRCopy;

  }


  void setVGPRForAGPRCopy(Register NewVGPRForAGPRCopy) {

    VGPRForAGPRCopy = NewVGPRForAGPRCopy;

  }


  bool isCalleeSavedReg(const MCPhysReg *CSRegs, MCPhysReg Reg) const;


  void setMaskForVGPRBlockOps(Register RegisterBlock, uint32_t Mask) {

    MaskForVGPRBlockOps.grow(RegisterBlock);

    MaskForVGPRBlockOps[RegisterBlock] = Mask;

  }


  uint32_t getMaskForVGPRBlockOps(Register RegisterBlock) const {

    return MaskForVGPRBlockOps[RegisterBlock];

  }


  bool hasMaskForVGPRBlockOps(Register RegisterBlock) const {

    return MaskForVGPRBlockOps.inBounds(RegisterBlock);

  }


public:

  SIMachineFunctionInfo(const SIMachineFunctionInfo &MFI) = default;

  SIMachineFunctionInfo(const Function &F, const GCNSubtarget *STI);


  MachineFunctionInfo *

  clone(BumpPtrAllocator &Allocator, MachineFunction &DestMF,

        const DenseMap<MachineBasicBlock *, MachineBasicBlock *> &Src2DstMBB)

      const override;


  bool initializeBaseYamlFields(const yaml::SIMachineFunctionInfo &YamlMFI,

                                const MachineFunction &MF,

                                PerFunctionMIParsingState &PFS,

                                SMDiagnostic &Error, SMRange &SourceRange);


  void reserveWWMRegister(Register Reg) { WWMReservedRegs.insert(Reg); }

  bool isWWMReg(Register Reg) const {

    return Reg.isVirtual() ? checkFlag(Reg, AMDGPU::VirtRegFlag::WWM_REG)

                           : WWMReservedRegs.contains(Reg);

  }


  void updateNonWWMRegMask(BitVector &RegMask) { NonWWMRegMask = RegMask; }

  BitVector getNonWWMRegMask() const { return NonWWMRegMask; }

  void clearNonWWMRegAllocMask() { NonWWMRegMask.clear(); }


  SIModeRegisterDefaults getMode() const { return Mode; }


  ArrayRef<SIRegisterInfo::SpilledReg>

  getSGPRSpillToVirtualVGPRLanes(int FrameIndex) const {

    auto I = SGPRSpillsToVirtualVGPRLanes.find(FrameIndex);

    return (I == SGPRSpillsToVirtualVGPRLanes.end())

               ? ArrayRef<SIRegisterInfo::SpilledReg>()

               : ArrayRef(I->second);

  }


  ArrayRef<Register> getSGPRSpillVGPRs() const { return SpillVGPRs; }

  ArrayRef<Register> getSGPRSpillPhysVGPRs() const { return SpillPhysVGPRs; }


  const WWMSpillsMap &getWWMSpills() const { return WWMSpills; }

  const ReservedRegSet &getWWMReservedRegs() const { return WWMReservedRegs; }


  bool isWWMReservedRegister(Register Reg) const {

    return WWMReservedRegs.contains(Reg);

  }


  bool isWholeWaveFunction() const { return IsWholeWaveFunction; }


  ArrayRef<PrologEpilogSGPRSpill> getPrologEpilogSGPRSpills() const {

    assert(is_sorted(PrologEpilogSGPRSpills, llvm::less_first()));

    return PrologEpilogSGPRSpills;

  }


  GCNUserSGPRUsageInfo &getUserSGPRInfo() { return UserSGPRInfo; }


  const GCNUserSGPRUsageInfo &getUserSGPRInfo() const { return UserSGPRInfo; }


  void addToPrologEpilogSGPRSpills(Register Reg,

                                   PrologEpilogSGPRSaveRestoreInfo SI) {

    assert(!hasPrologEpilogSGPRSpillEntry(Reg));


    // Insert a new entry in the right place to keep the vector in sorted order.

    // This should be cheap since the vector is expected to be very short.

    PrologEpilogSGPRSpills.insert(

        upper_bound(

            PrologEpilogSGPRSpills, Reg,

            [](const auto &LHS, const auto &RHS) { return LHS < RHS.first; }),

        std::make_pair(Reg, SI));

  }


  // Check if an entry created for \p Reg in PrologEpilogSGPRSpills. Return true

  // on success and false otherwise.

  bool hasPrologEpilogSGPRSpillEntry(Register Reg) const {

    const auto *I = find_if(PrologEpilogSGPRSpills, [&Reg](const auto &Spill) {

      return Spill.first == Reg;

    });

    return I != PrologEpilogSGPRSpills.end();

  }


  // Get the scratch SGPR if allocated to save/restore \p Reg.

  Register getScratchSGPRCopyDstReg(Register Reg) const {

    const auto *I = find_if(PrologEpilogSGPRSpills, [&Reg](const auto &Spill) {

      return Spill.first == Reg;

    });

    if (I != PrologEpilogSGPRSpills.end() &&

        I->second.getKind() == SGPRSaveKind::COPY_TO_SCRATCH_SGPR)

      return I->second.getReg();


    return AMDGPU::NoRegister;

  }


  // Get all scratch SGPRs allocated to copy/restore the SGPR spills.

  void getAllScratchSGPRCopyDstRegs(SmallVectorImpl<Register> &Regs) const {

    for (const auto &SI : PrologEpilogSGPRSpills) {

      if (SI.second.getKind() == SGPRSaveKind::COPY_TO_SCRATCH_SGPR)

        Regs.push_back(SI.second.getReg());

    }

  }


  // Check if \p FI is allocated for any SGPR spill to a VGPR lane during PEI.

  bool checkIndexInPrologEpilogSGPRSpills(int FI) const {

    return find_if(PrologEpilogSGPRSpills,

                   [FI](const std::pair<Register,

                                        PrologEpilogSGPRSaveRestoreInfo> &SI) {

                     return SI.second.getKind() ==

                                SGPRSaveKind::SPILL_TO_VGPR_LANE &&

                            SI.second.getIndex() == FI;

                   }) != PrologEpilogSGPRSpills.end();

  }


  const PrologEpilogSGPRSaveRestoreInfo &

  getPrologEpilogSGPRSaveRestoreInfo(Register Reg) const {

    const auto *I = find_if(PrologEpilogSGPRSpills, [&Reg](const auto &Spill) {

      return Spill.first == Reg;

    });

    assert(I != PrologEpilogSGPRSpills.end());


    return I->second;

  }


  ArrayRef<SIRegisterInfo::SpilledReg>

  getSGPRSpillToPhysicalVGPRLanes(int FrameIndex) const {

    auto I = SGPRSpillsToPhysicalVGPRLanes.find(FrameIndex);

    return (I == SGPRSpillsToPhysicalVGPRLanes.end())

               ? ArrayRef<SIRegisterInfo::SpilledReg>()

               : ArrayRef(I->second);

  }


  void setFlag(Register Reg, uint8_t Flag) {

    assert(Reg.isVirtual());

    if (VRegFlags.inBounds(Reg))

      VRegFlags[Reg] |= Flag;

  }


  bool checkFlag(Register Reg, uint8_t Flag) const {

    if (Reg.isPhysical())

      return false;


    return VRegFlags.inBounds(Reg) && VRegFlags[Reg] & Flag;

  }


  bool hasVRegFlags() { return VRegFlags.size(); }


  void allocateWWMSpill(MachineFunction &MF, Register VGPR, uint64_t Size = 4,

                        Align Alignment = Align(4));


  void splitWWMSpillRegisters(

      MachineFunction &MF,

      SmallVectorImpl<std::pair<Register, int>> &CalleeSavedRegs,

      SmallVectorImpl<std::pair<Register, int>> &ScratchRegs) const;


  ArrayRef<MCPhysReg> getAGPRSpillVGPRs() const {

    return SpillAGPR;

  }


  Register getSGPRForEXECCopy() const { return SGPRForEXECCopy; }


  void setSGPRForEXECCopy(Register Reg) { SGPRForEXECCopy = Reg; }


  ArrayRef<MCPhysReg> getVGPRSpillAGPRs() const {

    return SpillVGPR;

  }


  MCPhysReg getVGPRToAGPRSpill(int FrameIndex, unsigned Lane) const {

    auto I = VGPRToAGPRSpills.find(FrameIndex);

    return (I == VGPRToAGPRSpills.end()) ? (MCPhysReg)AMDGPU::NoRegister

                                         : I->second.Lanes[Lane];

  }


  void setVGPRToAGPRSpillDead(int FrameIndex) {

    auto I = VGPRToAGPRSpills.find(FrameIndex);

    if (I != VGPRToAGPRSpills.end())

      I->second.IsDead = true;

  }


  // To bring the allocated WWM registers in \p WWMVGPRs to the lowest available

  // range.

  void shiftWwmVGPRsToLowestRange(MachineFunction &MF,

                                  SmallVectorImpl<Register> &WWMVGPRs,

                                  BitVector &SavedVGPRs);


  bool allocateSGPRSpillToVGPRLane(MachineFunction &MF, int FI,

                                   bool SpillToPhysVGPRLane = false,

                                   bool IsPrologEpilog = false);

  bool allocateVGPRSpillToAGPR(MachineFunction &MF, int FI, bool isAGPRtoVGPR);


  /// If \p ResetSGPRSpillStackIDs is true, reset the stack ID from sgpr-spill

  /// to the default stack.

  bool removeDeadFrameIndices(MachineFrameInfo &MFI,

                              bool ResetSGPRSpillStackIDs);


  int getScavengeFI(MachineFrameInfo &MFI, const SIRegisterInfo &TRI);

  std::optional<int> getOptionalScavengeFI() const { return ScavengeFI; }


  unsigned getBytesInStackArgArea() const {

    return BytesInStackArgArea;

  }


  void setBytesInStackArgArea(unsigned Bytes) {

    BytesInStackArgArea = Bytes;

  }


  bool isDynamicVGPREnabled() const { return DynamicVGPRBlockSize != 0; }

  unsigned getDynamicVGPRBlockSize() const { return DynamicVGPRBlockSize; }


  // This is only used if we need to save any dynamic VGPRs in scratch.

  unsigned getScratchReservedForDynamicVGPRs() const {

    return ScratchReservedForDynamicVGPRs;

  }


  void setScratchReservedForDynamicVGPRs(unsigned SizeInBytes) {

    ScratchReservedForDynamicVGPRs = SizeInBytes;

  }


  // Add user SGPRs.

  Register addPrivateSegmentBuffer(const SIRegisterInfo &TRI);

  Register addDispatchPtr(const SIRegisterInfo &TRI);

  Register addQueuePtr(const SIRegisterInfo &TRI);

  Register addKernargSegmentPtr(const SIRegisterInfo &TRI);

  Register addDispatchID(const SIRegisterInfo &TRI);

  Register addFlatScratchInit(const SIRegisterInfo &TRI);

  Register addPrivateSegmentSize(const SIRegisterInfo &TRI);

  Register addImplicitBufferPtr(const SIRegisterInfo &TRI);

  Register addLDSKernelId();

  SmallVectorImpl<MCRegister> *

  addPreloadedKernArg(const SIRegisterInfo &TRI, const TargetRegisterClass *RC,

                      unsigned AllocSizeDWord, int KernArgIdx,

                      int PaddingSGPRs);


  /// Increment user SGPRs used for padding the argument list only.

  Register addReservedUserSGPR() {

    Register Next = getNextUserSGPR();

    ++NumUserSGPRs;

    return Next;

  }


  // Add system SGPRs.

  Register addWorkGroupIDX() {

    ArgInfo.WorkGroupIDX = ArgDescriptor::createRegister(getNextSystemSGPR());

    NumSystemSGPRs += 1;

    return ArgInfo.WorkGroupIDX.getRegister();

  }


  Register addWorkGroupIDY() {

    ArgInfo.WorkGroupIDY = ArgDescriptor::createRegister(getNextSystemSGPR());

    NumSystemSGPRs += 1;

    return ArgInfo.WorkGroupIDY.getRegister();

  }


  Register addWorkGroupIDZ() {

    ArgInfo.WorkGroupIDZ = ArgDescriptor::createRegister(getNextSystemSGPR());

    NumSystemSGPRs += 1;

    return ArgInfo.WorkGroupIDZ.getRegister();

  }


  Register addWorkGroupInfo() {

    ArgInfo.WorkGroupInfo = ArgDescriptor::createRegister(getNextSystemSGPR());

    NumSystemSGPRs += 1;

    return ArgInfo.WorkGroupInfo.getRegister();

  }


  bool hasLDSKernelId() const { return LDSKernelId; }


  // Add special VGPR inputs

  void setWorkItemIDX(ArgDescriptor Arg) {

    ArgInfo.WorkItemIDX = Arg;

  }


  void setWorkItemIDY(ArgDescriptor Arg) {

    ArgInfo.WorkItemIDY = Arg;

  }


  void setWorkItemIDZ(ArgDescriptor Arg) {

    ArgInfo.WorkItemIDZ = Arg;

  }


  Register addPrivateSegmentWaveByteOffset() {

    ArgInfo.PrivateSegmentWaveByteOffset

      = ArgDescriptor::createRegister(getNextSystemSGPR());

    NumSystemSGPRs += 1;

    return ArgInfo.PrivateSegmentWaveByteOffset.getRegister();

  }


  void setPrivateSegmentWaveByteOffset(Register Reg) {

    ArgInfo.PrivateSegmentWaveByteOffset = ArgDescriptor::createRegister(Reg);

  }


  bool hasWorkGroupIDX() const {

    return WorkGroupIDX;

  }


  bool hasWorkGroupIDY() const {

    return WorkGroupIDY;

  }


  bool hasWorkGroupIDZ() const {

    return WorkGroupIDZ;

  }


  bool hasWorkGroupInfo() const {

    return WorkGroupInfo;

  }


  bool hasPrivateSegmentWaveByteOffset() const {

    return PrivateSegmentWaveByteOffset;

  }


  bool hasWorkItemIDX() const {

    return WorkItemIDX;

  }


  bool hasWorkItemIDY() const {

    return WorkItemIDY;

  }


  bool hasWorkItemIDZ() const {

    return WorkItemIDZ;

  }


  bool hasImplicitArgPtr() const {

    return ImplicitArgPtr;

  }


  AMDGPUFunctionArgInfo &getArgInfo() {

    return ArgInfo;

  }


  const AMDGPUFunctionArgInfo &getArgInfo() const {

    return ArgInfo;

  }


  std::tuple<const ArgDescriptor *, const TargetRegisterClass *, LLT>

  getPreloadedValue(AMDGPUFunctionArgInfo::PreloadedValue Value) const {

    return ArgInfo.getPreloadedValue(Value);

  }


  MCRegister getPreloadedReg(AMDGPUFunctionArgInfo::PreloadedValue Value) const {

    const auto *Arg = std::get<0>(ArgInfo.getPreloadedValue(Value));

    return Arg ? Arg->getRegister() : MCRegister();

  }


  unsigned getGITPtrHigh() const {

    return GITPtrHigh;

  }


  Register getGITPtrLoReg(const MachineFunction &MF) const;


  uint32_t get32BitAddressHighBits() const {

    return HighBitsOf32BitAddress;

  }


  unsigned getNumUserSGPRs() const {

    return NumUserSGPRs;

  }


  unsigned getNumPreloadedSGPRs() const {

    return NumUserSGPRs + NumSystemSGPRs;

  }


  unsigned getNumKernargPreloadedSGPRs() const {

    return UserSGPRInfo.getNumKernargPreloadSGPRs();

  }


  unsigned getNumWaveDispatchSGPRs() const { return NumWaveDispatchSGPRs; }


  void setNumWaveDispatchSGPRs(unsigned Count) { NumWaveDispatchSGPRs = Count; }


  unsigned getNumWaveDispatchVGPRs() const { return NumWaveDispatchVGPRs; }


  void setNumWaveDispatchVGPRs(unsigned Count) { NumWaveDispatchVGPRs = Count; }


  Register getPrivateSegmentWaveByteOffsetSystemSGPR() const {

    return ArgInfo.PrivateSegmentWaveByteOffset.getRegister();

  }


  /// Returns the physical register reserved for use as the resource

  /// descriptor for scratch accesses.

  Register getScratchRSrcReg() const {

    return ScratchRSrcReg;

  }


  void setScratchRSrcReg(Register Reg) {

    assert(Reg != 0 && "Should never be unset");

    ScratchRSrcReg = Reg;

  }


  Register getFrameOffsetReg() const {

    return FrameOffsetReg;

  }


  void setFrameOffsetReg(Register Reg) {

    assert(Reg != 0 && "Should never be unset");

    FrameOffsetReg = Reg;

  }


  void setStackPtrOffsetReg(Register Reg) {

    assert(Reg != 0 && "Should never be unset");

    StackPtrOffsetReg = Reg;

  }


  void setLongBranchReservedReg(Register Reg) { LongBranchReservedReg = Reg; }


  // Note the unset value for this is AMDGPU::SP_REG rather than

  // NoRegister. This is mostly a workaround for MIR tests where state that

  // can't be directly computed from the function is not preserved in serialized

  // MIR.

  Register getStackPtrOffsetReg() const {

    return StackPtrOffsetReg;

  }


  Register getLongBranchReservedReg() const { return LongBranchReservedReg; }


  Register getQueuePtrUserSGPR() const {

    return ArgInfo.QueuePtr.getRegister();

  }


  Register getImplicitBufferPtrUserSGPR() const {

    return ArgInfo.ImplicitBufferPtr.getRegister();

  }


  bool hasSpilledSGPRs() const {

    return HasSpilledSGPRs;

  }


  void setHasSpilledSGPRs(bool Spill = true) {

    HasSpilledSGPRs = Spill;

  }


  bool hasSpilledVGPRs() const {

    return HasSpilledVGPRs;

  }


  void setHasSpilledVGPRs(bool Spill = true) {

    HasSpilledVGPRs = Spill;

  }


  bool hasNonSpillStackObjects() const {

    return HasNonSpillStackObjects;

  }


  void setHasNonSpillStackObjects(bool StackObject = true) {

    HasNonSpillStackObjects = StackObject;

  }


  bool isStackRealigned() const {

    return IsStackRealigned;

  }


  void setIsStackRealigned(bool Realigned = true) {

    IsStackRealigned = Realigned;

  }


  unsigned getNumSpilledSGPRs() const {

    return NumSpilledSGPRs;

  }


  unsigned getNumSpilledVGPRs() const {

    return NumSpilledVGPRs;

  }


  void addToSpilledSGPRs(unsigned num) {

    NumSpilledSGPRs += num;

  }


  void addToSpilledVGPRs(unsigned num) {

    NumSpilledVGPRs += num;

  }


  unsigned getPSInputAddr() const {

    return PSInputAddr;

  }


  unsigned getPSInputEnable() const {

    return PSInputEnable;

  }


  bool isPSInputAllocated(unsigned Index) const {

    return PSInputAddr & (1 << Index);

  }


  void markPSInputAllocated(unsigned Index) {

    PSInputAddr |= 1 << Index;

  }


  void markPSInputEnabled(unsigned Index) {

    PSInputEnable |= 1 << Index;

  }


  bool returnsVoid() const {

    return ReturnsVoid;

  }


  void setIfReturnsVoid(bool Value) {

    ReturnsVoid = Value;

  }


  /// \returns A pair of default/requested minimum/maximum flat work group sizes

  /// for this function.

  std::pair<unsigned, unsigned> getFlatWorkGroupSizes() const {

    return FlatWorkGroupSizes;

  }


  /// \returns Default/requested minimum flat work group size for this function.

  unsigned getMinFlatWorkGroupSize() const {

    return FlatWorkGroupSizes.first;

  }


  /// \returns Default/requested maximum flat work group size for this function.

  unsigned getMaxFlatWorkGroupSize() const {

    return FlatWorkGroupSizes.second;

  }


  /// \returns A pair of default/requested minimum/maximum number of waves per

  /// execution unit.

  std::pair<unsigned, unsigned> getWavesPerEU() const {

    return WavesPerEU;

  }


  /// \returns Default/requested minimum number of waves per execution unit.

  unsigned getMinWavesPerEU() const {

    return WavesPerEU.first;

  }


  /// \returns Default/requested maximum number of waves per execution unit.

  unsigned getMaxWavesPerEU() const {

    return WavesPerEU.second;

  }


  const AMDGPUGWSResourcePseudoSourceValue *

  getGWSPSV(const AMDGPUTargetMachine &TM) {

    return &GWSResourcePSV;

  }


  unsigned getOccupancy() const {

    return Occupancy;

  }


  unsigned getMinAllowedOccupancy() const {

    if (!isMemoryBound() && !needsWaveLimiter())

      return Occupancy;

    return (Occupancy < 4) ? Occupancy : 4;

  }


  void limitOccupancy(const MachineFunction &MF);


  void limitOccupancy(unsigned Limit) {

    if (Occupancy > Limit)

      Occupancy = Limit;

  }


  void increaseOccupancy(const MachineFunction &MF, unsigned Limit) {

    if (Occupancy < Limit)

      Occupancy = Limit;

    limitOccupancy(MF);

  }


  unsigned getMaxMemoryClusterDWords() const { return MaxMemoryClusterDWords; }


  bool mayNeedAGPRs() const {

    return MayNeedAGPRs;

  }


  // \returns true if a function has a use of AGPRs via inline asm or

  // has a call which may use it.

  bool mayUseAGPRs(const Function &F) const;


  /// \returns Default/requested number of work groups for this function.

  SmallVector<unsigned> getMaxNumWorkGroups() const { return MaxNumWorkGroups; }


  unsigned getMaxNumWorkGroupsX() const { return MaxNumWorkGroups[0]; }

  unsigned getMaxNumWorkGroupsY() const { return MaxNumWorkGroups[1]; }

  unsigned getMaxNumWorkGroupsZ() const { return MaxNumWorkGroups[2]; }

};


} // end namespace llvm


#endif // LLVM_LIB_TARGET_AMDGPU_SIMACHINEFUNCTIONINFO_H

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

AMDGPUArgumentUsageInfo.h

AMDGPUMCTargetDesc.h
Provides AMDGPU specific target descriptions.

AMDGPUMachineFunction.h

AMDGPUTargetMachine.h
The AMDGPU TargetMachine interface definition for hw codegen targets.

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

Index
uint32_t Index
Definition: ELFObjHandler.cpp:83

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

YamlIO
IO & YamlIO
Definition: ELFYAML.cpp:1327

GCNSubtarget.h
AMD GCN specific subclass of TargetSubtarget.

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

MIRYamlMapping.h

Reg
Register Reg
Definition: MachineSink.cpp:2117

TRI
Register const TargetRegisterInfo * TRI
Definition: MachineSink.cpp:2118

Register
Promote Memory to Register
Definition: Mem2Reg.cpp:110

PseudoSourceValue.h

Allocator
Basic Register Allocator
Definition: RegAllocBasic.cpp:59

Mode
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))

SIInstrInfo.h
Interface definition for SIInstrInfo.

SIModeRegisterDefaults.h

OS
raw_pwrite_stream & OS
Definition: SampleProfWriter.cpp:51

contains
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
Definition: Value.cpp:480

SetVector.h
This file implements a set that has insertion order iteration characteristics.

SmallVector.h
This file defines the SmallVector class.

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

llvm::AMDGPUGWSResourcePseudoSourceValue
Definition: SIMachineFunctionInfo.h:65

llvm::AMDGPUGWSResourcePseudoSourceValue::printCustom
void printCustom(raw_ostream &OS) const override
Implement printing for PseudoSourceValue.
Definition: SIMachineFunctionInfo.h:84

llvm::AMDGPUGWSResourcePseudoSourceValue::classof
static bool classof(const PseudoSourceValue *V)
Definition: SIMachineFunctionInfo.h:70

llvm::AMDGPUGWSResourcePseudoSourceValue::AMDGPUGWSResourcePseudoSourceValue
AMDGPUGWSResourcePseudoSourceValue(const AMDGPUTargetMachine &TM)
Definition: SIMachineFunctionInfo.h:67

llvm::AMDGPUGWSResourcePseudoSourceValue::mayAlias
bool mayAlias(const MachineFrameInfo *) const override
Return true if the memory pointed to by this PseudoSourceValue can ever alias an LLVM IR Value.
Definition: SIMachineFunctionInfo.h:80

llvm::AMDGPUGWSResourcePseudoSourceValue::isAliased
bool isAliased(const MachineFrameInfo *) const override
Test whether the memory pointed to by this PseudoSourceValue may also be pointed to by an LLVM IR Val...
Definition: SIMachineFunctionInfo.h:75

llvm::AMDGPUMachineFunction
Definition: AMDGPUMachineFunction.h:24

llvm::AMDGPUMachineFunction::isMemoryBound
bool isMemoryBound() const
Definition: AMDGPUMachineFunction.h:114

llvm::AMDGPUMachineFunction::needsWaveLimiter
bool needsWaveLimiter() const
Definition: AMDGPUMachineFunction.h:118

llvm::AMDGPUPseudoSourceValue
Definition: SIMachineFunctionInfo.h:38

llvm::AMDGPUPseudoSourceValue::isConstant
bool isConstant(const MachineFrameInfo *) const override
Test whether the memory pointed to by this PseudoSourceValue has a constant value.
Definition: SIMachineFunctionInfo.h:50

llvm::AMDGPUPseudoSourceValue::AMDGPUPseudoSourceValue
AMDGPUPseudoSourceValue(unsigned Kind, const AMDGPUTargetMachine &TM)
Definition: SIMachineFunctionInfo.h:46

llvm::AMDGPUPseudoSourceValue::mayAlias
bool mayAlias(const MachineFrameInfo *) const override
Return true if the memory pointed to by this PseudoSourceValue can ever alias an LLVM IR Value.
Definition: SIMachineFunctionInfo.h:60

llvm::AMDGPUPseudoSourceValue::isAliased
bool isAliased(const MachineFrameInfo *) const override
Test whether the memory pointed to by this PseudoSourceValue may also be pointed to by an LLVM IR Val...
Definition: SIMachineFunctionInfo.h:56

llvm::AMDGPUPseudoSourceValue::AMDGPUPSVKind
AMDGPUPSVKind
Definition: SIMachineFunctionInfo.h:40

llvm::AMDGPUPseudoSourceValue::PSVImage
@ PSVImage
Definition: SIMachineFunctionInfo.h:41

llvm::AMDGPUPseudoSourceValue::GWSResource
@ GWSResource
Definition: SIMachineFunctionInfo.h:42

llvm::AMDGPUTargetMachine
Definition: AMDGPUTargetMachine.h:30

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::BitVector
Definition: BitVector.h:82

llvm::BitVector::clear
void clear()
clear - Removes all bits from the bitvector.
Definition: BitVector.h:335

llvm::BumpPtrAllocatorImpl
Allocate memory in an ever growing pool, as if by bump-pointer.
Definition: Allocator.h:67

llvm::DenseMapBase::find
iterator find(const_arg_type_t< KeyT > Val)
Definition: DenseMap.h:177

llvm::DenseMapBase::end
iterator end()
Definition: DenseMap.h:87

llvm::DenseMap
Definition: DenseMap.h:730

llvm::Error
Lightweight error class with error context and mandatory checking.
Definition: Error.h:159

llvm::Function
Definition: Function.h:64

llvm::GCNSubtarget
Definition: GCNSubtarget.h:34

llvm::GCNTargetMachine
Definition: AMDGPUTargetMachine.h:81

llvm::GCNUserSGPRUsageInfo
Definition: GCNSubtarget.h:1837

llvm::IndexedMap
Definition: IndexedMap.h:31

llvm::IndexedMap::grow
void grow(IndexT n)
Definition: IndexedMap.h:69

llvm::IndexedMap::inBounds
bool inBounds(IndexT n) const
Definition: IndexedMap.h:75

llvm::MCRegister
Wrapper class representing physical registers. Should be passed by value.
Definition: MCRegister.h:33

llvm::MachineFrameInfo
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
Definition: MachineFrameInfo.h:108

llvm::MachineFunction
Definition: MachineFunction.h:286

llvm::MachineRegisterInfo::Delegate
Definition: MachineRegisterInfo.h:55

llvm::MapVector< Register, int >

llvm::PrologEpilogSGPRSaveRestoreInfo
Definition: SIMachineFunctionInfo.h:383

llvm::PrologEpilogSGPRSaveRestoreInfo::Index
int Index
Definition: SIMachineFunctionInfo.h:386

llvm::PrologEpilogSGPRSaveRestoreInfo::PrologEpilogSGPRSaveRestoreInfo
PrologEpilogSGPRSaveRestoreInfo(SGPRSaveKind K, Register R)
Definition: SIMachineFunctionInfo.h:392

llvm::PrologEpilogSGPRSaveRestoreInfo::PrologEpilogSGPRSaveRestoreInfo
PrologEpilogSGPRSaveRestoreInfo(SGPRSaveKind K, int I)
Definition: SIMachineFunctionInfo.h:391

llvm::PrologEpilogSGPRSaveRestoreInfo::getIndex
int getIndex() const
Definition: SIMachineFunctionInfo.h:395

llvm::PrologEpilogSGPRSaveRestoreInfo::getKind
SGPRSaveKind getKind() const
Definition: SIMachineFunctionInfo.h:396

llvm::PrologEpilogSGPRSaveRestoreInfo::Reg
Register Reg
Definition: SIMachineFunctionInfo.h:387

llvm::PrologEpilogSGPRSaveRestoreInfo::getReg
Register getReg() const
Definition: SIMachineFunctionInfo.h:394

llvm::PseudoSourceValue
Special value supplied for machine level alias analysis.
Definition: PseudoSourceValue.h:33

llvm::PseudoSourceValue::TargetCustom
@ TargetCustom
Definition: PseudoSourceValue.h:43

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::SIMachineFunctionInfo
This class keeps track of the SPI_SP_INPUT_ADDR config register, which tells the hardware which inter...
Definition: SIMachineFunctionInfo.h:412

llvm::SIMachineFunctionInfo::getNumWaveDispatchVGPRs
unsigned getNumWaveDispatchVGPRs() const
Definition: SIMachineFunctionInfo.h:1005

llvm::SIMachineFunctionInfo::hasNonSpillStackObjects
bool hasNonSpillStackObjects() const
Definition: SIMachineFunctionInfo.h:1074

llvm::SIMachineFunctionInfo::getPrologEpilogSGPRSpills
ArrayRef< PrologEpilogSGPRSpill > getPrologEpilogSGPRSpills() const
Definition: SIMachineFunctionInfo.h:686

llvm::SIMachineFunctionInfo::getWWMSpills
const WWMSpillsMap & getWWMSpills() const
Definition: SIMachineFunctionInfo.h:677

llvm::SIMachineFunctionInfo::isPSInputAllocated
bool isPSInputAllocated(unsigned Index) const
Definition: SIMachineFunctionInfo.h:1114

llvm::SIMachineFunctionInfo::getAllScratchSGPRCopyDstRegs
void getAllScratchSGPRCopyDstRegs(SmallVectorImpl< Register > &Regs) const
Definition: SIMachineFunctionInfo.h:730

llvm::SIMachineFunctionInfo::getAGPRSpillVGPRs
ArrayRef< MCPhysReg > getAGPRSpillVGPRs() const
Definition: SIMachineFunctionInfo.h:789

llvm::SIMachineFunctionInfo::setSGPRForEXECCopy
void setSGPRForEXECCopy(Register Reg)
Definition: SIMachineFunctionInfo.h:795

llvm::SIMachineFunctionInfo::initializeBaseYamlFields
bool initializeBaseYamlFields(const yaml::SIMachineFunctionInfo &YamlMFI, const MachineFunction &MF, PerFunctionMIParsingState &PFS, SMDiagnostic &Error, SMRange &SourceRange)
Definition: SIMachineFunctionInfo.cpp:770

llvm::SIMachineFunctionInfo::getOccupancy
unsigned getOccupancy() const
Definition: SIMachineFunctionInfo.h:1171

llvm::SIMachineFunctionInfo::getNumPreloadedSGPRs
unsigned getNumPreloadedSGPRs() const
Definition: SIMachineFunctionInfo.h:993

llvm::SIMachineFunctionInfo::shiftWwmVGPRsToLowestRange
void shiftWwmVGPRsToLowestRange(MachineFunction &MF, SmallVectorImpl< Register > &WWMVGPRs, BitVector &SavedVGPRs)
Definition: SIMachineFunctionInfo.cpp:356

llvm::SIMachineFunctionInfo::setWorkItemIDY
void setWorkItemIDY(ArgDescriptor Arg)
Definition: SIMachineFunctionInfo.h:906

llvm::SIMachineFunctionInfo::getNumSpilledVGPRs
unsigned getNumSpilledVGPRs() const
Definition: SIMachineFunctionInfo.h:1094

llvm::SIMachineFunctionInfo::hasLDSKernelId
bool hasLDSKernelId() const
Definition: SIMachineFunctionInfo.h:899

llvm::SIMachineFunctionInfo::increaseOccupancy
void increaseOccupancy(const MachineFunction &MF, unsigned Limit)
Definition: SIMachineFunctionInfo.h:1188

llvm::SIMachineFunctionInfo::getNumWaveDispatchSGPRs
unsigned getNumWaveDispatchSGPRs() const
Definition: SIMachineFunctionInfo.h:1001

llvm::SIMachineFunctionInfo::addPrivateSegmentSize
Register addPrivateSegmentSize(const SIRegisterInfo &TRI)
Definition: SIMachineFunctionInfo.cpp:258

llvm::SIMachineFunctionInfo::setWorkItemIDZ
void setWorkItemIDZ(ArgDescriptor Arg)
Definition: SIMachineFunctionInfo.h:910

llvm::SIMachineFunctionInfo::getWavesPerEU
std::pair< unsigned, unsigned > getWavesPerEU() const
Definition: SIMachineFunctionInfo.h:1152

llvm::SIMachineFunctionInfo::setMaskForVGPRBlockOps
void setMaskForVGPRBlockOps(Register RegisterBlock, uint32_t Mask)
Definition: SIMachineFunctionInfo.h:627

llvm::SIMachineFunctionInfo::getMaxNumWorkGroupsZ
unsigned getMaxNumWorkGroupsZ() const
Definition: SIMachineFunctionInfo.h:1209

llvm::SIMachineFunctionInfo::getVGPRToAGPRSpill
MCPhysReg getVGPRToAGPRSpill(int FrameIndex, unsigned Lane) const
Definition: SIMachineFunctionInfo.h:801

llvm::SIMachineFunctionInfo::getNumSpilledSGPRs
unsigned getNumSpilledSGPRs() const
Definition: SIMachineFunctionInfo.h:1090

llvm::SIMachineFunctionInfo::getUserSGPRInfo
GCNUserSGPRUsageInfo & getUserSGPRInfo()
Definition: SIMachineFunctionInfo.h:691

llvm::SIMachineFunctionInfo::allocateWWMSpill
void allocateWWMSpill(MachineFunction &MF, Register VGPR, uint64_t Size=4, Align Alignment=Align(4))
Definition: SIMachineFunctionInfo.cpp:308

llvm::SIMachineFunctionInfo::addDispatchPtr
Register addDispatchPtr(const SIRegisterInfo &TRI)
Definition: SIMachineFunctionInfo.cpp:222

llvm::SIMachineFunctionInfo::getLongBranchReservedReg
Register getLongBranchReservedReg() const
Definition: SIMachineFunctionInfo.h:1048

llvm::SIMachineFunctionInfo::getDynamicVGPRBlockSize
unsigned getDynamicVGPRBlockSize() const
Definition: SIMachineFunctionInfo.h:841

llvm::SIMachineFunctionInfo::hasSpilledVGPRs
bool hasSpilledVGPRs() const
Definition: SIMachineFunctionInfo.h:1066

llvm::SIMachineFunctionInfo::setFlag
void setFlag(Register Reg, uint8_t Flag)
Definition: SIMachineFunctionInfo.h:766

llvm::SIMachineFunctionInfo::setVGPRToAGPRSpillDead
void setVGPRToAGPRSpillDead(int FrameIndex)
Definition: SIMachineFunctionInfo.h:807

llvm::SIMachineFunctionInfo::getMaxFlatWorkGroupSize
unsigned getMaxFlatWorkGroupSize() const
Definition: SIMachineFunctionInfo.h:1146

llvm::SIMachineFunctionInfo::isWholeWaveFunction
bool isWholeWaveFunction() const
Definition: SIMachineFunctionInfo.h:684

llvm::SIMachineFunctionInfo::getFlatWorkGroupSizes
std::pair< unsigned, unsigned > getFlatWorkGroupSizes() const
Definition: SIMachineFunctionInfo.h:1136

llvm::SIMachineFunctionInfo::getStackPtrOffsetReg
Register getStackPtrOffsetReg() const
Definition: SIMachineFunctionInfo.h:1044

llvm::SIMachineFunctionInfo::isStackRealigned
bool isStackRealigned() const
Definition: SIMachineFunctionInfo.h:1082

llvm::SIMachineFunctionInfo::addFlatScratchInit
Register addFlatScratchInit(const SIRegisterInfo &TRI)
Definition: SIMachineFunctionInfo.cpp:251

llvm::SIMachineFunctionInfo::getScratchRSrcReg
Register getScratchRSrcReg() const
Returns the physical register reserved for use as the resource descriptor for scratch accesses.
Definition: SIMachineFunctionInfo.h:1015

llvm::SIMachineFunctionInfo::returnsVoid
bool returnsVoid() const
Definition: SIMachineFunctionInfo.h:1126

llvm::SIMachineFunctionInfo::getMaxWavesPerEU
unsigned getMaxWavesPerEU() const
Definition: SIMachineFunctionInfo.h:1162

llvm::SIMachineFunctionInfo::setStackPtrOffsetReg
void setStackPtrOffsetReg(Register Reg)
Definition: SIMachineFunctionInfo.h:1033

llvm::SIMachineFunctionInfo::addReservedUserSGPR
Register addReservedUserSGPR()
Increment user SGPRs used for padding the argument list only.
Definition: SIMachineFunctionInfo.h:868

llvm::SIMachineFunctionInfo::getVGPRSpillAGPRs
ArrayRef< MCPhysReg > getVGPRSpillAGPRs() const
Definition: SIMachineFunctionInfo.h:797

llvm::SIMachineFunctionInfo::getSGPRSpillPhysVGPRs
ArrayRef< Register > getSGPRSpillPhysVGPRs() const
Definition: SIMachineFunctionInfo.h:675

llvm::SIMachineFunctionInfo::getScavengeFI
int getScavengeFI(MachineFrameInfo &MFI, const SIRegisterInfo &TRI)
Definition: SIMachineFunctionInfo.cpp:606

llvm::SIMachineFunctionInfo::addQueuePtr
Register addQueuePtr(const SIRegisterInfo &TRI)
Definition: SIMachineFunctionInfo.cpp:229

llvm::SIMachineFunctionInfo::hasWorkGroupIDZ
bool hasWorkGroupIDZ() const
Definition: SIMachineFunctionInfo.h:933

llvm::SIMachineFunctionInfo::getQueuePtrUserSGPR
Register getQueuePtrUserSGPR() const
Definition: SIMachineFunctionInfo.h:1050

llvm::SIMachineFunctionInfo::getSGPRSpillToVirtualVGPRLanes
ArrayRef< SIRegisterInfo::SpilledReg > getSGPRSpillToVirtualVGPRLanes(int FrameIndex) const
Definition: SIMachineFunctionInfo.h:667

llvm::SIMachineFunctionInfo::getMaskForVGPRBlockOps
uint32_t getMaskForVGPRBlockOps(Register RegisterBlock) const
Definition: SIMachineFunctionInfo.h:632

llvm::SIMachineFunctionInfo::getMaxMemoryClusterDWords
unsigned getMaxMemoryClusterDWords() const
Definition: SIMachineFunctionInfo.h:1194

llvm::SIMachineFunctionInfo::SIMachineFunctionInfo
SIMachineFunctionInfo(const SIMachineFunctionInfo &MFI)=default

llvm::SIMachineFunctionInfo::hasMaskForVGPRBlockOps
bool hasMaskForVGPRBlockOps(Register RegisterBlock) const
Definition: SIMachineFunctionInfo.h:636

llvm::SIMachineFunctionInfo::getMaxNumWorkGroups
SmallVector< unsigned > getMaxNumWorkGroups() const
Definition: SIMachineFunctionInfo.h:1205

llvm::SIMachineFunctionInfo::clearNonWWMRegAllocMask
void clearNonWWMRegAllocMask()
Definition: SIMachineFunctionInfo.h:662

llvm::SIMachineFunctionInfo::hasPrologEpilogSGPRSpillEntry
bool hasPrologEpilogSGPRSpillEntry(Register Reg) const
Definition: SIMachineFunctionInfo.h:710

llvm::SIMachineFunctionInfo::getGITPtrLoReg
Register getGITPtrLoReg(const MachineFunction &MF) const
Definition: SIMachineFunctionInfo.cpp:637

llvm::SIMachineFunctionInfo::hasWorkGroupIDY
bool hasWorkGroupIDY() const
Definition: SIMachineFunctionInfo.h:929

llvm::SIMachineFunctionInfo::setVGPRForAGPRCopy
void setVGPRForAGPRCopy(Register NewVGPRForAGPRCopy)
Definition: SIMachineFunctionInfo.h:621

llvm::SIMachineFunctionInfo::allocateVGPRSpillToAGPR
bool allocateVGPRSpillToAGPR(MachineFunction &MF, int FI, bool isAGPRtoVGPR)
Reserve AGPRs or VGPRs to support spilling for FrameIndex FI.
Definition: SIMachineFunctionInfo.cpp:495

llvm::SIMachineFunctionInfo::addWorkGroupIDY
Register addWorkGroupIDY()
Definition: SIMachineFunctionInfo.h:881

llvm::SIMachineFunctionInfo::splitWWMSpillRegisters
void splitWWMSpillRegisters(MachineFunction &MF, SmallVectorImpl< std::pair< Register, int > > &CalleeSavedRegs, SmallVectorImpl< std::pair< Register, int > > &ScratchRegs) const
Definition: SIMachineFunctionInfo.cpp:333

llvm::SIMachineFunctionInfo::setBytesInStackArgArea
void setBytesInStackArgArea(unsigned Bytes)
Definition: SIMachineFunctionInfo.h:836

llvm::SIMachineFunctionInfo::setNumWaveDispatchSGPRs
void setNumWaveDispatchSGPRs(unsigned Count)
Definition: SIMachineFunctionInfo.h:1003

llvm::SIMachineFunctionInfo::getMode
SIModeRegisterDefaults getMode() const
Definition: SIMachineFunctionInfo.h:664

llvm::SIMachineFunctionInfo::getSGPRForEXECCopy
Register getSGPRForEXECCopy() const
Definition: SIMachineFunctionInfo.h:793

llvm::SIMachineFunctionInfo::setFrameOffsetReg
void setFrameOffsetReg(Register Reg)
Definition: SIMachineFunctionInfo.h:1028

llvm::SIMachineFunctionInfo::isWWMReservedRegister
bool isWWMReservedRegister(Register Reg) const
Definition: SIMachineFunctionInfo.h:680

llvm::SIMachineFunctionInfo::getSGPRSpillToPhysicalVGPRLanes
ArrayRef< SIRegisterInfo::SpilledReg > getSGPRSpillToPhysicalVGPRLanes(int FrameIndex) const
Definition: SIMachineFunctionInfo.h:759

llvm::SIMachineFunctionInfo::addPrivateSegmentWaveByteOffset
Register addPrivateSegmentWaveByteOffset()
Definition: SIMachineFunctionInfo.h:914

llvm::SIMachineFunctionInfo::getPreloadedValue
std::tuple< const ArgDescriptor *, const TargetRegisterClass *, LLT > getPreloadedValue(AMDGPUFunctionArgInfo::PreloadedValue Value) const
Definition: SIMachineFunctionInfo.h:970

llvm::SIMachineFunctionInfo::hasWorkGroupInfo
bool hasWorkGroupInfo() const
Definition: SIMachineFunctionInfo.h:937

llvm::SIMachineFunctionInfo::mayUseAGPRs
bool mayUseAGPRs(const Function &F) const
Definition: SIMachineFunctionInfo.cpp:815

llvm::SIMachineFunctionInfo::isCalleeSavedReg
bool isCalleeSavedReg(const MCPhysReg *CSRegs, MCPhysReg Reg) const
Definition: SIMachineFunctionInfo.cpp:346

llvm::SIMachineFunctionInfo::hasWorkItemIDY
bool hasWorkItemIDY() const
Definition: SIMachineFunctionInfo.h:949

llvm::SIMachineFunctionInfo::getMinFlatWorkGroupSize
unsigned getMinFlatWorkGroupSize() const
Definition: SIMachineFunctionInfo.h:1141

llvm::SIMachineFunctionInfo::addLDSKernelId
Register addLDSKernelId()
Definition: SIMachineFunctionInfo.cpp:271

llvm::SIMachineFunctionInfo::getVGPRForAGPRCopy
Register getVGPRForAGPRCopy() const
Definition: SIMachineFunctionInfo.h:617

llvm::SIMachineFunctionInfo::getUserSGPRInfo
const GCNUserSGPRUsageInfo & getUserSGPRInfo() const
Definition: SIMachineFunctionInfo.h:693

llvm::SIMachineFunctionInfo::allocateSGPRSpillToVGPRLane
bool allocateSGPRSpillToVGPRLane(MachineFunction &MF, int FI, bool SpillToPhysVGPRLane=false, bool IsPrologEpilog=false)
Definition: SIMachineFunctionInfo.cpp:448

llvm::SIMachineFunctionInfo::setPrivateSegmentWaveByteOffset
void setPrivateSegmentWaveByteOffset(Register Reg)
Definition: SIMachineFunctionInfo.h:921

llvm::SIMachineFunctionInfo::getMinWavesPerEU
unsigned getMinWavesPerEU() const
Definition: SIMachineFunctionInfo.h:1157

llvm::SIMachineFunctionInfo::getFrameOffsetReg
Register getFrameOffsetReg() const
Definition: SIMachineFunctionInfo.h:1024

llvm::SIMachineFunctionInfo::setLongBranchReservedReg
void setLongBranchReservedReg(Register Reg)
Definition: SIMachineFunctionInfo.h:1038

llvm::SIMachineFunctionInfo::hasWorkGroupIDX
bool hasWorkGroupIDX() const
Definition: SIMachineFunctionInfo.h:925

llvm::SIMachineFunctionInfo::getArgInfo
const AMDGPUFunctionArgInfo & getArgInfo() const
Definition: SIMachineFunctionInfo.h:965

llvm::SIMachineFunctionInfo::getMaxNumWorkGroupsX
unsigned getMaxNumWorkGroupsX() const
Definition: SIMachineFunctionInfo.h:1207

llvm::SIMachineFunctionInfo::getBytesInStackArgArea
unsigned getBytesInStackArgArea() const
Definition: SIMachineFunctionInfo.h:832

llvm::SIMachineFunctionInfo::addKernargSegmentPtr
Register addKernargSegmentPtr(const SIRegisterInfo &TRI)
Definition: SIMachineFunctionInfo.cpp:236

llvm::SIMachineFunctionInfo::addDispatchID
Register addDispatchID(const SIRegisterInfo &TRI)
Definition: SIMachineFunctionInfo.cpp:244

llvm::SIMachineFunctionInfo::setHasSpilledVGPRs
void setHasSpilledVGPRs(bool Spill=true)
Definition: SIMachineFunctionInfo.h:1070

llvm::SIMachineFunctionInfo::setIfReturnsVoid
void setIfReturnsVoid(bool Value)
Definition: SIMachineFunctionInfo.h:1130

llvm::SIMachineFunctionInfo::limitOccupancy
void limitOccupancy(unsigned Limit)
Definition: SIMachineFunctionInfo.h:1183

llvm::SIMachineFunctionInfo::removeDeadFrameIndices
bool removeDeadFrameIndices(MachineFrameInfo &MFI, bool ResetSGPRSpillStackIDs)
If ResetSGPRSpillStackIDs is true, reset the stack ID from sgpr-spill to the default stack.
Definition: SIMachineFunctionInfo.cpp:561

llvm::SIMachineFunctionInfo::setScratchReservedForDynamicVGPRs
void setScratchReservedForDynamicVGPRs(unsigned SizeInBytes)
Definition: SIMachineFunctionInfo.h:848

llvm::SIMachineFunctionInfo::getNonWWMRegMask
BitVector getNonWWMRegMask() const
Definition: SIMachineFunctionInfo.h:661

llvm::SIMachineFunctionInfo::markPSInputAllocated
void markPSInputAllocated(unsigned Index)
Definition: SIMachineFunctionInfo.h:1118

llvm::SIMachineFunctionInfo::setWorkItemIDX
void setWorkItemIDX(ArgDescriptor Arg)
Definition: SIMachineFunctionInfo.h:902

llvm::SIMachineFunctionInfo::isWWMReg
bool isWWMReg(Register Reg) const
Definition: SIMachineFunctionInfo.h:655

llvm::SIMachineFunctionInfo::clone
MachineFunctionInfo * clone(BumpPtrAllocator &Allocator, MachineFunction &DestMF, const DenseMap< MachineBasicBlock *, MachineBasicBlock * > &Src2DstMBB) const override
Make a functionally equivalent copy of this MachineFunctionInfo in MF.
Definition: SIMachineFunctionInfo.cpp:200

llvm::SIMachineFunctionInfo::hasVRegFlags
bool hasVRegFlags()
Definition: SIMachineFunctionInfo.h:779

llvm::SIMachineFunctionInfo::checkFlag
bool checkFlag(Register Reg, uint8_t Flag) const
Definition: SIMachineFunctionInfo.h:772

llvm::SIMachineFunctionInfo::setNumWaveDispatchVGPRs
void setNumWaveDispatchVGPRs(unsigned Count)
Definition: SIMachineFunctionInfo.h:1007

llvm::SIMachineFunctionInfo::markPSInputEnabled
void markPSInputEnabled(unsigned Index)
Definition: SIMachineFunctionInfo.h:1122

llvm::SIMachineFunctionInfo::addToSpilledVGPRs
void addToSpilledVGPRs(unsigned num)
Definition: SIMachineFunctionInfo.h:1102

llvm::SIMachineFunctionInfo::getPreloadedReg
MCRegister getPreloadedReg(AMDGPUFunctionArgInfo::PreloadedValue Value) const
Definition: SIMachineFunctionInfo.h:974

llvm::SIMachineFunctionInfo::get32BitAddressHighBits
uint32_t get32BitAddressHighBits() const
Definition: SIMachineFunctionInfo.h:985

llvm::SIMachineFunctionInfo::getMinAllowedOccupancy
unsigned getMinAllowedOccupancy() const
Definition: SIMachineFunctionInfo.h:1175

llvm::SIMachineFunctionInfo::setHasSpilledSGPRs
void setHasSpilledSGPRs(bool Spill=true)
Definition: SIMachineFunctionInfo.h:1062

llvm::SIMachineFunctionInfo::checkIndexInPrologEpilogSGPRSpills
bool checkIndexInPrologEpilogSGPRSpills(int FI) const
Definition: SIMachineFunctionInfo.h:738

llvm::SIMachineFunctionInfo::updateNonWWMRegMask
void updateNonWWMRegMask(BitVector &RegMask)
Definition: SIMachineFunctionInfo.h:660

llvm::SIMachineFunctionInfo::getNumKernargPreloadedSGPRs
unsigned getNumKernargPreloadedSGPRs() const
Definition: SIMachineFunctionInfo.h:997

llvm::SIMachineFunctionInfo::addPrivateSegmentBuffer
Register addPrivateSegmentBuffer(const SIRegisterInfo &TRI)
Definition: SIMachineFunctionInfo.cpp:213

llvm::SIMachineFunctionInfo::hasWorkItemIDX
bool hasWorkItemIDX() const
Definition: SIMachineFunctionInfo.h:945

llvm::SIMachineFunctionInfo::getNumUserSGPRs
unsigned getNumUserSGPRs() const
Definition: SIMachineFunctionInfo.h:989

llvm::SIMachineFunctionInfo::getScratchReservedForDynamicVGPRs
unsigned getScratchReservedForDynamicVGPRs() const
Definition: SIMachineFunctionInfo.h:844

llvm::SIMachineFunctionInfo::getWWMReservedRegs
const ReservedRegSet & getWWMReservedRegs() const
Definition: SIMachineFunctionInfo.h:678

llvm::SIMachineFunctionInfo::getImplicitBufferPtrUserSGPR
Register getImplicitBufferPtrUserSGPR() const
Definition: SIMachineFunctionInfo.h:1054

llvm::SIMachineFunctionInfo::getOptionalScavengeFI
std::optional< int > getOptionalScavengeFI() const
Definition: SIMachineFunctionInfo.h:830

llvm::SIMachineFunctionInfo::addImplicitBufferPtr
Register addImplicitBufferPtr(const SIRegisterInfo &TRI)
Definition: SIMachineFunctionInfo.cpp:264

llvm::SIMachineFunctionInfo::getArgInfo
AMDGPUFunctionArgInfo & getArgInfo()
Definition: SIMachineFunctionInfo.h:961

llvm::SIMachineFunctionInfo::getPrologEpilogSGPRSaveRestoreInfo
const PrologEpilogSGPRSaveRestoreInfo & getPrologEpilogSGPRSaveRestoreInfo(Register Reg) const
Definition: SIMachineFunctionInfo.h:749

llvm::SIMachineFunctionInfo::isDynamicVGPREnabled
bool isDynamicVGPREnabled() const
Definition: SIMachineFunctionInfo.h:840

llvm::SIMachineFunctionInfo::setHasNonSpillStackObjects
void setHasNonSpillStackObjects(bool StackObject=true)
Definition: SIMachineFunctionInfo.h:1078

llvm::SIMachineFunctionInfo::setIsStackRealigned
void setIsStackRealigned(bool Realigned=true)
Definition: SIMachineFunctionInfo.h:1086

llvm::SIMachineFunctionInfo::getGITPtrHigh
unsigned getGITPtrHigh() const
Definition: SIMachineFunctionInfo.h:979

llvm::SIMachineFunctionInfo::limitOccupancy
void limitOccupancy(const MachineFunction &MF)
Definition: SIMachineFunctionInfo.cpp:207

llvm::SIMachineFunctionInfo::hasSpilledSGPRs
bool hasSpilledSGPRs() const
Definition: SIMachineFunctionInfo.h:1058

llvm::SIMachineFunctionInfo::getSGPRSpillVGPRs
ArrayRef< Register > getSGPRSpillVGPRs() const
Definition: SIMachineFunctionInfo.h:674

llvm::SIMachineFunctionInfo::getPSInputAddr
unsigned getPSInputAddr() const
Definition: SIMachineFunctionInfo.h:1106

llvm::SIMachineFunctionInfo::addPreloadedKernArg
SmallVectorImpl< MCRegister > * addPreloadedKernArg(const SIRegisterInfo &TRI, const TargetRegisterClass *RC, unsigned AllocSizeDWord, int KernArgIdx, int PaddingSGPRs)
Definition: SIMachineFunctionInfo.cpp:277

llvm::SIMachineFunctionInfo::addToPrologEpilogSGPRSpills
void addToPrologEpilogSGPRSpills(Register Reg, PrologEpilogSGPRSaveRestoreInfo SI)
Definition: SIMachineFunctionInfo.h:695

llvm::SIMachineFunctionInfo::getScratchSGPRCopyDstReg
Register getScratchSGPRCopyDstReg(Register Reg) const
Definition: SIMachineFunctionInfo.h:718

llvm::SIMachineFunctionInfo::getPrivateSegmentWaveByteOffsetSystemSGPR
Register getPrivateSegmentWaveByteOffsetSystemSGPR() const
Definition: SIMachineFunctionInfo.h:1009

llvm::SIMachineFunctionInfo::hasImplicitArgPtr
bool hasImplicitArgPtr() const
Definition: SIMachineFunctionInfo.h:957

llvm::SIMachineFunctionInfo::addWorkGroupIDZ
Register addWorkGroupIDZ()
Definition: SIMachineFunctionInfo.h:887

llvm::SIMachineFunctionInfo::mayNeedAGPRs
bool mayNeedAGPRs() const
Definition: SIMachineFunctionInfo.h:1196

llvm::SIMachineFunctionInfo::addWorkGroupInfo
Register addWorkGroupInfo()
Definition: SIMachineFunctionInfo.h:893

llvm::SIMachineFunctionInfo::hasWorkItemIDZ
bool hasWorkItemIDZ() const
Definition: SIMachineFunctionInfo.h:953

llvm::SIMachineFunctionInfo::getMaxNumWorkGroupsY
unsigned getMaxNumWorkGroupsY() const
Definition: SIMachineFunctionInfo.h:1208

llvm::SIMachineFunctionInfo::getPSInputEnable
unsigned getPSInputEnable() const
Definition: SIMachineFunctionInfo.h:1110

llvm::SIMachineFunctionInfo::setScratchRSrcReg
void setScratchRSrcReg(Register Reg)
Definition: SIMachineFunctionInfo.h:1019

llvm::SIMachineFunctionInfo::addToSpilledSGPRs
void addToSpilledSGPRs(unsigned num)
Definition: SIMachineFunctionInfo.h:1098

llvm::SIMachineFunctionInfo::getGWSPSV
const AMDGPUGWSResourcePseudoSourceValue * getGWSPSV(const AMDGPUTargetMachine &TM)
Definition: SIMachineFunctionInfo.h:1167

llvm::SIMachineFunctionInfo::reserveWWMRegister
void reserveWWMRegister(Register Reg)
Definition: SIMachineFunctionInfo.h:654

llvm::SIMachineFunctionInfo::hasPrivateSegmentWaveByteOffset
bool hasPrivateSegmentWaveByteOffset() const
Definition: SIMachineFunctionInfo.h:941

llvm::SIMachineFunctionInfo::addWorkGroupIDX
Register addWorkGroupIDX()
Definition: SIMachineFunctionInfo.h:875

llvm::SIRegisterInfo
Definition: SIRegisterInfo.h:40

llvm::SMDiagnostic
Instances of this class encapsulate one diagnostic report, allowing printing to a raw_ostream as a ca...
Definition: SourceMgr.h:282

llvm::SMRange
Represents a range in source code.
Definition: SMLoc.h:48

llvm::SetVector::insert
bool insert(const value_type &X)
Insert a new element into the SetVector.
Definition: SetVector.h:168

llvm::SetVector::contains
bool contains(const key_type &key) const
Check if the SetVector contains the given key.
Definition: SetVector.h:269

llvm::SmallSetVector< Register, 8 >

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:574

llvm::SmallVectorImpl::insert
iterator insert(iterator I, T &&Elt)
Definition: SmallVector.h:806

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:414

llvm::SmallVectorTemplateCommon::end
iterator end()
Definition: SmallVector.h:270

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1197

llvm::StackOffset
StackOffset holds a fixed and a scalable offset in bytes.
Definition: TypeSize.h:34

llvm::TargetRegisterClass
Definition: TargetRegisterInfo.h:45

llvm::TargetRegisterInfo
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
Definition: TargetRegisterInfo.h:237

llvm::Value
LLVM Value Representation.
Definition: Value.h:75

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:53

uint16_t

uint32_t

uint64_t

uint8_t

false
Definition: MachinePipeliner.cpp:239

llvm::AMDGPU::VirtRegFlag::WWM_REG
@ WWM_REG
Definition: SIDefines.h:1088

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::MCPhysReg
uint16_t MCPhysReg
An unsigned integer type large enough to represent all physical registers, but not necessarily virtua...
Definition: MCRegister.h:21

llvm::SGPRSaveKind
SGPRSaveKind
Definition: SIMachineFunctionInfo.h:377

llvm::SGPRSaveKind::SPILL_TO_MEM
@ SPILL_TO_MEM

llvm::SGPRSaveKind::SPILL_TO_VGPR_LANE
@ SPILL_TO_VGPR_LANE

llvm::SGPRSaveKind::COPY_TO_SCRATCH_SGPR
@ COPY_TO_SCRATCH_SGPR

llvm::upper_bound
auto upper_bound(R &&Range, T &&Value)
Provide wrappers to std::upper_bound which take ranges instead of having to pass begin/end explicitly...
Definition: STLExtras.h:2026

llvm::is_sorted
bool is_sorted(R &&Range, Compare C)
Wrapper function around std::is_sorted to check if elements in a range R are sorted with respect to a...
Definition: STLExtras.h:1939

llvm::IRMemLocation::Other
@ Other
Any other memory.

llvm::DefaultMemoryClusterDWordsLimit
constexpr unsigned DefaultMemoryClusterDWordsLimit
Definition: SIInstrInfo.h:40

llvm::find_if
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1777

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition: STLExtras.h:1916

true
Definition: SPIRVConvergenceRegionAnalysis.cpp:40

raw_ostream.h

llvm::AMDGPUFunctionArgInfo
Definition: AMDGPUArgumentUsageInfo.h:103

llvm::AMDGPUFunctionArgInfo::PreloadedValue
PreloadedValue
Definition: AMDGPUArgumentUsageInfo.h:105

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::ArgDescriptor
Definition: AMDGPUArgumentUsageInfo.h:25

llvm::ArgDescriptor::createRegister
static ArgDescriptor createRegister(Register Reg, unsigned Mask=~0u)
Definition: AMDGPUArgumentUsageInfo.h:46

llvm::ArgInfo
Helper struct shared between Function Specialization and SCCP Solver.
Definition: SCCPSolver.h:42

llvm::DenormalMode::PreserveSign
@ PreserveSign
The sign of a flushed-to-zero number is preserved in the sign of 0.
Definition: FloatingPointMode.h:81

llvm::MachineFunctionInfo
MachineFunctionInfo - This class can be derived from and used by targets to hold private target-speci...
Definition: MachineFunction.h:104

llvm::PerFunctionMIParsingState
Definition: MIParser.h:165

llvm::SIMachineFunctionInfo::VGPRSpillToAGPR
Definition: SIMachineFunctionInfo.h:537

llvm::SIMachineFunctionInfo::VGPRSpillToAGPR::IsDead
bool IsDead
Definition: SIMachineFunctionInfo.h:540

llvm::SIMachineFunctionInfo::VGPRSpillToAGPR::FullyAllocated
bool FullyAllocated
Definition: SIMachineFunctionInfo.h:539

llvm::SIMachineFunctionInfo::VGPRSpillToAGPR::Lanes
SmallVector< MCPhysReg, 32 > Lanes
Definition: SIMachineFunctionInfo.h:538

llvm::SIModeRegisterDefaults
Definition: SIModeRegisterDefaults.h:20

llvm::VGPRBlock2IndexFunctor
Definition: SIMachineFunctionInfo.h:399

llvm::VGPRBlock2IndexFunctor::operator()
unsigned operator()(Register Reg) const
Definition: SIMachineFunctionInfo.h:401

llvm::less_first
Function object to check whether the first component of a container supported by std::get (like std::...
Definition: STLExtras.h:1472

llvm::yaml::MachineFunctionInfo
Targets should override this in a way that mirrors the implementation of llvm::MachineFunctionInfo.
Definition: MIRYamlMapping.h:758

llvm::yaml::MappingTraits< SIArgumentInfo >::mapping
static void mapping(IO &YamlIO, SIArgumentInfo &AI)
Definition: SIMachineFunctionInfo.h:190

llvm::yaml::MappingTraits< SIArgument >::mapping
static void mapping(IO &YamlIO, SIArgument &A)
Definition: SIMachineFunctionInfo.h:144

llvm::yaml::MappingTraits< SIMachineFunctionInfo >::mapping
static void mapping(IO &YamlIO, SIMachineFunctionInfo &MFI)
Definition: SIMachineFunctionInfo.h:318

llvm::yaml::MappingTraits< SIMode >::mapping
static void mapping(IO &YamlIO, SIMode &Mode)
Definition: SIMachineFunctionInfo.h:250

llvm::yaml::MappingTraits
Definition: ModuleSummaryIndex.h:57

llvm::yaml::SIArgumentInfo
Definition: SIMachineFunctionInfo.h:165

llvm::yaml::SIArgumentInfo::PrivateSegmentWaveByteOffset
std::optional< SIArgument > PrivateSegmentWaveByteOffset
Definition: SIMachineFunctionInfo.h:179

llvm::yaml::SIArgumentInfo::WorkGroupIDY
std::optional< SIArgument > WorkGroupIDY
Definition: SIMachineFunctionInfo.h:175

llvm::yaml::SIArgumentInfo::FlatScratchInit
std::optional< SIArgument > FlatScratchInit
Definition: SIMachineFunctionInfo.h:171

llvm::yaml::SIArgumentInfo::DispatchPtr
std::optional< SIArgument > DispatchPtr
Definition: SIMachineFunctionInfo.h:167

llvm::yaml::SIArgumentInfo::DispatchID
std::optional< SIArgument > DispatchID
Definition: SIMachineFunctionInfo.h:170

llvm::yaml::SIArgumentInfo::WorkItemIDY
std::optional< SIArgument > WorkItemIDY
Definition: SIMachineFunctionInfo.h:185

llvm::yaml::SIArgumentInfo::WorkGroupIDX
std::optional< SIArgument > WorkGroupIDX
Definition: SIMachineFunctionInfo.h:174

llvm::yaml::SIArgumentInfo::ImplicitArgPtr
std::optional< SIArgument > ImplicitArgPtr
Definition: SIMachineFunctionInfo.h:181

llvm::yaml::SIArgumentInfo::QueuePtr
std::optional< SIArgument > QueuePtr
Definition: SIMachineFunctionInfo.h:168

llvm::yaml::SIArgumentInfo::WorkGroupInfo
std::optional< SIArgument > WorkGroupInfo
Definition: SIMachineFunctionInfo.h:177

llvm::yaml::SIArgumentInfo::LDSKernelId
std::optional< SIArgument > LDSKernelId
Definition: SIMachineFunctionInfo.h:178

llvm::yaml::SIArgumentInfo::ImplicitBufferPtr
std::optional< SIArgument > ImplicitBufferPtr
Definition: SIMachineFunctionInfo.h:182

llvm::yaml::SIArgumentInfo::WorkItemIDX
std::optional< SIArgument > WorkItemIDX
Definition: SIMachineFunctionInfo.h:184

llvm::yaml::SIArgumentInfo::KernargSegmentPtr
std::optional< SIArgument > KernargSegmentPtr
Definition: SIMachineFunctionInfo.h:169

llvm::yaml::SIArgumentInfo::WorkItemIDZ
std::optional< SIArgument > WorkItemIDZ
Definition: SIMachineFunctionInfo.h:186

llvm::yaml::SIArgumentInfo::PrivateSegmentSize
std::optional< SIArgument > PrivateSegmentSize
Definition: SIMachineFunctionInfo.h:172

llvm::yaml::SIArgumentInfo::PrivateSegmentBuffer
std::optional< SIArgument > PrivateSegmentBuffer
Definition: SIMachineFunctionInfo.h:166

llvm::yaml::SIArgumentInfo::WorkGroupIDZ
std::optional< SIArgument > WorkGroupIDZ
Definition: SIMachineFunctionInfo.h:176

llvm::yaml::SIArgument
Definition: SIMachineFunctionInfo.h:91

llvm::yaml::SIArgument::StackOffset
unsigned StackOffset
Definition: SIMachineFunctionInfo.h:95

llvm::yaml::SIArgument::Mask
std::optional< unsigned > Mask
Definition: SIMachineFunctionInfo.h:97

llvm::yaml::SIArgument::~SIArgument
~SIArgument()
Definition: SIMachineFunctionInfo.h:126

llvm::yaml::SIArgument::SIArgument
SIArgument()
Definition: SIMachineFunctionInfo.h:100

llvm::yaml::SIArgument::SIArgument
SIArgument(const SIArgument &Other)
Definition: SIMachineFunctionInfo.h:101

llvm::yaml::SIArgument::RegisterName
StringValue RegisterName
Definition: SIMachineFunctionInfo.h:94

llvm::yaml::SIArgument::operator=
SIArgument & operator=(const SIArgument &Other)
Definition: SIMachineFunctionInfo.h:109

llvm::yaml::SIArgument::createArgument
static SIArgument createArgument(bool IsReg)
Definition: SIMachineFunctionInfo.h:132

llvm::yaml::SIArgument::IsRegister
bool IsRegister
Definition: SIMachineFunctionInfo.h:92

llvm::yaml::SIMachineFunctionInfo
Definition: SIMachineFunctionInfo.h:260

llvm::yaml::SIMachineFunctionInfo::MaxMemoryClusterDWords
unsigned MaxMemoryClusterDWords
Definition: SIMachineFunctionInfo.h:294

llvm::yaml::SIMachineFunctionInfo::HasSpilledVGPRs
bool HasSpilledVGPRs
Definition: SIMachineFunctionInfo.h:272

llvm::yaml::SIMachineFunctionInfo::SGPRForEXECCopy
StringValue SGPRForEXECCopy
Definition: SIMachineFunctionInfo.h:299

llvm::yaml::SIMachineFunctionInfo::HasSpilledSGPRs
bool HasSpilledSGPRs
Definition: SIMachineFunctionInfo.h:271

llvm::yaml::SIMachineFunctionInfo::ReturnsVoid
bool ReturnsVoid
Definition: SIMachineFunctionInfo.h:288

llvm::yaml::SIMachineFunctionInfo::DynLDSAlign
Align DynLDSAlign
Definition: SIMachineFunctionInfo.h:265

llvm::yaml::SIMachineFunctionInfo::WWMReservedRegs
SmallVector< StringValue > WWMReservedRegs
Definition: SIMachineFunctionInfo.h:281

llvm::yaml::SIMachineFunctionInfo::HighBitsOf32BitAddress
uint32_t HighBitsOf32BitAddress
Definition: SIMachineFunctionInfo.h:275

llvm::yaml::SIMachineFunctionInfo::GDSSize
uint32_t GDSSize
Definition: SIMachineFunctionInfo.h:264

llvm::yaml::SIMachineFunctionInfo::MemoryBound
bool MemoryBound
Definition: SIMachineFunctionInfo.h:269

llvm::yaml::SIMachineFunctionInfo::Occupancy
unsigned Occupancy
Definition: SIMachineFunctionInfo.h:278

llvm::yaml::SIMachineFunctionInfo::PSInputEnable
unsigned PSInputEnable
Definition: SIMachineFunctionInfo.h:293

llvm::yaml::SIMachineFunctionInfo::MaxKernArgAlign
Align MaxKernArgAlign
Definition: SIMachineFunctionInfo.h:262

llvm::yaml::SIMachineFunctionInfo::SIMachineFunctionInfo
SIMachineFunctionInfo()=default

llvm::yaml::SIMachineFunctionInfo::FrameOffsetReg
StringValue FrameOffsetReg
Definition: SIMachineFunctionInfo.h:284

llvm::yaml::SIMachineFunctionInfo::LongBranchReservedReg
StringValue LongBranchReservedReg
Definition: SIMachineFunctionInfo.h:300

llvm::yaml::SIMachineFunctionInfo::ExplicitKernArgSize
uint64_t ExplicitKernArgSize
Definition: SIMachineFunctionInfo.h:261

llvm::yaml::SIMachineFunctionInfo::LDSSize
uint32_t LDSSize
Definition: SIMachineFunctionInfo.h:263

llvm::yaml::SIMachineFunctionInfo::WaveLimiter
bool WaveLimiter
Definition: SIMachineFunctionInfo.h:270

llvm::yaml::SIMachineFunctionInfo::PSInputAddr
unsigned PSInputAddr
Definition: SIMachineFunctionInfo.h:292

llvm::yaml::SIMachineFunctionInfo::IsWholeWaveFunction
bool IsWholeWaveFunction
Definition: SIMachineFunctionInfo.h:303

llvm::yaml::SIMachineFunctionInfo::NumWaveDispatchSGPRs
uint16_t NumWaveDispatchSGPRs
Definition: SIMachineFunctionInfo.h:273

llvm::yaml::SIMachineFunctionInfo::mappingImpl
void mappingImpl(yaml::IO &YamlIO) override
Definition: SIMachineFunctionInfo.cpp:766

llvm::yaml::SIMachineFunctionInfo::~SIMachineFunctionInfo
~SIMachineFunctionInfo()=default

llvm::yaml::SIMachineFunctionInfo::NoSignedZerosFPMath
bool NoSignedZerosFPMath
Definition: SIMachineFunctionInfo.h:268

llvm::yaml::SIMachineFunctionInfo::IsEntryFunction
bool IsEntryFunction
Definition: SIMachineFunctionInfo.h:266

llvm::yaml::SIMachineFunctionInfo::DynamicVGPRBlockSize
unsigned DynamicVGPRBlockSize
Definition: SIMachineFunctionInfo.h:305

llvm::yaml::SIMachineFunctionInfo::VGPRForAGPRCopy
StringValue VGPRForAGPRCopy
Definition: SIMachineFunctionInfo.h:298

llvm::yaml::SIMachineFunctionInfo::Mode
SIMode Mode
Definition: SIMachineFunctionInfo.h:296

llvm::yaml::SIMachineFunctionInfo::IsChainFunction
bool IsChainFunction
Definition: SIMachineFunctionInfo.h:267

llvm::yaml::SIMachineFunctionInfo::HasInitWholeWave
bool HasInitWholeWave
Definition: SIMachineFunctionInfo.h:302

llvm::yaml::SIMachineFunctionInfo::ArgInfo
std::optional< SIArgumentInfo > ArgInfo
Definition: SIMachineFunctionInfo.h:290

llvm::yaml::SIMachineFunctionInfo::SpillPhysVGPRS
SmallVector< StringValue, 2 > SpillPhysVGPRS
Definition: SIMachineFunctionInfo.h:280

llvm::yaml::SIMachineFunctionInfo::ScavengeFI
std::optional< FrameIndex > ScavengeFI
Definition: SIMachineFunctionInfo.h:297

llvm::yaml::SIMachineFunctionInfo::NumWaveDispatchVGPRs
uint16_t NumWaveDispatchVGPRs
Definition: SIMachineFunctionInfo.h:274

llvm::yaml::SIMachineFunctionInfo::BytesInStackArgArea
unsigned BytesInStackArgArea
Definition: SIMachineFunctionInfo.h:287

llvm::yaml::SIMachineFunctionInfo::ScratchReservedForDynamicVGPRs
unsigned ScratchReservedForDynamicVGPRs
Definition: SIMachineFunctionInfo.h:306

llvm::yaml::SIMachineFunctionInfo::ScratchRSrcReg
StringValue ScratchRSrcReg
Definition: SIMachineFunctionInfo.h:283

llvm::yaml::SIMachineFunctionInfo::StackPtrOffsetReg
StringValue StackPtrOffsetReg
Definition: SIMachineFunctionInfo.h:285

llvm::yaml::SIMode
Definition: SIMachineFunctionInfo.h:217

llvm::yaml::SIMode::IEEE
bool IEEE
Definition: SIMachineFunctionInfo.h:218

llvm::yaml::SIMode::SIMode
SIMode()=default

llvm::yaml::SIMode::SIMode
SIMode(const SIModeRegisterDefaults &Mode)
Definition: SIMachineFunctionInfo.h:227

llvm::yaml::SIMode::DX10Clamp
bool DX10Clamp
Definition: SIMachineFunctionInfo.h:219

llvm::yaml::SIMode::FP64FP16OutputDenormals
bool FP64FP16OutputDenormals
Definition: SIMachineFunctionInfo.h:223

llvm::yaml::SIMode::FP64FP16InputDenormals
bool FP64FP16InputDenormals
Definition: SIMachineFunctionInfo.h:222

llvm::yaml::SIMode::FP32OutputDenormals
bool FP32OutputDenormals
Definition: SIMachineFunctionInfo.h:221

llvm::yaml::SIMode::FP32InputDenormals
bool FP32InputDenormals
Definition: SIMachineFunctionInfo.h:220

llvm::yaml::StringValue
A wrapper around std::string which contains a source range that's being set during parsing.
Definition: MIRYamlMapping.h:34