LLVM: lib/Target/AMDGPU/AMDGPUISelLowering.h Source File

//===-- AMDGPUISelLowering.h - AMDGPU Lowering Interface --------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file

/// Interface definition of the TargetLowering class that is common

/// to all AMD GPUs.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUISELLOWERING_H

#define LLVM_LIB_TARGET_AMDGPU_AMDGPUISELLOWERING_H


#include "llvm/CodeGen/CallingConvLower.h"

#include "llvm/CodeGen/TargetLowering.h"


namespace llvm {


class AMDGPUMachineFunction;

class AMDGPUSubtarget;

struct ArgDescriptor;


class AMDGPUTargetLowering : public TargetLowering {

private:

  const AMDGPUSubtarget *Subtarget;


  /// \returns AMDGPUISD::FFBH_U32 node if the incoming \p Op may have been

  /// legalized from a smaller type VT. Need to match pre-legalized type because

  /// the generic legalization inserts the add/sub between the select and

  /// compare.

  SDValue getFFBX_U32(SelectionDAG &DAG, SDValue Op, const SDLoc &DL, unsigned Opc) const;


public:

  /// \returns The minimum number of bits needed to store the value of \Op as an

  /// unsigned integer. Truncating to this size and then zero-extending to the

  /// original size will not change the value.

  static unsigned numBitsUnsigned(SDValue Op, SelectionDAG &DAG);


  /// \returns The minimum number of bits needed to store the value of \Op as a

  /// signed integer. Truncating to this size and then sign-extending to the

  /// original size will not change the value.

  static unsigned numBitsSigned(SDValue Op, SelectionDAG &DAG);


protected:

  SDValue LowerEXTRACT_SUBVECTOR(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const;

  /// Split a vector store into multiple scalar stores.

  /// \returns The resulting chain.


  SDValue LowerFREM(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFCEIL(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFTRUNC(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFRINT(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFNEARBYINT(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerFROUNDEVEN(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFROUND(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFFLOOR(SDValue Op, SelectionDAG &DAG) const;


  static bool allowApproxFunc(const SelectionDAG &DAG, SDNodeFlags Flags);

  static bool needsDenormHandlingF32(const SelectionDAG &DAG, SDValue Src,

                                     SDNodeFlags Flags);

  SDValue getIsLtSmallestNormal(SelectionDAG &DAG, SDValue Op,

                                SDNodeFlags Flags) const;

  SDValue getIsFinite(SelectionDAG &DAG, SDValue Op, SDNodeFlags Flags) const;

  std::pair<SDValue, SDValue> getScaledLogInput(SelectionDAG &DAG,

                                                const SDLoc SL, SDValue Op,

                                                SDNodeFlags Flags) const;


  SDValue LowerFLOG2(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFLOGCommon(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFLOG10(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFLOGUnsafe(SDValue Op, const SDLoc &SL, SelectionDAG &DAG,

                          bool IsLog10, SDNodeFlags Flags) const;

  SDValue lowerFEXP2(SDValue Op, SelectionDAG &DAG) const;


  SDValue lowerFEXPUnsafe(SDValue Op, const SDLoc &SL, SelectionDAG &DAG,

                          SDNodeFlags Flags) const;

  SDValue lowerFEXP10Unsafe(SDValue Op, const SDLoc &SL, SelectionDAG &DAG,

                            SDNodeFlags Flags) const;

  SDValue lowerFEXP(SDValue Op, SelectionDAG &DAG) const;


  SDValue lowerCTLZResults(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerCTLZ_CTTZ(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerINT_TO_FP32(SDValue Op, SelectionDAG &DAG, bool Signed) const;

  SDValue LowerINT_TO_FP64(SDValue Op, SelectionDAG &DAG, bool Signed) const;

  SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerFP_TO_INT64(SDValue Op, SelectionDAG &DAG, bool Signed) const;

  SDValue LowerFP_TO_FP16(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerF64ToF16Safe(SDValue Src, const SDLoc &DL,

                            SelectionDAG &DAG) const;


  SDValue LowerSIGN_EXTEND_INREG(SDValue Op, SelectionDAG &DAG) const;


protected:

  bool shouldCombineMemoryType(EVT VT) const;

  SDValue performLoadCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performStoreCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performAssertSZExtCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performIntrinsicWOChainCombine(SDNode *N, DAGCombinerInfo &DCI) const;


  SDValue splitBinaryBitConstantOpImpl(DAGCombinerInfo &DCI, const SDLoc &SL,

                                       unsigned Opc, SDValue LHS,

                                       uint32_t ValLo, uint32_t ValHi) const;

  SDValue performShlCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performSraCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performSrlCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performTruncateCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performMulCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performMulLoHiCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performMulhsCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performMulhuCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performCtlz_CttzCombine(const SDLoc &SL, SDValue Cond, SDValue LHS,

                             SDValue RHS, DAGCombinerInfo &DCI) const;


  SDValue foldFreeOpFromSelect(TargetLowering::DAGCombinerInfo &DCI,

                               SDValue N) const;

  SDValue performSelectCombine(SDNode *N, DAGCombinerInfo &DCI) const;


  TargetLowering::NegatibleCost

  getConstantNegateCost(const ConstantFPSDNode *C) const;


  bool isConstantCostlierToNegate(SDValue N) const;

  bool isConstantCheaperToNegate(SDValue N) const;

  SDValue performFNegCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performFAbsCombine(SDNode *N, DAGCombinerInfo &DCI) const;

  SDValue performRcpCombine(SDNode *N, DAGCombinerInfo &DCI) const;


  static EVT getEquivalentMemType(LLVMContext &Context, EVT VT);


  virtual SDValue LowerGlobalAddress(AMDGPUMachineFunction *MFI, SDValue Op,

                                     SelectionDAG &DAG) const;


  /// Return 64-bit value Op as two 32-bit integers.

  std::pair<SDValue, SDValue> split64BitValue(SDValue Op,

                                              SelectionDAG &DAG) const;

  SDValue getLoHalf64(SDValue Op, SelectionDAG &DAG) const;

  SDValue getHiHalf64(SDValue Op, SelectionDAG &DAG) const;


  /// Split a vector type into two parts. The first part is a power of two

  /// vector. The second part is whatever is left over, and is a scalar if it

  /// would otherwise be a 1-vector.

  std::pair<EVT, EVT> getSplitDestVTs(const EVT &VT, SelectionDAG &DAG) const;


  /// Split a vector value into two parts of types LoVT and HiVT. HiVT could be

  /// scalar.

  std::pair<SDValue, SDValue> splitVector(const SDValue &N, const SDLoc &DL,

                                          const EVT &LoVT, const EVT &HighVT,

                                          SelectionDAG &DAG) const;


  /// Split a vector load into 2 loads of half the vector.

  SDValue SplitVectorLoad(SDValue Op, SelectionDAG &DAG) const;


  /// Widen a suitably aligned v3 load. For all other cases, split the input

  /// vector load.

  SDValue WidenOrSplitVectorLoad(SDValue Op, SelectionDAG &DAG) const;


  /// Split a vector store into 2 stores of half the vector.

  SDValue SplitVectorStore(SDValue Op, SelectionDAG &DAG) const;


  SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerSDIVREM(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerUDIVREM(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerDIVREM24(SDValue Op, SelectionDAG &DAG, bool sign) const;

  void LowerUDIVREM64(SDValue Op, SelectionDAG &DAG,

                                    SmallVectorImpl<SDValue> &Results) const;


  void analyzeFormalArgumentsCompute(

    CCState &State,

    const SmallVectorImpl<ISD::InputArg> &Ins) const;


public:

  AMDGPUTargetLowering(const TargetMachine &TM, const AMDGPUSubtarget &STI);


  bool mayIgnoreSignedZero(SDValue Op) const;


  static inline SDValue stripBitcast(SDValue Val) {

    return Val.getOpcode() == ISD::BITCAST ? Val.getOperand(0) : Val;

  }


  static bool shouldFoldFNegIntoSrc(SDNode *FNeg, SDValue FNegSrc);

  static bool allUsesHaveSourceMods(const SDNode *N,

                                    unsigned CostThreshold = 4);

  bool isFAbsFree(EVT VT) const override;

  bool isFNegFree(EVT VT) const override;

  bool isTruncateFree(EVT Src, EVT Dest) const override;

  bool isTruncateFree(Type *Src, Type *Dest) const override;


  bool isZExtFree(Type *Src, Type *Dest) const override;

  bool isZExtFree(EVT Src, EVT Dest) const override;


  SDValue getNegatedExpression(SDValue Op, SelectionDAG &DAG,

                               bool LegalOperations, bool ForCodeSize,

                               NegatibleCost &Cost,

                               unsigned Depth) const override;


  bool isNarrowingProfitable(SDNode *N, EVT SrcVT, EVT DestVT) const override;


  bool isDesirableToCommuteWithShift(const SDNode *N,

                                     CombineLevel Level) const override;


  EVT getTypeForExtReturn(LLVMContext &Context, EVT VT,

                          ISD::NodeType ExtendKind) const override;


  unsigned getVectorIdxWidth(const DataLayout &) const override;

  bool isSelectSupported(SelectSupportKind) const override;


  bool isFPImmLegal(const APFloat &Imm, EVT VT,

                    bool ForCodeSize) const override;

  bool ShouldShrinkFPConstant(EVT VT) const override;

  bool shouldReduceLoadWidth(SDNode *Load, ISD::LoadExtType ExtType, EVT ExtVT,

                             std::optional<unsigned> ByteOffset) const override;


  bool isLoadBitCastBeneficial(EVT, EVT, const SelectionDAG &DAG,

                               const MachineMemOperand &MMO) const final;


  bool storeOfVectorConstantIsCheap(bool IsZero, EVT MemVT,

                                    unsigned NumElem,

                                    unsigned AS) const override;

  bool aggressivelyPreferBuildVectorSources(EVT VecVT) const override;

  bool isCheapToSpeculateCttz(Type *Ty) const override;

  bool isCheapToSpeculateCtlz(Type *Ty) const override;


  bool isSDNodeAlwaysUniform(const SDNode *N) const override;


  // FIXME: This hook should not exist

  AtomicExpansionKind shouldCastAtomicLoadInIR(LoadInst *LI) const override {

    return AtomicExpansionKind::None;

  }


  AtomicExpansionKind shouldCastAtomicStoreInIR(StoreInst *SI) const override {

    return AtomicExpansionKind::None;

  }


  AtomicExpansionKind shouldCastAtomicRMWIInIR(AtomicRMWInst *) const override {

    return AtomicExpansionKind::None;

  }


  static CCAssignFn *CCAssignFnForCall(CallingConv::ID CC, bool IsVarArg);

  static CCAssignFn *CCAssignFnForReturn(CallingConv::ID CC, bool IsVarArg);


  SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,

                      const SmallVectorImpl<ISD::OutputArg> &Outs,

                      const SmallVectorImpl<SDValue> &OutVals, const SDLoc &DL,

                      SelectionDAG &DAG) const override;


  SDValue addTokenForArgument(SDValue Chain,

                              SelectionDAG &DAG,

                              MachineFrameInfo &MFI,

                              int ClobberedFI) const;


  SDValue lowerUnhandledCall(CallLoweringInfo &CLI,

                             SmallVectorImpl<SDValue> &InVals,

                             StringRef Reason) const;

  SDValue LowerCall(CallLoweringInfo &CLI,

                    SmallVectorImpl<SDValue> &InVals) const override;


  SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;

  SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;

  SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;

  void ReplaceNodeResults(SDNode * N,

                          SmallVectorImpl<SDValue> &Results,

                          SelectionDAG &DAG) const override;


  SDValue combineFMinMaxLegacyImpl(const SDLoc &DL, EVT VT, SDValue LHS,

                                   SDValue RHS, SDValue True, SDValue False,

                                   SDValue CC, DAGCombinerInfo &DCI) const;


  SDValue combineFMinMaxLegacy(const SDLoc &DL, EVT VT, SDValue LHS,

                               SDValue RHS, SDValue True, SDValue False,

                               SDValue CC, DAGCombinerInfo &DCI) const;


  const char* getTargetNodeName(unsigned Opcode) const override;


  // FIXME: Turn off MergeConsecutiveStores() before Instruction Selection for

  // AMDGPU.  Commit r319036,

  // (https://github.com/llvm/llvm-project/commit/db77e57ea86d941a4262ef60261692f4cb6893e6)

  // turned on MergeConsecutiveStores() before Instruction Selection for all

  // targets.  Enough AMDGPU compiles go into an infinite loop (

  // MergeConsecutiveStores() merges two stores; LegalizeStoreOps() un-merges;

  // MergeConsecutiveStores() re-merges, etc. ) to warrant turning it off for

  // now.

  bool mergeStoresAfterLegalization(EVT) const override { return false; }


  bool isFsqrtCheap(SDValue Operand, SelectionDAG &DAG) const override {

    return true;

  }

  SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,

                           int &RefinementSteps, bool &UseOneConstNR,

                           bool Reciprocal) const override;

  SDValue getRecipEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,

                           int &RefinementSteps) const override;


  virtual SDNode *PostISelFolding(MachineSDNode *N,

                                  SelectionDAG &DAG) const = 0;


  /// Determine which of the bits specified in \p Mask are known to be

  /// either zero or one and return them in the \p KnownZero and \p KnownOne

  /// bitsets.

  void computeKnownBitsForTargetNode(const SDValue Op,

                                     KnownBits &Known,

                                     const APInt &DemandedElts,

                                     const SelectionDAG &DAG,

                                     unsigned Depth = 0) const override;


  unsigned ComputeNumSignBitsForTargetNode(SDValue Op, const APInt &DemandedElts,

                                           const SelectionDAG &DAG,

                                           unsigned Depth = 0) const override;


  unsigned computeNumSignBitsForTargetInstr(GISelValueTracking &Analysis,

                                            Register R,

                                            const APInt &DemandedElts,

                                            const MachineRegisterInfo &MRI,

                                            unsigned Depth = 0) const override;


  bool canCreateUndefOrPoisonForTargetNode(SDValue Op,

                                           const APInt &DemandedElts,

                                           const SelectionDAG &DAG,

                                           bool PoisonOnly, bool ConsiderFlags,

                                           unsigned Depth) const override;


  bool isKnownNeverNaNForTargetNode(SDValue Op, const APInt &DemandedElts,

                                    const SelectionDAG &DAG, bool SNaN = false,

                                    unsigned Depth = 0) const override;


  bool isReassocProfitable(MachineRegisterInfo &MRI, Register N0,

                           Register N1) const override;


  /// Helper function that adds Reg to the LiveIn list of the DAG's

  /// MachineFunction.

  ///

  /// \returns a RegisterSDNode representing Reg if \p RawReg is true, otherwise

  /// a copy from the register.

  SDValue CreateLiveInRegister(SelectionDAG &DAG,

                               const TargetRegisterClass *RC,

                               Register Reg, EVT VT,

                               const SDLoc &SL,

                               bool RawReg = false) const;

  SDValue CreateLiveInRegister(SelectionDAG &DAG,

                               const TargetRegisterClass *RC,

                               Register Reg, EVT VT) const {

    return CreateLiveInRegister(DAG, RC, Reg, VT, SDLoc(DAG.getEntryNode()));

  }


  // Returns the raw live in register rather than a copy from it.

  SDValue CreateLiveInRegisterRaw(SelectionDAG &DAG,

                                  const TargetRegisterClass *RC,

                                  Register Reg, EVT VT) const {

    return CreateLiveInRegister(DAG, RC, Reg, VT, SDLoc(DAG.getEntryNode()), true);

  }


  /// Similar to CreateLiveInRegister, except value maybe loaded from a stack

  /// slot rather than passed in a register.

  SDValue loadStackInputValue(SelectionDAG &DAG,

                              EVT VT,

                              const SDLoc &SL,

                              int64_t Offset) const;


  SDValue storeStackInputValue(SelectionDAG &DAG,

                               const SDLoc &SL,

                               SDValue Chain,

                               SDValue ArgVal,

                               int64_t Offset) const;


  SDValue loadInputValue(SelectionDAG &DAG,

                         const TargetRegisterClass *RC,

                         EVT VT, const SDLoc &SL,

                         const ArgDescriptor &Arg) const;


  enum ImplicitParameter {

    FIRST_IMPLICIT,

    PRIVATE_BASE,

    SHARED_BASE,

    QUEUE_PTR,

  };


  /// Helper function that returns the byte offset of the given

  /// type of implicit parameter.

  uint32_t getImplicitParameterOffset(const MachineFunction &MF,

                                      const ImplicitParameter Param) const;

  uint32_t getImplicitParameterOffset(const uint64_t ExplicitKernArgSize,

                                      const ImplicitParameter Param) const;


  MVT getFenceOperandTy(const DataLayout &DL) const override {

    return MVT::i32;

  }


  bool hasMultipleConditionRegisters(EVT VT) const override {

    // FIXME: This is only partially true. If we have to do vector compares, any

    // SGPR pair can be a condition register. If we have a uniform condition, we

    // are better off doing SALU operations, where there is only one SCC. For

    // now, we don't have a way of knowing during instruction selection if a

    // condition will be uniform and we always use vector compares. Assume we

    // are using vector compares until that is fixed.

    return true;

  }

};


namespace AMDGPUISD {


enum NodeType : unsigned {

  // AMDIL ISD Opcodes

  FIRST_NUMBER = ISD::BUILTIN_OP_END,

  BRANCH_COND,

  // End AMDIL ISD Opcodes


  // Function call.

  CALL,

  TC_RETURN,

  TC_RETURN_GFX,

  TC_RETURN_CHAIN,

  TC_RETURN_CHAIN_DVGPR,

  TRAP,


  // Masked control flow nodes.

  IF,

  ELSE,

  LOOP,


  // A uniform kernel return that terminates the wavefront.

  ENDPGM,


  // s_endpgm, but we may want to insert it in the middle of the block.

  ENDPGM_TRAP,


  // "s_trap 2" equivalent on hardware that does not support it.

  SIMULATED_TRAP,


  // Return to a shader part's epilog code.

  RETURN_TO_EPILOG,


  // Return with values from a non-entry function.

  RET_GLUE,


  // Convert a unswizzled wave uniform stack address to an address compatible

  // with a vector offset for use in stack access.

  WAVE_ADDRESS,


  DWORDADDR,

  FRACT,


  /// CLAMP value between 0.0 and 1.0. NaN clamped to 0, following clamp output

  /// modifier behavior with dx10_enable.

  CLAMP,


  // This is SETCC with the full mask result which is used for a compare with a

  // result bit per item in the wavefront.

  SETCC,


  DENORM_MODE,


  // FP ops with input and output chain.

  FMA_W_CHAIN,

  FMUL_W_CHAIN,


  // SIN_HW, COS_HW - f32 for SI, 1 ULP max error, valid from -100 pi to 100 pi.

  // Denormals handled on some parts.

  COS_HW,

  SIN_HW,

  FMAX_LEGACY,

  FMIN_LEGACY,


  FMAX3,

  SMAX3,

  UMAX3,

  FMIN3,

  SMIN3,

  UMIN3,

  FMED3,

  SMED3,

  UMED3,

  FMAXIMUM3,

  FMINIMUM3,

  FDOT2,

  URECIP,

  DIV_SCALE,

  DIV_FMAS,

  DIV_FIXUP,

  // For emitting ISD::FMAD when f32 denormals are enabled because mac/mad is

  // treated as an illegal operation.

  FMAD_FTZ,


  // RCP, RSQ - For f32, 1 ULP max error, no denormal handling.

  //            For f64, max error 2^29 ULP, handles denormals.

  RCP,

  RSQ,

  RCP_LEGACY,

  RCP_IFLAG,


  // log2, no denormal handling for f32.

  LOG,


  // exp2, no denormal handling for f32.

  EXP,


  FMUL_LEGACY,

  RSQ_CLAMP,

  FP_CLASS,

  DOT4,

  CARRY,

  BORROW,

  BFE_U32,  // Extract range of bits with zero extension to 32-bits.

  BFE_I32,  // Extract range of bits with sign extension to 32-bits.

  BFI,      // (src0 & src1) | (~src0 & src2)

  BFM,      // Insert a range of bits into a 32-bit word.

  FFBH_U32, // ctlz with -1 if input is zero.

  FFBH_I32,

  FFBL_B32, // cttz with -1 if input is zero.

  MUL_U24,

  MUL_I24,

  MULHI_U24,

  MULHI_I24,

  MAD_U24,

  MAD_I24,

  MAD_U64_U32,

  MAD_I64_I32,

  PERM,

  TEXTURE_FETCH,

  R600_EXPORT,

  CONST_ADDRESS,

  REGISTER_LOAD,

  REGISTER_STORE,


  // These cvt_f32_ubyte* nodes need to remain consecutive and in order.

  CVT_F32_UBYTE0,

  CVT_F32_UBYTE1,

  CVT_F32_UBYTE2,

  CVT_F32_UBYTE3,


  // Convert two float 32 numbers into a single register holding two packed f16

  // with round to zero.

  CVT_PKRTZ_F16_F32,

  CVT_PKNORM_I16_F32,

  CVT_PKNORM_U16_F32,

  CVT_PK_I16_I32,

  CVT_PK_U16_U32,


  // Same as the standard node, except the high bits of the resulting integer

  // are known 0.

  FP_TO_FP16,


  /// This node is for VLIW targets and it is used to represent a vector

  /// that is stored in consecutive registers with the same channel.

  /// For example:

  ///   |X  |Y|Z|W|

  /// T0|v.x| | | |

  /// T1|v.y| | | |

  /// T2|v.z| | | |

  /// T3|v.w| | | |

  BUILD_VERTICAL_VECTOR,

  /// Pointer to the start of the shader's constant data.

  CONST_DATA_PTR,

  PC_ADD_REL_OFFSET,

  PC_ADD_REL_OFFSET64,

  LDS,


  DUMMY_CHAIN,


  FIRST_MEMORY_OPCODE,

  LOAD_D16_HI = FIRST_MEMORY_OPCODE,

  LOAD_D16_LO,

  LOAD_D16_HI_I8,

  LOAD_D16_HI_U8,

  LOAD_D16_LO_I8,

  LOAD_D16_LO_U8,


  STORE_MSKOR,

  TBUFFER_STORE_FORMAT,

  TBUFFER_STORE_FORMAT_D16,

  TBUFFER_LOAD_FORMAT,

  TBUFFER_LOAD_FORMAT_D16,

  DS_ORDERED_COUNT,

  ATOMIC_CMP_SWAP,

  BUFFER_LOAD,

  BUFFER_LOAD_UBYTE,

  BUFFER_LOAD_USHORT,

  BUFFER_LOAD_BYTE,

  BUFFER_LOAD_SHORT,

  BUFFER_LOAD_TFE,

  BUFFER_LOAD_UBYTE_TFE,

  BUFFER_LOAD_USHORT_TFE,

  BUFFER_LOAD_BYTE_TFE,

  BUFFER_LOAD_SHORT_TFE,

  BUFFER_LOAD_FORMAT,

  BUFFER_LOAD_FORMAT_TFE,

  BUFFER_LOAD_FORMAT_D16,

  SBUFFER_LOAD,

  SBUFFER_LOAD_BYTE,

  SBUFFER_LOAD_UBYTE,

  SBUFFER_LOAD_SHORT,

  SBUFFER_LOAD_USHORT,

  SBUFFER_PREFETCH_DATA,

  BUFFER_STORE,

  BUFFER_STORE_BYTE,

  BUFFER_STORE_SHORT,

  BUFFER_STORE_FORMAT,

  BUFFER_STORE_FORMAT_D16,

  BUFFER_ATOMIC_SWAP,

  BUFFER_ATOMIC_ADD,

  BUFFER_ATOMIC_SUB,

  BUFFER_ATOMIC_SMIN,

  BUFFER_ATOMIC_UMIN,

  BUFFER_ATOMIC_SMAX,

  BUFFER_ATOMIC_UMAX,

  BUFFER_ATOMIC_AND,

  BUFFER_ATOMIC_OR,

  BUFFER_ATOMIC_XOR,

  BUFFER_ATOMIC_INC,

  BUFFER_ATOMIC_DEC,

  BUFFER_ATOMIC_CMPSWAP,

  BUFFER_ATOMIC_CSUB,

  BUFFER_ATOMIC_FADD,

  BUFFER_ATOMIC_FMIN,

  BUFFER_ATOMIC_FMAX,

  BUFFER_ATOMIC_COND_SUB_U32,

  LAST_MEMORY_OPCODE = BUFFER_ATOMIC_COND_SUB_U32,


  // Set up a whole wave function.

  WHOLE_WAVE_SETUP,


  // Return from a whole wave function.

  WHOLE_WAVE_RETURN,

};


} // End namespace AMDGPUISD


} // End namespace llvm


#endif

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:103

AMDGPUSubtarget
#define AMDGPUSubtarget
Definition: AMDGPUInstructionSelector.cpp:38

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

Results
Function Alias Analysis Results
Definition: AliasAnalysis.cpp:722

Analysis
block Block Frequency Analysis
Definition: BlockFrequencyInfo.cpp:300

CallingConvLower.h

Reg
Register Reg
Definition: MachineSink.cpp:2117

Context
@ Context
Definition: MemProfContextDisambiguation.cpp:124

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition: RISCVRedundantCopyElimination.cpp:71

Opc
auto Opc
Definition: RISCVRedundantCopyElimination.cpp:75

TargetLowering.h
This file describes how to lower LLVM code to machine code.

UndefPoisonKind::PoisonOnly
@ PoisonOnly

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

llvm::AMDGPUMachineFunction
Definition: AMDGPUMachineFunction.h:24

llvm::AMDGPUSubtarget
Definition: AMDGPUSubtarget.h:30

llvm::AMDGPUTargetLowering
Definition: AMDGPUISelLowering.h:27

llvm::AMDGPUTargetLowering::numBitsSigned
static unsigned numBitsSigned(SDValue Op, SelectionDAG &DAG)
Definition: AMDGPUISelLowering.cpp:55

llvm::AMDGPUTargetLowering::combineFMinMaxLegacy
SDValue combineFMinMaxLegacy(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, SDValue True, SDValue False, SDValue CC, DAGCombinerInfo &DCI) const
Generate Min/Max node.
Definition: AMDGPUISelLowering.cpp:1721

llvm::AMDGPUTargetLowering::ComputeNumSignBitsForTargetNode
unsigned ComputeNumSignBitsForTargetNode(SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG, unsigned Depth=0) const override
This method can be implemented by targets that want to expose additional information about sign bits ...
Definition: AMDGPUISelLowering.cpp:6037

llvm::AMDGPUTargetLowering::performMulhuCombine
SDValue performMulhuCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4671

llvm::AMDGPUTargetLowering::getTypeForExtReturn
EVT getTypeForExtReturn(LLVMContext &Context, EVT VT, ISD::NodeType ExtendKind) const override
Return the type that should be used to zero or sign extend a zeroext/signext integer return value.
Definition: AMDGPUISelLowering.cpp:788

llvm::AMDGPUTargetLowering::SplitVectorLoad
SDValue SplitVectorLoad(SDValue Op, SelectionDAG &DAG) const
Split a vector load into 2 loads of half the vector.
Definition: AMDGPUISelLowering.cpp:1844

llvm::AMDGPUTargetLowering::LowerCONCAT_VECTORS
SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:1564

llvm::AMDGPUTargetLowering::performLoadCombine
SDValue performLoadCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:3881

llvm::AMDGPUTargetLowering::analyzeFormalArgumentsCompute
void analyzeFormalArgumentsCompute(CCState &State, const SmallVectorImpl< ISD::InputArg > &Ins) const
The SelectionDAGBuilder will automatically promote function arguments with illegal types.
Definition: AMDGPUISelLowering.cpp:1202

llvm::AMDGPUTargetLowering::LowerF64ToF16Safe
SDValue LowerF64ToF16Safe(SDValue Src, const SDLoc &DL, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:3612

llvm::AMDGPUTargetLowering::LowerFROUND
SDValue LowerFROUND(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2575

llvm::AMDGPUTargetLowering::storeStackInputValue
SDValue storeStackInputValue(SelectionDAG &DAG, const SDLoc &SL, SDValue Chain, SDValue ArgVal, int64_t Offset) const
Definition: AMDGPUISelLowering.cpp:5593

llvm::AMDGPUTargetLowering::storeOfVectorConstantIsCheap
bool storeOfVectorConstantIsCheap(bool IsZero, EVT MemVT, unsigned NumElem, unsigned AS) const override
Return true if it is expected to be cheaper to do a store of vector constant with the given size and ...
Definition: AMDGPUISelLowering.cpp:968

llvm::AMDGPUTargetLowering::LowerEXTRACT_SUBVECTOR
SDValue LowerEXTRACT_SUBVECTOR(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:1599

llvm::AMDGPUTargetLowering::computeKnownBitsForTargetNode
void computeKnownBitsForTargetNode(const SDValue Op, KnownBits &Known, const APInt &DemandedElts, const SelectionDAG &DAG, unsigned Depth=0) const override
Determine which of the bits specified in Mask are known to be either zero or one and return them in t...
Definition: AMDGPUISelLowering.cpp:5872

llvm::AMDGPUTargetLowering::shouldCombineMemoryType
bool shouldCombineMemoryType(EVT VT) const
Definition: AMDGPUISelLowering.cpp:3860

llvm::AMDGPUTargetLowering::splitBinaryBitConstantOpImpl
SDValue splitBinaryBitConstantOpImpl(DAGCombinerInfo &DCI, const SDLoc &SL, unsigned Opc, SDValue LHS, uint32_t ValLo, uint32_t ValHi) const
Split the 64-bit value LHS into two 32-bit components, and perform the binary operation Opc to it wit...
Definition: AMDGPUISelLowering.cpp:4052

llvm::AMDGPUTargetLowering::lowerUnhandledCall
SDValue lowerUnhandledCall(CallLoweringInfo &CLI, SmallVectorImpl< SDValue > &InVals, StringRef Reason) const
Definition: AMDGPUISelLowering.cpp:1377

llvm::AMDGPUTargetLowering::performAssertSZExtCombine
SDValue performAssertSZExtCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:3991

llvm::AMDGPUTargetLowering::LowerSTORE
SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const

llvm::AMDGPUTargetLowering::isTruncateFree
bool isTruncateFree(EVT Src, EVT Dest) const override
Definition: AMDGPUISelLowering.cpp:986

llvm::AMDGPUTargetLowering::aggressivelyPreferBuildVectorSources
bool aggressivelyPreferBuildVectorSources(EVT VecVT) const override
Definition: AMDGPUISelLowering.cpp:974

llvm::AMDGPUTargetLowering::LowerFCEIL
SDValue LowerFCEIL(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2441

llvm::AMDGPUTargetLowering::getConstantNegateCost
TargetLowering::NegatibleCost getConstantNegateCost(const ConstantFPSDNode *C) const
Definition: AMDGPUISelLowering.cpp:4924

llvm::AMDGPUTargetLowering::LowerFLOGUnsafe
SDValue LowerFLOGUnsafe(SDValue Op, const SDLoc &SL, SelectionDAG &DAG, bool IsLog10, SDNodeFlags Flags) const
Definition: AMDGPUISelLowering.cpp:2866

llvm::AMDGPUTargetLowering::canCreateUndefOrPoisonForTargetNode
bool canCreateUndefOrPoisonForTargetNode(SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG, bool PoisonOnly, bool ConsiderFlags, unsigned Depth) const override
Return true if Op can create undef or poison from non-undef & non-poison operands.
Definition: AMDGPUISelLowering.cpp:6134

llvm::AMDGPUTargetLowering::performMulhsCombine
SDValue performMulhsCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4638

llvm::AMDGPUTargetLowering::isSDNodeAlwaysUniform
bool isSDNodeAlwaysUniform(const SDNode *N) const override
Definition: AMDGPUISelLowering.cpp:894

llvm::AMDGPUTargetLowering::isDesirableToCommuteWithShift
bool isDesirableToCommuteWithShift(const SDNode *N, CombineLevel Level) const override
Return true if it is profitable to move this shift by a constant amount through its operand,...
Definition: AMDGPUISelLowering.cpp:1074

llvm::AMDGPUTargetLowering::LowerFREM
SDValue LowerFREM(SDValue Op, SelectionDAG &DAG) const
Split a vector store into multiple scalar stores.
Definition: AMDGPUISelLowering.cpp:2427

llvm::AMDGPUTargetLowering::PostISelFolding
virtual SDNode * PostISelFolding(MachineSDNode *N, SelectionDAG &DAG) const =0

llvm::AMDGPUTargetLowering::performShlCombine
SDValue performShlCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4075

llvm::AMDGPUTargetLowering::isCheapToSpeculateCtlz
bool isCheapToSpeculateCtlz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic ctlz.
Definition: AMDGPUISelLowering.cpp:890

llvm::AMDGPUTargetLowering::LowerSDIVREM
SDValue LowerSDIVREM(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2366

llvm::AMDGPUTargetLowering::isFNegFree
bool isFNegFree(EVT VT) const override
Return true if an fneg operation is free to the point where it is never worthwhile to replace it with...
Definition: AMDGPUISelLowering.cpp:961

llvm::AMDGPUTargetLowering::LowerFLOG10
SDValue LowerFLOG10(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2860

llvm::AMDGPUTargetLowering::LowerINT_TO_FP64
SDValue LowerINT_TO_FP64(SDValue Op, SelectionDAG &DAG, bool Signed) const
Definition: AMDGPUISelLowering.cpp:3406

llvm::AMDGPUTargetLowering::computeNumSignBitsForTargetInstr
unsigned computeNumSignBitsForTargetInstr(GISelValueTracking &Analysis, Register R, const APInt &DemandedElts, const MachineRegisterInfo &MRI, unsigned Depth=0) const override
This method can be implemented by targets that want to expose additional information about sign bits ...
Definition: AMDGPUISelLowering.cpp:6098

llvm::AMDGPUTargetLowering::LowerOperation
SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override
This callback is invoked for operations that are unsupported by the target, which are registered to u...
Definition: AMDGPUISelLowering.cpp:1418

llvm::AMDGPUTargetLowering::LowerFP_TO_FP16
SDValue LowerFP_TO_FP16(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:3595

llvm::AMDGPUTargetLowering::addTokenForArgument
SDValue addTokenForArgument(SDValue Chain, SelectionDAG &DAG, MachineFrameInfo &MFI, int ClobberedFI) const
Definition: AMDGPUISelLowering.cpp:1343

llvm::AMDGPUTargetLowering::isConstantCheaperToNegate
bool isConstantCheaperToNegate(SDValue N) const
Definition: AMDGPUISelLowering.cpp:4940

llvm::AMDGPUTargetLowering::isReassocProfitable
bool isReassocProfitable(MachineRegisterInfo &MRI, Register N0, Register N1) const override
Definition: AMDGPUISelLowering.cpp:6262

llvm::AMDGPUTargetLowering::isKnownNeverNaNForTargetNode
bool isKnownNeverNaNForTargetNode(SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG, bool SNaN=false, unsigned Depth=0) const override
If SNaN is false,.
Definition: AMDGPUISelLowering.cpp:6147

llvm::AMDGPUTargetLowering::needsDenormHandlingF32
static bool needsDenormHandlingF32(const SelectionDAG &DAG, SDValue Src, SDNodeFlags Flags)
Definition: AMDGPUISelLowering.cpp:2656

llvm::AMDGPUTargetLowering::getFenceOperandTy
MVT getFenceOperandTy(const DataLayout &DL) const override
Return the type for operands of fence.
Definition: AMDGPUISelLowering.h:394

llvm::AMDGPUTargetLowering::getImplicitParameterOffset
uint32_t getImplicitParameterOffset(const MachineFunction &MF, const ImplicitParameter Param) const
Helper function that returns the byte offset of the given type of implicit parameter.
Definition: AMDGPUISelLowering.cpp:5652

llvm::AMDGPUTargetLowering::LowerFFLOOR
SDValue LowerFFLOOR(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2602

llvm::AMDGPUTargetLowering::performSelectCombine
SDValue performSelectCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4865

llvm::AMDGPUTargetLowering::performFNegCombine
SDValue performFNegCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4994

llvm::AMDGPUTargetLowering::LowerFP_TO_INT
SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:3700

llvm::AMDGPUTargetLowering::LowerGlobalAddress
virtual SDValue LowerGlobalAddress(AMDGPUMachineFunction *MFI, SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:1506

llvm::AMDGPUTargetLowering::isConstantCostlierToNegate
bool isConstantCostlierToNegate(SDValue N) const
Definition: AMDGPUISelLowering.cpp:4934

llvm::AMDGPUTargetLowering::loadInputValue
SDValue loadInputValue(SelectionDAG &DAG, const TargetRegisterClass *RC, EVT VT, const SDLoc &SL, const ArgDescriptor &Arg) const
Definition: AMDGPUISelLowering.cpp:5612

llvm::AMDGPUTargetLowering::LowerDIVREM24
SDValue LowerDIVREM24(SDValue Op, SelectionDAG &DAG, bool sign) const
Definition: AMDGPUISelLowering.cpp:1982

llvm::AMDGPUTargetLowering::lowerFEXP10Unsafe
SDValue lowerFEXP10Unsafe(SDValue Op, const SDLoc &SL, SelectionDAG &DAG, SDNodeFlags Flags) const
Emit approx-funcs appropriate lowering for exp10.
Definition: AMDGPUISelLowering.cpp:2996

llvm::AMDGPUTargetLowering::shouldReduceLoadWidth
bool shouldReduceLoadWidth(SDNode *Load, ISD::LoadExtType ExtType, EVT ExtVT, std::optional< unsigned > ByteOffset) const override
Return true if it is profitable to reduce a load to a smaller type.
Definition: AMDGPUISelLowering.cpp:822

llvm::AMDGPUTargetLowering::LowerUINT_TO_FP
SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:3425

llvm::AMDGPUTargetLowering::CreateLiveInRegisterRaw
SDValue CreateLiveInRegisterRaw(SelectionDAG &DAG, const TargetRegisterClass *RC, Register Reg, EVT VT) const
Definition: AMDGPUISelLowering.h:356

llvm::AMDGPUTargetLowering::isCheapToSpeculateCttz
bool isCheapToSpeculateCttz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic cttz.
Definition: AMDGPUISelLowering.cpp:886

llvm::AMDGPUTargetLowering::performCtlz_CttzCombine
SDValue performCtlz_CttzCombine(const SDLoc &SL, SDValue Cond, SDValue LHS, SDValue RHS, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4731

llvm::AMDGPUTargetLowering::performSraCombine
SDValue performSraCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4177

llvm::AMDGPUTargetLowering::isSelectSupported
bool isSelectSupported(SelectSupportKind) const override
Definition: AMDGPUISelLowering.cpp:803

llvm::AMDGPUTargetLowering::isZExtFree
bool isZExtFree(Type *Src, Type *Dest) const override
Return true if any actual instruction that defines a value of type FromTy implicitly zero-extends the...
Definition: AMDGPUISelLowering.cpp:1007

llvm::AMDGPUTargetLowering::lowerFEXP2
SDValue lowerFEXP2(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2905

llvm::AMDGPUTargetLowering::LowerCall
SDValue LowerCall(CallLoweringInfo &CLI, SmallVectorImpl< SDValue > &InVals) const override
This hook must be implemented to lower calls into the specified DAG.
Definition: AMDGPUISelLowering.cpp:1403

llvm::AMDGPUTargetLowering::shouldCastAtomicLoadInIR
AtomicExpansionKind shouldCastAtomicLoadInIR(LoadInst *LI) const override
Returns how the given (atomic) load should be cast by the IR-level AtomicExpand pass.
Definition: AMDGPUISelLowering.h:237

llvm::AMDGPUTargetLowering::performSrlCombine
SDValue performSrlCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4278

llvm::AMDGPUTargetLowering::lowerFEXP
SDValue lowerFEXP(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:3049

llvm::AMDGPUTargetLowering::getIsLtSmallestNormal
SDValue getIsLtSmallestNormal(SelectionDAG &DAG, SDValue Op, SDNodeFlags Flags) const
Definition: AMDGPUISelLowering.cpp:2665

llvm::AMDGPUTargetLowering::mayIgnoreSignedZero
bool mayIgnoreSignedZero(SDValue Op) const
Definition: AMDGPUISelLowering.cpp:633

llvm::AMDGPUTargetLowering::getIsFinite
SDValue getIsFinite(SelectionDAG &DAG, SDValue Op, SDNodeFlags Flags) const
Definition: AMDGPUISelLowering.cpp:2683

llvm::AMDGPUTargetLowering::isLoadBitCastBeneficial
bool isLoadBitCastBeneficial(EVT, EVT, const SelectionDAG &DAG, const MachineMemOperand &MMO) const final
Return true if the following transform is beneficial: fold (conv (load x)) -> (load (conv*)x) On arch...
Definition: AMDGPUISelLowering.cpp:862

llvm::AMDGPUTargetLowering::splitVector
std::pair< SDValue, SDValue > splitVector(const SDValue &N, const SDLoc &DL, const EVT &LoVT, const EVT &HighVT, SelectionDAG &DAG) const
Split a vector value into two parts of types LoVT and HiVT.
Definition: AMDGPUISelLowering.cpp:1809

llvm::AMDGPUTargetLowering::LowerFLOGCommon
SDValue LowerFLOGCommon(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2764

llvm::AMDGPUTargetLowering::foldFreeOpFromSelect
SDValue foldFreeOpFromSelect(TargetLowering::DAGCombinerInfo &DCI, SDValue N) const
Definition: AMDGPUISelLowering.cpp:4788

llvm::AMDGPUTargetLowering::LowerINT_TO_FP32
SDValue LowerINT_TO_FP32(SDValue Op, SelectionDAG &DAG, bool Signed) const
Definition: AMDGPUISelLowering.cpp:3280

llvm::AMDGPUTargetLowering::isFAbsFree
bool isFAbsFree(EVT VT) const override
Return true if an fabs operation is free to the point where it is never worthwhile to replace it with...
Definition: AMDGPUISelLowering.cpp:953

llvm::AMDGPUTargetLowering::loadStackInputValue
SDValue loadStackInputValue(SelectionDAG &DAG, EVT VT, const SDLoc &SL, int64_t Offset) const
Similar to CreateLiveInRegister, except value maybe loaded from a stack slot rather than passed in a ...
Definition: AMDGPUISelLowering.cpp:5577

llvm::AMDGPUTargetLowering::LowerFLOG2
SDValue LowerFLOG2(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2723

llvm::AMDGPUTargetLowering::getEquivalentMemType
static EVT getEquivalentMemType(LLVMContext &Context, EVT VT)
Definition: AMDGPUISelLowering.cpp:40

llvm::AMDGPUTargetLowering::getSqrtEstimate
SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps, bool &UseOneConstNR, bool Reciprocal) const override
Hooks for building estimates in place of slower divisions and square roots.
Definition: AMDGPUISelLowering.cpp:5820

llvm::AMDGPUTargetLowering::performTruncateCombine
SDValue performTruncateCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4382

llvm::AMDGPUTargetLowering::LowerSINT_TO_FP
SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:3471

llvm::AMDGPUTargetLowering::ImplicitParameter
ImplicitParameter
Definition: AMDGPUISelLowering.h:380

llvm::AMDGPUTargetLowering::SHARED_BASE
@ SHARED_BASE
Definition: AMDGPUISelLowering.h:383

llvm::AMDGPUTargetLowering::PRIVATE_BASE
@ PRIVATE_BASE
Definition: AMDGPUISelLowering.h:382

llvm::AMDGPUTargetLowering::FIRST_IMPLICIT
@ FIRST_IMPLICIT
Definition: AMDGPUISelLowering.h:381

llvm::AMDGPUTargetLowering::QUEUE_PTR
@ QUEUE_PTR
Definition: AMDGPUISelLowering.h:384

llvm::AMDGPUTargetLowering::stripBitcast
static SDValue stripBitcast(SDValue Val)
Definition: AMDGPUISelLowering.h:187

llvm::AMDGPUTargetLowering::CreateLiveInRegister
SDValue CreateLiveInRegister(SelectionDAG &DAG, const TargetRegisterClass *RC, Register Reg, EVT VT, const SDLoc &SL, bool RawReg=false) const
Helper function that adds Reg to the LiveIn list of the DAG's MachineFunction.
Definition: AMDGPUISelLowering.cpp:5541

llvm::AMDGPUTargetLowering::SplitVectorStore
SDValue SplitVectorStore(SDValue Op, SelectionDAG &DAG) const
Split a vector store into 2 stores of half the vector.
Definition: AMDGPUISelLowering.cpp:1938

llvm::AMDGPUTargetLowering::LowerCTLZ_CTTZ
SDValue LowerCTLZ_CTTZ(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:3220

llvm::AMDGPUTargetLowering::getNegatedExpression
SDValue getNegatedExpression(SDValue Op, SelectionDAG &DAG, bool LegalOperations, bool ForCodeSize, NegatibleCost &Cost, unsigned Depth) const override
Return the newly negated expression if the cost is not expensive and set the cost in Cost to indicate...
Definition: AMDGPUISelLowering.cpp:918

llvm::AMDGPUTargetLowering::shouldCastAtomicStoreInIR
AtomicExpansionKind shouldCastAtomicStoreInIR(StoreInst *SI) const override
Returns how the given (atomic) store should be cast by the IR-level AtomicExpand pass into.
Definition: AMDGPUISelLowering.h:241

llvm::AMDGPUTargetLowering::split64BitValue
std::pair< SDValue, SDValue > split64BitValue(SDValue Op, SelectionDAG &DAG) const
Return 64-bit value Op as two 32-bit integers.
Definition: AMDGPUISelLowering.cpp:1760

llvm::AMDGPUTargetLowering::performMulCombine
SDValue performMulCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4504

llvm::AMDGPUTargetLowering::getRecipEstimate
SDValue getRecipEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps) const override
Return a reciprocal estimate value for the input operand.
Definition: AMDGPUISelLowering.cpp:5838

llvm::AMDGPUTargetLowering::CreateLiveInRegister
SDValue CreateLiveInRegister(SelectionDAG &DAG, const TargetRegisterClass *RC, Register Reg, EVT VT) const
Definition: AMDGPUISelLowering.h:349

llvm::AMDGPUTargetLowering::hasMultipleConditionRegisters
bool hasMultipleConditionRegisters(EVT VT) const override
Does the target have multiple (allocatable) condition registers that can be used to store the results...
Definition: AMDGPUISelLowering.h:398

llvm::AMDGPUTargetLowering::LowerFNEARBYINT
SDValue LowerFNEARBYINT(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2555

llvm::AMDGPUTargetLowering::getTargetNodeName
const char * getTargetNodeName(unsigned Opcode) const override
This method returns the name of a target specific DAG node.
Definition: AMDGPUISelLowering.cpp:5660

llvm::AMDGPUTargetLowering::LowerSIGN_EXTEND_INREG
SDValue LowerSIGN_EXTEND_INREG(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:3744

llvm::AMDGPUTargetLowering::CCAssignFnForReturn
static CCAssignFn * CCAssignFnForReturn(CallingConv::ID CC, bool IsVarArg)
Definition: AMDGPUISelLowering.cpp:1338

llvm::AMDGPUTargetLowering::getScaledLogInput
std::pair< SDValue, SDValue > getScaledLogInput(SelectionDAG &DAG, const SDLoc SL, SDValue Op, SDNodeFlags Flags) const
If denormal handling is required return the scaled input to FLOG2, and the check for denormal range.
Definition: AMDGPUISelLowering.cpp:2700

llvm::AMDGPUTargetLowering::CCAssignFnForCall
static CCAssignFn * CCAssignFnForCall(CallingConv::ID CC, bool IsVarArg)
Selects the correct CCAssignFn for a given CallingConvention value.
Definition: AMDGPUISelLowering.cpp:1333

llvm::AMDGPUTargetLowering::allUsesHaveSourceMods
static bool allUsesHaveSourceMods(const SDNode *N, unsigned CostThreshold=4)
Definition: AMDGPUISelLowering.cpp:762

llvm::AMDGPUTargetLowering::LowerFROUNDEVEN
SDValue LowerFROUNDEVEN(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2527

llvm::AMDGPUTargetLowering::isFPImmLegal
bool isFPImmLegal(const APFloat &Imm, EVT VT, bool ForCodeSize) const override
Returns true if the target can instruction select the specified FP immediate natively.
Definition: AMDGPUISelLowering.cpp:809

llvm::AMDGPUTargetLowering::numBitsUnsigned
static unsigned numBitsUnsigned(SDValue Op, SelectionDAG &DAG)
Definition: AMDGPUISelLowering.cpp:51

llvm::AMDGPUTargetLowering::lowerFEXPUnsafe
SDValue lowerFEXPUnsafe(SDValue Op, const SDLoc &SL, SelectionDAG &DAG, SDNodeFlags Flags) const
Definition: AMDGPUISelLowering.cpp:2956

llvm::AMDGPUTargetLowering::LowerFTRUNC
SDValue LowerFTRUNC(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2481

llvm::AMDGPUTargetLowering::LowerDYNAMIC_STACKALLOC
SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:1408

llvm::AMDGPUTargetLowering::allowApproxFunc
static bool allowApproxFunc(const SelectionDAG &DAG, SDNodeFlags Flags)
Definition: AMDGPUISelLowering.cpp:2651

llvm::AMDGPUTargetLowering::ShouldShrinkFPConstant
bool ShouldShrinkFPConstant(EVT VT) const override
If true, then instruction selection should seek to shrink the FP constant of the specified type to a ...
Definition: AMDGPUISelLowering.cpp:817

llvm::AMDGPUTargetLowering::LowerReturn
SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg, const SmallVectorImpl< ISD::OutputArg > &Outs, const SmallVectorImpl< SDValue > &OutVals, const SDLoc &DL, SelectionDAG &DAG) const override
This hook must be implemented to lower outgoing return values, described by the Outs array,...
Definition: AMDGPUISelLowering.cpp:1316

llvm::AMDGPUTargetLowering::performStoreCombine
SDValue performStoreCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:3934

llvm::AMDGPUTargetLowering::ReplaceNodeResults
void ReplaceNodeResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG) const override
This callback is invoked when a node result type is illegal for the target, and the operation was reg...
Definition: AMDGPUISelLowering.cpp:1466

llvm::AMDGPUTargetLowering::performRcpCombine
SDValue performRcpCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:5283

llvm::AMDGPUTargetLowering::getLoHalf64
SDValue getLoHalf64(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:1774

llvm::AMDGPUTargetLowering::lowerCTLZResults
SDValue lowerCTLZResults(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:3190

llvm::AMDGPUTargetLowering::performFAbsCombine
SDValue performFAbsCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:5258

llvm::AMDGPUTargetLowering::LowerFP_TO_INT64
SDValue LowerFP_TO_INT64(SDValue Op, SelectionDAG &DAG, bool Signed) const
Definition: AMDGPUISelLowering.cpp:3520

llvm::AMDGPUTargetLowering::shouldFoldFNegIntoSrc
static bool shouldFoldFNegIntoSrc(SDNode *FNeg, SDValue FNegSrc)
Definition: AMDGPUISelLowering.cpp:4975

llvm::AMDGPUTargetLowering::isNarrowingProfitable
bool isNarrowingProfitable(SDNode *N, EVT SrcVT, EVT DestVT) const override
Return true if it's profitable to narrow operations of type SrcVT to DestVT.
Definition: AMDGPUISelLowering.cpp:1029

llvm::AMDGPUTargetLowering::LowerFRINT
SDValue LowerFRINT(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2564

llvm::AMDGPUTargetLowering::performIntrinsicWOChainCombine
SDValue performIntrinsicWOChainCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4014

llvm::AMDGPUTargetLowering::LowerUDIVREM
SDValue LowerUDIVREM(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:2311

llvm::AMDGPUTargetLowering::performMulLoHiCombine
SDValue performMulLoHiCombine(SDNode *N, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:4589

llvm::AMDGPUTargetLowering::shouldCastAtomicRMWIInIR
AtomicExpansionKind shouldCastAtomicRMWIInIR(AtomicRMWInst *) const override
Returns how the given atomic atomicrmw should be cast by the IR-level AtomicExpand pass.
Definition: AMDGPUISelLowering.h:245

llvm::AMDGPUTargetLowering::PerformDAGCombine
SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override
This method will be invoked for all target nodes and for any target-independent nodes that the target...
Definition: AMDGPUISelLowering.cpp:5295

llvm::AMDGPUTargetLowering::LowerUDIVREM64
void LowerUDIVREM64(SDValue Op, SelectionDAG &DAG, SmallVectorImpl< SDValue > &Results) const
Definition: AMDGPUISelLowering.cpp:2097

llvm::AMDGPUTargetLowering::WidenOrSplitVectorLoad
SDValue WidenOrSplitVectorLoad(SDValue Op, SelectionDAG &DAG) const
Widen a suitably aligned v3 load.
Definition: AMDGPUISelLowering.cpp:1904

llvm::AMDGPUTargetLowering::mergeStoresAfterLegalization
bool mergeStoresAfterLegalization(EVT) const override
Allow store merging for the specified type after legalization in addition to before legalization.
Definition: AMDGPUISelLowering.h:293

llvm::AMDGPUTargetLowering::getSplitDestVTs
std::pair< EVT, EVT > getSplitDestVTs(const EVT &VT, SelectionDAG &DAG) const
Split a vector type into two parts.
Definition: AMDGPUISelLowering.cpp:1794

llvm::AMDGPUTargetLowering::getHiHalf64
SDValue getHiHalf64(SDValue Op, SelectionDAG &DAG) const
Definition: AMDGPUISelLowering.cpp:1782

llvm::AMDGPUTargetLowering::isFsqrtCheap
bool isFsqrtCheap(SDValue Operand, SelectionDAG &DAG) const override
Return true if SQRT(X) shouldn't be replaced with X*RSQRT(X).
Definition: AMDGPUISelLowering.h:295

llvm::AMDGPUTargetLowering::combineFMinMaxLegacyImpl
SDValue combineFMinMaxLegacyImpl(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, SDValue True, SDValue False, SDValue CC, DAGCombinerInfo &DCI) const
Definition: AMDGPUISelLowering.cpp:1652

llvm::AMDGPUTargetLowering::getVectorIdxWidth
unsigned getVectorIdxWidth(const DataLayout &) const override
Returns the type to be used for the index operand vector operations.
Definition: AMDGPUISelLowering.cpp:799

llvm::APFloat
Definition: APFloat.h:900

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::AtomicRMWInst
an instruction that atomically reads a memory location, combines it with another value,...
Definition: Instructions.h:709

llvm::CCState
CCState - This class holds information needed while lowering arguments and return values.
Definition: CallingConvLower.h:171

llvm::ConstantFPSDNode
Definition: SelectionDAGNodes.h:1795

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:33

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::GISelValueTracking
Definition: GISelValueTracking.h:34

llvm::InstructionCost
Definition: InstructionCost.h:30

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:68

llvm::LoadInst
An instruction for reading from memory.
Definition: Instructions.h:180

llvm::MVT
Machine Value Type.
Definition: MachineValueType.h:36

llvm::MachineFrameInfo
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
Definition: MachineFrameInfo.h:108

llvm::MachineFunction
Definition: MachineFunction.h:286

llvm::MachineMemOperand
A description of a memory reference used in the backend.
Definition: MachineMemOperand.h:130

llvm::MachineRegisterInfo
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
Definition: MachineRegisterInfo.h:53

llvm::MachineSDNode
An SDNode that represents everything that will be needed to construct a MachineInstr.
Definition: SelectionDAGNodes.h:3143

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::SDLoc
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Definition: SelectionDAGNodes.h:1225

llvm::SDNode
Represents one node in the SelectionDAG.
Definition: SelectionDAGNodes.h:501

llvm::SDValue
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
Definition: SelectionDAGNodes.h:147

llvm::SDValue::getOperand
const SDValue & getOperand(unsigned i) const
Definition: SelectionDAGNodes.h:1268

llvm::SDValue::getOpcode
unsigned getOpcode() const
Definition: SelectionDAGNodes.h:1256

llvm::SelectionDAG
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
Definition: SelectionDAG.h:229

llvm::SelectionDAG::getEntryNode
SDValue getEntryNode() const
Return the token chain corresponding to the entry of the function.
Definition: SelectionDAG.h:581

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:574

llvm::StoreInst
An instruction for storing to memory.
Definition: Instructions.h:296

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:55

llvm::TargetLoweringBase::Enabled
@ Enabled
Definition: TargetLowering.h:603

llvm::TargetLoweringBase::SelectSupportKind
SelectSupportKind
Enum that describes what type of support for selects the target has.
Definition: TargetLowering.h:244

llvm::TargetLoweringBase::AtomicExpansionKind
AtomicExpansionKind
Enum that specifies what an atomic load/AtomicRMWInst is expanded to, if at all.
Definition: TargetLowering.h:256

llvm::TargetLoweringBase::AtomicExpansionKind::None
@ None

llvm::TargetLoweringBase::NegatibleCost
NegatibleCost
Enum that specifies when a float negation is beneficial.
Definition: TargetLowering.h:286

llvm::TargetLowering
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Definition: TargetLowering.h:3937

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:83

llvm::TargetRegisterClass
Definition: TargetRegisterInfo.h:45

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

uint32_t

uint64_t

unsigned

llvm::AMDGPUISD::NodeType
NodeType
Definition: AMDGPUISelLowering.h:411

llvm::AMDGPUISD::ELSE
@ ELSE
Definition: AMDGPUISelLowering.h:427

llvm::AMDGPUISD::BUFFER_STORE
@ BUFFER_STORE
Definition: AMDGPUISelLowering.h:603

llvm::AMDGPUISD::REGISTER_STORE
@ REGISTER_STORE
Definition: AMDGPUISelLowering.h:532

llvm::AMDGPUISD::MUL_I24
@ MUL_I24
Definition: AMDGPUISelLowering.h:520

llvm::AMDGPUISD::CVT_PKRTZ_F16_F32
@ CVT_PKRTZ_F16_F32
Definition: AMDGPUISelLowering.h:542

llvm::AMDGPUISD::DIV_SCALE
@ DIV_SCALE
Definition: AMDGPUISelLowering.h:486

llvm::AMDGPUISD::BUFFER_ATOMIC_COND_SUB_U32
@ BUFFER_ATOMIC_COND_SUB_U32
Definition: AMDGPUISelLowering.h:625

llvm::AMDGPUISD::TEXTURE_FETCH
@ TEXTURE_FETCH
Definition: AMDGPUISelLowering.h:528

llvm::AMDGPUISD::PC_ADD_REL_OFFSET64
@ PC_ADD_REL_OFFSET64
Definition: AMDGPUISelLowering.h:564

llvm::AMDGPUISD::TBUFFER_LOAD_FORMAT_D16
@ TBUFFER_LOAD_FORMAT_D16
Definition: AMDGPUISelLowering.h:581

llvm::AMDGPUISD::LOG
@ LOG
Definition: AMDGPUISelLowering.h:501

llvm::AMDGPUISD::FFBL_B32
@ FFBL_B32
Definition: AMDGPUISelLowering.h:518

llvm::AMDGPUISD::UMAX3
@ UMAX3
Definition: AMDGPUISelLowering.h:475

llvm::AMDGPUISD::BUILD_VERTICAL_VECTOR
@ BUILD_VERTICAL_VECTOR
This node is for VLIW targets and it is used to represent a vector that is stored in consecutive regi...
Definition: AMDGPUISelLowering.h:560

llvm::AMDGPUISD::URECIP
@ URECIP
Definition: AMDGPUISelLowering.h:485

llvm::AMDGPUISD::FFBH_I32
@ FFBH_I32
Definition: AMDGPUISelLowering.h:517

llvm::AMDGPUISD::MULHI_U24
@ MULHI_U24
Definition: AMDGPUISelLowering.h:521

llvm::AMDGPUISD::CONST_ADDRESS
@ CONST_ADDRESS
Definition: AMDGPUISelLowering.h:530

llvm::AMDGPUISD::TC_RETURN_CHAIN
@ TC_RETURN_CHAIN
Definition: AMDGPUISelLowering.h:421

llvm::AMDGPUISD::BUFFER_LOAD_FORMAT_D16
@ BUFFER_LOAD_FORMAT_D16
Definition: AMDGPUISelLowering.h:596

llvm::AMDGPUISD::LDS
@ LDS
Definition: AMDGPUISelLowering.h:565

llvm::AMDGPUISD::FMUL_LEGACY
@ FMUL_LEGACY
Definition: AMDGPUISelLowering.h:506

llvm::AMDGPUISD::REGISTER_LOAD
@ REGISTER_LOAD
Definition: AMDGPUISelLowering.h:531

llvm::AMDGPUISD::CARRY
@ CARRY
Definition: AMDGPUISelLowering.h:510

llvm::AMDGPUISD::MAD_U24
@ MAD_U24
Definition: AMDGPUISelLowering.h:523

llvm::AMDGPUISD::SBUFFER_LOAD_UBYTE
@ SBUFFER_LOAD_UBYTE
Definition: AMDGPUISelLowering.h:599

llvm::AMDGPUISD::FMAXIMUM3
@ FMAXIMUM3
Definition: AMDGPUISelLowering.h:482

llvm::AMDGPUISD::BRANCH_COND
@ BRANCH_COND
Definition: AMDGPUISelLowering.h:414

llvm::AMDGPUISD::SBUFFER_LOAD_USHORT
@ SBUFFER_LOAD_USHORT
Definition: AMDGPUISelLowering.h:601

llvm::AMDGPUISD::BUFFER_LOAD
@ BUFFER_LOAD
Definition: AMDGPUISelLowering.h:584

llvm::AMDGPUISD::BUFFER_LOAD_FORMAT
@ BUFFER_LOAD_FORMAT
Definition: AMDGPUISelLowering.h:594

llvm::AMDGPUISD::CVT_PKNORM_I16_F32
@ CVT_PKNORM_I16_F32
Definition: AMDGPUISelLowering.h:543

llvm::AMDGPUISD::TBUFFER_STORE_FORMAT_D16
@ TBUFFER_STORE_FORMAT_D16
Definition: AMDGPUISelLowering.h:579

llvm::AMDGPUISD::BUFFER_ATOMIC_SMAX
@ BUFFER_ATOMIC_SMAX
Definition: AMDGPUISelLowering.h:613

llvm::AMDGPUISD::RSQ_CLAMP
@ RSQ_CLAMP
Definition: AMDGPUISelLowering.h:507

llvm::AMDGPUISD::DIV_FMAS
@ DIV_FMAS
Definition: AMDGPUISelLowering.h:487

llvm::AMDGPUISD::UMED3
@ UMED3
Definition: AMDGPUISelLowering.h:481

llvm::AMDGPUISD::BUFFER_LOAD_UBYTE_TFE
@ BUFFER_LOAD_UBYTE_TFE
Definition: AMDGPUISelLowering.h:590

llvm::AMDGPUISD::FFBH_U32
@ FFBH_U32
Definition: AMDGPUISelLowering.h:516

llvm::AMDGPUISD::RCP
@ RCP
Definition: AMDGPUISelLowering.h:495

llvm::AMDGPUISD::SETCC
@ SETCC
Definition: AMDGPUISelLowering.h:458

llvm::AMDGPUISD::RET_GLUE
@ RET_GLUE
Definition: AMDGPUISelLowering.h:443

llvm::AMDGPUISD::COS_HW
@ COS_HW
Definition: AMDGPUISelLowering.h:468

llvm::AMDGPUISD::FMAD_FTZ
@ FMAD_FTZ
Definition: AMDGPUISelLowering.h:491

llvm::AMDGPUISD::BUFFER_ATOMIC_UMIN
@ BUFFER_ATOMIC_UMIN
Definition: AMDGPUISelLowering.h:612

llvm::AMDGPUISD::RCP_IFLAG
@ RCP_IFLAG
Definition: AMDGPUISelLowering.h:498

llvm::AMDGPUISD::SIMULATED_TRAP
@ SIMULATED_TRAP
Definition: AMDGPUISelLowering.h:437

llvm::AMDGPUISD::DOT4
@ DOT4
Definition: AMDGPUISelLowering.h:509

llvm::AMDGPUISD::BUFFER_ATOMIC_OR
@ BUFFER_ATOMIC_OR
Definition: AMDGPUISelLowering.h:616

llvm::AMDGPUISD::BUFFER_LOAD_UBYTE
@ BUFFER_LOAD_UBYTE
Definition: AMDGPUISelLowering.h:585

llvm::AMDGPUISD::BUFFER_ATOMIC_FMIN
@ BUFFER_ATOMIC_FMIN
Definition: AMDGPUISelLowering.h:623

llvm::AMDGPUISD::BUFFER_LOAD_SHORT
@ BUFFER_LOAD_SHORT
Definition: AMDGPUISelLowering.h:588

llvm::AMDGPUISD::PERM
@ PERM
Definition: AMDGPUISelLowering.h:527

llvm::AMDGPUISD::DIV_FIXUP
@ DIV_FIXUP
Definition: AMDGPUISelLowering.h:488

llvm::AMDGPUISD::LOOP
@ LOOP
Definition: AMDGPUISelLowering.h:428

llvm::AMDGPUISD::DWORDADDR
@ DWORDADDR
Definition: AMDGPUISelLowering.h:449

llvm::AMDGPUISD::CVT_PK_U16_U32
@ CVT_PK_U16_U32
Definition: AMDGPUISelLowering.h:546

llvm::AMDGPUISD::LOAD_D16_LO_I8
@ LOAD_D16_LO_I8
Definition: AMDGPUISelLowering.h:574

llvm::AMDGPUISD::BUFFER_ATOMIC_SUB
@ BUFFER_ATOMIC_SUB
Definition: AMDGPUISelLowering.h:610

llvm::AMDGPUISD::BUFFER_STORE_SHORT
@ BUFFER_STORE_SHORT
Definition: AMDGPUISelLowering.h:605

llvm::AMDGPUISD::BUFFER_ATOMIC_CMPSWAP
@ BUFFER_ATOMIC_CMPSWAP
Definition: AMDGPUISelLowering.h:620

llvm::AMDGPUISD::BUFFER_STORE_BYTE
@ BUFFER_STORE_BYTE
Definition: AMDGPUISelLowering.h:604

llvm::AMDGPUISD::BUFFER_LOAD_SHORT_TFE
@ BUFFER_LOAD_SHORT_TFE
Definition: AMDGPUISelLowering.h:593

llvm::AMDGPUISD::RSQ
@ RSQ
Definition: AMDGPUISelLowering.h:496

llvm::AMDGPUISD::WHOLE_WAVE_RETURN
@ WHOLE_WAVE_RETURN
Definition: AMDGPUISelLowering.h:632

llvm::AMDGPUISD::FMA_W_CHAIN
@ FMA_W_CHAIN
Definition: AMDGPUISelLowering.h:463

llvm::AMDGPUISD::BUFFER_ATOMIC_FMAX
@ BUFFER_ATOMIC_FMAX
Definition: AMDGPUISelLowering.h:624

llvm::AMDGPUISD::CALL
@ CALL
Definition: AMDGPUISelLowering.h:418

llvm::AMDGPUISD::FMAX_LEGACY
@ FMAX_LEGACY
Definition: AMDGPUISelLowering.h:470

llvm::AMDGPUISD::MAD_U64_U32
@ MAD_U64_U32
Definition: AMDGPUISelLowering.h:525

llvm::AMDGPUISD::LOAD_D16_HI_U8
@ LOAD_D16_HI_U8
Definition: AMDGPUISelLowering.h:573

llvm::AMDGPUISD::FRACT
@ FRACT
Definition: AMDGPUISelLowering.h:450

llvm::AMDGPUISD::TBUFFER_STORE_FORMAT
@ TBUFFER_STORE_FORMAT
Definition: AMDGPUISelLowering.h:578

llvm::AMDGPUISD::PC_ADD_REL_OFFSET
@ PC_ADD_REL_OFFSET
Definition: AMDGPUISelLowering.h:563

llvm::AMDGPUISD::BUFFER_STORE_FORMAT
@ BUFFER_STORE_FORMAT
Definition: AMDGPUISelLowering.h:606

llvm::AMDGPUISD::CONST_DATA_PTR
@ CONST_DATA_PTR
Pointer to the start of the shader's constant data.
Definition: AMDGPUISelLowering.h:562

llvm::AMDGPUISD::EXP
@ EXP
Definition: AMDGPUISelLowering.h:504

llvm::AMDGPUISD::TRAP
@ TRAP
Definition: AMDGPUISelLowering.h:423

llvm::AMDGPUISD::SBUFFER_PREFETCH_DATA
@ SBUFFER_PREFETCH_DATA
Definition: AMDGPUISelLowering.h:602

llvm::AMDGPUISD::CVT_F32_UBYTE1
@ CVT_F32_UBYTE1
Definition: AMDGPUISelLowering.h:536

llvm::AMDGPUISD::LOAD_D16_HI_I8
@ LOAD_D16_HI_I8
Definition: AMDGPUISelLowering.h:572

llvm::AMDGPUISD::FIRST_NUMBER
@ FIRST_NUMBER
Definition: AMDGPUISelLowering.h:413

llvm::AMDGPUISD::FP_CLASS
@ FP_CLASS
Definition: AMDGPUISelLowering.h:508

llvm::AMDGPUISD::FDOT2
@ FDOT2
Definition: AMDGPUISelLowering.h:484

llvm::AMDGPUISD::CVT_PK_I16_I32
@ CVT_PK_I16_I32
Definition: AMDGPUISelLowering.h:545

llvm::AMDGPUISD::BUFFER_LOAD_FORMAT_TFE
@ BUFFER_LOAD_FORMAT_TFE
Definition: AMDGPUISelLowering.h:595

llvm::AMDGPUISD::TC_RETURN
@ TC_RETURN
Definition: AMDGPUISelLowering.h:419

llvm::AMDGPUISD::LAST_MEMORY_OPCODE
@ LAST_MEMORY_OPCODE
Definition: AMDGPUISelLowering.h:626

llvm::AMDGPUISD::FMED3
@ FMED3
Definition: AMDGPUISelLowering.h:479

llvm::AMDGPUISD::SBUFFER_LOAD_BYTE
@ SBUFFER_LOAD_BYTE
Definition: AMDGPUISelLowering.h:598

llvm::AMDGPUISD::BUFFER_ATOMIC_XOR
@ BUFFER_ATOMIC_XOR
Definition: AMDGPUISelLowering.h:617

llvm::AMDGPUISD::FMIN3
@ FMIN3
Definition: AMDGPUISelLowering.h:476

llvm::AMDGPUISD::BFE_I32
@ BFE_I32
Definition: AMDGPUISelLowering.h:513

llvm::AMDGPUISD::LOAD_D16_LO
@ LOAD_D16_LO
Definition: AMDGPUISelLowering.h:571

llvm::AMDGPUISD::ENDPGM
@ ENDPGM
Definition: AMDGPUISelLowering.h:431

llvm::AMDGPUISD::BUFFER_ATOMIC_SWAP
@ BUFFER_ATOMIC_SWAP
Definition: AMDGPUISelLowering.h:608

llvm::AMDGPUISD::BFM
@ BFM
Definition: AMDGPUISelLowering.h:515

llvm::AMDGPUISD::STORE_MSKOR
@ STORE_MSKOR
Definition: AMDGPUISelLowering.h:577

llvm::AMDGPUISD::BUFFER_ATOMIC_FADD
@ BUFFER_ATOMIC_FADD
Definition: AMDGPUISelLowering.h:622

llvm::AMDGPUISD::FP_TO_FP16
@ FP_TO_FP16
Definition: AMDGPUISelLowering.h:550

llvm::AMDGPUISD::BUFFER_STORE_FORMAT_D16
@ BUFFER_STORE_FORMAT_D16
Definition: AMDGPUISelLowering.h:607

llvm::AMDGPUISD::FMUL_W_CHAIN
@ FMUL_W_CHAIN
Definition: AMDGPUISelLowering.h:464

llvm::AMDGPUISD::SMED3
@ SMED3
Definition: AMDGPUISelLowering.h:480

llvm::AMDGPUISD::LOAD_D16_HI
@ LOAD_D16_HI
Definition: AMDGPUISelLowering.h:570

llvm::AMDGPUISD::BUFFER_ATOMIC_DEC
@ BUFFER_ATOMIC_DEC
Definition: AMDGPUISelLowering.h:619

llvm::AMDGPUISD::DENORM_MODE
@ DENORM_MODE
Definition: AMDGPUISelLowering.h:460

llvm::AMDGPUISD::TC_RETURN_CHAIN_DVGPR
@ TC_RETURN_CHAIN_DVGPR
Definition: AMDGPUISelLowering.h:422

llvm::AMDGPUISD::BUFFER_ATOMIC_AND
@ BUFFER_ATOMIC_AND
Definition: AMDGPUISelLowering.h:615

llvm::AMDGPUISD::ATOMIC_CMP_SWAP
@ ATOMIC_CMP_SWAP
Definition: AMDGPUISelLowering.h:583

llvm::AMDGPUISD::CVT_F32_UBYTE2
@ CVT_F32_UBYTE2
Definition: AMDGPUISelLowering.h:537

llvm::AMDGPUISD::FMIN_LEGACY
@ FMIN_LEGACY
Definition: AMDGPUISelLowering.h:471

llvm::AMDGPUISD::RETURN_TO_EPILOG
@ RETURN_TO_EPILOG
Definition: AMDGPUISelLowering.h:440

llvm::AMDGPUISD::BUFFER_LOAD_BYTE_TFE
@ BUFFER_LOAD_BYTE_TFE
Definition: AMDGPUISelLowering.h:592

llvm::AMDGPUISD::BUFFER_ATOMIC_CSUB
@ BUFFER_ATOMIC_CSUB
Definition: AMDGPUISelLowering.h:621

llvm::AMDGPUISD::UMIN3
@ UMIN3
Definition: AMDGPUISelLowering.h:478

llvm::AMDGPUISD::DS_ORDERED_COUNT
@ DS_ORDERED_COUNT
Definition: AMDGPUISelLowering.h:582

llvm::AMDGPUISD::BUFFER_ATOMIC_UMAX
@ BUFFER_ATOMIC_UMAX
Definition: AMDGPUISelLowering.h:614

llvm::AMDGPUISD::BUFFER_LOAD_TFE
@ BUFFER_LOAD_TFE
Definition: AMDGPUISelLowering.h:589

llvm::AMDGPUISD::LOAD_D16_LO_U8
@ LOAD_D16_LO_U8
Definition: AMDGPUISelLowering.h:575

llvm::AMDGPUISD::WHOLE_WAVE_SETUP
@ WHOLE_WAVE_SETUP
Definition: AMDGPUISelLowering.h:629

llvm::AMDGPUISD::IF
@ IF
Definition: AMDGPUISelLowering.h:426

llvm::AMDGPUISD::FIRST_MEMORY_OPCODE
@ FIRST_MEMORY_OPCODE
Definition: AMDGPUISelLowering.h:569

llvm::AMDGPUISD::BUFFER_ATOMIC_INC
@ BUFFER_ATOMIC_INC
Definition: AMDGPUISelLowering.h:618

llvm::AMDGPUISD::DUMMY_CHAIN
@ DUMMY_CHAIN
Definition: AMDGPUISelLowering.h:567

llvm::AMDGPUISD::SBUFFER_LOAD
@ SBUFFER_LOAD
Definition: AMDGPUISelLowering.h:597

llvm::AMDGPUISD::BFE_U32
@ BFE_U32
Definition: AMDGPUISelLowering.h:512

llvm::AMDGPUISD::MUL_U24
@ MUL_U24
Definition: AMDGPUISelLowering.h:519

llvm::AMDGPUISD::MULHI_I24
@ MULHI_I24
Definition: AMDGPUISelLowering.h:522

llvm::AMDGPUISD::SBUFFER_LOAD_SHORT
@ SBUFFER_LOAD_SHORT
Definition: AMDGPUISelLowering.h:600

llvm::AMDGPUISD::SIN_HW
@ SIN_HW
Definition: AMDGPUISelLowering.h:469

llvm::AMDGPUISD::CVT_F32_UBYTE3
@ CVT_F32_UBYTE3
Definition: AMDGPUISelLowering.h:538

llvm::AMDGPUISD::MAD_I24
@ MAD_I24
Definition: AMDGPUISelLowering.h:524

llvm::AMDGPUISD::CVT_F32_UBYTE0
@ CVT_F32_UBYTE0
Definition: AMDGPUISelLowering.h:535

llvm::AMDGPUISD::BUFFER_LOAD_USHORT
@ BUFFER_LOAD_USHORT
Definition: AMDGPUISelLowering.h:586

llvm::AMDGPUISD::MAD_I64_I32
@ MAD_I64_I32
Definition: AMDGPUISelLowering.h:526

llvm::AMDGPUISD::BORROW
@ BORROW
Definition: AMDGPUISelLowering.h:511

llvm::AMDGPUISD::BUFFER_ATOMIC_ADD
@ BUFFER_ATOMIC_ADD
Definition: AMDGPUISelLowering.h:609

llvm::AMDGPUISD::SMIN3
@ SMIN3
Definition: AMDGPUISelLowering.h:477

llvm::AMDGPUISD::FMAX3
@ FMAX3
Definition: AMDGPUISelLowering.h:473

llvm::AMDGPUISD::TBUFFER_LOAD_FORMAT
@ TBUFFER_LOAD_FORMAT
Definition: AMDGPUISelLowering.h:580

llvm::AMDGPUISD::BUFFER_ATOMIC_SMIN
@ BUFFER_ATOMIC_SMIN
Definition: AMDGPUISelLowering.h:611

llvm::AMDGPUISD::R600_EXPORT
@ R600_EXPORT
Definition: AMDGPUISelLowering.h:529

llvm::AMDGPUISD::BUFFER_LOAD_USHORT_TFE
@ BUFFER_LOAD_USHORT_TFE
Definition: AMDGPUISelLowering.h:591

llvm::AMDGPUISD::ENDPGM_TRAP
@ ENDPGM_TRAP
Definition: AMDGPUISelLowering.h:434

llvm::AMDGPUISD::RCP_LEGACY
@ RCP_LEGACY
Definition: AMDGPUISelLowering.h:497

llvm::AMDGPUISD::TC_RETURN_GFX
@ TC_RETURN_GFX
Definition: AMDGPUISelLowering.h:420

llvm::AMDGPUISD::CVT_PKNORM_U16_F32
@ CVT_PKNORM_U16_F32
Definition: AMDGPUISelLowering.h:544

llvm::AMDGPUISD::SMAX3
@ SMAX3
Definition: AMDGPUISelLowering.h:474

llvm::AMDGPUISD::BUFFER_LOAD_BYTE
@ BUFFER_LOAD_BYTE
Definition: AMDGPUISelLowering.h:587

llvm::AMDGPUISD::FMINIMUM3
@ FMINIMUM3
Definition: AMDGPUISelLowering.h:483

llvm::AMDGPUISD::BFI
@ BFI
Definition: AMDGPUISelLowering.h:514

llvm::AMDGPUISD::WAVE_ADDRESS
@ WAVE_ADDRESS
Definition: AMDGPUISelLowering.h:447

llvm::AMDGPUISD::CLAMP
@ CLAMP
CLAMP value between 0.0 and 1.0.
Definition: AMDGPUISelLowering.h:454

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::ISD::NodeType
NodeType
ISD::NodeType enum - This enum defines the target-independent operators for a SelectionDAG.
Definition: ISDOpcodes.h:41

llvm::ISD::BITCAST
@ BITCAST
BITCAST - This operator converts between integer, vector and FP values, as if the value was stored to...
Definition: ISDOpcodes.h:975

llvm::ISD::BUILTIN_OP_END
@ BUILTIN_OP_END
BUILTIN_OP_END - This must be the last enum value in this list.
Definition: ISDOpcodes.h:1568

llvm::ISD::LoadExtType
LoadExtType
LoadExtType enum - This enum defines the three variants of LOADEXT (load with extension).
Definition: ISDOpcodes.h:1665

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Offset
@ Offset
Definition: DWP.cpp:477

llvm::Depth
@ Depth
Definition: SIMachineScheduler.h:36

llvm::CCAssignFn
bool CCAssignFn(unsigned ValNo, MVT ValVT, MVT LocVT, CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags, Type *OrigTy, CCState &State)
CCAssignFn - This function assigns a location for Val, updating State to reflect the change.
Definition: CallingConvLower.h:157

llvm::CombineLevel
CombineLevel
Definition: DAGCombine.h:15

llvm::LEB128Sign::Signed
@ Signed

llvm::CostThreshold
static cl::opt< int > CostThreshold("sbvec-cost-threshold", cl::init(0), cl::Hidden, cl::desc("Vectorization cost threshold."))

N
#define N

llvm::ArgDescriptor
Definition: AMDGPUArgumentUsageInfo.h:25

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:35

llvm::KnownBits
Definition: KnownBits.h:24

llvm::SDNodeFlags
These are IR-level optimization flags that may be propagated to SDNodes.
Definition: SelectionDAGNodes.h:384

llvm::TargetLowering::DAGCombinerInfo
Definition: TargetLowering.h:4398