LLVM: lib/Target/WebAssembly/WebAssemblyTargetTransformInfo.cpp Source File

//===-- WebAssemblyTargetTransformInfo.cpp - WebAssembly-specific TTI -----===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

///

/// \file

/// This file defines the WebAssembly-specific TargetTransformInfo

/// implementation.

///

//===----------------------------------------------------------------------===//


#include "WebAssemblyTargetTransformInfo.h"


#include "llvm/CodeGen/CostTable.h"

using namespace llvm;


#define DEBUG_TYPE "wasmtti"


TargetTransformInfo::PopcntSupportKind

WebAssemblyTTIImpl::getPopcntSupport(unsigned TyWidth) const {

  assert(isPowerOf2_32(TyWidth) && "Ty width must be power of 2");

  return TargetTransformInfo::PSK_FastHardware;

}


unsigned WebAssemblyTTIImpl::getNumberOfRegisters(unsigned ClassID) const {

  unsigned Result = BaseT::getNumberOfRegisters(ClassID);


  // For SIMD, use at least 16 registers, as a rough guess.

  bool Vector = (ClassID == 1);

  if (Vector)

    Result = std::max(Result, 16u);


  return Result;

}


TypeSize WebAssemblyTTIImpl::getRegisterBitWidth(

    TargetTransformInfo::RegisterKind K) const {

  switch (K) {

  case TargetTransformInfo::RGK_Scalar:

    return TypeSize::getFixed(64);

  case TargetTransformInfo::RGK_FixedWidthVector:

    return TypeSize::getFixed(getST()->hasSIMD128() ? 128 : 64);

  case TargetTransformInfo::RGK_ScalableVector:

    return TypeSize::getScalable(0);

  }


  llvm_unreachable("Unsupported register kind");

}


InstructionCost WebAssemblyTTIImpl::getArithmeticInstrCost(

    unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

    TTI::OperandValueInfo Op1Info, TTI::OperandValueInfo Op2Info,

    ArrayRef<const Value *> Args, const Instruction *CxtI) const {


  InstructionCost Cost =

      BasicTTIImplBase<WebAssemblyTTIImpl>::getArithmeticInstrCost(

          Opcode, Ty, CostKind, Op1Info, Op2Info);


  if (auto *VTy = dyn_cast<VectorType>(Ty)) {

    switch (Opcode) {

    case Instruction::LShr:

    case Instruction::AShr:

    case Instruction::Shl:

      // SIMD128's shifts currently only accept a scalar shift count. For each

      // element, we'll need to extract, op, insert. The following is a rough

      // approximation.

      if (!Op2Info.isUniform())

        Cost =

            cast<FixedVectorType>(VTy)->getNumElements() *

            (TargetTransformInfo::TCC_Basic +

             getArithmeticInstrCost(Opcode, VTy->getElementType(), CostKind) +

             TargetTransformInfo::TCC_Basic);

      break;

    }

  }

  return Cost;

}


InstructionCost WebAssemblyTTIImpl::getCastInstrCost(

    unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH,

    TTI::TargetCostKind CostKind, const Instruction *I) const {

  int ISD = TLI->InstructionOpcodeToISD(Opcode);

  auto SrcTy = TLI->getValueType(DL, Src);

  auto DstTy = TLI->getValueType(DL, Dst);


  if (!SrcTy.isSimple() || !DstTy.isSimple()) {

    return BaseT::getCastInstrCost(Opcode, Dst, Src, CCH, CostKind, I);

  }


  if (!ST->hasSIMD128()) {

    return BaseT::getCastInstrCost(Opcode, Dst, Src, CCH, CostKind, I);

  }


  auto DstVT = DstTy.getSimpleVT();

  auto SrcVT = SrcTy.getSimpleVT();


  if (I && I->hasOneUser()) {

    auto *SingleUser = cast<Instruction>(*I->user_begin());

    int UserISD = TLI->InstructionOpcodeToISD(SingleUser->getOpcode());


    // extmul_low support

    if (UserISD == ISD::MUL &&

        (ISD == ISD::ZERO_EXTEND || ISD == ISD::SIGN_EXTEND)) {

      // Free low extensions.

      if ((SrcVT == MVT::v8i8 && DstVT == MVT::v8i16) ||

          (SrcVT == MVT::v4i16 && DstVT == MVT::v4i32) ||

          (SrcVT == MVT::v2i32 && DstVT == MVT::v2i64)) {

        return 0;

      }

      // Will require an additional extlow operation for the intermediate

      // i16/i32 value.

      if ((SrcVT == MVT::v4i8 && DstVT == MVT::v4i32) ||

          (SrcVT == MVT::v2i16 && DstVT == MVT::v2i64)) {

        return 1;

      }

    }

  }


  // extend_low

  static constexpr TypeConversionCostTblEntry ConversionTbl[] = {

      {ISD::SIGN_EXTEND, MVT::v2i64, MVT::v2i32, 1},

      {ISD::ZERO_EXTEND, MVT::v2i64, MVT::v2i32, 1},

      {ISD::SIGN_EXTEND, MVT::v4i32, MVT::v4i16, 1},

      {ISD::ZERO_EXTEND, MVT::v4i32, MVT::v4i16, 1},

      {ISD::SIGN_EXTEND, MVT::v8i16, MVT::v8i8, 1},

      {ISD::ZERO_EXTEND, MVT::v8i16, MVT::v8i8, 1},

      {ISD::SIGN_EXTEND, MVT::v2i64, MVT::v2i16, 2},

      {ISD::ZERO_EXTEND, MVT::v2i64, MVT::v2i16, 2},

      {ISD::SIGN_EXTEND, MVT::v4i32, MVT::v4i8, 2},

      {ISD::ZERO_EXTEND, MVT::v4i32, MVT::v4i8, 2},

  };


  if (const auto *Entry =

          ConvertCostTableLookup(ConversionTbl, ISD, DstVT, SrcVT)) {

    return Entry->Cost;

  }


  return BaseT::getCastInstrCost(Opcode, Dst, Src, CCH, CostKind, I);

}


WebAssemblyTTIImpl::TTI::MemCmpExpansionOptions

WebAssemblyTTIImpl::enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const {

  TTI::MemCmpExpansionOptions Options;


  Options.AllowOverlappingLoads = true;


  if (ST->hasSIMD128())

    Options.LoadSizes.push_back(16);


  Options.LoadSizes.append({8, 4, 2, 1});

  Options.MaxNumLoads = TLI->getMaxExpandSizeMemcmp(OptSize);

  Options.NumLoadsPerBlock = Options.MaxNumLoads;


  return Options;

}


InstructionCost WebAssemblyTTIImpl::getMemoryOpCost(

    unsigned Opcode, Type *Ty, Align Alignment, unsigned AddressSpace,

    TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo,

    const Instruction *I) const {

  if (!ST->hasSIMD128() || !isa<FixedVectorType>(Ty)) {

    return BaseT::getMemoryOpCost(Opcode, Ty, Alignment, AddressSpace,

                                  CostKind);

  }


  EVT VT = TLI->getValueType(DL, Ty, true);

  // Type legalization can't handle structs

  if (VT == MVT::Other)

    return BaseT::getMemoryOpCost(Opcode, Ty, Alignment, AddressSpace,

                                  CostKind);


  auto LT = getTypeLegalizationCost(Ty);

  if (!LT.first.isValid())

    return InstructionCost::getInvalid();


  int ISD = TLI->InstructionOpcodeToISD(Opcode);

  unsigned width = VT.getSizeInBits();

  if (ISD == ISD::LOAD) {

    // 128-bit loads are a single instruction. 32-bit and 64-bit vector loads

    // can be lowered to load32_zero and load64_zero respectively. Assume SIMD

    // loads are twice as expensive as scalar.

    switch (width) {

    default:

      break;

    case 32:

    case 64:

    case 128:

      return 2;

    }

  } else if (ISD == ISD::STORE) {

    // For stores, we can use store lane operations.

    switch (width) {

    default:

      break;

    case 8:

    case 16:

    case 32:

    case 64:

    case 128:

      return 2;

    }

  }


  return BaseT::getMemoryOpCost(Opcode, Ty, Alignment, AddressSpace, CostKind);

}


InstructionCost WebAssemblyTTIImpl::getInterleavedMemoryOpCost(

    unsigned Opcode, Type *Ty, unsigned Factor, ArrayRef<unsigned> Indices,

    Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

    bool UseMaskForCond, bool UseMaskForGaps) const {

  assert(Factor >= 2 && "Invalid interleave factor");


  auto *VecTy = cast<VectorType>(Ty);

  if (!ST->hasSIMD128() || !isa<FixedVectorType>(VecTy)) {

    return InstructionCost::getInvalid();

  }


  if (UseMaskForCond || UseMaskForGaps)

    return BaseT::getInterleavedMemoryOpCost(Opcode, Ty, Factor, Indices,

                                             Alignment, AddressSpace, CostKind,

                                             UseMaskForCond, UseMaskForGaps);


  constexpr unsigned MaxInterleaveFactor = 4;

  if (Factor <= MaxInterleaveFactor) {

    unsigned MinElts = VecTy->getElementCount().getKnownMinValue();

    // Ensure the number of vector elements is greater than 1.

    if (MinElts < 2 || MinElts % Factor != 0)

      return InstructionCost::getInvalid();


    unsigned ElSize = DL.getTypeSizeInBits(VecTy->getElementType());

    // Ensure the element type is legal.

    if (ElSize != 8 && ElSize != 16 && ElSize != 32 && ElSize != 64)

      return InstructionCost::getInvalid();


    auto *SubVecTy =

        VectorType::get(VecTy->getElementType(),

                        VecTy->getElementCount().divideCoefficientBy(Factor));

    InstructionCost MemCost =

        getMemoryOpCost(Opcode, SubVecTy, Alignment, AddressSpace, CostKind);


    unsigned VecSize = DL.getTypeSizeInBits(SubVecTy);

    unsigned MaxVecSize = 128;

    unsigned NumAccesses =

        std::max<unsigned>(1, (MinElts * ElSize + MaxVecSize - 1) / VecSize);


    // A stride of two is commonly supported via dedicated instructions, so it

    // should be relatively cheap for all element sizes. A stride of four is

    // more expensive as it will likely require more shuffles. Using two

    // simd128 inputs is considered more expensive and we mainly account for

    // shuffling two inputs (32 bytes), but we do model 4 x v4i32 to enable

    // arithmetic kernels.

    static const CostTblEntry ShuffleCostTbl[] = {

        // One reg.

        {2, MVT::v2i8, 1},  // interleave 2 x 2i8 into 4i8

        {2, MVT::v4i8, 1},  // interleave 2 x 4i8 into 8i8

        {2, MVT::v8i8, 1},  // interleave 2 x 8i8 into 16i8

        {2, MVT::v2i16, 1}, // interleave 2 x 2i16 into 4i16

        {2, MVT::v4i16, 1}, // interleave 2 x 4i16 into 8i16

        {2, MVT::v2i32, 1}, // interleave 2 x 2i32 into 4i32


        // Two regs.

        {2, MVT::v16i8, 2}, // interleave 2 x 16i8 into 32i8

        {2, MVT::v8i16, 2}, // interleave 2 x 8i16 into 16i16

        {2, MVT::v4i32, 2}, // interleave 2 x 4i32 into 8i32


        // One reg.

        {4, MVT::v2i8, 4},  // interleave 4 x 2i8 into 8i8

        {4, MVT::v4i8, 4},  // interleave 4 x 4i8 into 16i8

        {4, MVT::v2i16, 4}, // interleave 4 x 2i16 into 8i16


        // Two regs.

        {4, MVT::v8i8, 16}, // interleave 4 x 8i8 into 32i8

        {4, MVT::v4i16, 8}, // interleave 4 x 4i16 into 16i16

        {4, MVT::v2i32, 4}, // interleave 4 x 2i32 into 8i32


        // Four regs.

        {4, MVT::v4i32, 16}, // interleave 4 x 4i32 into 16i32

    };


    EVT ETy = TLI->getValueType(DL, SubVecTy);

    if (const auto *Entry =

            CostTableLookup(ShuffleCostTbl, Factor, ETy.getSimpleVT()))

      return Entry->Cost + (NumAccesses * MemCost);

  }


  return BaseT::getInterleavedMemoryOpCost(Opcode, VecTy, Factor, Indices,

                                           Alignment, AddressSpace, CostKind,

                                           UseMaskForCond, UseMaskForGaps);

}


InstructionCost WebAssemblyTTIImpl::getVectorInstrCost(

    unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index,

    const Value *Op0, const Value *Op1) const {

  InstructionCost Cost = BasicTTIImplBase::getVectorInstrCost(

      Opcode, Val, CostKind, Index, Op0, Op1);


  // SIMD128's insert/extract currently only take constant indices.

  if (Index == -1u)

    return Cost + 25 * TargetTransformInfo::TCC_Expensive;


  return Cost;

}


InstructionCost WebAssemblyTTIImpl::getPartialReductionCost(

    unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType,

    ElementCount VF, TTI::PartialReductionExtendKind OpAExtend,

    TTI::PartialReductionExtendKind OpBExtend, std::optional<unsigned> BinOp,

    TTI::TargetCostKind CostKind) const {

  InstructionCost Invalid = InstructionCost::getInvalid();

  if (!VF.isFixed() || !ST->hasSIMD128())

    return Invalid;


  if (CostKind != TTI::TCK_RecipThroughput)

    return Invalid;


  InstructionCost Cost(TTI::TCC_Basic);


  // Possible options:

  // - i16x8.extadd_pairwise_i8x16_sx

  // - i32x4.extadd_pairwise_i16x8_sx

  // - i32x4.dot_i16x8_s

  // Only try to support dot, for now.


  if (Opcode != Instruction::Add)

    return Invalid;


  if (!BinOp || *BinOp != Instruction::Mul)

    return Invalid;


  if (InputTypeA != InputTypeB)

    return Invalid;


  if (OpAExtend != OpBExtend)

    return Invalid;


  EVT InputEVT = EVT::getEVT(InputTypeA);

  EVT AccumEVT = EVT::getEVT(AccumType);


  // TODO: Add i64 accumulator.

  if (AccumEVT != MVT::i32)

    return Invalid;


  // Signed inputs can lower to dot

  if (InputEVT == MVT::i16 && VF.getFixedValue() == 8)

    return OpAExtend == TTI::PR_SignExtend ? Cost : Cost * 2;


  // Double the size of the lowered sequence.

  if (InputEVT == MVT::i8 && VF.getFixedValue() == 16)

    return OpAExtend == TTI::PR_SignExtend ? Cost * 2 : Cost * 4;


  return Invalid;

}


TTI::ReductionShuffle WebAssemblyTTIImpl::getPreferredExpandedReductionShuffle(

    const IntrinsicInst *II) const {


  switch (II->getIntrinsicID()) {

  default:

    break;

  case Intrinsic::vector_reduce_fadd:

    return TTI::ReductionShuffle::Pairwise;

  }

  return TTI::ReductionShuffle::SplitHalf;

}


void WebAssemblyTTIImpl::getUnrollingPreferences(

    Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP,

    OptimizationRemarkEmitter *ORE) const {

  // Scan the loop: don't unroll loops with calls. This is a standard approach

  // for most (all?) targets.

  for (BasicBlock *BB : L->blocks())

    for (Instruction &I : *BB)

      if (isa<CallInst>(I) || isa<InvokeInst>(I))

        if (const Function *F = cast<CallBase>(I).getCalledFunction())

          if (isLoweredToCall(F))

            return;


  // The chosen threshold is within the range of 'LoopMicroOpBufferSize' of

  // the various microarchitectures that use the BasicTTI implementation and

  // has been selected through heuristics across multiple cores and runtimes.

  UP.Partial = UP.Runtime = UP.UpperBound = true;

  UP.PartialThreshold = 30;


  // Avoid unrolling when optimizing for size.

  UP.OptSizeThreshold = 0;

  UP.PartialOptSizeThreshold = 0;


  // Set number of instructions optimized when "back edge"

  // becomes "fall through" to default value of 2.

  UP.BEInsns = 2;

}


bool WebAssemblyTTIImpl::supportsTailCalls() const {

  return getST()->hasTailCall();

}


bool WebAssemblyTTIImpl::isProfitableToSinkOperands(

    Instruction *I, SmallVectorImpl<Use *> &Ops) const {

  using namespace llvm::PatternMatch;


  if (!I->getType()->isVectorTy() || !I->isShift())

    return false;


  Value *V = I->getOperand(1);

  // We dont need to sink constant splat.

  if (isa<Constant>(V))

    return false;


  if (match(V, m_Shuffle(m_InsertElt(m_Value(), m_Value(), m_ZeroInt()),

                         m_Value(), m_ZeroMask()))) {

    // Sink insert

    Ops.push_back(&cast<Instruction>(V)->getOperandUse(0));

    // Sink shuffle

    Ops.push_back(&I->getOperandUse(1));

    return true;

  }


  return false;

}

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

CostKind
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))

CostTable.h
Cost tables and simple lookup functions.

MaxVecSize
static const int MaxVecSize
Definition: DXILDataScalarization.cpp:28

Options
static LVOptions Options
Definition: LVOptions.cpp:25

MaxInterleaveFactor
static const unsigned MaxInterleaveFactor
Maximum vectorization interleave count.
Definition: LoopVectorizationLegality.cpp:85

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

getCalledFunction
static const Function * getCalledFunction(const Value *V)
Definition: MemoryBuiltins.cpp:159

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:46

WebAssemblyTargetTransformInfo.h
This file a TargetTransformInfoImplBase conforming object specific to the WebAssembly target machine.

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:62

llvm::BasicTTIImplBase< WebAssemblyTTIImpl >::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false) const override
Definition: BasicTTIImpl.h:1589

llvm::BasicTTIImplBase::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1) const override
Definition: BasicTTIImpl.h:1423

llvm::BasicTTIImplBase::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Opd1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Opd2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition: BasicTTIImpl.h:1033

llvm::BasicTTIImplBase< WebAssemblyTTIImpl >::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition: BasicTTIImpl.h:1196

llvm::BasicTTIImplBase< WebAssemblyTTIImpl >::getTypeLegalizationCost
std::pair< InstructionCost, MVT > getTypeLegalizationCost(Type *Ty) const
Estimate the cost of type-legalization and the legalized type.
Definition: BasicTTIImpl.h:997

llvm::BasicTTIImplBase< WebAssemblyTTIImpl >::DL
const DataLayout & DL
Definition: TargetTransformInfoImpl.h:39

llvm::BasicTTIImplBase< WebAssemblyTTIImpl >::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition: BasicTTIImpl.h:1503

llvm::DataLayout::getTypeSizeInBits
TypeSize getTypeSizeInBits(Type *Ty) const
Size examples:
Definition: DataLayout.h:674

llvm::ElementCount
Definition: TypeSize.h:301

llvm::Function
Definition: Function.h:64

llvm::InstructionCost
Definition: InstructionCost.h:30

llvm::InstructionCost::getInvalid
static InstructionCost getInvalid(CostType Val=0)
Definition: InstructionCost.h:74

llvm::Instruction
Definition: Instruction.h:69

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:49

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:40

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition: OptimizationRemarkEmitter.h:33

llvm::ScalarEvolution
The main scalar evolution driver.
Definition: ScalarEvolution.h:448

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:574

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:414

llvm::TargetLoweringBase::InstructionOpcodeToISD
int InstructionOpcodeToISD(unsigned Opcode) const
Get the ISD node that corresponds to the Instruction class opcode.
Definition: TargetLoweringBase.cpp:1841

llvm::TargetLoweringBase::getValueType
EVT getValueType(const DataLayout &DL, Type *Ty, bool AllowUnknown=false) const
Return the EVT corresponding to this LLVM type.
Definition: TargetLowering.h:1726

llvm::TargetLoweringBase::getMaxExpandSizeMemcmp
unsigned getMaxExpandSizeMemcmp(bool OptSize) const
Get maximum # of load operations permitted for memcmp.
Definition: TargetLowering.h:1947

llvm::TargetTransformInfoImplBase::getNumberOfRegisters
virtual unsigned getNumberOfRegisters(unsigned ClassID) const
Definition: TargetTransformInfoImpl.h:561

llvm::TargetTransformInfoImplBase::isLoweredToCall
virtual bool isLoweredToCall(const Function *F) const
Definition: TargetTransformInfoImpl.h:174

llvm::TargetTransformInfo::ReductionShuffle
ReductionShuffle
Definition: TargetTransformInfo.h:1849

llvm::TargetTransformInfo::ReductionShuffle::Pairwise
@ Pairwise

llvm::TargetTransformInfo::ReductionShuffle::SplitHalf
@ SplitHalf

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition: TargetTransformInfo.h:271

llvm::TargetTransformInfo::TCK_RecipThroughput
@ TCK_RecipThroughput
Reciprocal throughput.
Definition: TargetTransformInfo.h:272

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition: TargetTransformInfo.h:1206

llvm::TargetTransformInfo::RGK_FixedWidthVector
@ RGK_FixedWidthVector
Definition: TargetTransformInfo.h:1206

llvm::TargetTransformInfo::RGK_ScalableVector
@ RGK_ScalableVector
Definition: TargetTransformInfo.h:1206

llvm::TargetTransformInfo::RGK_Scalar
@ RGK_Scalar
Definition: TargetTransformInfo.h:1206

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition: TargetTransformInfo.h:735

llvm::TargetTransformInfo::PSK_FastHardware
@ PSK_FastHardware
Definition: TargetTransformInfo.h:735

llvm::TargetTransformInfo::PartialReductionExtendKind
PartialReductionExtendKind
Definition: TargetTransformInfo.h:221

llvm::TargetTransformInfo::PR_SignExtend
@ PR_SignExtend
Definition: TargetTransformInfo.h:221

llvm::TargetTransformInfo::TCC_Expensive
@ TCC_Expensive
The cost of a 'div' instruction on x86.
Definition: TargetTransformInfo.h:299

llvm::TargetTransformInfo::TCC_Basic
@ TCC_Basic
The cost of a typical 'add' instruction.
Definition: TargetTransformInfo.h:298

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition: TargetTransformInfo.h:1428

llvm::TypeSize
Definition: TypeSize.h:335

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition: TypeSize.h:346

llvm::TypeSize::getScalable
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition: TypeSize.h:349

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Value
LLVM Value Representation.
Definition: Value.h:75

llvm::VectorType::get
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.

llvm::WebAssemblySubtarget::hasTailCall
bool hasTailCall() const
Definition: WebAssemblySubtarget.h:115

llvm::WebAssemblySubtarget::hasSIMD128
bool hasSIMD128() const
Definition: WebAssemblySubtarget.h:114

llvm::WebAssemblyTTIImpl::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *Ty, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond, bool UseMaskForGaps) const override
Definition: WebAssemblyTargetTransformInfo.cpp:210

llvm::WebAssemblyTTIImpl::supportsTailCalls
bool supportsTailCalls() const override
Definition: WebAssemblyTargetTransformInfo.cpp:396

llvm::WebAssemblyTTIImpl::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition: WebAssemblyTargetTransformInfo.cpp:160

llvm::WebAssemblyTTIImpl::getPopcntSupport
TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) const override
Definition: WebAssemblyTargetTransformInfo.cpp:23

llvm::WebAssemblyTTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const override
Definition: WebAssemblyTargetTransformInfo.cpp:39

llvm::WebAssemblyTTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition: WebAssemblyTargetTransformInfo.cpp:53

llvm::WebAssemblyTTIImpl::isProfitableToSinkOperands
bool isProfitableToSinkOperands(Instruction *I, SmallVectorImpl< Use * > &Ops) const override
Definition: WebAssemblyTargetTransformInfo.cpp:400

llvm::WebAssemblyTTIImpl::getPartialReductionCost
InstructionCost getPartialReductionCost(unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType, ElementCount VF, TTI::PartialReductionExtendKind OpAExtend, TTI::PartialReductionExtendKind OpBExtend, std::optional< unsigned > BinOp, TTI::TargetCostKind CostKind) const override
Definition: WebAssemblyTargetTransformInfo.cpp:307

llvm::WebAssemblyTTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1) const override
Definition: WebAssemblyTargetTransformInfo.cpp:294

llvm::WebAssemblyTTIImpl::getPreferredExpandedReductionShuffle
TTI::ReductionShuffle getPreferredExpandedReductionShuffle(const IntrinsicInst *II) const override
Definition: WebAssemblyTargetTransformInfo.cpp:357

llvm::WebAssemblyTTIImpl::getUnrollingPreferences
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE) const override
Definition: WebAssemblyTargetTransformInfo.cpp:369

llvm::WebAssemblyTTIImpl::enableMemCmpExpansion
TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const override
Definition: WebAssemblyTargetTransformInfo.cpp:145

llvm::WebAssemblyTTIImpl::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition: WebAssemblyTargetTransformInfo.cpp:82

llvm::WebAssemblyTTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const override
Definition: WebAssemblyTargetTransformInfo.cpp:28

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition: TypeSize.h:203

llvm::details::FixedOrScalableQuantity::isFixed
constexpr bool isFixed() const
Returns true if the quantity is not scaled by vscale.
Definition: TypeSize.h:175

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:164

llvm::ISD::STORE
@ STORE
Definition: ISDOpcodes.h:1142

llvm::ISD::LOAD
@ LOAD
LOAD and STORE have token chains as their first operand, then the same operands as an LLVM load/store...
Definition: ISDOpcodes.h:1141

llvm::ISD::SIGN_EXTEND
@ SIGN_EXTEND
Conversion operators.
Definition: ISDOpcodes.h:826

llvm::ISD::ZERO_EXTEND
@ ZERO_EXTEND
ZERO_EXTEND - Used for integer types, zeroing the new bits.
Definition: ISDOpcodes.h:832

llvm::ISD::MUL
@ MUL
Definition: ISDOpcodes.h:261

llvm::MIPatternMatch::m_ZeroInt
SpecificConstantMatch m_ZeroInt()
Convenience matchers for specific integer values.
Definition: MIPatternMatch.h:277

llvm::NVPTXAS::AddressSpace
AddressSpace
Definition: NVPTXAddrSpace.h:21

llvm::PatternMatch
Definition: PatternMatch.h:47

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::PatternMatch::m_Shuffle
TwoOps_match< V1_t, V2_t, Instruction::ShuffleVector > m_Shuffle(const V1_t &v1, const V2_t &v2)
Matches ShuffleVectorInst independently of mask value.
Definition: PatternMatch.h:2040

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_InsertElt
ThreeOps_match< Val_t, Elt_t, Idx_t, Instruction::InsertElement > m_InsertElt(const Val_t &Val, const Elt_t &Elt, const Idx_t &Idx)
Matches InsertElementInst.
Definition: PatternMatch.h:1958

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::CostTableLookup
const CostTblEntryT< CostType > * CostTableLookup(ArrayRef< CostTblEntryT< CostType > > Tbl, int ISD, MVT Ty)
Find in cost table.
Definition: CostTable.h:35

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:288

llvm::Cost
InstructionCost Cost
Definition: FunctionSpecialization.h:103

llvm::VFParamKind::Vector
@ Vector

llvm::Invalid
@ Invalid
Definition: PGOCtxProfWriter.h:24

llvm::ConvertCostTableLookup
const TypeConversionCostTblEntryT< CostType > * ConvertCostTableLookup(ArrayRef< TypeConversionCostTblEntryT< CostType > > Tbl, int ISD, MVT Dst, MVT Src)
Find in type conversion cost table.
Definition: CostTable.h:66

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::CostTblEntryT
Cost Table Entry.
Definition: CostTable.h:25

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:35

llvm::EVT::getSizeInBits
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition: ValueTypes.h:368

llvm::EVT::getEVT
static LLVM_ABI EVT getEVT(Type *Ty, bool HandleUnknown=false)
Return the value type corresponding to the specified type.
Definition: ValueTypes.cpp:299

llvm::EVT::getSimpleVT
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Definition: ValueTypes.h:311

llvm::PatternMatch::m_ZeroMask
Definition: PatternMatch.h:1997

llvm::TargetTransformInfo::MemCmpExpansionOptions
Returns options for expansion of memcmp. IsZeroCmp is.
Definition: TargetTransformInfo.h:985

llvm::TargetTransformInfo::OperandValueInfo
Definition: TargetTransformInfo.h:1160

llvm::TargetTransformInfo::OperandValueInfo::isUniform
bool isUniform() const
Definition: TargetTransformInfo.h:1167

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition: TargetTransformInfo.h:547

llvm::TargetTransformInfo::UnrollingPreferences::UpperBound
bool UpperBound
Allow using trip count upper bound to unroll loops.
Definition: TargetTransformInfo.h:618

llvm::TargetTransformInfo::UnrollingPreferences::PartialOptSizeThreshold
unsigned PartialOptSizeThreshold
The cost threshold for the unrolled loop when optimizing for size, like OptSizeThreshold,...
Definition: TargetTransformInfo.h:576

llvm::TargetTransformInfo::UnrollingPreferences::BEInsns
unsigned BEInsns
Definition: TargetTransformInfo.h:601

llvm::TargetTransformInfo::UnrollingPreferences::PartialThreshold
unsigned PartialThreshold
The cost threshold for the unrolled loop, like Threshold, but used for partial/runtime unrolling (set...
Definition: TargetTransformInfo.h:572

llvm::TargetTransformInfo::UnrollingPreferences::Runtime
bool Runtime
Allow runtime unrolling (unrolling of loops to expand the size of the loop body even when the number ...
Definition: TargetTransformInfo.h:608

llvm::TargetTransformInfo::UnrollingPreferences::Partial
bool Partial
Allow partial unrolling (unrolling of loops to expand the size of the loop body, not only to eliminat...
Definition: TargetTransformInfo.h:604

llvm::TargetTransformInfo::UnrollingPreferences::OptSizeThreshold
unsigned OptSizeThreshold
The cost threshold for the unrolled loop when optimizing for size (set to UINT_MAX to disable).
Definition: TargetTransformInfo.h:569

llvm::TypeConversionCostTblEntryT
Type Conversion Cost Table.
Definition: CostTable.h:55