LLVM: lib/Target/WebAssembly/WebAssemblyISelLowering.cpp Source File

//=- WebAssemblyISelLowering.cpp - WebAssembly DAG Lowering Implementation -==//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

///

/// \file

/// This file implements the WebAssemblyTargetLowering class.

///

//===----------------------------------------------------------------------===//


#include "WebAssemblyISelLowering.h"

#include "MCTargetDesc/WebAssemblyMCTargetDesc.h"

#include "Utils/WebAssemblyTypeUtilities.h"

#include "WebAssemblyMachineFunctionInfo.h"

#include "WebAssemblySubtarget.h"

#include "WebAssemblyTargetMachine.h"

#include "WebAssemblyUtilities.h"

#include "llvm/CodeGen/CallingConvLower.h"

#include "llvm/CodeGen/MachineFrameInfo.h"

#include "llvm/CodeGen/MachineInstrBuilder.h"

#include "llvm/CodeGen/MachineJumpTableInfo.h"

#include "llvm/CodeGen/MachineModuleInfo.h"

#include "llvm/CodeGen/MachineRegisterInfo.h"

#include "llvm/CodeGen/SDPatternMatch.h"

#include "llvm/CodeGen/SelectionDAG.h"

#include "llvm/CodeGen/SelectionDAGNodes.h"

#include "llvm/IR/DiagnosticInfo.h"

#include "llvm/IR/DiagnosticPrinter.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Intrinsics.h"

#include "llvm/IR/IntrinsicsWebAssembly.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Support/MathExtras.h"

#include "llvm/Target/TargetOptions.h"

using namespace llvm;


#define DEBUG_TYPE "wasm-lower"


WebAssemblyTargetLowering::WebAssemblyTargetLowering(

    const TargetMachine &TM, const WebAssemblySubtarget &STI)

    : TargetLowering(TM), Subtarget(&STI) {

  auto MVTPtr = Subtarget->hasAddr64() ? MVT::i64 : MVT::i32;


  // Set the load count for memcmp expand optimization

  MaxLoadsPerMemcmp = 8;

  MaxLoadsPerMemcmpOptSize = 4;


  // Booleans always contain 0 or 1.

  setBooleanContents(ZeroOrOneBooleanContent);

  // Except in SIMD vectors

  setBooleanVectorContents(ZeroOrNegativeOneBooleanContent);

  // We don't know the microarchitecture here, so just reduce register pressure.

  setSchedulingPreference(Sched::RegPressure);

  // Tell ISel that we have a stack pointer.

  setStackPointerRegisterToSaveRestore(

      Subtarget->hasAddr64() ? WebAssembly::SP64 : WebAssembly::SP32);

  // Set up the register classes.

  addRegisterClass(MVT::i32, &WebAssembly::I32RegClass);

  addRegisterClass(MVT::i64, &WebAssembly::I64RegClass);

  addRegisterClass(MVT::f32, &WebAssembly::F32RegClass);

  addRegisterClass(MVT::f64, &WebAssembly::F64RegClass);

  if (Subtarget->hasSIMD128()) {

    addRegisterClass(MVT::v16i8, &WebAssembly::V128RegClass);

    addRegisterClass(MVT::v8i16, &WebAssembly::V128RegClass);

    addRegisterClass(MVT::v4i32, &WebAssembly::V128RegClass);

    addRegisterClass(MVT::v4f32, &WebAssembly::V128RegClass);

    addRegisterClass(MVT::v2i64, &WebAssembly::V128RegClass);

    addRegisterClass(MVT::v2f64, &WebAssembly::V128RegClass);

  }

  if (Subtarget->hasFP16()) {

    addRegisterClass(MVT::v8f16, &WebAssembly::V128RegClass);

  }

  if (Subtarget->hasReferenceTypes()) {

    addRegisterClass(MVT::externref, &WebAssembly::EXTERNREFRegClass);

    addRegisterClass(MVT::funcref, &WebAssembly::FUNCREFRegClass);

    if (Subtarget->hasExceptionHandling()) {

      addRegisterClass(MVT::exnref, &WebAssembly::EXNREFRegClass);

    }

  }

  // Compute derived properties from the register classes.

  computeRegisterProperties(Subtarget->getRegisterInfo());


  // Transform loads and stores to pointers in address space 1 to loads and

  // stores to WebAssembly global variables, outside linear memory.

  for (auto T : {MVT::i32, MVT::i64, MVT::f32, MVT::f64}) {

    setOperationAction(ISD::LOAD, T, Custom);

    setOperationAction(ISD::STORE, T, Custom);

  }

  if (Subtarget->hasSIMD128()) {

    for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,

                   MVT::v2f64}) {

      setOperationAction(ISD::LOAD, T, Custom);

      setOperationAction(ISD::STORE, T, Custom);

    }

  }

  if (Subtarget->hasFP16()) {

    setOperationAction(ISD::LOAD, MVT::v8f16, Custom);

    setOperationAction(ISD::STORE, MVT::v8f16, Custom);

  }

  if (Subtarget->hasReferenceTypes()) {

    // We need custom load and store lowering for both externref, funcref and

    // Other. The MVT::Other here represents tables of reference types.

    for (auto T : {MVT::externref, MVT::funcref, MVT::Other}) {

      setOperationAction(ISD::LOAD, T, Custom);

      setOperationAction(ISD::STORE, T, Custom);

    }

  }


  setOperationAction(ISD::GlobalAddress, MVTPtr, Custom);

  setOperationAction(ISD::GlobalTLSAddress, MVTPtr, Custom);

  setOperationAction(ISD::ExternalSymbol, MVTPtr, Custom);

  setOperationAction(ISD::JumpTable, MVTPtr, Custom);

  setOperationAction(ISD::BlockAddress, MVTPtr, Custom);

  setOperationAction(ISD::BRIND, MVT::Other, Custom);

  setOperationAction(ISD::CLEAR_CACHE, MVT::Other, Custom);


  // Take the default expansion for va_arg, va_copy, and va_end. There is no

  // default action for va_start, so we do that custom.

  setOperationAction(ISD::VASTART, MVT::Other, Custom);

  setOperationAction(ISD::VAARG, MVT::Other, Expand);

  setOperationAction(ISD::VACOPY, MVT::Other, Expand);

  setOperationAction(ISD::VAEND, MVT::Other, Expand);


  for (auto T : {MVT::f32, MVT::f64, MVT::v4f32, MVT::v2f64, MVT::v8f16}) {

    if (!Subtarget->hasFP16() && T == MVT::v8f16) {

      continue;

    }

    // Don't expand the floating-point types to constant pools.

    setOperationAction(ISD::ConstantFP, T, Legal);

    // Expand floating-point comparisons.

    for (auto CC : {ISD::SETO, ISD::SETUO, ISD::SETUEQ, ISD::SETONE,

                    ISD::SETULT, ISD::SETULE, ISD::SETUGT, ISD::SETUGE})

      setCondCodeAction(CC, T, Expand);

    // Expand floating-point library function operators.

    for (auto Op :

         {ISD::FSIN, ISD::FCOS, ISD::FSINCOS, ISD::FPOW, ISD::FREM, ISD::FMA})

      setOperationAction(Op, T, Expand);

    // Note supported floating-point library function operators that otherwise

    // default to expand.

    for (auto Op : {ISD::FCEIL, ISD::FFLOOR, ISD::FTRUNC, ISD::FNEARBYINT,

                    ISD::FRINT, ISD::FROUNDEVEN})

      setOperationAction(Op, T, Legal);

    // Support minimum and maximum, which otherwise default to expand.

    setOperationAction(ISD::FMINIMUM, T, Legal);

    setOperationAction(ISD::FMAXIMUM, T, Legal);

    // When experimental v8f16 support is enabled these instructions don't need

    // to be expanded.

    if (T != MVT::v8f16) {

      setOperationAction(ISD::FP16_TO_FP, T, Expand);

      setOperationAction(ISD::FP_TO_FP16, T, Expand);

    }

    setLoadExtAction(ISD::EXTLOAD, T, MVT::f16, Expand);

    setTruncStoreAction(T, MVT::f16, Expand);

  }


  // Expand unavailable integer operations.

  for (auto Op :

       {ISD::BSWAP, ISD::SMUL_LOHI, ISD::UMUL_LOHI, ISD::MULHS, ISD::MULHU,

        ISD::SDIVREM, ISD::UDIVREM, ISD::SHL_PARTS, ISD::SRA_PARTS,

        ISD::SRL_PARTS, ISD::ADDC, ISD::ADDE, ISD::SUBC, ISD::SUBE}) {

    for (auto T : {MVT::i32, MVT::i64})

      setOperationAction(Op, T, Expand);

    if (Subtarget->hasSIMD128())

      for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64})

        setOperationAction(Op, T, Expand);

  }


  if (Subtarget->hasWideArithmetic()) {

    setOperationAction(ISD::ADD, MVT::i128, Custom);

    setOperationAction(ISD::SUB, MVT::i128, Custom);

    setOperationAction(ISD::SMUL_LOHI, MVT::i64, Custom);

    setOperationAction(ISD::UMUL_LOHI, MVT::i64, Custom);

    setOperationAction(ISD::UADDO, MVT::i64, Custom);

  }


  if (Subtarget->hasNontrappingFPToInt())

    for (auto Op : {ISD::FP_TO_SINT_SAT, ISD::FP_TO_UINT_SAT})

      for (auto T : {MVT::i32, MVT::i64})

        setOperationAction(Op, T, Custom);


  // SIMD-specific configuration

  if (Subtarget->hasSIMD128()) {


    // Combine partial.reduce.add before legalization gets confused.

    setTargetDAGCombine(ISD::INTRINSIC_WO_CHAIN);


    // Combine wide-vector muls, with extend inputs, to extmul_half.

    setTargetDAGCombine(ISD::MUL);


    // Combine vector mask reductions into alltrue/anytrue

    setTargetDAGCombine(ISD::SETCC);


    // Convert vector to integer bitcasts to bitmask

    setTargetDAGCombine(ISD::BITCAST);


    // Hoist bitcasts out of shuffles

    setTargetDAGCombine(ISD::VECTOR_SHUFFLE);


    // Combine extends of extract_subvectors into widening ops

    setTargetDAGCombine({ISD::SIGN_EXTEND, ISD::ZERO_EXTEND});


    // Combine int_to_fp or fp_extend of extract_vectors and vice versa into

    // conversions ops

    setTargetDAGCombine({ISD::SINT_TO_FP, ISD::UINT_TO_FP, ISD::FP_EXTEND,

                         ISD::EXTRACT_SUBVECTOR});


    // Combine fp_to_{s,u}int_sat or fp_round of concat_vectors or vice versa

    // into conversion ops

    setTargetDAGCombine({ISD::FP_TO_SINT_SAT, ISD::FP_TO_UINT_SAT,

                         ISD::FP_ROUND, ISD::CONCAT_VECTORS});


    setTargetDAGCombine(ISD::TRUNCATE);


    // Support saturating add/sub for i8x16 and i16x8

    for (auto Op : {ISD::SADDSAT, ISD::UADDSAT, ISD::SSUBSAT, ISD::USUBSAT})

      for (auto T : {MVT::v16i8, MVT::v8i16})

        setOperationAction(Op, T, Legal);


    // Support integer abs

    for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64})

      setOperationAction(ISD::ABS, T, Legal);


    // Custom lower BUILD_VECTORs to minimize number of replace_lanes

    for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,

                   MVT::v2f64})

      setOperationAction(ISD::BUILD_VECTOR, T, Custom);


    if (Subtarget->hasFP16())

      setOperationAction(ISD::BUILD_VECTOR, MVT::f16, Custom);


    // We have custom shuffle lowering to expose the shuffle mask

    for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,

                   MVT::v2f64})

      setOperationAction(ISD::VECTOR_SHUFFLE, T, Custom);


    if (Subtarget->hasFP16())

      setOperationAction(ISD::VECTOR_SHUFFLE, MVT::v8f16, Custom);


    // Support splatting

    for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,

                   MVT::v2f64})

      setOperationAction(ISD::SPLAT_VECTOR, T, Legal);


    setOperationAction(ISD::AVGCEILU, {MVT::v8i16, MVT::v16i8}, Legal);


    // Custom lowering since wasm shifts must have a scalar shift amount

    for (auto Op : {ISD::SHL, ISD::SRA, ISD::SRL})

      for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64})

        setOperationAction(Op, T, Custom);


    // Custom lower lane accesses to expand out variable indices

    for (auto Op : {ISD::EXTRACT_VECTOR_ELT, ISD::INSERT_VECTOR_ELT})

      for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,

                     MVT::v2f64})

        setOperationAction(Op, T, Custom);


    // There is no i8x16.mul instruction

    setOperationAction(ISD::MUL, MVT::v16i8, Expand);


    // There is no vector conditional select instruction

    for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v4f32, MVT::v2i64,

                   MVT::v2f64})

      setOperationAction(ISD::SELECT_CC, T, Expand);


    // Expand integer operations supported for scalars but not SIMD

    for (auto Op :

         {ISD::SDIV, ISD::UDIV, ISD::SREM, ISD::UREM, ISD::ROTL, ISD::ROTR})

      for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64})

        setOperationAction(Op, T, Expand);


    // But we do have integer min and max operations

    for (auto Op : {ISD::SMIN, ISD::SMAX, ISD::UMIN, ISD::UMAX})

      for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32})

        setOperationAction(Op, T, Legal);


    // And we have popcnt for i8x16. It can be used to expand ctlz/cttz.

    setOperationAction(ISD::CTPOP, MVT::v16i8, Legal);

    setOperationAction(ISD::CTLZ, MVT::v16i8, Expand);

    setOperationAction(ISD::CTTZ, MVT::v16i8, Expand);


    // Custom lower bit counting operations for other types to scalarize them.

    for (auto Op : {ISD::CTLZ, ISD::CTTZ, ISD::CTPOP})

      for (auto T : {MVT::v8i16, MVT::v4i32, MVT::v2i64})

        setOperationAction(Op, T, Custom);


    // Expand float operations supported for scalars but not SIMD

    for (auto Op : {ISD::FCOPYSIGN, ISD::FLOG, ISD::FLOG2, ISD::FLOG10,

                    ISD::FEXP, ISD::FEXP2, ISD::FEXP10})

      for (auto T : {MVT::v4f32, MVT::v2f64})

        setOperationAction(Op, T, Expand);


    // Unsigned comparison operations are unavailable for i64x2 vectors.

    for (auto CC : {ISD::SETUGT, ISD::SETUGE, ISD::SETULT, ISD::SETULE})

      setCondCodeAction(CC, MVT::v2i64, Custom);


    // 64x2 conversions are not in the spec

    for (auto Op :

         {ISD::SINT_TO_FP, ISD::UINT_TO_FP, ISD::FP_TO_SINT, ISD::FP_TO_UINT})

      for (auto T : {MVT::v2i64, MVT::v2f64})

        setOperationAction(Op, T, Expand);


    // But saturating fp_to_int converstions are

    for (auto Op : {ISD::FP_TO_SINT_SAT, ISD::FP_TO_UINT_SAT}) {

      setOperationAction(Op, MVT::v4i32, Custom);

      if (Subtarget->hasFP16()) {

        setOperationAction(Op, MVT::v8i16, Custom);

      }

    }


    // Support vector extending

    for (auto T : MVT::integer_fixedlen_vector_valuetypes()) {

      setOperationAction(ISD::SIGN_EXTEND_VECTOR_INREG, T, Custom);

      setOperationAction(ISD::ZERO_EXTEND_VECTOR_INREG, T, Custom);

    }

  }


  // As a special case, these operators use the type to mean the type to

  // sign-extend from.

  setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);

  if (!Subtarget->hasSignExt()) {

    // Sign extends are legal only when extending a vector extract

    auto Action = Subtarget->hasSIMD128() ? Custom : Expand;

    for (auto T : {MVT::i8, MVT::i16, MVT::i32})

      setOperationAction(ISD::SIGN_EXTEND_INREG, T, Action);

  }

  for (auto T : MVT::integer_fixedlen_vector_valuetypes())

    setOperationAction(ISD::SIGN_EXTEND_INREG, T, Expand);


  // Dynamic stack allocation: use the default expansion.

  setOperationAction(ISD::STACKSAVE, MVT::Other, Expand);

  setOperationAction(ISD::STACKRESTORE, MVT::Other, Expand);

  setOperationAction(ISD::DYNAMIC_STACKALLOC, MVTPtr, Expand);


  setOperationAction(ISD::FrameIndex, MVT::i32, Custom);

  setOperationAction(ISD::FrameIndex, MVT::i64, Custom);

  setOperationAction(ISD::CopyToReg, MVT::Other, Custom);


  // Expand these forms; we pattern-match the forms that we can handle in isel.

  for (auto T : {MVT::i32, MVT::i64, MVT::f32, MVT::f64})

    for (auto Op : {ISD::BR_CC, ISD::SELECT_CC})

      setOperationAction(Op, T, Expand);


  // We have custom switch handling.

  setOperationAction(ISD::BR_JT, MVT::Other, Custom);


  // WebAssembly doesn't have:

  //  - Floating-point extending loads.

  //  - Floating-point truncating stores.

  //  - i1 extending loads.

  //  - truncating SIMD stores and most extending loads

  setLoadExtAction(ISD::EXTLOAD, MVT::f64, MVT::f32, Expand);

  setTruncStoreAction(MVT::f64, MVT::f32, Expand);

  for (auto T : MVT::integer_valuetypes())

    for (auto Ext : {ISD::EXTLOAD, ISD::ZEXTLOAD, ISD::SEXTLOAD})

      setLoadExtAction(Ext, T, MVT::i1, Promote);

  if (Subtarget->hasSIMD128()) {

    for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64, MVT::v4f32,

                   MVT::v2f64}) {

      for (auto MemT : MVT::fixedlen_vector_valuetypes()) {

        if (MVT(T) != MemT) {

          setTruncStoreAction(T, MemT, Expand);

          for (auto Ext : {ISD::EXTLOAD, ISD::ZEXTLOAD, ISD::SEXTLOAD})

            setLoadExtAction(Ext, T, MemT, Expand);

        }

      }

    }

    // But some vector extending loads are legal

    for (auto Ext : {ISD::EXTLOAD, ISD::SEXTLOAD, ISD::ZEXTLOAD}) {

      setLoadExtAction(Ext, MVT::v8i16, MVT::v8i8, Legal);

      setLoadExtAction(Ext, MVT::v4i32, MVT::v4i16, Legal);

      setLoadExtAction(Ext, MVT::v2i64, MVT::v2i32, Legal);

    }

    setLoadExtAction(ISD::EXTLOAD, MVT::v2f64, MVT::v2f32, Legal);

  }


  // Don't do anything clever with build_pairs

  setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand);


  // Trap lowers to wasm unreachable

  setOperationAction(ISD::TRAP, MVT::Other, Legal);

  setOperationAction(ISD::DEBUGTRAP, MVT::Other, Legal);


  // Exception handling intrinsics

  setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);

  setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::Other, Custom);

  setOperationAction(ISD::INTRINSIC_VOID, MVT::Other, Custom);


  setMaxAtomicSizeInBitsSupported(64);


  // Always convert switches to br_tables unless there is only one case, which

  // is equivalent to a simple branch. This reduces code size for wasm, and we

  // defer possible jump table optimizations to the VM.

  setMinimumJumpTableEntries(2);

}


MVT WebAssemblyTargetLowering::getPointerTy(const DataLayout &DL,

                                            uint32_t AS) const {

  if (AS == WebAssembly::WasmAddressSpace::WASM_ADDRESS_SPACE_EXTERNREF)

    return MVT::externref;

  if (AS == WebAssembly::WasmAddressSpace::WASM_ADDRESS_SPACE_FUNCREF)

    return MVT::funcref;

  return TargetLowering::getPointerTy(DL, AS);

}


MVT WebAssemblyTargetLowering::getPointerMemTy(const DataLayout &DL,

                                               uint32_t AS) const {

  if (AS == WebAssembly::WasmAddressSpace::WASM_ADDRESS_SPACE_EXTERNREF)

    return MVT::externref;

  if (AS == WebAssembly::WasmAddressSpace::WASM_ADDRESS_SPACE_FUNCREF)

    return MVT::funcref;

  return TargetLowering::getPointerMemTy(DL, AS);

}


bool WebAssemblyTargetLowering::shouldExpandPartialReductionIntrinsic(

    const IntrinsicInst *I) const {

  if (I->getIntrinsicID() != Intrinsic::experimental_vector_partial_reduce_add)

    return true;


  EVT VT = EVT::getEVT(I->getType());

  auto Op1 = I->getOperand(1);


  if (auto *InputInst = dyn_cast<Instruction>(Op1)) {

    if (InstructionOpcodeToISD(InputInst->getOpcode()) != ISD::MUL)

      return true;


    if (isa<Instruction>(InputInst->getOperand(0)) &&

        isa<Instruction>(InputInst->getOperand(1))) {

      // dot only supports signed inputs but also support lowering unsigned.

      if (cast<Instruction>(InputInst->getOperand(0))->getOpcode() !=

          cast<Instruction>(InputInst->getOperand(1))->getOpcode())

        return true;


      EVT Op1VT = EVT::getEVT(Op1->getType());

      if (Op1VT.getVectorElementType() == VT.getVectorElementType() &&

          ((VT.getVectorElementCount() * 2 == Op1VT.getVectorElementCount()) ||

           (VT.getVectorElementCount() * 4 == Op1VT.getVectorElementCount())))

        return false;

    }

  }

  return true;

}


TargetLowering::AtomicExpansionKind

WebAssemblyTargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {

  // We have wasm instructions for these

  switch (AI->getOperation()) {

  case AtomicRMWInst::Add:

  case AtomicRMWInst::Sub:

  case AtomicRMWInst::And:

  case AtomicRMWInst::Or:

  case AtomicRMWInst::Xor:

  case AtomicRMWInst::Xchg:

    return AtomicExpansionKind::None;

  default:

    break;

  }

  return AtomicExpansionKind::CmpXChg;

}


bool WebAssemblyTargetLowering::shouldScalarizeBinop(SDValue VecOp) const {

  // Implementation copied from X86TargetLowering.

  unsigned Opc = VecOp.getOpcode();


  // Assume target opcodes can't be scalarized.

  // TODO - do we have any exceptions?

  if (Opc >= ISD::BUILTIN_OP_END || !isBinOp(Opc))

    return false;


  // If the vector op is not supported, try to convert to scalar.

  EVT VecVT = VecOp.getValueType();

  if (!isOperationLegalOrCustomOrPromote(Opc, VecVT))

    return true;


  // If the vector op is supported, but the scalar op is not, the transform may

  // not be worthwhile.

  EVT ScalarVT = VecVT.getScalarType();

  return isOperationLegalOrCustomOrPromote(Opc, ScalarVT);

}


FastISel *WebAssemblyTargetLowering::createFastISel(

    FunctionLoweringInfo &FuncInfo, const TargetLibraryInfo *LibInfo) const {

  return WebAssembly::createFastISel(FuncInfo, LibInfo);

}


MVT WebAssemblyTargetLowering::getScalarShiftAmountTy(const DataLayout & /*DL*/,

                                                      EVT VT) const {

  unsigned BitWidth = NextPowerOf2(VT.getSizeInBits() - 1);

  if (BitWidth > 1 && BitWidth < 8)

    BitWidth = 8;


  if (BitWidth > 64) {

    // The shift will be lowered to a libcall, and compiler-rt libcalls expect

    // the count to be an i32.

    BitWidth = 32;

    assert(BitWidth >= Log2_32_Ceil(VT.getSizeInBits()) &&

           "32-bit shift counts ought to be enough for anyone");

  }


  MVT Result = MVT::getIntegerVT(BitWidth);

  assert(Result != MVT::INVALID_SIMPLE_VALUE_TYPE &&

         "Unable to represent scalar shift amount type");

  return Result;

}


// Lower an fp-to-int conversion operator from the LLVM opcode, which has an

// undefined result on invalid/overflow, to the WebAssembly opcode, which

// traps on invalid/overflow.

static MachineBasicBlock *LowerFPToInt(MachineInstr &MI, DebugLoc DL,

                                       MachineBasicBlock *BB,

                                       const TargetInstrInfo &TII,

                                       bool IsUnsigned, bool Int64,

                                       bool Float64, unsigned LoweredOpcode) {

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();


  Register OutReg = MI.getOperand(0).getReg();

  Register InReg = MI.getOperand(1).getReg();


  unsigned Abs = Float64 ? WebAssembly::ABS_F64 : WebAssembly::ABS_F32;

  unsigned FConst = Float64 ? WebAssembly::CONST_F64 : WebAssembly::CONST_F32;

  unsigned LT = Float64 ? WebAssembly::LT_F64 : WebAssembly::LT_F32;

  unsigned GE = Float64 ? WebAssembly::GE_F64 : WebAssembly::GE_F32;

  unsigned IConst = Int64 ? WebAssembly::CONST_I64 : WebAssembly::CONST_I32;

  unsigned Eqz = WebAssembly::EQZ_I32;

  unsigned And = WebAssembly::AND_I32;

  int64_t Limit = Int64 ? INT64_MIN : INT32_MIN;

  int64_t Substitute = IsUnsigned ? 0 : Limit;

  double CmpVal = IsUnsigned ? -(double)Limit * 2.0 : -(double)Limit;

  auto &Context = BB->getParent()->getFunction().getContext();

  Type *Ty = Float64 ? Type::getDoubleTy(Context) : Type::getFloatTy(Context);


  const BasicBlock *LLVMBB = BB->getBasicBlock();

  MachineFunction *F = BB->getParent();

  MachineBasicBlock *TrueMBB = F->CreateMachineBasicBlock(LLVMBB);

  MachineBasicBlock *FalseMBB = F->CreateMachineBasicBlock(LLVMBB);

  MachineBasicBlock *DoneMBB = F->CreateMachineBasicBlock(LLVMBB);


  MachineFunction::iterator It = ++BB->getIterator();

  F->insert(It, FalseMBB);

  F->insert(It, TrueMBB);

  F->insert(It, DoneMBB);


  // Transfer the remainder of BB and its successor edges to DoneMBB.

  DoneMBB->splice(DoneMBB->begin(), BB, std::next(MI.getIterator()), BB->end());

  DoneMBB->transferSuccessorsAndUpdatePHIs(BB);


  BB->addSuccessor(TrueMBB);

  BB->addSuccessor(FalseMBB);

  TrueMBB->addSuccessor(DoneMBB);

  FalseMBB->addSuccessor(DoneMBB);


  unsigned Tmp0, Tmp1, CmpReg, EqzReg, FalseReg, TrueReg;

  Tmp0 = MRI.createVirtualRegister(MRI.getRegClass(InReg));

  Tmp1 = MRI.createVirtualRegister(MRI.getRegClass(InReg));

  CmpReg = MRI.createVirtualRegister(&WebAssembly::I32RegClass);

  EqzReg = MRI.createVirtualRegister(&WebAssembly::I32RegClass);

  FalseReg = MRI.createVirtualRegister(MRI.getRegClass(OutReg));

  TrueReg = MRI.createVirtualRegister(MRI.getRegClass(OutReg));


  MI.eraseFromParent();

  // For signed numbers, we can do a single comparison to determine whether

  // fabs(x) is within range.

  if (IsUnsigned) {

    Tmp0 = InReg;

  } else {

    BuildMI(BB, DL, TII.get(Abs), Tmp0).addReg(InReg);

  }

  BuildMI(BB, DL, TII.get(FConst), Tmp1)

      .addFPImm(cast<ConstantFP>(ConstantFP::get(Ty, CmpVal)));

  BuildMI(BB, DL, TII.get(LT), CmpReg).addReg(Tmp0).addReg(Tmp1);


  // For unsigned numbers, we have to do a separate comparison with zero.

  if (IsUnsigned) {

    Tmp1 = MRI.createVirtualRegister(MRI.getRegClass(InReg));

    Register SecondCmpReg =

        MRI.createVirtualRegister(&WebAssembly::I32RegClass);

    Register AndReg = MRI.createVirtualRegister(&WebAssembly::I32RegClass);

    BuildMI(BB, DL, TII.get(FConst), Tmp1)

        .addFPImm(cast<ConstantFP>(ConstantFP::get(Ty, 0.0)));

    BuildMI(BB, DL, TII.get(GE), SecondCmpReg).addReg(Tmp0).addReg(Tmp1);

    BuildMI(BB, DL, TII.get(And), AndReg).addReg(CmpReg).addReg(SecondCmpReg);

    CmpReg = AndReg;

  }


  BuildMI(BB, DL, TII.get(Eqz), EqzReg).addReg(CmpReg);


  // Create the CFG diamond to select between doing the conversion or using

  // the substitute value.

  BuildMI(BB, DL, TII.get(WebAssembly::BR_IF)).addMBB(TrueMBB).addReg(EqzReg);

  BuildMI(FalseMBB, DL, TII.get(LoweredOpcode), FalseReg).addReg(InReg);

  BuildMI(FalseMBB, DL, TII.get(WebAssembly::BR)).addMBB(DoneMBB);

  BuildMI(TrueMBB, DL, TII.get(IConst), TrueReg).addImm(Substitute);

  BuildMI(*DoneMBB, DoneMBB->begin(), DL, TII.get(TargetOpcode::PHI), OutReg)

      .addReg(FalseReg)

      .addMBB(FalseMBB)

      .addReg(TrueReg)

      .addMBB(TrueMBB);


  return DoneMBB;

}


// Lower a `MEMCPY` instruction into a CFG triangle around a `MEMORY_COPY`

// instuction to handle the zero-length case.

static MachineBasicBlock *LowerMemcpy(MachineInstr &MI, DebugLoc DL,

                                      MachineBasicBlock *BB,

                                      const TargetInstrInfo &TII, bool Int64) {

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();


  MachineOperand DstMem = MI.getOperand(0);

  MachineOperand SrcMem = MI.getOperand(1);

  MachineOperand Dst = MI.getOperand(2);

  MachineOperand Src = MI.getOperand(3);

  MachineOperand Len = MI.getOperand(4);


  // We're going to add an extra use to `Len` to test if it's zero; that

  // use shouldn't be a kill, even if the original use is.

  MachineOperand NoKillLen = Len;

  NoKillLen.setIsKill(false);


  // Decide on which `MachineInstr` opcode we're going to use.

  unsigned Eqz = Int64 ? WebAssembly::EQZ_I64 : WebAssembly::EQZ_I32;

  unsigned MemoryCopy =

      Int64 ? WebAssembly::MEMORY_COPY_A64 : WebAssembly::MEMORY_COPY_A32;


  // Create two new basic blocks; one for the new `memory.fill` that we can

  // branch over, and one for the rest of the instructions after the original

  // `memory.fill`.

  const BasicBlock *LLVMBB = BB->getBasicBlock();

  MachineFunction *F = BB->getParent();

  MachineBasicBlock *TrueMBB = F->CreateMachineBasicBlock(LLVMBB);

  MachineBasicBlock *DoneMBB = F->CreateMachineBasicBlock(LLVMBB);


  MachineFunction::iterator It = ++BB->getIterator();

  F->insert(It, TrueMBB);

  F->insert(It, DoneMBB);


  // Transfer the remainder of BB and its successor edges to DoneMBB.

  DoneMBB->splice(DoneMBB->begin(), BB, std::next(MI.getIterator()), BB->end());

  DoneMBB->transferSuccessorsAndUpdatePHIs(BB);


  // Connect the CFG edges.

  BB->addSuccessor(TrueMBB);

  BB->addSuccessor(DoneMBB);

  TrueMBB->addSuccessor(DoneMBB);


  // Create a virtual register for the `Eqz` result.

  unsigned EqzReg;

  EqzReg = MRI.createVirtualRegister(&WebAssembly::I32RegClass);


  // Erase the original `memory.copy`.

  MI.eraseFromParent();


  // Test if `Len` is zero.

  BuildMI(BB, DL, TII.get(Eqz), EqzReg).add(NoKillLen);


  // Insert a new `memory.copy`.

  BuildMI(TrueMBB, DL, TII.get(MemoryCopy))

      .add(DstMem)

      .add(SrcMem)

      .add(Dst)

      .add(Src)

      .add(Len);


  // Create the CFG triangle.

  BuildMI(BB, DL, TII.get(WebAssembly::BR_IF)).addMBB(DoneMBB).addReg(EqzReg);

  BuildMI(TrueMBB, DL, TII.get(WebAssembly::BR)).addMBB(DoneMBB);


  return DoneMBB;

}


// Lower a `MEMSET` instruction into a CFG triangle around a `MEMORY_FILL`

// instuction to handle the zero-length case.

static MachineBasicBlock *LowerMemset(MachineInstr &MI, DebugLoc DL,

                                      MachineBasicBlock *BB,

                                      const TargetInstrInfo &TII, bool Int64) {

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();


  MachineOperand Mem = MI.getOperand(0);

  MachineOperand Dst = MI.getOperand(1);

  MachineOperand Val = MI.getOperand(2);

  MachineOperand Len = MI.getOperand(3);


  // We're going to add an extra use to `Len` to test if it's zero; that

  // use shouldn't be a kill, even if the original use is.

  MachineOperand NoKillLen = Len;

  NoKillLen.setIsKill(false);


  // Decide on which `MachineInstr` opcode we're going to use.

  unsigned Eqz = Int64 ? WebAssembly::EQZ_I64 : WebAssembly::EQZ_I32;

  unsigned MemoryFill =

      Int64 ? WebAssembly::MEMORY_FILL_A64 : WebAssembly::MEMORY_FILL_A32;


  // Create two new basic blocks; one for the new `memory.fill` that we can

  // branch over, and one for the rest of the instructions after the original

  // `memory.fill`.

  const BasicBlock *LLVMBB = BB->getBasicBlock();

  MachineFunction *F = BB->getParent();

  MachineBasicBlock *TrueMBB = F->CreateMachineBasicBlock(LLVMBB);

  MachineBasicBlock *DoneMBB = F->CreateMachineBasicBlock(LLVMBB);


  MachineFunction::iterator It = ++BB->getIterator();

  F->insert(It, TrueMBB);

  F->insert(It, DoneMBB);


  // Transfer the remainder of BB and its successor edges to DoneMBB.

  DoneMBB->splice(DoneMBB->begin(), BB, std::next(MI.getIterator()), BB->end());

  DoneMBB->transferSuccessorsAndUpdatePHIs(BB);


  // Connect the CFG edges.

  BB->addSuccessor(TrueMBB);

  BB->addSuccessor(DoneMBB);

  TrueMBB->addSuccessor(DoneMBB);


  // Create a virtual register for the `Eqz` result.

  unsigned EqzReg;

  EqzReg = MRI.createVirtualRegister(&WebAssembly::I32RegClass);


  // Erase the original `memory.fill`.

  MI.eraseFromParent();


  // Test if `Len` is zero.

  BuildMI(BB, DL, TII.get(Eqz), EqzReg).add(NoKillLen);


  // Insert a new `memory.copy`.

  BuildMI(TrueMBB, DL, TII.get(MemoryFill)).add(Mem).add(Dst).add(Val).add(Len);


  // Create the CFG triangle.

  BuildMI(BB, DL, TII.get(WebAssembly::BR_IF)).addMBB(DoneMBB).addReg(EqzReg);

  BuildMI(TrueMBB, DL, TII.get(WebAssembly::BR)).addMBB(DoneMBB);


  return DoneMBB;

}


static MachineBasicBlock *

LowerCallResults(MachineInstr &CallResults, DebugLoc DL, MachineBasicBlock *BB,

                 const WebAssemblySubtarget *Subtarget,

                 const TargetInstrInfo &TII) {

  MachineInstr &CallParams = *CallResults.getPrevNode();

  assert(CallParams.getOpcode() == WebAssembly::CALL_PARAMS);

  assert(CallResults.getOpcode() == WebAssembly::CALL_RESULTS ||

         CallResults.getOpcode() == WebAssembly::RET_CALL_RESULTS);


  bool IsIndirect =

      CallParams.getOperand(0).isReg() || CallParams.getOperand(0).isFI();

  bool IsRetCall = CallResults.getOpcode() == WebAssembly::RET_CALL_RESULTS;


  bool IsFuncrefCall = false;

  if (IsIndirect && CallParams.getOperand(0).isReg()) {

    Register Reg = CallParams.getOperand(0).getReg();

    const MachineFunction *MF = BB->getParent();

    const MachineRegisterInfo &MRI = MF->getRegInfo();

    const TargetRegisterClass *TRC = MRI.getRegClass(Reg);

    IsFuncrefCall = (TRC == &WebAssembly::FUNCREFRegClass);

    assert(!IsFuncrefCall || Subtarget->hasReferenceTypes());

  }


  unsigned CallOp;

  if (IsIndirect && IsRetCall) {

    CallOp = WebAssembly::RET_CALL_INDIRECT;

  } else if (IsIndirect) {

    CallOp = WebAssembly::CALL_INDIRECT;

  } else if (IsRetCall) {

    CallOp = WebAssembly::RET_CALL;

  } else {

    CallOp = WebAssembly::CALL;

  }


  MachineFunction &MF = *BB->getParent();

  const MCInstrDesc &MCID = TII.get(CallOp);

  MachineInstrBuilder MIB(MF, MF.CreateMachineInstr(MCID, DL));


  // Move the function pointer to the end of the arguments for indirect calls

  if (IsIndirect) {

    auto FnPtr = CallParams.getOperand(0);

    CallParams.removeOperand(0);


    // For funcrefs, call_indirect is done through __funcref_call_table and the

    // funcref is always installed in slot 0 of the table, therefore instead of

    // having the function pointer added at the end of the params list, a zero

    // (the index in

    // __funcref_call_table is added).

    if (IsFuncrefCall) {

      Register RegZero =

          MF.getRegInfo().createVirtualRegister(&WebAssembly::I32RegClass);

      MachineInstrBuilder MIBC0 =

          BuildMI(MF, DL, TII.get(WebAssembly::CONST_I32), RegZero).addImm(0);


      BB->insert(CallResults.getIterator(), MIBC0);

      MachineInstrBuilder(MF, CallParams).addReg(RegZero);

    } else

      CallParams.addOperand(FnPtr);

  }


  for (auto Def : CallResults.defs())

    MIB.add(Def);


  if (IsIndirect) {

    // Placeholder for the type index.

    // This gets replaced with the correct value in WebAssemblyMCInstLower.cpp

    MIB.addImm(0);

    // The table into which this call_indirect indexes.

    MCSymbolWasm *Table = IsFuncrefCall

                              ? WebAssembly::getOrCreateFuncrefCallTableSymbol(

                                    MF.getContext(), Subtarget)

                              : WebAssembly::getOrCreateFunctionTableSymbol(

                                    MF.getContext(), Subtarget);

    if (Subtarget->hasCallIndirectOverlong()) {

      MIB.addSym(Table);

    } else {

      // For the MVP there is at most one table whose number is 0, but we can't

      // write a table symbol or issue relocations.  Instead we just ensure the

      // table is live and write a zero.

      Table->setNoStrip();

      MIB.addImm(0);

    }

  }


  for (auto Use : CallParams.uses())

    MIB.add(Use);


  BB->insert(CallResults.getIterator(), MIB);

  CallParams.eraseFromParent();

  CallResults.eraseFromParent();


  // If this is a funcref call, to avoid hidden GC roots, we need to clear the

  // table slot with ref.null upon call_indirect return.

  //

  // This generates the following code, which comes right after a call_indirect

  // of a funcref:

  //

  //    i32.const 0

  //    ref.null func

  //    table.set __funcref_call_table

  if (IsIndirect && IsFuncrefCall) {

    MCSymbolWasm *Table = WebAssembly::getOrCreateFuncrefCallTableSymbol(

        MF.getContext(), Subtarget);

    Register RegZero =

        MF.getRegInfo().createVirtualRegister(&WebAssembly::I32RegClass);

    MachineInstr *Const0 =

        BuildMI(MF, DL, TII.get(WebAssembly::CONST_I32), RegZero).addImm(0);

    BB->insertAfter(MIB.getInstr()->getIterator(), Const0);


    Register RegFuncref =

        MF.getRegInfo().createVirtualRegister(&WebAssembly::FUNCREFRegClass);

    MachineInstr *RefNull =

        BuildMI(MF, DL, TII.get(WebAssembly::REF_NULL_FUNCREF), RegFuncref);

    BB->insertAfter(Const0->getIterator(), RefNull);


    MachineInstr *TableSet =

        BuildMI(MF, DL, TII.get(WebAssembly::TABLE_SET_FUNCREF))

            .addSym(Table)

            .addReg(RegZero)

            .addReg(RegFuncref);

    BB->insertAfter(RefNull->getIterator(), TableSet);

  }


  return BB;

}


MachineBasicBlock *WebAssemblyTargetLowering::EmitInstrWithCustomInserter(

    MachineInstr &MI, MachineBasicBlock *BB) const {

  const TargetInstrInfo &TII = *Subtarget->getInstrInfo();

  DebugLoc DL = MI.getDebugLoc();


  switch (MI.getOpcode()) {

  default:

    llvm_unreachable("Unexpected instr type to insert");

  case WebAssembly::FP_TO_SINT_I32_F32:

    return LowerFPToInt(MI, DL, BB, TII, false, false, false,

                        WebAssembly::I32_TRUNC_S_F32);

  case WebAssembly::FP_TO_UINT_I32_F32:

    return LowerFPToInt(MI, DL, BB, TII, true, false, false,

                        WebAssembly::I32_TRUNC_U_F32);

  case WebAssembly::FP_TO_SINT_I64_F32:

    return LowerFPToInt(MI, DL, BB, TII, false, true, false,

                        WebAssembly::I64_TRUNC_S_F32);

  case WebAssembly::FP_TO_UINT_I64_F32:

    return LowerFPToInt(MI, DL, BB, TII, true, true, false,

                        WebAssembly::I64_TRUNC_U_F32);

  case WebAssembly::FP_TO_SINT_I32_F64:

    return LowerFPToInt(MI, DL, BB, TII, false, false, true,

                        WebAssembly::I32_TRUNC_S_F64);

  case WebAssembly::FP_TO_UINT_I32_F64:

    return LowerFPToInt(MI, DL, BB, TII, true, false, true,

                        WebAssembly::I32_TRUNC_U_F64);

  case WebAssembly::FP_TO_SINT_I64_F64:

    return LowerFPToInt(MI, DL, BB, TII, false, true, true,

                        WebAssembly::I64_TRUNC_S_F64);

  case WebAssembly::FP_TO_UINT_I64_F64:

    return LowerFPToInt(MI, DL, BB, TII, true, true, true,

                        WebAssembly::I64_TRUNC_U_F64);

  case WebAssembly::MEMCPY_A32:

    return LowerMemcpy(MI, DL, BB, TII, false);

  case WebAssembly::MEMCPY_A64:

    return LowerMemcpy(MI, DL, BB, TII, true);

  case WebAssembly::MEMSET_A32:

    return LowerMemset(MI, DL, BB, TII, false);

  case WebAssembly::MEMSET_A64:

    return LowerMemset(MI, DL, BB, TII, true);

  case WebAssembly::CALL_RESULTS:

  case WebAssembly::RET_CALL_RESULTS:

    return LowerCallResults(MI, DL, BB, Subtarget, TII);

  }

}


const char *

WebAssemblyTargetLowering::getTargetNodeName(unsigned Opcode) const {

  switch (static_cast<WebAssemblyISD::NodeType>(Opcode)) {

  case WebAssemblyISD::FIRST_NUMBER:

    break;

#define HANDLE_NODETYPE(NODE)                                                  \

  case WebAssemblyISD::NODE:                                                   \

    return "WebAssemblyISD::" #NODE;

#include "WebAssemblyISD.def"

#undef HANDLE_NODETYPE

  }

  return nullptr;

}


std::pair<unsigned, const TargetRegisterClass *>

WebAssemblyTargetLowering::getRegForInlineAsmConstraint(

    const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const {

  // First, see if this is a constraint that directly corresponds to a

  // WebAssembly register class.

  if (Constraint.size() == 1) {

    switch (Constraint[0]) {

    case 'r':

      assert(VT != MVT::iPTR && "Pointer MVT not expected here");

      if (Subtarget->hasSIMD128() && VT.isVector()) {

        if (VT.getSizeInBits() == 128)

          return std::make_pair(0U, &WebAssembly::V128RegClass);

      }

      if (VT.isInteger() && !VT.isVector()) {

        if (VT.getSizeInBits() <= 32)

          return std::make_pair(0U, &WebAssembly::I32RegClass);

        if (VT.getSizeInBits() <= 64)

          return std::make_pair(0U, &WebAssembly::I64RegClass);

      }

      if (VT.isFloatingPoint() && !VT.isVector()) {

        switch (VT.getSizeInBits()) {

        case 32:

          return std::make_pair(0U, &WebAssembly::F32RegClass);

        case 64:

          return std::make_pair(0U, &WebAssembly::F64RegClass);

        default:

          break;

        }

      }

      break;

    default:

      break;

    }

  }


  return TargetLowering::getRegForInlineAsmConstraint(TRI, Constraint, VT);

}


bool WebAssemblyTargetLowering::isCheapToSpeculateCttz(Type *Ty) const {

  // Assume ctz is a relatively cheap operation.

  return true;

}


bool WebAssemblyTargetLowering::isCheapToSpeculateCtlz(Type *Ty) const {

  // Assume clz is a relatively cheap operation.

  return true;

}


bool WebAssemblyTargetLowering::isLegalAddressingMode(const DataLayout &DL,

                                                      const AddrMode &AM,

                                                      Type *Ty, unsigned AS,

                                                      Instruction *I) const {

  // WebAssembly offsets are added as unsigned without wrapping. The

  // isLegalAddressingMode gives us no way to determine if wrapping could be

  // happening, so we approximate this by accepting only non-negative offsets.

  if (AM.BaseOffs < 0)

    return false;


  // WebAssembly has no scale register operands.

  if (AM.Scale != 0)

    return false;


  // Everything else is legal.

  return true;

}


bool WebAssemblyTargetLowering::allowsMisalignedMemoryAccesses(

    EVT /*VT*/, unsigned /*AddrSpace*/, Align /*Align*/,

    MachineMemOperand::Flags /*Flags*/, unsigned *Fast) const {

  // WebAssembly supports unaligned accesses, though it should be declared

  // with the p2align attribute on loads and stores which do so, and there

  // may be a performance impact. We tell LLVM they're "fast" because

  // for the kinds of things that LLVM uses this for (merging adjacent stores

  // of constants, etc.), WebAssembly implementations will either want the

  // unaligned access or they'll split anyway.

  if (Fast)

    *Fast = 1;

  return true;

}


bool WebAssemblyTargetLowering::isIntDivCheap(EVT VT,

                                              AttributeList Attr) const {

  // The current thinking is that wasm engines will perform this optimization,

  // so we can save on code size.

  return true;

}


bool WebAssemblyTargetLowering::isVectorLoadExtDesirable(SDValue ExtVal) const {

  EVT ExtT = ExtVal.getValueType();

  EVT MemT = cast<LoadSDNode>(ExtVal->getOperand(0))->getValueType(0);

  return (ExtT == MVT::v8i16 && MemT == MVT::v8i8) ||

         (ExtT == MVT::v4i32 && MemT == MVT::v4i16) ||

         (ExtT == MVT::v2i64 && MemT == MVT::v2i32);

}


bool WebAssemblyTargetLowering::isOffsetFoldingLegal(

    const GlobalAddressSDNode *GA) const {

  // Wasm doesn't support function addresses with offsets

  const GlobalValue *GV = GA->getGlobal();

  return isa<Function>(GV) ? false : TargetLowering::isOffsetFoldingLegal(GA);

}


EVT WebAssemblyTargetLowering::getSetCCResultType(const DataLayout &DL,

                                                  LLVMContext &C,

                                                  EVT VT) const {

  if (VT.isVector())

    return VT.changeVectorElementTypeToInteger();


  // So far, all branch instructions in Wasm take an I32 condition.

  // The default TargetLowering::getSetCCResultType returns the pointer size,

  // which would be useful to reduce instruction counts when testing

  // against 64-bit pointers/values if at some point Wasm supports that.

  return EVT::getIntegerVT(C, 32);

}


bool WebAssemblyTargetLowering::getTgtMemIntrinsic(IntrinsicInfo &Info,

                                                   const CallInst &I,

                                                   MachineFunction &MF,

                                                   unsigned Intrinsic) const {

  switch (Intrinsic) {

  case Intrinsic::wasm_memory_atomic_notify:

    Info.opc = ISD::INTRINSIC_W_CHAIN;

    Info.memVT = MVT::i32;

    Info.ptrVal = I.getArgOperand(0);

    Info.offset = 0;

    Info.align = Align(4);

    // atomic.notify instruction does not really load the memory specified with

    // this argument, but MachineMemOperand should either be load or store, so

    // we set this to a load.

    // FIXME Volatile isn't really correct, but currently all LLVM atomic

    // instructions are treated as volatiles in the backend, so we should be

    // consistent. The same applies for wasm_atomic_wait intrinsics too.

    Info.flags = MachineMemOperand::MOVolatile | MachineMemOperand::MOLoad;

    return true;

  case Intrinsic::wasm_memory_atomic_wait32:

    Info.opc = ISD::INTRINSIC_W_CHAIN;

    Info.memVT = MVT::i32;

    Info.ptrVal = I.getArgOperand(0);

    Info.offset = 0;

    Info.align = Align(4);

    Info.flags = MachineMemOperand::MOVolatile | MachineMemOperand::MOLoad;

    return true;

  case Intrinsic::wasm_memory_atomic_wait64:

    Info.opc = ISD::INTRINSIC_W_CHAIN;

    Info.memVT = MVT::i64;

    Info.ptrVal = I.getArgOperand(0);

    Info.offset = 0;

    Info.align = Align(8);

    Info.flags = MachineMemOperand::MOVolatile | MachineMemOperand::MOLoad;

    return true;

  case Intrinsic::wasm_loadf16_f32:

    Info.opc = ISD::INTRINSIC_W_CHAIN;

    Info.memVT = MVT::f16;

    Info.ptrVal = I.getArgOperand(0);

    Info.offset = 0;

    Info.align = Align(2);

    Info.flags = MachineMemOperand::MOLoad;

    return true;

  case Intrinsic::wasm_storef16_f32:

    Info.opc = ISD::INTRINSIC_VOID;

    Info.memVT = MVT::f16;

    Info.ptrVal = I.getArgOperand(1);

    Info.offset = 0;

    Info.align = Align(2);

    Info.flags = MachineMemOperand::MOStore;

    return true;

  default:

    return false;

  }

}


void WebAssemblyTargetLowering::computeKnownBitsForTargetNode(

    const SDValue Op, KnownBits &Known, const APInt &DemandedElts,

    const SelectionDAG &DAG, unsigned Depth) const {

  switch (Op.getOpcode()) {

  default:

    break;

  case ISD::INTRINSIC_WO_CHAIN: {

    unsigned IntNo = Op.getConstantOperandVal(0);

    switch (IntNo) {

    default:

      break;

    case Intrinsic::wasm_bitmask: {

      unsigned BitWidth = Known.getBitWidth();

      EVT VT = Op.getOperand(1).getSimpleValueType();

      unsigned PossibleBits = VT.getVectorNumElements();

      APInt ZeroMask = APInt::getHighBitsSet(BitWidth, BitWidth - PossibleBits);

      Known.Zero |= ZeroMask;

      break;

    }

    }

    break;

  }


  // For 128-bit addition if the upper bits are all zero then it's known that

  // the upper bits of the result will have all bits guaranteed zero except the

  // first.

  case WebAssemblyISD::I64_ADD128:

    if (Op.getResNo() == 1) {

      SDValue LHS_HI = Op.getOperand(1);

      SDValue RHS_HI = Op.getOperand(3);

      if (isNullConstant(LHS_HI) && isNullConstant(RHS_HI))

        Known.Zero.setBitsFrom(1);

    }

    break;

  }

}


TargetLoweringBase::LegalizeTypeAction

WebAssemblyTargetLowering::getPreferredVectorAction(MVT VT) const {

  if (VT.isFixedLengthVector()) {

    MVT EltVT = VT.getVectorElementType();

    // We have legal vector types with these lane types, so widening the

    // vector would let us use some of the lanes directly without having to

    // extend or truncate values.

    if (EltVT == MVT::i8 || EltVT == MVT::i16 || EltVT == MVT::i32 ||

        EltVT == MVT::i64 || EltVT == MVT::f32 || EltVT == MVT::f64)

      return TypeWidenVector;

  }


  return TargetLoweringBase::getPreferredVectorAction(VT);

}


bool WebAssemblyTargetLowering::shouldSimplifyDemandedVectorElts(

    SDValue Op, const TargetLoweringOpt &TLO) const {

  // ISel process runs DAGCombiner after legalization; this step is called

  // SelectionDAG optimization phase. This post-legalization combining process

  // runs DAGCombiner on each node, and if there was a change to be made,

  // re-runs legalization again on it and its user nodes to make sure

  // everythiing is in a legalized state.

  //

  // The legalization calls lowering routines, and we do our custom lowering for

  // build_vectors (LowerBUILD_VECTOR), which converts undef vector elements

  // into zeros. But there is a set of routines in DAGCombiner that turns unused

  // (= not demanded) nodes into undef, among which SimplifyDemandedVectorElts

  // turns unused vector elements into undefs. But this routine does not work

  // with our custom LowerBUILD_VECTOR, which turns undefs into zeros. This

  // combination can result in a infinite loop, in which undefs are converted to

  // zeros in legalization and back to undefs in combining.

  //

  // So after DAG is legalized, we prevent SimplifyDemandedVectorElts from

  // running for build_vectors.

  if (Op.getOpcode() == ISD::BUILD_VECTOR && TLO.LegalOps && TLO.LegalTys)

    return false;

  return true;

}


//===----------------------------------------------------------------------===//

// WebAssembly Lowering private implementation.

//===----------------------------------------------------------------------===//


//===----------------------------------------------------------------------===//

// Lowering Code

//===----------------------------------------------------------------------===//


static void fail(const SDLoc &DL, SelectionDAG &DAG, const char *Msg) {

  MachineFunction &MF = DAG.getMachineFunction();

  DAG.getContext()->diagnose(

      DiagnosticInfoUnsupported(MF.getFunction(), Msg, DL.getDebugLoc()));

}


// Test whether the given calling convention is supported.

static bool callingConvSupported(CallingConv::ID CallConv) {

  // We currently support the language-independent target-independent

  // conventions. We don't yet have a way to annotate calls with properties like

  // "cold", and we don't have any call-clobbered registers, so these are mostly

  // all handled the same.

  return CallConv == CallingConv::C || CallConv == CallingConv::Fast ||

         CallConv == CallingConv::Cold ||

         CallConv == CallingConv::PreserveMost ||

         CallConv == CallingConv::PreserveAll ||

         CallConv == CallingConv::CXX_FAST_TLS ||

         CallConv == CallingConv::WASM_EmscriptenInvoke ||

         CallConv == CallingConv::Swift;

}


SDValue

WebAssemblyTargetLowering::LowerCall(CallLoweringInfo &CLI,

                                     SmallVectorImpl<SDValue> &InVals) const {

  SelectionDAG &DAG = CLI.DAG;

  SDLoc DL = CLI.DL;

  SDValue Chain = CLI.Chain;

  SDValue Callee = CLI.Callee;

  MachineFunction &MF = DAG.getMachineFunction();

  auto Layout = MF.getDataLayout();


  CallingConv::ID CallConv = CLI.CallConv;

  if (!callingConvSupported(CallConv))

    fail(DL, DAG,

         "WebAssembly doesn't support language-specific or target-specific "

         "calling conventions yet");

  if (CLI.IsPatchPoint)

    fail(DL, DAG, "WebAssembly doesn't support patch point yet");


  if (CLI.IsTailCall) {

    auto NoTail = [&](const char *Msg) {

      if (CLI.CB && CLI.CB->isMustTailCall())

        fail(DL, DAG, Msg);

      CLI.IsTailCall = false;

    };


    if (!Subtarget->hasTailCall())

      NoTail("WebAssembly 'tail-call' feature not enabled");


    // Varargs calls cannot be tail calls because the buffer is on the stack

    if (CLI.IsVarArg)

      NoTail("WebAssembly does not support varargs tail calls");


    // Do not tail call unless caller and callee return types match

    const Function &F = MF.getFunction();

    const TargetMachine &TM = getTargetMachine();

    Type *RetTy = F.getReturnType();

    SmallVector<MVT, 4> CallerRetTys;

    SmallVector<MVT, 4> CalleeRetTys;

    computeLegalValueVTs(F, TM, RetTy, CallerRetTys);

    computeLegalValueVTs(F, TM, CLI.RetTy, CalleeRetTys);

    bool TypesMatch = CallerRetTys.size() == CalleeRetTys.size() &&

                      std::equal(CallerRetTys.begin(), CallerRetTys.end(),

                                 CalleeRetTys.begin());

    if (!TypesMatch)

      NoTail("WebAssembly tail call requires caller and callee return types to "

             "match");


    // If pointers to local stack values are passed, we cannot tail call

    if (CLI.CB) {

      for (auto &Arg : CLI.CB->args()) {

        Value *Val = Arg.get();

        // Trace the value back through pointer operations

        while (true) {

          Value *Src = Val->stripPointerCastsAndAliases();

          if (auto *GEP = dyn_cast<GetElementPtrInst>(Src))

            Src = GEP->getPointerOperand();

          if (Val == Src)

            break;

          Val = Src;

        }

        if (isa<AllocaInst>(Val)) {

          NoTail(

              "WebAssembly does not support tail calling with stack arguments");

          break;

        }

      }

    }

  }


  SmallVectorImpl<ISD::InputArg> &Ins = CLI.Ins;

  SmallVectorImpl<ISD::OutputArg> &Outs = CLI.Outs;

  SmallVectorImpl<SDValue> &OutVals = CLI.OutVals;


  // The generic code may have added an sret argument. If we're lowering an

  // invoke function, the ABI requires that the function pointer be the first

  // argument, so we may have to swap the arguments.

  if (CallConv == CallingConv::WASM_EmscriptenInvoke && Outs.size() >= 2 &&

      Outs[0].Flags.isSRet()) {

    std::swap(Outs[0], Outs[1]);

    std::swap(OutVals[0], OutVals[1]);

  }


  bool HasSwiftSelfArg = false;

  bool HasSwiftErrorArg = false;

  unsigned NumFixedArgs = 0;

  for (unsigned I = 0; I < Outs.size(); ++I) {

    const ISD::OutputArg &Out = Outs[I];

    SDValue &OutVal = OutVals[I];

    HasSwiftSelfArg |= Out.Flags.isSwiftSelf();

    HasSwiftErrorArg |= Out.Flags.isSwiftError();

    if (Out.Flags.isNest())

      fail(DL, DAG, "WebAssembly hasn't implemented nest arguments");

    if (Out.Flags.isInAlloca())

      fail(DL, DAG, "WebAssembly hasn't implemented inalloca arguments");

    if (Out.Flags.isInConsecutiveRegs())

      fail(DL, DAG, "WebAssembly hasn't implemented cons regs arguments");

    if (Out.Flags.isInConsecutiveRegsLast())

      fail(DL, DAG, "WebAssembly hasn't implemented cons regs last arguments");

    if (Out.Flags.isByVal() && Out.Flags.getByValSize() != 0) {

      auto &MFI = MF.getFrameInfo();

      int FI = MFI.CreateStackObject(Out.Flags.getByValSize(),

                                     Out.Flags.getNonZeroByValAlign(),

                                     /*isSS=*/false);

      SDValue SizeNode =

          DAG.getConstant(Out.Flags.getByValSize(), DL, MVT::i32);

      SDValue FINode = DAG.getFrameIndex(FI, getPointerTy(Layout));

      Chain = DAG.getMemcpy(Chain, DL, FINode, OutVal, SizeNode,

                            Out.Flags.getNonZeroByValAlign(),

                            /*isVolatile*/ false, /*AlwaysInline=*/false,

                            /*CI=*/nullptr, std::nullopt, MachinePointerInfo(),

                            MachinePointerInfo());

      OutVal = FINode;

    }

    // Count the number of fixed args *after* legalization.

    NumFixedArgs += !Out.Flags.isVarArg();

  }


  bool IsVarArg = CLI.IsVarArg;

  auto PtrVT = getPointerTy(Layout);


  // For swiftcc, emit additional swiftself and swifterror arguments

  // if there aren't. These additional arguments are also added for callee

  // signature They are necessary to match callee and caller signature for

  // indirect call.

  if (CallConv == CallingConv::Swift) {

    Type *PtrTy = PointerType::getUnqual(*DAG.getContext());

    if (!HasSwiftSelfArg) {

      NumFixedArgs++;

      ISD::ArgFlagsTy Flags;

      Flags.setSwiftSelf();

      ISD::OutputArg Arg(Flags, PtrVT, EVT(PtrVT), PtrTy, 0, 0);

      CLI.Outs.push_back(Arg);

      SDValue ArgVal = DAG.getUNDEF(PtrVT);

      CLI.OutVals.push_back(ArgVal);

    }

    if (!HasSwiftErrorArg) {

      NumFixedArgs++;

      ISD::ArgFlagsTy Flags;

      Flags.setSwiftError();

      ISD::OutputArg Arg(Flags, PtrVT, EVT(PtrVT), PtrTy, 0, 0);

      CLI.Outs.push_back(Arg);

      SDValue ArgVal = DAG.getUNDEF(PtrVT);

      CLI.OutVals.push_back(ArgVal);

    }

  }


  // Analyze operands of the call, assigning locations to each operand.

  SmallVector<CCValAssign, 16> ArgLocs;

  CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.getContext());


  if (IsVarArg) {

    // Outgoing non-fixed arguments are placed in a buffer. First

    // compute their offsets and the total amount of buffer space needed.

    for (unsigned I = NumFixedArgs; I < Outs.size(); ++I) {

      const ISD::OutputArg &Out = Outs[I];

      SDValue &Arg = OutVals[I];

      EVT VT = Arg.getValueType();

      assert(VT != MVT::iPTR && "Legalized args should be concrete");

      Type *Ty = VT.getTypeForEVT(*DAG.getContext());

      Align Alignment =

          std::max(Out.Flags.getNonZeroOrigAlign(), Layout.getABITypeAlign(Ty));

      unsigned Offset =

          CCInfo.AllocateStack(Layout.getTypeAllocSize(Ty), Alignment);

      CCInfo.addLoc(CCValAssign::getMem(ArgLocs.size(), VT.getSimpleVT(),

                                        Offset, VT.getSimpleVT(),

                                        CCValAssign::Full));

    }

  }


  unsigned NumBytes = CCInfo.getAlignedCallFrameSize();


  SDValue FINode;

  if (IsVarArg && NumBytes) {

    // For non-fixed arguments, next emit stores to store the argument values

    // to the stack buffer at the offsets computed above.

    MaybeAlign StackAlign = Layout.getStackAlignment();

    assert(StackAlign && "data layout string is missing stack alignment");

    int FI = MF.getFrameInfo().CreateStackObject(NumBytes, *StackAlign,

                                                 /*isSS=*/false);

    unsigned ValNo = 0;

    SmallVector<SDValue, 8> Chains;

    for (SDValue Arg : drop_begin(OutVals, NumFixedArgs)) {

      assert(ArgLocs[ValNo].getValNo() == ValNo &&

             "ArgLocs should remain in order and only hold varargs args");

      unsigned Offset = ArgLocs[ValNo++].getLocMemOffset();

      FINode = DAG.getFrameIndex(FI, getPointerTy(Layout));

      SDValue Add = DAG.getNode(ISD::ADD, DL, PtrVT, FINode,

                                DAG.getConstant(Offset, DL, PtrVT));

      Chains.push_back(

          DAG.getStore(Chain, DL, Arg, Add,

                       MachinePointerInfo::getFixedStack(MF, FI, Offset)));

    }

    if (!Chains.empty())

      Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, Chains);

  } else if (IsVarArg) {

    FINode = DAG.getIntPtrConstant(0, DL);

  }


  if (Callee->getOpcode() == ISD::GlobalAddress) {

    // If the callee is a GlobalAddress node (quite common, every direct call

    // is) turn it into a TargetGlobalAddress node so that LowerGlobalAddress

    // doesn't at MO_GOT which is not needed for direct calls.

    GlobalAddressSDNode *GA = cast<GlobalAddressSDNode>(Callee);

    Callee = DAG.getTargetGlobalAddress(GA->getGlobal(), DL,

                                        getPointerTy(DAG.getDataLayout()),

                                        GA->getOffset());

    Callee = DAG.getNode(WebAssemblyISD::Wrapper, DL,

                         getPointerTy(DAG.getDataLayout()), Callee);

  }


  // Compute the operands for the CALLn node.

  SmallVector<SDValue, 16> Ops;

  Ops.push_back(Chain);

  Ops.push_back(Callee);


  // Add all fixed arguments. Note that for non-varargs calls, NumFixedArgs

  // isn't reliable.

  Ops.append(OutVals.begin(),

             IsVarArg ? OutVals.begin() + NumFixedArgs : OutVals.end());

  // Add a pointer to the vararg buffer.

  if (IsVarArg)

    Ops.push_back(FINode);


  SmallVector<EVT, 8> InTys;

  for (const auto &In : Ins) {

    assert(!In.Flags.isByVal() && "byval is not valid for return values");

    assert(!In.Flags.isNest() && "nest is not valid for return values");

    if (In.Flags.isInAlloca())

      fail(DL, DAG, "WebAssembly hasn't implemented inalloca return values");

    if (In.Flags.isInConsecutiveRegs())

      fail(DL, DAG, "WebAssembly hasn't implemented cons regs return values");

    if (In.Flags.isInConsecutiveRegsLast())

      fail(DL, DAG,

           "WebAssembly hasn't implemented cons regs last return values");

    // Ignore In.getNonZeroOrigAlign() because all our arguments are passed in

    // registers.

    InTys.push_back(In.VT);

  }


  // Lastly, if this is a call to a funcref we need to add an instruction

  // table.set to the chain and transform the call.

  if (CLI.CB && WebAssembly::isWebAssemblyFuncrefType(

                    CLI.CB->getCalledOperand()->getType())) {

    // In the absence of function references proposal where a funcref call is

    // lowered to call_ref, using reference types we generate a table.set to set

    // the funcref to a special table used solely for this purpose, followed by

    // a call_indirect. Here we just generate the table set, and return the

    // SDValue of the table.set so that LowerCall can finalize the lowering by

    // generating the call_indirect.

    SDValue Chain = Ops[0];


    MCSymbolWasm *Table = WebAssembly::getOrCreateFuncrefCallTableSymbol(

        MF.getContext(), Subtarget);

    SDValue Sym = DAG.getMCSymbol(Table, PtrVT);

    SDValue TableSlot = DAG.getConstant(0, DL, MVT::i32);

    SDValue TableSetOps[] = {Chain, Sym, TableSlot, Callee};

    SDValue TableSet = DAG.getMemIntrinsicNode(

        WebAssemblyISD::TABLE_SET, DL, DAG.getVTList(MVT::Other), TableSetOps,

        MVT::funcref,

        // Machine Mem Operand args

        MachinePointerInfo(

            WebAssembly::WasmAddressSpace::WASM_ADDRESS_SPACE_FUNCREF),

        CLI.CB->getCalledOperand()->getPointerAlignment(DAG.getDataLayout()),

        MachineMemOperand::MOStore);


    Ops[0] = TableSet; // The new chain is the TableSet itself

  }


  if (CLI.IsTailCall) {

    // ret_calls do not return values to the current frame

    SDVTList NodeTys = DAG.getVTList(MVT::Other, MVT::Glue);

    return DAG.getNode(WebAssemblyISD::RET_CALL, DL, NodeTys, Ops);

  }


  InTys.push_back(MVT::Other);

  SDVTList InTyList = DAG.getVTList(InTys);

  SDValue Res = DAG.getNode(WebAssemblyISD::CALL, DL, InTyList, Ops);


  for (size_t I = 0; I < Ins.size(); ++I)

    InVals.push_back(Res.getValue(I));


  // Return the chain

  return Res.getValue(Ins.size());

}


bool WebAssemblyTargetLowering::CanLowerReturn(

    CallingConv::ID /*CallConv*/, MachineFunction & /*MF*/, bool /*IsVarArg*/,

    const SmallVectorImpl<ISD::OutputArg> &Outs, LLVMContext & /*Context*/,

    const Type *RetTy) const {

  // WebAssembly can only handle returning tuples with multivalue enabled

  return WebAssembly::canLowerReturn(Outs.size(), Subtarget);

}


SDValue WebAssemblyTargetLowering::LowerReturn(

    SDValue Chain, CallingConv::ID CallConv, bool /*IsVarArg*/,

    const SmallVectorImpl<ISD::OutputArg> &Outs,

    const SmallVectorImpl<SDValue> &OutVals, const SDLoc &DL,

    SelectionDAG &DAG) const {

  assert(WebAssembly::canLowerReturn(Outs.size(), Subtarget) &&

         "MVP WebAssembly can only return up to one value");

  if (!callingConvSupported(CallConv))

    fail(DL, DAG, "WebAssembly doesn't support non-C calling conventions");


  SmallVector<SDValue, 4> RetOps(1, Chain);

  RetOps.append(OutVals.begin(), OutVals.end());

  Chain = DAG.getNode(WebAssemblyISD::RETURN, DL, MVT::Other, RetOps);


  // Record the number and types of the return values.

  for (const ISD::OutputArg &Out : Outs) {

    assert(!Out.Flags.isByVal() && "byval is not valid for return values");

    assert(!Out.Flags.isNest() && "nest is not valid for return values");

    assert(!Out.Flags.isVarArg() && "non-fixed return value is not valid");

    if (Out.Flags.isInAlloca())

      fail(DL, DAG, "WebAssembly hasn't implemented inalloca results");

    if (Out.Flags.isInConsecutiveRegs())

      fail(DL, DAG, "WebAssembly hasn't implemented cons regs results");

    if (Out.Flags.isInConsecutiveRegsLast())

      fail(DL, DAG, "WebAssembly hasn't implemented cons regs last results");

  }


  return Chain;

}


SDValue WebAssemblyTargetLowering::LowerFormalArguments(

    SDValue Chain, CallingConv::ID CallConv, bool IsVarArg,

    const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &DL,

    SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const {

  if (!callingConvSupported(CallConv))

    fail(DL, DAG, "WebAssembly doesn't support non-C calling conventions");


  MachineFunction &MF = DAG.getMachineFunction();

  auto *MFI = MF.getInfo<WebAssemblyFunctionInfo>();


  // Set up the incoming ARGUMENTS value, which serves to represent the liveness

  // of the incoming values before they're represented by virtual registers.

  MF.getRegInfo().addLiveIn(WebAssembly::ARGUMENTS);


  bool HasSwiftErrorArg = false;

  bool HasSwiftSelfArg = false;

  for (const ISD::InputArg &In : Ins) {

    HasSwiftSelfArg |= In.Flags.isSwiftSelf();

    HasSwiftErrorArg |= In.Flags.isSwiftError();

    if (In.Flags.isInAlloca())

      fail(DL, DAG, "WebAssembly hasn't implemented inalloca arguments");

    if (In.Flags.isNest())

      fail(DL, DAG, "WebAssembly hasn't implemented nest arguments");

    if (In.Flags.isInConsecutiveRegs())

      fail(DL, DAG, "WebAssembly hasn't implemented cons regs arguments");

    if (In.Flags.isInConsecutiveRegsLast())

      fail(DL, DAG, "WebAssembly hasn't implemented cons regs last arguments");

    // Ignore In.getNonZeroOrigAlign() because all our arguments are passed in

    // registers.

    InVals.push_back(In.Used ? DAG.getNode(WebAssemblyISD::ARGUMENT, DL, In.VT,

                                           DAG.getTargetConstant(InVals.size(),

                                                                 DL, MVT::i32))

                             : DAG.getUNDEF(In.VT));


    // Record the number and types of arguments.

    MFI->addParam(In.VT);

  }


  // For swiftcc, emit additional swiftself and swifterror arguments

  // if there aren't. These additional arguments are also added for callee

  // signature They are necessary to match callee and caller signature for

  // indirect call.

  auto PtrVT = getPointerTy(MF.getDataLayout());

  if (CallConv == CallingConv::Swift) {

    if (!HasSwiftSelfArg) {

      MFI->addParam(PtrVT);

    }

    if (!HasSwiftErrorArg) {

      MFI->addParam(PtrVT);

    }

  }

  // Varargs are copied into a buffer allocated by the caller, and a pointer to

  // the buffer is passed as an argument.

  if (IsVarArg) {

    MVT PtrVT = getPointerTy(MF.getDataLayout());

    Register VarargVreg =

        MF.getRegInfo().createVirtualRegister(getRegClassFor(PtrVT));

    MFI->setVarargBufferVreg(VarargVreg);

    Chain = DAG.getCopyToReg(

        Chain, DL, VarargVreg,

        DAG.getNode(WebAssemblyISD::ARGUMENT, DL, PtrVT,

                    DAG.getTargetConstant(Ins.size(), DL, MVT::i32)));

    MFI->addParam(PtrVT);

  }


  // Record the number and types of arguments and results.

  SmallVector<MVT, 4> Params;

  SmallVector<MVT, 4> Results;

  computeSignatureVTs(MF.getFunction().getFunctionType(), &MF.getFunction(),

                      MF.getFunction(), DAG.getTarget(), Params, Results);

  for (MVT VT : Results)

    MFI->addResult(VT);

  // TODO: Use signatures in WebAssemblyMachineFunctionInfo too and unify

  // the param logic here with ComputeSignatureVTs

  assert(MFI->getParams().size() == Params.size() &&

         std::equal(MFI->getParams().begin(), MFI->getParams().end(),

                    Params.begin()));


  return Chain;

}


void WebAssemblyTargetLowering::ReplaceNodeResults(

    SDNode *N, SmallVectorImpl<SDValue> &Results, SelectionDAG &DAG) const {

  switch (N->getOpcode()) {

  case ISD::SIGN_EXTEND_INREG:

    // Do not add any results, signifying that N should not be custom lowered

    // after all. This happens because simd128 turns on custom lowering for

    // SIGN_EXTEND_INREG, but for non-vector sign extends the result might be an

    // illegal type.

    break;

  case ISD::SIGN_EXTEND_VECTOR_INREG:

  case ISD::ZERO_EXTEND_VECTOR_INREG:

    // Do not add any results, signifying that N should not be custom lowered.

    // EXTEND_VECTOR_INREG is implemented for some vectors, but not all.

    break;

  case ISD::ADD:

  case ISD::SUB:

    Results.push_back(Replace128Op(N, DAG));

    break;

  default:

    llvm_unreachable(

        "ReplaceNodeResults not implemented for this op for WebAssembly!");

  }

}


//===----------------------------------------------------------------------===//

//  Custom lowering hooks.

//===----------------------------------------------------------------------===//


SDValue WebAssemblyTargetLowering::LowerOperation(SDValue Op,

                                                  SelectionDAG &DAG) const {

  SDLoc DL(Op);

  switch (Op.getOpcode()) {

  default:

    llvm_unreachable("unimplemented operation lowering");

    return SDValue();

  case ISD::FrameIndex:

    return LowerFrameIndex(Op, DAG);

  case ISD::GlobalAddress:

    return LowerGlobalAddress(Op, DAG);

  case ISD::GlobalTLSAddress:

    return LowerGlobalTLSAddress(Op, DAG);

  case ISD::ExternalSymbol:

    return LowerExternalSymbol(Op, DAG);

  case ISD::JumpTable:

    return LowerJumpTable(Op, DAG);

  case ISD::BR_JT:

    return LowerBR_JT(Op, DAG);

  case ISD::VASTART:

    return LowerVASTART(Op, DAG);

  case ISD::BlockAddress:

  case ISD::BRIND:

    fail(DL, DAG, "WebAssembly hasn't implemented computed gotos");

    return SDValue();

  case ISD::RETURNADDR:

    return LowerRETURNADDR(Op, DAG);

  case ISD::FRAMEADDR:

    return LowerFRAMEADDR(Op, DAG);

  case ISD::CopyToReg:

    return LowerCopyToReg(Op, DAG);

  case ISD::EXTRACT_VECTOR_ELT:

  case ISD::INSERT_VECTOR_ELT:

    return LowerAccessVectorElement(Op, DAG);

  case ISD::INTRINSIC_VOID:

  case ISD::INTRINSIC_WO_CHAIN:

  case ISD::INTRINSIC_W_CHAIN:

    return LowerIntrinsic(Op, DAG);

  case ISD::SIGN_EXTEND_INREG:

    return LowerSIGN_EXTEND_INREG(Op, DAG);

  case ISD::ZERO_EXTEND_VECTOR_INREG:

  case ISD::SIGN_EXTEND_VECTOR_INREG:

    return LowerEXTEND_VECTOR_INREG(Op, DAG);

  case ISD::BUILD_VECTOR:

    return LowerBUILD_VECTOR(Op, DAG);

  case ISD::VECTOR_SHUFFLE:

    return LowerVECTOR_SHUFFLE(Op, DAG);

  case ISD::SETCC:

    return LowerSETCC(Op, DAG);

  case ISD::SHL:

  case ISD::SRA:

  case ISD::SRL:

    return LowerShift(Op, DAG);

  case ISD::FP_TO_SINT_SAT:

  case ISD::FP_TO_UINT_SAT:

    return LowerFP_TO_INT_SAT(Op, DAG);

  case ISD::LOAD:

    return LowerLoad(Op, DAG);

  case ISD::STORE:

    return LowerStore(Op, DAG);

  case ISD::CTPOP:

  case ISD::CTLZ:

  case ISD::CTTZ:

    return DAG.UnrollVectorOp(Op.getNode());

  case ISD::CLEAR_CACHE:

    report_fatal_error("llvm.clear_cache is not supported on wasm");

  case ISD::SMUL_LOHI:

  case ISD::UMUL_LOHI:

    return LowerMUL_LOHI(Op, DAG);

  case ISD::UADDO:

    return LowerUADDO(Op, DAG);

  }

}


static bool IsWebAssemblyGlobal(SDValue Op) {

  if (const GlobalAddressSDNode *GA = dyn_cast<GlobalAddressSDNode>(Op))

    return WebAssembly::isWasmVarAddressSpace(GA->getAddressSpace());


  return false;

}


static std::optional<unsigned> IsWebAssemblyLocal(SDValue Op,

                                                  SelectionDAG &DAG) {

  const FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Op);

  if (!FI)

    return std::nullopt;


  auto &MF = DAG.getMachineFunction();

  return WebAssemblyFrameLowering::getLocalForStackObject(MF, FI->getIndex());

}


SDValue WebAssemblyTargetLowering::LowerStore(SDValue Op,

                                              SelectionDAG &DAG) const {

  SDLoc DL(Op);

  StoreSDNode *SN = cast<StoreSDNode>(Op.getNode());

  const SDValue &Value = SN->getValue();

  const SDValue &Base = SN->getBasePtr();

  const SDValue &Offset = SN->getOffset();


  if (IsWebAssemblyGlobal(Base)) {

    if (!Offset->isUndef())

      report_fatal_error("unexpected offset when storing to webassembly global",

                         false);


    SDVTList Tys = DAG.getVTList(MVT::Other);

    SDValue Ops[] = {SN->getChain(), Value, Base};

    return DAG.getMemIntrinsicNode(WebAssemblyISD::GLOBAL_SET, DL, Tys, Ops,

                                   SN->getMemoryVT(), SN->getMemOperand());

  }


  if (std::optional<unsigned> Local = IsWebAssemblyLocal(Base, DAG)) {

    if (!Offset->isUndef())

      report_fatal_error("unexpected offset when storing to webassembly local",

                         false);


    SDValue Idx = DAG.getTargetConstant(*Local, Base, MVT::i32);

    SDVTList Tys = DAG.getVTList(MVT::Other); // The chain.

    SDValue Ops[] = {SN->getChain(), Idx, Value};

    return DAG.getNode(WebAssemblyISD::LOCAL_SET, DL, Tys, Ops);

  }


  if (WebAssembly::isWasmVarAddressSpace(SN->getAddressSpace()))

    report_fatal_error(

        "Encountered an unlowerable store to the wasm_var address space",

        false);


  return Op;

}


SDValue WebAssemblyTargetLowering::LowerLoad(SDValue Op,

                                             SelectionDAG &DAG) const {

  SDLoc DL(Op);

  LoadSDNode *LN = cast<LoadSDNode>(Op.getNode());

  const SDValue &Base = LN->getBasePtr();

  const SDValue &Offset = LN->getOffset();


  if (IsWebAssemblyGlobal(Base)) {

    if (!Offset->isUndef())

      report_fatal_error(

          "unexpected offset when loading from webassembly global", false);


    SDVTList Tys = DAG.getVTList(LN->getValueType(0), MVT::Other);

    SDValue Ops[] = {LN->getChain(), Base};

    return DAG.getMemIntrinsicNode(WebAssemblyISD::GLOBAL_GET, DL, Tys, Ops,

                                   LN->getMemoryVT(), LN->getMemOperand());

  }


  if (std::optional<unsigned> Local = IsWebAssemblyLocal(Base, DAG)) {

    if (!Offset->isUndef())

      report_fatal_error(

          "unexpected offset when loading from webassembly local", false);


    SDValue Idx = DAG.getTargetConstant(*Local, Base, MVT::i32);

    EVT LocalVT = LN->getValueType(0);

    SDValue LocalGet = DAG.getNode(WebAssemblyISD::LOCAL_GET, DL, LocalVT,

                                   {LN->getChain(), Idx});

    SDValue Result = DAG.getMergeValues({LocalGet, LN->getChain()}, DL);

    assert(Result->getNumValues() == 2 && "Loads must carry a chain!");

    return Result;

  }


  if (WebAssembly::isWasmVarAddressSpace(LN->getAddressSpace()))

    report_fatal_error(

        "Encountered an unlowerable load from the wasm_var address space",

        false);


  return Op;

}


SDValue WebAssemblyTargetLowering::LowerMUL_LOHI(SDValue Op,

                                                 SelectionDAG &DAG) const {

  assert(Subtarget->hasWideArithmetic());

  assert(Op.getValueType() == MVT::i64);

  SDLoc DL(Op);

  unsigned Opcode;

  switch (Op.getOpcode()) {

  case ISD::UMUL_LOHI:

    Opcode = WebAssemblyISD::I64_MUL_WIDE_U;

    break;

  case ISD::SMUL_LOHI:

    Opcode = WebAssemblyISD::I64_MUL_WIDE_S;

    break;

  default:

    llvm_unreachable("unexpected opcode");

  }

  SDValue LHS = Op.getOperand(0);

  SDValue RHS = Op.getOperand(1);

  SDValue Lo =

      DAG.getNode(Opcode, DL, DAG.getVTList(MVT::i64, MVT::i64), LHS, RHS);

  SDValue Hi(Lo.getNode(), 1);

  SDValue Ops[] = {Lo, Hi};

  return DAG.getMergeValues(Ops, DL);

}


// Lowers `UADDO` intrinsics to an `i64.add128` instruction when it's enabled.

//

// This enables generating a single wasm instruction for this operation where

// the upper half of both operands are constant zeros. The upper half of the

// result is then whether the overflow happened.

SDValue WebAssemblyTargetLowering::LowerUADDO(SDValue Op,

                                              SelectionDAG &DAG) const {

  assert(Subtarget->hasWideArithmetic());

  assert(Op.getValueType() == MVT::i64);

  assert(Op.getOpcode() == ISD::UADDO);

  SDLoc DL(Op);

  SDValue LHS = Op.getOperand(0);

  SDValue RHS = Op.getOperand(1);

  SDValue Zero = DAG.getConstant(0, DL, MVT::i64);

  SDValue Result =

      DAG.getNode(WebAssemblyISD::I64_ADD128, DL,

                  DAG.getVTList(MVT::i64, MVT::i64), LHS, Zero, RHS, Zero);

  SDValue CarryI64(Result.getNode(), 1);

  SDValue CarryI32 = DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, CarryI64);

  SDValue Ops[] = {Result, CarryI32};

  return DAG.getMergeValues(Ops, DL);

}


SDValue WebAssemblyTargetLowering::Replace128Op(SDNode *N,

                                                SelectionDAG &DAG) const {

  assert(Subtarget->hasWideArithmetic());

  assert(N->getValueType(0) == MVT::i128);

  SDLoc DL(N);

  unsigned Opcode;

  switch (N->getOpcode()) {

  case ISD::ADD:

    Opcode = WebAssemblyISD::I64_ADD128;

    break;

  case ISD::SUB:

    Opcode = WebAssemblyISD::I64_SUB128;

    break;

  default:

    llvm_unreachable("unexpected opcode");

  }

  SDValue LHS = N->getOperand(0);

  SDValue RHS = N->getOperand(1);


  SDValue C0 = DAG.getConstant(0, DL, MVT::i64);

  SDValue C1 = DAG.getConstant(1, DL, MVT::i64);

  SDValue LHS_0 = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, MVT::i64, LHS, C0);

  SDValue LHS_1 = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, MVT::i64, LHS, C1);

  SDValue RHS_0 = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, MVT::i64, RHS, C0);

  SDValue RHS_1 = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, MVT::i64, RHS, C1);

  SDValue Result_LO = DAG.getNode(Opcode, DL, DAG.getVTList(MVT::i64, MVT::i64),

                                  LHS_0, LHS_1, RHS_0, RHS_1);

  SDValue Result_HI(Result_LO.getNode(), 1);

  return DAG.getNode(ISD::BUILD_PAIR, DL, N->getVTList(), Result_LO, Result_HI);

}


SDValue WebAssemblyTargetLowering::LowerCopyToReg(SDValue Op,

                                                  SelectionDAG &DAG) const {

  SDValue Src = Op.getOperand(2);

  if (isa<FrameIndexSDNode>(Src.getNode())) {

    // CopyToReg nodes don't support FrameIndex operands. Other targets select

    // the FI to some LEA-like instruction, but since we don't have that, we

    // need to insert some kind of instruction that can take an FI operand and

    // produces a value usable by CopyToReg (i.e. in a vreg). So insert a dummy

    // local.copy between Op and its FI operand.

    SDValue Chain = Op.getOperand(0);

    SDLoc DL(Op);

    Register Reg = cast<RegisterSDNode>(Op.getOperand(1))->getReg();

    EVT VT = Src.getValueType();

    SDValue Copy(DAG.getMachineNode(VT == MVT::i32 ? WebAssembly::COPY_I32

                                                   : WebAssembly::COPY_I64,

                                    DL, VT, Src),

                 0);

    return Op.getNode()->getNumValues() == 1

               ? DAG.getCopyToReg(Chain, DL, Reg, Copy)

               : DAG.getCopyToReg(Chain, DL, Reg, Copy,

                                  Op.getNumOperands() == 4 ? Op.getOperand(3)

                                                           : SDValue());

  }

  return SDValue();

}


SDValue WebAssemblyTargetLowering::LowerFrameIndex(SDValue Op,

                                                   SelectionDAG &DAG) const {

  int FI = cast<FrameIndexSDNode>(Op)->getIndex();

  return DAG.getTargetFrameIndex(FI, Op.getValueType());

}


SDValue WebAssemblyTargetLowering::LowerRETURNADDR(SDValue Op,

                                                   SelectionDAG &DAG) const {

  SDLoc DL(Op);


  if (!Subtarget->getTargetTriple().isOSEmscripten()) {

    fail(DL, DAG,

         "Non-Emscripten WebAssembly hasn't implemented "

         "__builtin_return_address");

    return SDValue();

  }


  unsigned Depth = Op.getConstantOperandVal(0);

  MakeLibCallOptions CallOptions;

  return makeLibCall(DAG, RTLIB::RETURN_ADDRESS, Op.getValueType(),

                     {DAG.getConstant(Depth, DL, MVT::i32)}, CallOptions, DL)

      .first;

}


SDValue WebAssemblyTargetLowering::LowerFRAMEADDR(SDValue Op,

                                                  SelectionDAG &DAG) const {

  // Non-zero depths are not supported by WebAssembly currently. Use the

  // legalizer's default expansion, which is to return 0 (what this function is

  // documented to do).

  if (Op.getConstantOperandVal(0) > 0)

    return SDValue();


  DAG.getMachineFunction().getFrameInfo().setFrameAddressIsTaken(true);

  EVT VT = Op.getValueType();

  Register FP =

      Subtarget->getRegisterInfo()->getFrameRegister(DAG.getMachineFunction());

  return DAG.getCopyFromReg(DAG.getEntryNode(), SDLoc(Op), FP, VT);

}


SDValue

WebAssemblyTargetLowering::LowerGlobalTLSAddress(SDValue Op,

                                                 SelectionDAG &DAG) const {

  SDLoc DL(Op);

  const auto *GA = cast<GlobalAddressSDNode>(Op);


  MachineFunction &MF = DAG.getMachineFunction();

  if (!MF.getSubtarget<WebAssemblySubtarget>().hasBulkMemory())

    report_fatal_error("cannot use thread-local storage without bulk memory",

                       false);


  const GlobalValue *GV = GA->getGlobal();


  // Currently only Emscripten supports dynamic linking with threads. Therefore,

  // on other targets, if we have thread-local storage, only the local-exec

  // model is possible.

  auto model = Subtarget->getTargetTriple().isOSEmscripten()

                   ? GV->getThreadLocalMode()

                   : GlobalValue::LocalExecTLSModel;


  // Unsupported TLS modes

  assert(model != GlobalValue::NotThreadLocal);

  assert(model != GlobalValue::InitialExecTLSModel);


  if (model == GlobalValue::LocalExecTLSModel ||

      model == GlobalValue::LocalDynamicTLSModel ||

      (model == GlobalValue::GeneralDynamicTLSModel &&

       getTargetMachine().shouldAssumeDSOLocal(GV))) {

    // For DSO-local TLS variables we use offset from __tls_base


    MVT PtrVT = getPointerTy(DAG.getDataLayout());

    auto GlobalGet = PtrVT == MVT::i64 ? WebAssembly::GLOBAL_GET_I64

                                       : WebAssembly::GLOBAL_GET_I32;

    const char *BaseName = MF.createExternalSymbolName("__tls_base");


    SDValue BaseAddr(

        DAG.getMachineNode(GlobalGet, DL, PtrVT,

                           DAG.getTargetExternalSymbol(BaseName, PtrVT)),

        0);


    SDValue TLSOffset = DAG.getTargetGlobalAddress(

        GV, DL, PtrVT, GA->getOffset(), WebAssemblyII::MO_TLS_BASE_REL);

    SDValue SymOffset =

        DAG.getNode(WebAssemblyISD::WrapperREL, DL, PtrVT, TLSOffset);


    return DAG.getNode(ISD::ADD, DL, PtrVT, BaseAddr, SymOffset);

  }


  assert(model == GlobalValue::GeneralDynamicTLSModel);


  EVT VT = Op.getValueType();

  return DAG.getNode(WebAssemblyISD::Wrapper, DL, VT,

                     DAG.getTargetGlobalAddress(GA->getGlobal(), DL, VT,

                                                GA->getOffset(),

                                                WebAssemblyII::MO_GOT_TLS));

}


SDValue WebAssemblyTargetLowering::LowerGlobalAddress(SDValue Op,

                                                      SelectionDAG &DAG) const {

  SDLoc DL(Op);

  const auto *GA = cast<GlobalAddressSDNode>(Op);

  EVT VT = Op.getValueType();

  assert(GA->getTargetFlags() == 0 &&

         "Unexpected target flags on generic GlobalAddressSDNode");

  if (!WebAssembly::isValidAddressSpace(GA->getAddressSpace()))

    fail(DL, DAG, "Invalid address space for WebAssembly target");


  unsigned OperandFlags = 0;

  const GlobalValue *GV = GA->getGlobal();

  // Since WebAssembly tables cannot yet be shared accross modules, we don't

  // need special treatment for tables in PIC mode.

  if (isPositionIndependent() &&

      !WebAssembly::isWebAssemblyTableType(GV->getValueType())) {

    if (getTargetMachine().shouldAssumeDSOLocal(GV)) {

      MachineFunction &MF = DAG.getMachineFunction();

      MVT PtrVT = getPointerTy(MF.getDataLayout());

      const char *BaseName;

      if (GV->getValueType()->isFunctionTy()) {

        BaseName = MF.createExternalSymbolName("__table_base");

        OperandFlags = WebAssemblyII::MO_TABLE_BASE_REL;

      } else {

        BaseName = MF.createExternalSymbolName("__memory_base");

        OperandFlags = WebAssemblyII::MO_MEMORY_BASE_REL;

      }

      SDValue BaseAddr =

          DAG.getNode(WebAssemblyISD::Wrapper, DL, PtrVT,

                      DAG.getTargetExternalSymbol(BaseName, PtrVT));


      SDValue SymAddr = DAG.getNode(

          WebAssemblyISD::WrapperREL, DL, VT,

          DAG.getTargetGlobalAddress(GA->getGlobal(), DL, VT, GA->getOffset(),

                                     OperandFlags));


      return DAG.getNode(ISD::ADD, DL, VT, BaseAddr, SymAddr);

    }

    OperandFlags = WebAssemblyII::MO_GOT;

  }


  return DAG.getNode(WebAssemblyISD::Wrapper, DL, VT,

                     DAG.getTargetGlobalAddress(GA->getGlobal(), DL, VT,

                                                GA->getOffset(), OperandFlags));

}


SDValue

WebAssemblyTargetLowering::LowerExternalSymbol(SDValue Op,

                                               SelectionDAG &DAG) const {

  SDLoc DL(Op);

  const auto *ES = cast<ExternalSymbolSDNode>(Op);

  EVT VT = Op.getValueType();

  assert(ES->getTargetFlags() == 0 &&

         "Unexpected target flags on generic ExternalSymbolSDNode");

  return DAG.getNode(WebAssemblyISD::Wrapper, DL, VT,

                     DAG.getTargetExternalSymbol(ES->getSymbol(), VT));

}


SDValue WebAssemblyTargetLowering::LowerJumpTable(SDValue Op,

                                                  SelectionDAG &DAG) const {

  // There's no need for a Wrapper node because we always incorporate a jump

  // table operand into a BR_TABLE instruction, rather than ever

  // materializing it in a register.

  const JumpTableSDNode *JT = cast<JumpTableSDNode>(Op);

  return DAG.getTargetJumpTable(JT->getIndex(), Op.getValueType(),

                                JT->getTargetFlags());

}


SDValue WebAssemblyTargetLowering::LowerBR_JT(SDValue Op,

                                              SelectionDAG &DAG) const {

  SDLoc DL(Op);

  SDValue Chain = Op.getOperand(0);

  const auto *JT = cast<JumpTableSDNode>(Op.getOperand(1));

  SDValue Index = Op.getOperand(2);

  assert(JT->getTargetFlags() == 0 && "WebAssembly doesn't set target flags");


  SmallVector<SDValue, 8> Ops;

  Ops.push_back(Chain);

  Ops.push_back(Index);


  MachineJumpTableInfo *MJTI = DAG.getMachineFunction().getJumpTableInfo();

  const auto &MBBs = MJTI->getJumpTables()[JT->getIndex()].MBBs;


  // Add an operand for each case.

  for (auto *MBB : MBBs)

    Ops.push_back(DAG.getBasicBlock(MBB));


  // Add the first MBB as a dummy default target for now. This will be replaced

  // with the proper default target (and the preceding range check eliminated)

  // if possible by WebAssemblyFixBrTableDefaults.

  Ops.push_back(DAG.getBasicBlock(*MBBs.begin()));

  return DAG.getNode(WebAssemblyISD::BR_TABLE, DL, MVT::Other, Ops);

}


SDValue WebAssemblyTargetLowering::LowerVASTART(SDValue Op,

                                                SelectionDAG &DAG) const {

  SDLoc DL(Op);

  EVT PtrVT = getPointerTy(DAG.getMachineFunction().getDataLayout());


  auto *MFI = DAG.getMachineFunction().getInfo<WebAssemblyFunctionInfo>();

  const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();


  SDValue ArgN = DAG.getCopyFromReg(DAG.getEntryNode(), DL,

                                    MFI->getVarargBufferVreg(), PtrVT);

  return DAG.getStore(Op.getOperand(0), DL, ArgN, Op.getOperand(1),

                      MachinePointerInfo(SV));

}


// Try to lower partial.reduce.add to a dot or fallback to a sequence with

// extmul and adds.

SDValue performLowerPartialReduction(SDNode *N, SelectionDAG &DAG) {

  assert(N->getOpcode() == ISD::INTRINSIC_WO_CHAIN);

  if (N->getConstantOperandVal(0) !=

      Intrinsic::experimental_vector_partial_reduce_add)

    return SDValue();


  assert(N->getValueType(0) == MVT::v4i32 && "can only support v4i32");

  SDLoc DL(N);

  SDValue Mul = N->getOperand(2);

  assert(Mul->getOpcode() == ISD::MUL && "expected mul input");


  SDValue ExtendLHS = Mul->getOperand(0);

  SDValue ExtendRHS = Mul->getOperand(1);

  assert((ISD::isExtOpcode(ExtendLHS.getOpcode()) &&

          ISD::isExtOpcode(ExtendRHS.getOpcode())) &&

         "expected widening mul");

  assert(ExtendLHS.getOpcode() == ExtendRHS.getOpcode() &&

         "expected mul to use the same extend for both operands");


  SDValue ExtendInLHS = ExtendLHS->getOperand(0);

  SDValue ExtendInRHS = ExtendRHS->getOperand(0);

  bool IsSigned = ExtendLHS->getOpcode() == ISD::SIGN_EXTEND;


  if (ExtendInLHS->getValueType(0) == MVT::v8i16) {

    if (IsSigned) {

      // i32x4.dot_i16x8_s

      SDValue Dot = DAG.getNode(WebAssemblyISD::DOT, DL, MVT::v4i32,

                                ExtendInLHS, ExtendInRHS);

      return DAG.getNode(ISD::ADD, DL, MVT::v4i32, N->getOperand(1), Dot);

    }


    unsigned LowOpc = WebAssemblyISD::EXTEND_LOW_U;

    unsigned HighOpc = WebAssemblyISD::EXTEND_HIGH_U;


    // (add (add (extmul_low_sx lhs, rhs), (extmul_high_sx lhs, rhs)))

    SDValue LowLHS = DAG.getNode(LowOpc, DL, MVT::v4i32, ExtendInLHS);

    SDValue LowRHS = DAG.getNode(LowOpc, DL, MVT::v4i32, ExtendInRHS);

    SDValue HighLHS = DAG.getNode(HighOpc, DL, MVT::v4i32, ExtendInLHS);

    SDValue HighRHS = DAG.getNode(HighOpc, DL, MVT::v4i32, ExtendInRHS);


    SDValue MulLow = DAG.getNode(ISD::MUL, DL, MVT::v4i32, LowLHS, LowRHS);

    SDValue MulHigh = DAG.getNode(ISD::MUL, DL, MVT::v4i32, HighLHS, HighRHS);

    SDValue Add = DAG.getNode(ISD::ADD, DL, MVT::v4i32, MulLow, MulHigh);

    return DAG.getNode(ISD::ADD, DL, MVT::v4i32, N->getOperand(1), Add);

  } else {

    assert(ExtendInLHS->getValueType(0) == MVT::v16i8 &&

           "expected v16i8 input types");

    // Lower to a wider tree, using twice the operations compared to above.

    if (IsSigned) {

      // Use two dots

      unsigned LowOpc = WebAssemblyISD::EXTEND_LOW_S;

      unsigned HighOpc = WebAssemblyISD::EXTEND_HIGH_S;

      SDValue LowLHS = DAG.getNode(LowOpc, DL, MVT::v8i16, ExtendInLHS);

      SDValue LowRHS = DAG.getNode(LowOpc, DL, MVT::v8i16, ExtendInRHS);

      SDValue HighLHS = DAG.getNode(HighOpc, DL, MVT::v8i16, ExtendInLHS);

      SDValue HighRHS = DAG.getNode(HighOpc, DL, MVT::v8i16, ExtendInRHS);

      SDValue DotLHS =

          DAG.getNode(WebAssemblyISD::DOT, DL, MVT::v4i32, LowLHS, LowRHS);

      SDValue DotRHS =

          DAG.getNode(WebAssemblyISD::DOT, DL, MVT::v4i32, HighLHS, HighRHS);

      SDValue Add = DAG.getNode(ISD::ADD, DL, MVT::v4i32, DotLHS, DotRHS);

      return DAG.getNode(ISD::ADD, DL, MVT::v4i32, N->getOperand(1), Add);

    }


    unsigned LowOpc = WebAssemblyISD::EXTEND_LOW_U;

    unsigned HighOpc = WebAssemblyISD::EXTEND_HIGH_U;

    SDValue LowLHS = DAG.getNode(LowOpc, DL, MVT::v8i16, ExtendInLHS);

    SDValue LowRHS = DAG.getNode(LowOpc, DL, MVT::v8i16, ExtendInRHS);

    SDValue HighLHS = DAG.getNode(HighOpc, DL, MVT::v8i16, ExtendInLHS);

    SDValue HighRHS = DAG.getNode(HighOpc, DL, MVT::v8i16, ExtendInRHS);


    SDValue MulLow = DAG.getNode(ISD::MUL, DL, MVT::v8i16, LowLHS, LowRHS);

    SDValue MulHigh = DAG.getNode(ISD::MUL, DL, MVT::v8i16, HighLHS, HighRHS);


    SDValue LowLow = DAG.getNode(LowOpc, DL, MVT::v4i32, MulLow);

    SDValue LowHigh = DAG.getNode(LowOpc, DL, MVT::v4i32, MulHigh);

    SDValue HighLow = DAG.getNode(HighOpc, DL, MVT::v4i32, MulLow);

    SDValue HighHigh = DAG.getNode(HighOpc, DL, MVT::v4i32, MulHigh);


    SDValue AddLow = DAG.getNode(ISD::ADD, DL, MVT::v4i32, LowLow, HighLow);

    SDValue AddHigh = DAG.getNode(ISD::ADD, DL, MVT::v4i32, LowHigh, HighHigh);

    SDValue Add = DAG.getNode(ISD::ADD, DL, MVT::v4i32, AddLow, AddHigh);

    return DAG.getNode(ISD::ADD, DL, MVT::v4i32, N->getOperand(1), Add);

  }

}


SDValue WebAssemblyTargetLowering::LowerIntrinsic(SDValue Op,

                                                  SelectionDAG &DAG) const {

  MachineFunction &MF = DAG.getMachineFunction();

  unsigned IntNo;

  switch (Op.getOpcode()) {

  case ISD::INTRINSIC_VOID:

  case ISD::INTRINSIC_W_CHAIN:

    IntNo = Op.getConstantOperandVal(1);

    break;

  case ISD::INTRINSIC_WO_CHAIN:

    IntNo = Op.getConstantOperandVal(0);

    break;

  default:

    llvm_unreachable("Invalid intrinsic");

  }

  SDLoc DL(Op);


  switch (IntNo) {

  default:

    return SDValue(); // Don't custom lower most intrinsics.


  case Intrinsic::wasm_lsda: {

    auto PtrVT = getPointerTy(MF.getDataLayout());

    const char *SymName = MF.createExternalSymbolName(

        "GCC_except_table" + std::to_string(MF.getFunctionNumber()));

    if (isPositionIndependent()) {

      SDValue Node = DAG.getTargetExternalSymbol(

          SymName, PtrVT, WebAssemblyII::MO_MEMORY_BASE_REL);

      const char *BaseName = MF.createExternalSymbolName("__memory_base");

      SDValue BaseAddr =

          DAG.getNode(WebAssemblyISD::Wrapper, DL, PtrVT,

                      DAG.getTargetExternalSymbol(BaseName, PtrVT));

      SDValue SymAddr =

          DAG.getNode(WebAssemblyISD::WrapperREL, DL, PtrVT, Node);

      return DAG.getNode(ISD::ADD, DL, PtrVT, BaseAddr, SymAddr);

    }

    SDValue Node = DAG.getTargetExternalSymbol(SymName, PtrVT);

    return DAG.getNode(WebAssemblyISD::Wrapper, DL, PtrVT, Node);

  }


  case Intrinsic::wasm_shuffle: {

    // Drop in-chain and replace undefs, but otherwise pass through unchanged

    SDValue Ops[18];

    size_t OpIdx = 0;

    Ops[OpIdx++] = Op.getOperand(1);

    Ops[OpIdx++] = Op.getOperand(2);

    while (OpIdx < 18) {

      const SDValue &MaskIdx = Op.getOperand(OpIdx + 1);

      if (MaskIdx.isUndef() || MaskIdx.getNode()->getAsZExtVal() >= 32) {

        bool isTarget = MaskIdx.getNode()->getOpcode() == ISD::TargetConstant;

        Ops[OpIdx++] = DAG.getConstant(0, DL, MVT::i32, isTarget);

      } else {

        Ops[OpIdx++] = MaskIdx;

      }

    }

    return DAG.getNode(WebAssemblyISD::SHUFFLE, DL, Op.getValueType(), Ops);

  }


  case Intrinsic::thread_pointer: {

    MVT PtrVT = getPointerTy(DAG.getDataLayout());

    auto GlobalGet = PtrVT == MVT::i64 ? WebAssembly::GLOBAL_GET_I64

                                       : WebAssembly::GLOBAL_GET_I32;

    const char *TlsBase = MF.createExternalSymbolName("__tls_base");

    return SDValue(

        DAG.getMachineNode(GlobalGet, DL, PtrVT,

                           DAG.getTargetExternalSymbol(TlsBase, PtrVT)),

        0);

  }

  }

}


SDValue

WebAssemblyTargetLowering::LowerSIGN_EXTEND_INREG(SDValue Op,

                                                  SelectionDAG &DAG) const {

  SDLoc DL(Op);

  // If sign extension operations are disabled, allow sext_inreg only if operand

  // is a vector extract of an i8 or i16 lane. SIMD does not depend on sign

  // extension operations, but allowing sext_inreg in this context lets us have

  // simple patterns to select extract_lane_s instructions. Expanding sext_inreg

  // everywhere would be simpler in this file, but would necessitate large and

  // brittle patterns to undo the expansion and select extract_lane_s

  // instructions.

  assert(!Subtarget->hasSignExt() && Subtarget->hasSIMD128());

  if (Op.getOperand(0).getOpcode() != ISD::EXTRACT_VECTOR_ELT)

    return SDValue();


  const SDValue &Extract = Op.getOperand(0);

  MVT VecT = Extract.getOperand(0).getSimpleValueType();

  if (VecT.getVectorElementType().getSizeInBits() > 32)

    return SDValue();

  MVT ExtractedLaneT =

      cast<VTSDNode>(Op.getOperand(1).getNode())->getVT().getSimpleVT();

  MVT ExtractedVecT =

      MVT::getVectorVT(ExtractedLaneT, 128 / ExtractedLaneT.getSizeInBits());

  if (ExtractedVecT == VecT)

    return Op;


  // Bitcast vector to appropriate type to ensure ISel pattern coverage

  const SDNode *Index = Extract.getOperand(1).getNode();

  if (!isa<ConstantSDNode>(Index))

    return SDValue();

  unsigned IndexVal = Index->getAsZExtVal();

  unsigned Scale =

      ExtractedVecT.getVectorNumElements() / VecT.getVectorNumElements();

  assert(Scale > 1);

  SDValue NewIndex =

      DAG.getConstant(IndexVal * Scale, DL, Index->getValueType(0));

  SDValue NewExtract = DAG.getNode(

      ISD::EXTRACT_VECTOR_ELT, DL, Extract.getValueType(),

      DAG.getBitcast(ExtractedVecT, Extract.getOperand(0)), NewIndex);

  return DAG.getNode(ISD::SIGN_EXTEND_INREG, DL, Op.getValueType(), NewExtract,

                     Op.getOperand(1));

}


static SDValue GetExtendHigh(SDValue Op, unsigned UserOpc, EVT VT,

                             SelectionDAG &DAG) {

  if (Op.getOpcode() != ISD::VECTOR_SHUFFLE)

    return SDValue();


  assert((UserOpc == WebAssemblyISD::EXTEND_LOW_U ||

          UserOpc == WebAssemblyISD::EXTEND_LOW_S) &&

         "expected extend_low");

  auto *Shuffle = cast<ShuffleVectorSDNode>(Op.getNode());


  ArrayRef<int> Mask = Shuffle->getMask();

  // Look for a shuffle which moves from the high half to the low half.

  size_t FirstIdx = Mask.size() / 2;

  for (size_t i = 0; i < Mask.size() / 2; ++i) {

    if (Mask[i] != static_cast<int>(FirstIdx + i)) {

      return SDValue();

    }

  }


  SDLoc DL(Op);

  unsigned Opc = UserOpc == WebAssemblyISD::EXTEND_LOW_S

                     ? WebAssemblyISD::EXTEND_HIGH_S

                     : WebAssemblyISD::EXTEND_HIGH_U;

  return DAG.getNode(Opc, DL, VT, Shuffle->getOperand(0));

}


SDValue

WebAssemblyTargetLowering::LowerEXTEND_VECTOR_INREG(SDValue Op,

                                                    SelectionDAG &DAG) const {

  SDLoc DL(Op);

  EVT VT = Op.getValueType();

  SDValue Src = Op.getOperand(0);

  EVT SrcVT = Src.getValueType();


  if (SrcVT.getVectorElementType() == MVT::i1 ||

      SrcVT.getVectorElementType() == MVT::i64)

    return SDValue();


  assert(VT.getScalarSizeInBits() % SrcVT.getScalarSizeInBits() == 0 &&

         "Unexpected extension factor.");

  unsigned Scale = VT.getScalarSizeInBits() / SrcVT.getScalarSizeInBits();


  if (Scale != 2 && Scale != 4 && Scale != 8)

    return SDValue();


  unsigned Ext;

  switch (Op.getOpcode()) {

  case ISD::ZERO_EXTEND_VECTOR_INREG:

    Ext = WebAssemblyISD::EXTEND_LOW_U;

    break;

  case ISD::SIGN_EXTEND_VECTOR_INREG:

    Ext = WebAssemblyISD::EXTEND_LOW_S;

    break;

  }


  if (Scale == 2) {

    // See if we can use EXTEND_HIGH.

    if (auto ExtendHigh = GetExtendHigh(Op.getOperand(0), Ext, VT, DAG))

      return ExtendHigh;

  }


  SDValue Ret = Src;

  while (Scale != 1) {

    Ret = DAG.getNode(Ext, DL,

                      Ret.getValueType()

                          .widenIntegerVectorElementType(*DAG.getContext())

                          .getHalfNumVectorElementsVT(*DAG.getContext()),

                      Ret);

    Scale /= 2;

  }

  assert(Ret.getValueType() == VT);

  return Ret;

}


static SDValue LowerConvertLow(SDValue Op, SelectionDAG &DAG) {

  SDLoc DL(Op);

  if (Op.getValueType() != MVT::v2f64)

    return SDValue();


  auto GetConvertedLane = [](SDValue Op, unsigned &Opcode, SDValue &SrcVec,

                             unsigned &Index) -> bool {

    switch (Op.getOpcode()) {

    case ISD::SINT_TO_FP:

      Opcode = WebAssemblyISD::CONVERT_LOW_S;

      break;

    case ISD::UINT_TO_FP:

      Opcode = WebAssemblyISD::CONVERT_LOW_U;

      break;

    case ISD::FP_EXTEND:

      Opcode = WebAssemblyISD::PROMOTE_LOW;

      break;

    default:

      return false;

    }


    auto ExtractVector = Op.getOperand(0);

    if (ExtractVector.getOpcode() != ISD::EXTRACT_VECTOR_ELT)

      return false;


    if (!isa<ConstantSDNode>(ExtractVector.getOperand(1).getNode()))

      return false;


    SrcVec = ExtractVector.getOperand(0);

    Index = ExtractVector.getConstantOperandVal(1);

    return true;

  };


  unsigned LHSOpcode, RHSOpcode, LHSIndex, RHSIndex;

  SDValue LHSSrcVec, RHSSrcVec;

  if (!GetConvertedLane(Op.getOperand(0), LHSOpcode, LHSSrcVec, LHSIndex) ||

      !GetConvertedLane(Op.getOperand(1), RHSOpcode, RHSSrcVec, RHSIndex))

    return SDValue();


  if (LHSOpcode != RHSOpcode)

    return SDValue();


  MVT ExpectedSrcVT;

  switch (LHSOpcode) {

  case WebAssemblyISD::CONVERT_LOW_S:

  case WebAssemblyISD::CONVERT_LOW_U:

    ExpectedSrcVT = MVT::v4i32;

    break;

  case WebAssemblyISD::PROMOTE_LOW:

    ExpectedSrcVT = MVT::v4f32;

    break;

  }

  if (LHSSrcVec.getValueType() != ExpectedSrcVT)

    return SDValue();


  auto Src = LHSSrcVec;

  if (LHSIndex != 0 || RHSIndex != 1 || LHSSrcVec != RHSSrcVec) {

    // Shuffle the source vector so that the converted lanes are the low lanes.

    Src = DAG.getVectorShuffle(

        ExpectedSrcVT, DL, LHSSrcVec, RHSSrcVec,

        {static_cast<int>(LHSIndex), static_cast<int>(RHSIndex) + 4, -1, -1});

  }

  return DAG.getNode(LHSOpcode, DL, MVT::v2f64, Src);

}


SDValue WebAssemblyTargetLowering::LowerBUILD_VECTOR(SDValue Op,

                                                     SelectionDAG &DAG) const {

  MVT VT = Op.getSimpleValueType();

  if (VT == MVT::v8f16) {

    // BUILD_VECTOR can't handle FP16 operands since Wasm doesn't have a scaler

    // FP16 type, so cast them to I16s.

    MVT IVT = VT.changeVectorElementType(MVT::i16);

    SmallVector<SDValue, 8> NewOps;

    for (unsigned I = 0, E = Op.getNumOperands(); I < E; ++I)

      NewOps.push_back(DAG.getBitcast(MVT::i16, Op.getOperand(I)));

    SDValue Res = DAG.getNode(ISD::BUILD_VECTOR, SDLoc(), IVT, NewOps);

    return DAG.getBitcast(VT, Res);

  }


  if (auto ConvertLow = LowerConvertLow(Op, DAG))

    return ConvertLow;


  SDLoc DL(Op);

  const EVT VecT = Op.getValueType();

  const EVT LaneT = Op.getOperand(0).getValueType();

  const size_t Lanes = Op.getNumOperands();

  bool CanSwizzle = VecT == MVT::v16i8;


  // BUILD_VECTORs are lowered to the instruction that initializes the highest

  // possible number of lanes at once followed by a sequence of replace_lane

  // instructions to individually initialize any remaining lanes.


  // TODO: Tune this. For example, lanewise swizzling is very expensive, so

  // swizzled lanes should be given greater weight.


  // TODO: Investigate looping rather than always extracting/replacing specific

  // lanes to fill gaps.


  auto IsConstant = [](const SDValue &V) {

    return V.getOpcode() == ISD::Constant || V.getOpcode() == ISD::ConstantFP;

  };


  // Returns the source vector and index vector pair if they exist. Checks for:

  //   (extract_vector_elt

  //     $src,

  //     (sign_extend_inreg (extract_vector_elt $indices, $i))

  //   )

  auto GetSwizzleSrcs = [](size_t I, const SDValue &Lane) {

    auto Bail = std::make_pair(SDValue(), SDValue());

    if (Lane->getOpcode() != ISD::EXTRACT_VECTOR_ELT)

      return Bail;

    const SDValue &SwizzleSrc = Lane->getOperand(0);

    const SDValue &IndexExt = Lane->getOperand(1);

    if (IndexExt->getOpcode() != ISD::SIGN_EXTEND_INREG)

      return Bail;

    const SDValue &Index = IndexExt->getOperand(0);

    if (Index->getOpcode() != ISD::EXTRACT_VECTOR_ELT)

      return Bail;

    const SDValue &SwizzleIndices = Index->getOperand(0);

    if (SwizzleSrc.getValueType() != MVT::v16i8 ||

        SwizzleIndices.getValueType() != MVT::v16i8 ||

        Index->getOperand(1)->getOpcode() != ISD::Constant ||

        Index->getConstantOperandVal(1) != I)

      return Bail;

    return std::make_pair(SwizzleSrc, SwizzleIndices);

  };


  // If the lane is extracted from another vector at a constant index, return

  // that vector. The source vector must not have more lanes than the dest

  // because the shufflevector indices are in terms of the destination lanes and

  // would not be able to address the smaller individual source lanes.

  auto GetShuffleSrc = [&](const SDValue &Lane) {

    if (Lane->getOpcode() != ISD::EXTRACT_VECTOR_ELT)

      return SDValue();

    if (!isa<ConstantSDNode>(Lane->getOperand(1).getNode()))

      return SDValue();

    if (Lane->getOperand(0).getValueType().getVectorNumElements() >

        VecT.getVectorNumElements())

      return SDValue();

    return Lane->getOperand(0);

  };


  using ValueEntry = std::pair<SDValue, size_t>;

  SmallVector<ValueEntry, 16> SplatValueCounts;


  using SwizzleEntry = std::pair<std::pair<SDValue, SDValue>, size_t>;

  SmallVector<SwizzleEntry, 16> SwizzleCounts;


  using ShuffleEntry = std::pair<SDValue, size_t>;

  SmallVector<ShuffleEntry, 16> ShuffleCounts;


  auto AddCount = [](auto &Counts, const auto &Val) {

    auto CountIt =

        llvm::find_if(Counts, [&Val](auto E) { return E.first == Val; });

    if (CountIt == Counts.end()) {

      Counts.emplace_back(Val, 1);

    } else {

      CountIt->second++;

    }

  };


  auto GetMostCommon = [](auto &Counts) {

    auto CommonIt = llvm::max_element(Counts, llvm::less_second());

    assert(CommonIt != Counts.end() && "Unexpected all-undef build_vector");

    return *CommonIt;

  };


  size_t NumConstantLanes = 0;


  // Count eligible lanes for each type of vector creation op

  for (size_t I = 0; I < Lanes; ++I) {

    const SDValue &Lane = Op->getOperand(I);

    if (Lane.isUndef())

      continue;


    AddCount(SplatValueCounts, Lane);


    if (IsConstant(Lane))

      NumConstantLanes++;

    if (auto ShuffleSrc = GetShuffleSrc(Lane))

      AddCount(ShuffleCounts, ShuffleSrc);

    if (CanSwizzle) {

      auto SwizzleSrcs = GetSwizzleSrcs(I, Lane);

      if (SwizzleSrcs.first)

        AddCount(SwizzleCounts, SwizzleSrcs);

    }

  }


  SDValue SplatValue;

  size_t NumSplatLanes;

  std::tie(SplatValue, NumSplatLanes) = GetMostCommon(SplatValueCounts);


  SDValue SwizzleSrc;

  SDValue SwizzleIndices;

  size_t NumSwizzleLanes = 0;

  if (SwizzleCounts.size())

    std::forward_as_tuple(std::tie(SwizzleSrc, SwizzleIndices),

                          NumSwizzleLanes) = GetMostCommon(SwizzleCounts);


  // Shuffles can draw from up to two vectors, so find the two most common

  // sources.

  SDValue ShuffleSrc1, ShuffleSrc2;

  size_t NumShuffleLanes = 0;

  if (ShuffleCounts.size()) {

    std::tie(ShuffleSrc1, NumShuffleLanes) = GetMostCommon(ShuffleCounts);

    llvm::erase_if(ShuffleCounts,

                   [&](const auto &Pair) { return Pair.first == ShuffleSrc1; });

  }

  if (ShuffleCounts.size()) {

    size_t AdditionalShuffleLanes;

    std::tie(ShuffleSrc2, AdditionalShuffleLanes) =

        GetMostCommon(ShuffleCounts);

    NumShuffleLanes += AdditionalShuffleLanes;

  }


  // Predicate returning true if the lane is properly initialized by the

  // original instruction

  std::function<bool(size_t, const SDValue &)> IsLaneConstructed;

  SDValue Result;

  // Prefer swizzles over shuffles over vector consts over splats

  if (NumSwizzleLanes >= NumShuffleLanes &&

      NumSwizzleLanes >= NumConstantLanes && NumSwizzleLanes >= NumSplatLanes) {

    Result = DAG.getNode(WebAssemblyISD::SWIZZLE, DL, VecT, SwizzleSrc,

                         SwizzleIndices);

    auto Swizzled = std::make_pair(SwizzleSrc, SwizzleIndices);

    IsLaneConstructed = [&, Swizzled](size_t I, const SDValue &Lane) {

      return Swizzled == GetSwizzleSrcs(I, Lane);

    };

  } else if (NumShuffleLanes >= NumConstantLanes &&

             NumShuffleLanes >= NumSplatLanes) {

    size_t DestLaneSize = VecT.getVectorElementType().getFixedSizeInBits() / 8;

    size_t DestLaneCount = VecT.getVectorNumElements();

    size_t Scale1 = 1;

    size_t Scale2 = 1;

    SDValue Src1 = ShuffleSrc1;

    SDValue Src2 = ShuffleSrc2 ? ShuffleSrc2 : DAG.getUNDEF(VecT);

    if (Src1.getValueType() != VecT) {

      size_t LaneSize =

          Src1.getValueType().getVectorElementType().getFixedSizeInBits() / 8;

      assert(LaneSize > DestLaneSize);

      Scale1 = LaneSize / DestLaneSize;

      Src1 = DAG.getBitcast(VecT, Src1);

    }

    if (Src2.getValueType() != VecT) {

      size_t LaneSize =

          Src2.getValueType().getVectorElementType().getFixedSizeInBits() / 8;

      assert(LaneSize > DestLaneSize);

      Scale2 = LaneSize / DestLaneSize;

      Src2 = DAG.getBitcast(VecT, Src2);

    }


    int Mask[16];

    assert(DestLaneCount <= 16);

    for (size_t I = 0; I < DestLaneCount; ++I) {

      const SDValue &Lane = Op->getOperand(I);

      SDValue Src = GetShuffleSrc(Lane);

      if (Src == ShuffleSrc1) {

        Mask[I] = Lane->getConstantOperandVal(1) * Scale1;

      } else if (Src && Src == ShuffleSrc2) {

        Mask[I] = DestLaneCount + Lane->getConstantOperandVal(1) * Scale2;

      } else {

        Mask[I] = -1;

      }

    }

    ArrayRef<int> MaskRef(Mask, DestLaneCount);

    Result = DAG.getVectorShuffle(VecT, DL, Src1, Src2, MaskRef);

    IsLaneConstructed = [&](size_t, const SDValue &Lane) {

      auto Src = GetShuffleSrc(Lane);

      return Src == ShuffleSrc1 || (Src && Src == ShuffleSrc2);

    };

  } else if (NumConstantLanes >= NumSplatLanes) {

    SmallVector<SDValue, 16> ConstLanes;

    for (const SDValue &Lane : Op->op_values()) {

      if (IsConstant(Lane)) {

        // Values may need to be fixed so that they will sign extend to be

        // within the expected range during ISel. Check whether the value is in

        // bounds based on the lane bit width and if it is out of bounds, lop

        // off the extra bits and subtract 2^n to reflect giving the high bit

        // value -2^(n-1) rather than +2^(n-1). Skip the i64 case because it

        // cannot possibly be out of range.

        auto *Const = dyn_cast<ConstantSDNode>(Lane.getNode());

        int64_t Val = Const ? Const->getSExtValue() : 0;

        uint64_t LaneBits = 128 / Lanes;

        assert((LaneBits == 64 || Val >= -(1ll << (LaneBits - 1))) &&

               "Unexpected out of bounds negative value");

        if (Const && LaneBits != 64 && Val > (1ll << (LaneBits - 1)) - 1) {

          uint64_t Mask = (1ll << LaneBits) - 1;

          auto NewVal = (((uint64_t)Val & Mask) - (1ll << LaneBits)) & Mask;

          ConstLanes.push_back(DAG.getConstant(NewVal, SDLoc(Lane), LaneT));

        } else {

          ConstLanes.push_back(Lane);

        }

      } else if (LaneT.isFloatingPoint()) {

        ConstLanes.push_back(DAG.getConstantFP(0, DL, LaneT));

      } else {

        ConstLanes.push_back(DAG.getConstant(0, DL, LaneT));

      }

    }

    Result = DAG.getBuildVector(VecT, DL, ConstLanes);

    IsLaneConstructed = [&IsConstant](size_t _, const SDValue &Lane) {

      return IsConstant(Lane);

    };

  } else {

    size_t DestLaneSize = VecT.getVectorElementType().getFixedSizeInBits();

    if (NumSplatLanes == 1 && Op->getOperand(0) == SplatValue &&

        (DestLaneSize == 32 || DestLaneSize == 64)) {

      // Could be selected to load_zero.

      Result = DAG.getNode(ISD::SCALAR_TO_VECTOR, DL, VecT, SplatValue);

    } else {

      // Use a splat (which might be selected as a load splat)

      Result = DAG.getSplatBuildVector(VecT, DL, SplatValue);

    }

    IsLaneConstructed = [&SplatValue](size_t _, const SDValue &Lane) {

      return Lane == SplatValue;

    };

  }


  assert(Result);

  assert(IsLaneConstructed);


  // Add replace_lane instructions for any unhandled values

  for (size_t I = 0; I < Lanes; ++I) {

    const SDValue &Lane = Op->getOperand(I);

    if (!Lane.isUndef() && !IsLaneConstructed(I, Lane))

      Result = DAG.getNode(ISD::INSERT_VECTOR_ELT, DL, VecT, Result, Lane,

                           DAG.getConstant(I, DL, MVT::i32));

  }


  return Result;

}


SDValue

WebAssemblyTargetLowering::LowerVECTOR_SHUFFLE(SDValue Op,

                                               SelectionDAG &DAG) const {

  SDLoc DL(Op);

  ArrayRef<int> Mask = cast<ShuffleVectorSDNode>(Op.getNode())->getMask();

  MVT VecType = Op.getOperand(0).getSimpleValueType();

  assert(VecType.is128BitVector() && "Unexpected shuffle vector type");

  size_t LaneBytes = VecType.getVectorElementType().getSizeInBits() / 8;


  // Space for two vector args and sixteen mask indices

  SDValue Ops[18];

  size_t OpIdx = 0;

  Ops[OpIdx++] = Op.getOperand(0);

  Ops[OpIdx++] = Op.getOperand(1);


  // Expand mask indices to byte indices and materialize them as operands

  for (int M : Mask) {

    for (size_t J = 0; J < LaneBytes; ++J) {

      // Lower undefs (represented by -1 in mask) to {0..J}, which use a

      // whole lane of vector input, to allow further reduction at VM. E.g.

      // match an 8x16 byte shuffle to an equivalent cheaper 32x4 shuffle.

      uint64_t ByteIndex = M == -1 ? J : (uint64_t)M * LaneBytes + J;

      Ops[OpIdx++] = DAG.getConstant(ByteIndex, DL, MVT::i32);

    }

  }


  return DAG.getNode(WebAssemblyISD::SHUFFLE, DL, Op.getValueType(), Ops);

}


SDValue WebAssemblyTargetLowering::LowerSETCC(SDValue Op,

                                              SelectionDAG &DAG) const {

  SDLoc DL(Op);

  // The legalizer does not know how to expand the unsupported comparison modes

  // of i64x2 vectors, so we manually unroll them here.

  assert(Op->getOperand(0)->getSimpleValueType(0) == MVT::v2i64);

  SmallVector<SDValue, 2> LHS, RHS;

  DAG.ExtractVectorElements(Op->getOperand(0), LHS);

  DAG.ExtractVectorElements(Op->getOperand(1), RHS);

  const SDValue &CC = Op->getOperand(2);

  auto MakeLane = [&](unsigned I) {

    return DAG.getNode(ISD::SELECT_CC, DL, MVT::i64, LHS[I], RHS[I],

                       DAG.getConstant(uint64_t(-1), DL, MVT::i64),

                       DAG.getConstant(uint64_t(0), DL, MVT::i64), CC);

  };

  return DAG.getBuildVector(Op->getValueType(0), DL,

                            {MakeLane(0), MakeLane(1)});

}


SDValue

WebAssemblyTargetLowering::LowerAccessVectorElement(SDValue Op,

                                                    SelectionDAG &DAG) const {

  // Allow constant lane indices, expand variable lane indices

  SDNode *IdxNode = Op.getOperand(Op.getNumOperands() - 1).getNode();

  if (isa<ConstantSDNode>(IdxNode)) {

    // Ensure the index type is i32 to match the tablegen patterns

    uint64_t Idx = IdxNode->getAsZExtVal();

    SmallVector<SDValue, 3> Ops(Op.getNode()->ops());

    Ops[Op.getNumOperands() - 1] =

        DAG.getConstant(Idx, SDLoc(IdxNode), MVT::i32);

    return DAG.getNode(Op.getOpcode(), SDLoc(Op), Op.getValueType(), Ops);

  }

  // Perform default expansion

  return SDValue();

}


static SDValue unrollVectorShift(SDValue Op, SelectionDAG &DAG) {

  EVT LaneT = Op.getSimpleValueType().getVectorElementType();

  // 32-bit and 64-bit unrolled shifts will have proper semantics

  if (LaneT.bitsGE(MVT::i32))

    return DAG.UnrollVectorOp(Op.getNode());

  // Otherwise mask the shift value to get proper semantics from 32-bit shift

  SDLoc DL(Op);

  size_t NumLanes = Op.getSimpleValueType().getVectorNumElements();

  SDValue Mask = DAG.getConstant(LaneT.getSizeInBits() - 1, DL, MVT::i32);

  unsigned ShiftOpcode = Op.getOpcode();

  SmallVector<SDValue, 16> ShiftedElements;

  DAG.ExtractVectorElements(Op.getOperand(0), ShiftedElements, 0, 0, MVT::i32);

  SmallVector<SDValue, 16> ShiftElements;

  DAG.ExtractVectorElements(Op.getOperand(1), ShiftElements, 0, 0, MVT::i32);

  SmallVector<SDValue, 16> UnrolledOps;

  for (size_t i = 0; i < NumLanes; ++i) {

    SDValue MaskedShiftValue =

        DAG.getNode(ISD::AND, DL, MVT::i32, ShiftElements[i], Mask);

    SDValue ShiftedValue = ShiftedElements[i];

    if (ShiftOpcode == ISD::SRA)

      ShiftedValue = DAG.getNode(ISD::SIGN_EXTEND_INREG, DL, MVT::i32,

                                 ShiftedValue, DAG.getValueType(LaneT));

    UnrolledOps.push_back(

        DAG.getNode(ShiftOpcode, DL, MVT::i32, ShiftedValue, MaskedShiftValue));

  }

  return DAG.getBuildVector(Op.getValueType(), DL, UnrolledOps);

}


SDValue WebAssemblyTargetLowering::LowerShift(SDValue Op,

                                              SelectionDAG &DAG) const {

  SDLoc DL(Op);


  // Only manually lower vector shifts

  assert(Op.getSimpleValueType().isVector());


  uint64_t LaneBits = Op.getValueType().getScalarSizeInBits();

  auto ShiftVal = Op.getOperand(1);


  // Try to skip bitmask operation since it is implied inside shift instruction

  auto SkipImpliedMask = [](SDValue MaskOp, uint64_t MaskBits) {

    if (MaskOp.getOpcode() != ISD::AND)

      return MaskOp;

    SDValue LHS = MaskOp.getOperand(0);

    SDValue RHS = MaskOp.getOperand(1);

    if (MaskOp.getValueType().isVector()) {

      APInt MaskVal;

      if (!ISD::isConstantSplatVector(RHS.getNode(), MaskVal))

        std::swap(LHS, RHS);


      if (ISD::isConstantSplatVector(RHS.getNode(), MaskVal) &&

          MaskVal == MaskBits)

        MaskOp = LHS;

    } else {

      if (!isa<ConstantSDNode>(RHS.getNode()))

        std::swap(LHS, RHS);


      auto ConstantRHS = dyn_cast<ConstantSDNode>(RHS.getNode());

      if (ConstantRHS && ConstantRHS->getAPIntValue() == MaskBits)

        MaskOp = LHS;

    }


    return MaskOp;

  };


  // Skip vector and operation

  ShiftVal = SkipImpliedMask(ShiftVal, LaneBits - 1);

  ShiftVal = DAG.getSplatValue(ShiftVal);

  if (!ShiftVal)

    return unrollVectorShift(Op, DAG);


  // Skip scalar and operation

  ShiftVal = SkipImpliedMask(ShiftVal, LaneBits - 1);

  // Use anyext because none of the high bits can affect the shift

  ShiftVal = DAG.getAnyExtOrTrunc(ShiftVal, DL, MVT::i32);


  unsigned Opcode;

  switch (Op.getOpcode()) {

  case ISD::SHL:

    Opcode = WebAssemblyISD::VEC_SHL;

    break;

  case ISD::SRA:

    Opcode = WebAssemblyISD::VEC_SHR_S;

    break;

  case ISD::SRL:

    Opcode = WebAssemblyISD::VEC_SHR_U;

    break;

  default:

    llvm_unreachable("unexpected opcode");

  }


  return DAG.getNode(Opcode, DL, Op.getValueType(), Op.getOperand(0), ShiftVal);

}


SDValue WebAssemblyTargetLowering::LowerFP_TO_INT_SAT(SDValue Op,

                                                      SelectionDAG &DAG) const {

  EVT ResT = Op.getValueType();

  EVT SatVT = cast<VTSDNode>(Op.getOperand(1))->getVT();


  if ((ResT == MVT::i32 || ResT == MVT::i64) &&

      (SatVT == MVT::i32 || SatVT == MVT::i64))

    return Op;


  if (ResT == MVT::v4i32 && SatVT == MVT::i32)

    return Op;


  if (ResT == MVT::v8i16 && SatVT == MVT::i16)

    return Op;


  return SDValue();

}


//===----------------------------------------------------------------------===//

//   Custom DAG combine hooks

//===----------------------------------------------------------------------===//

static SDValue

performVECTOR_SHUFFLECombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI) {

  auto &DAG = DCI.DAG;

  auto Shuffle = cast<ShuffleVectorSDNode>(N);


  // Hoist vector bitcasts that don't change the number of lanes out of unary

  // shuffles, where they are less likely to get in the way of other combines.

  // (shuffle (vNxT1 (bitcast (vNxT0 x))), undef, mask) ->

  //  (vNxT1 (bitcast (vNxT0 (shuffle x, undef, mask))))

  SDValue Bitcast = N->getOperand(0);

  if (Bitcast.getOpcode() != ISD::BITCAST)

    return SDValue();

  if (!N->getOperand(1).isUndef())

    return SDValue();

  SDValue CastOp = Bitcast.getOperand(0);

  EVT SrcType = CastOp.getValueType();

  EVT DstType = Bitcast.getValueType();

  if (!SrcType.is128BitVector() ||

      SrcType.getVectorNumElements() != DstType.getVectorNumElements())

    return SDValue();

  SDValue NewShuffle = DAG.getVectorShuffle(

      SrcType, SDLoc(N), CastOp, DAG.getUNDEF(SrcType), Shuffle->getMask());

  return DAG.getBitcast(DstType, NewShuffle);

}


/// Convert ({u,s}itofp vec) --> ({u,s}itofp ({s,z}ext vec)) so it doesn't get

/// split up into scalar instructions during legalization, and the vector

/// extending instructions are selected in performVectorExtendCombine below.

static SDValue

performVectorExtendToFPCombine(SDNode *N,

                               TargetLowering::DAGCombinerInfo &DCI) {

  auto &DAG = DCI.DAG;

  assert(N->getOpcode() == ISD::UINT_TO_FP ||

         N->getOpcode() == ISD::SINT_TO_FP);


  EVT InVT = N->getOperand(0)->getValueType(0);

  EVT ResVT = N->getValueType(0);

  MVT ExtVT;

  if (ResVT == MVT::v4f32 && (InVT == MVT::v4i16 || InVT == MVT::v4i8))

    ExtVT = MVT::v4i32;

  else if (ResVT == MVT::v2f64 && (InVT == MVT::v2i16 || InVT == MVT::v2i8))

    ExtVT = MVT::v2i32;

  else

    return SDValue();


  unsigned Op =

      N->getOpcode() == ISD::UINT_TO_FP ? ISD::ZERO_EXTEND : ISD::SIGN_EXTEND;

  SDValue Conv = DAG.getNode(Op, SDLoc(N), ExtVT, N->getOperand(0));

  return DAG.getNode(N->getOpcode(), SDLoc(N), ResVT, Conv);

}


static SDValue

performVectorNonNegToFPCombine(SDNode *N,

                               TargetLowering::DAGCombinerInfo &DCI) {

  auto &DAG = DCI.DAG;


  SDNodeFlags Flags = N->getFlags();

  SDValue Op0 = N->getOperand(0);

  EVT VT = N->getValueType(0);


  // Optimize uitofp to sitofp when the sign bit is known to be zero.

  // Depending on the target (runtime) backend, this might be performance

  // neutral (e.g. AArch64) or a significant improvement (e.g. x86_64).

  if (VT.isVector() && (Flags.hasNonNeg() || DAG.SignBitIsZero(Op0))) {

    return DAG.getNode(ISD::SINT_TO_FP, SDLoc(N), VT, Op0);

  }


  return SDValue();

}


static SDValue

performVectorExtendCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI) {

  auto &DAG = DCI.DAG;

  assert(N->getOpcode() == ISD::SIGN_EXTEND ||

         N->getOpcode() == ISD::ZERO_EXTEND);


  // Combine ({s,z}ext (extract_subvector src, i)) into a widening operation if

  // possible before the extract_subvector can be expanded.

  auto Extract = N->getOperand(0);

  if (Extract.getOpcode() != ISD::EXTRACT_SUBVECTOR)

    return SDValue();

  auto Source = Extract.getOperand(0);

  auto *IndexNode = dyn_cast<ConstantSDNode>(Extract.getOperand(1));

  if (IndexNode == nullptr)

    return SDValue();

  auto Index = IndexNode->getZExtValue();


  // Only v8i8, v4i16, and v2i32 extracts can be widened, and only if the

  // extracted subvector is the low or high half of its source.

  EVT ResVT = N->getValueType(0);

  if (ResVT == MVT::v8i16) {

    if (Extract.getValueType() != MVT::v8i8 ||

        Source.getValueType() != MVT::v16i8 || (Index != 0 && Index != 8))

      return SDValue();

  } else if (ResVT == MVT::v4i32) {

    if (Extract.getValueType() != MVT::v4i16 ||

        Source.getValueType() != MVT::v8i16 || (Index != 0 && Index != 4))

      return SDValue();

  } else if (ResVT == MVT::v2i64) {

    if (Extract.getValueType() != MVT::v2i32 ||

        Source.getValueType() != MVT::v4i32 || (Index != 0 && Index != 2))

      return SDValue();

  } else {

    return SDValue();

  }


  bool IsSext = N->getOpcode() == ISD::SIGN_EXTEND;

  bool IsLow = Index == 0;


  unsigned Op = IsSext ? (IsLow ? WebAssemblyISD::EXTEND_LOW_S

                                : WebAssemblyISD::EXTEND_HIGH_S)

                       : (IsLow ? WebAssemblyISD::EXTEND_LOW_U

                                : WebAssemblyISD::EXTEND_HIGH_U);


  return DAG.getNode(Op, SDLoc(N), ResVT, Source);

}


static SDValue

performVectorTruncZeroCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI) {

  auto &DAG = DCI.DAG;


  auto GetWasmConversionOp = [](unsigned Op) {

    switch (Op) {

    case ISD::FP_TO_SINT_SAT:

      return WebAssemblyISD::TRUNC_SAT_ZERO_S;

    case ISD::FP_TO_UINT_SAT:

      return WebAssemblyISD::TRUNC_SAT_ZERO_U;

    case ISD::FP_ROUND:

      return WebAssemblyISD::DEMOTE_ZERO;

    }

    llvm_unreachable("unexpected op");

  };


  auto IsZeroSplat = [](SDValue SplatVal) {

    auto *Splat = dyn_cast<BuildVectorSDNode>(SplatVal.getNode());

    APInt SplatValue, SplatUndef;

    unsigned SplatBitSize;

    bool HasAnyUndefs;

    // Endianness doesn't matter in this context because we are looking for

    // an all-zero value.

    return Splat &&

           Splat->isConstantSplat(SplatValue, SplatUndef, SplatBitSize,

                                  HasAnyUndefs) &&

           SplatValue == 0;

  };


  if (N->getOpcode() == ISD::CONCAT_VECTORS) {

    // Combine this:

    //

    //   (concat_vectors (v2i32 (fp_to_{s,u}int_sat $x, 32)), (v2i32 (splat 0)))

    //

    // into (i32x4.trunc_sat_f64x2_zero_{s,u} $x).

    //

    // Or this:

    //

    //   (concat_vectors (v2f32 (fp_round (v2f64 $x))), (v2f32 (splat 0)))

    //

    // into (f32x4.demote_zero_f64x2 $x).

    EVT ResVT;

    EVT ExpectedConversionType;

    auto Conversion = N->getOperand(0);

    auto ConversionOp = Conversion.getOpcode();

    switch (ConversionOp) {

    case ISD::FP_TO_SINT_SAT:

    case ISD::FP_TO_UINT_SAT:

      ResVT = MVT::v4i32;

      ExpectedConversionType = MVT::v2i32;

      break;

    case ISD::FP_ROUND:

      ResVT = MVT::v4f32;

      ExpectedConversionType = MVT::v2f32;

      break;

    default:

      return SDValue();

    }


    if (N->getValueType(0) != ResVT)

      return SDValue();


    if (Conversion.getValueType() != ExpectedConversionType)

      return SDValue();


    auto Source = Conversion.getOperand(0);

    if (Source.getValueType() != MVT::v2f64)

      return SDValue();


    if (!IsZeroSplat(N->getOperand(1)) ||

        N->getOperand(1).getValueType() != ExpectedConversionType)

      return SDValue();


    unsigned Op = GetWasmConversionOp(ConversionOp);

    return DAG.getNode(Op, SDLoc(N), ResVT, Source);

  }


  // Combine this:

  //

  //   (fp_to_{s,u}int_sat (concat_vectors $x, (v2f64 (splat 0))), 32)

  //

  // into (i32x4.trunc_sat_f64x2_zero_{s,u} $x).

  //

  // Or this:

  //

  //   (v4f32 (fp_round (concat_vectors $x, (v2f64 (splat 0)))))

  //

  // into (f32x4.demote_zero_f64x2 $x).

  EVT ResVT;

  auto ConversionOp = N->getOpcode();

  switch (ConversionOp) {

  case ISD::FP_TO_SINT_SAT:

  case ISD::FP_TO_UINT_SAT:

    ResVT = MVT::v4i32;

    break;

  case ISD::FP_ROUND:

    ResVT = MVT::v4f32;

    break;

  default:

    llvm_unreachable("unexpected op");

  }


  if (N->getValueType(0) != ResVT)

    return SDValue();


  auto Concat = N->getOperand(0);

  if (Concat.getValueType() != MVT::v4f64)

    return SDValue();


  auto Source = Concat.getOperand(0);

  if (Source.getValueType() != MVT::v2f64)

    return SDValue();


  if (!IsZeroSplat(Concat.getOperand(1)) ||

      Concat.getOperand(1).getValueType() != MVT::v2f64)

    return SDValue();


  unsigned Op = GetWasmConversionOp(ConversionOp);

  return DAG.getNode(Op, SDLoc(N), ResVT, Source);

}


// Helper to extract VectorWidth bits from Vec, starting from IdxVal.

static SDValue extractSubVector(SDValue Vec, unsigned IdxVal, SelectionDAG &DAG,

                                const SDLoc &DL, unsigned VectorWidth) {

  EVT VT = Vec.getValueType();

  EVT ElVT = VT.getVectorElementType();

  unsigned Factor = VT.getSizeInBits() / VectorWidth;

  EVT ResultVT = EVT::getVectorVT(*DAG.getContext(), ElVT,

                                  VT.getVectorNumElements() / Factor);


  // Extract the relevant VectorWidth bits.  Generate an EXTRACT_SUBVECTOR

  unsigned ElemsPerChunk = VectorWidth / ElVT.getSizeInBits();

  assert(isPowerOf2_32(ElemsPerChunk) && "Elements per chunk not power of 2");


  // This is the index of the first element of the VectorWidth-bit chunk

  // we want. Since ElemsPerChunk is a power of 2 just need to clear bits.

  IdxVal &= ~(ElemsPerChunk - 1);


  // If the input is a buildvector just emit a smaller one.

  if (Vec.getOpcode() == ISD::BUILD_VECTOR)

    return DAG.getBuildVector(ResultVT, DL,

                              Vec->ops().slice(IdxVal, ElemsPerChunk));


  SDValue VecIdx = DAG.getIntPtrConstant(IdxVal, DL);

  return DAG.getNode(ISD::EXTRACT_SUBVECTOR, DL, ResultVT, Vec, VecIdx);

}


// Helper to recursively truncate vector elements in half with NARROW_U. DstVT

// is the expected destination value type after recursion. In is the initial

// input. Note that the input should have enough leading zero bits to prevent

// NARROW_U from saturating results.

static SDValue truncateVectorWithNARROW(EVT DstVT, SDValue In, const SDLoc &DL,

                                        SelectionDAG &DAG) {

  EVT SrcVT = In.getValueType();


  // No truncation required, we might get here due to recursive calls.

  if (SrcVT == DstVT)

    return In;


  unsigned SrcSizeInBits = SrcVT.getSizeInBits();

  unsigned NumElems = SrcVT.getVectorNumElements();

  if (!isPowerOf2_32(NumElems))

    return SDValue();

  assert(DstVT.getVectorNumElements() == NumElems && "Illegal truncation");

  assert(SrcSizeInBits > DstVT.getSizeInBits() && "Illegal truncation");


  LLVMContext &Ctx = *DAG.getContext();

  EVT PackedSVT = EVT::getIntegerVT(Ctx, SrcVT.getScalarSizeInBits() / 2);


  // Narrow to the largest type possible:

  // vXi64/vXi32 -> i16x8.narrow_i32x4_u and vXi16 -> i8x16.narrow_i16x8_u.

  EVT InVT = MVT::i16, OutVT = MVT::i8;

  if (SrcVT.getScalarSizeInBits() > 16) {

    InVT = MVT::i32;

    OutVT = MVT::i16;

  }

  unsigned SubSizeInBits = SrcSizeInBits / 2;

  InVT = EVT::getVectorVT(Ctx, InVT, SubSizeInBits / InVT.getSizeInBits());

  OutVT = EVT::getVectorVT(Ctx, OutVT, SubSizeInBits / OutVT.getSizeInBits());


  // Split lower/upper subvectors.

  SDValue Lo = extractSubVector(In, 0, DAG, DL, SubSizeInBits);

  SDValue Hi = extractSubVector(In, NumElems / 2, DAG, DL, SubSizeInBits);


  // 256bit -> 128bit truncate - Narrow lower/upper 128-bit subvectors.

  if (SrcVT.is256BitVector() && DstVT.is128BitVector()) {

    Lo = DAG.getBitcast(InVT, Lo);

    Hi = DAG.getBitcast(InVT, Hi);

    SDValue Res = DAG.getNode(WebAssemblyISD::NARROW_U, DL, OutVT, Lo, Hi);

    return DAG.getBitcast(DstVT, Res);

  }


  // Recursively narrow lower/upper subvectors, concat result and narrow again.

  EVT PackedVT = EVT::getVectorVT(Ctx, PackedSVT, NumElems / 2);

  Lo = truncateVectorWithNARROW(PackedVT, Lo, DL, DAG);

  Hi = truncateVectorWithNARROW(PackedVT, Hi, DL, DAG);


  PackedVT = EVT::getVectorVT(Ctx, PackedSVT, NumElems);

  SDValue Res = DAG.getNode(ISD::CONCAT_VECTORS, DL, PackedVT, Lo, Hi);

  return truncateVectorWithNARROW(DstVT, Res, DL, DAG);

}


static SDValue performTruncateCombine(SDNode *N,

                                      TargetLowering::DAGCombinerInfo &DCI) {

  auto &DAG = DCI.DAG;


  SDValue In = N->getOperand(0);

  EVT InVT = In.getValueType();

  if (!InVT.isSimple())

    return SDValue();


  EVT OutVT = N->getValueType(0);

  if (!OutVT.isVector())

    return SDValue();


  EVT OutSVT = OutVT.getVectorElementType();

  EVT InSVT = InVT.getVectorElementType();

  // Currently only cover truncate to v16i8 or v8i16.

  if (!((InSVT == MVT::i16 || InSVT == MVT::i32 || InSVT == MVT::i64) &&

        (OutSVT == MVT::i8 || OutSVT == MVT::i16) && OutVT.is128BitVector()))

    return SDValue();


  SDLoc DL(N);

  APInt Mask = APInt::getLowBitsSet(InVT.getScalarSizeInBits(),

                                    OutVT.getScalarSizeInBits());

  In = DAG.getNode(ISD::AND, DL, InVT, In, DAG.getConstant(Mask, DL, InVT));

  return truncateVectorWithNARROW(OutVT, In, DL, DAG);

}


static SDValue performBitcastCombine(SDNode *N,

                                     TargetLowering::DAGCombinerInfo &DCI) {

  using namespace llvm::SDPatternMatch;

  auto &DAG = DCI.DAG;

  SDLoc DL(N);

  SDValue Src = N->getOperand(0);

  EVT VT = N->getValueType(0);

  EVT SrcVT = Src.getValueType();


  if (!(DCI.isBeforeLegalize() && VT.isScalarInteger() &&

        SrcVT.isFixedLengthVector() && SrcVT.getScalarType() == MVT::i1))

    return SDValue();


  unsigned NumElts = SrcVT.getVectorNumElements();

  EVT Width = MVT::getIntegerVT(128 / NumElts);


  // bitcast <N x i1> to iN, where N = 2, 4, 8, 16 (legal)

  //   ==> bitmask

  if (NumElts == 2 || NumElts == 4 || NumElts == 8 || NumElts == 16) {

    return DAG.getZExtOrTrunc(

        DAG.getNode(ISD::INTRINSIC_WO_CHAIN, DL, MVT::i32,

                    {DAG.getConstant(Intrinsic::wasm_bitmask, DL, MVT::i32),

                     DAG.getSExtOrTrunc(N->getOperand(0), DL,

                                        SrcVT.changeVectorElementType(Width))}),

        DL, VT);

  }


  // bitcast <N x i1>(setcc ...) to concat iN, where N = 32 and 64 (illegal)

  if (NumElts == 32 || NumElts == 64) {

    // Strategy: We will setcc them seperately in v16i8 -> v16i1

    // Bitcast them to i16, extend them to either i32 or i64.

    // Add them together, shifting left 1 by 1.

    SDValue Concat, SetCCVector;

    ISD::CondCode SetCond;


    if (!sd_match(N, m_BitCast(m_c_SetCC(m_Value(Concat), m_Value(SetCCVector),

                                         m_CondCode(SetCond)))))

      return SDValue();

    if (Concat.getOpcode() != ISD::CONCAT_VECTORS)

      return SDValue();


    uint64_t ElementWidth =

        SetCCVector.getValueType().getVectorElementType().getFixedSizeInBits();


    SmallVector<SDValue> VectorsToShuffle;

    for (size_t I = 0; I < Concat->ops().size(); I++) {

      VectorsToShuffle.push_back(DAG.getBitcast(

          MVT::i16,

          DAG.getSetCC(DL, MVT::v16i1, Concat->ops()[I],

                       extractSubVector(SetCCVector, I * (128 / ElementWidth),

                                        DAG, DL, 128),

                       SetCond)));

    }


    MVT ReturnType = VectorsToShuffle.size() == 2 ? MVT::i32 : MVT::i64;

    SDValue ReturningInteger = DAG.getConstant(0, DL, ReturnType);


    for (SDValue V : VectorsToShuffle) {

      ReturningInteger = DAG.getNode(

          ISD::SHL, DL, ReturnType,

          {DAG.getShiftAmountConstant(16, ReturnType, DL), ReturningInteger});


      SDValue ExtendedV = DAG.getZExtOrTrunc(V, DL, ReturnType);

      ReturningInteger =

          DAG.getNode(ISD::ADD, DL, ReturnType, {ReturningInteger, ExtendedV});

    }


    return ReturningInteger;

  }


  return SDValue();

}


static SDValue performAnyAllCombine(SDNode *N, SelectionDAG &DAG) {

  // any_true (setcc <X>, 0, eq) => (not (all_true X))

  // all_true (setcc <X>, 0, eq) => (not (any_true X))

  // any_true (setcc <X>, 0, ne) => (any_true X)

  // all_true (setcc <X>, 0, ne) => (all_true X)

  assert(N->getOpcode() == ISD::INTRINSIC_WO_CHAIN);

  using namespace llvm::SDPatternMatch;


  SDValue LHS;

  if (!sd_match(N->getOperand(1),

                m_c_SetCC(m_Value(LHS), m_Zero(), m_CondCode())))

    return SDValue();

  EVT LT = LHS.getValueType();

  if (LT.getScalarSizeInBits() > 128 / LT.getVectorNumElements())

    return SDValue();


  auto CombineSetCC = [&N, &DAG](Intrinsic::WASMIntrinsics InPre,

                                 ISD::CondCode SetType,

                                 Intrinsic::WASMIntrinsics InPost) {

    if (N->getConstantOperandVal(0) != InPre)

      return SDValue();


    SDValue LHS;

    if (!sd_match(N->getOperand(1), m_c_SetCC(m_Value(LHS), m_Zero(),

                                              m_SpecificCondCode(SetType))))

      return SDValue();


    SDLoc DL(N);

    SDValue Ret = DAG.getZExtOrTrunc(

        DAG.getNode(ISD::INTRINSIC_WO_CHAIN, DL, MVT::i32,

                    {DAG.getConstant(InPost, DL, MVT::i32), LHS}),

        DL, MVT::i1);

    if (SetType == ISD::SETEQ)

      Ret = DAG.getNOT(DL, Ret, MVT::i1);

    return DAG.getZExtOrTrunc(Ret, DL, N->getValueType(0));

  };


  if (SDValue AnyTrueEQ = CombineSetCC(Intrinsic::wasm_anytrue, ISD::SETEQ,

                                       Intrinsic::wasm_alltrue))

    return AnyTrueEQ;

  if (SDValue AllTrueEQ = CombineSetCC(Intrinsic::wasm_alltrue, ISD::SETEQ,

                                       Intrinsic::wasm_anytrue))

    return AllTrueEQ;

  if (SDValue AnyTrueNE = CombineSetCC(Intrinsic::wasm_anytrue, ISD::SETNE,

                                       Intrinsic::wasm_anytrue))

    return AnyTrueNE;

  if (SDValue AllTrueNE = CombineSetCC(Intrinsic::wasm_alltrue, ISD::SETNE,

                                       Intrinsic::wasm_alltrue))

    return AllTrueNE;


  return SDValue();

}


template <int MatchRHS, ISD::CondCode MatchCond, bool RequiresNegate,

          Intrinsic::ID Intrin>

static SDValue TryMatchTrue(SDNode *N, EVT VecVT, SelectionDAG &DAG) {

  SDValue LHS = N->getOperand(0);

  SDValue RHS = N->getOperand(1);

  SDValue Cond = N->getOperand(2);

  if (MatchCond != cast<CondCodeSDNode>(Cond)->get())

    return SDValue();


  if (MatchRHS != cast<ConstantSDNode>(RHS)->getSExtValue())

    return SDValue();


  SDLoc DL(N);

  SDValue Ret = DAG.getZExtOrTrunc(

      DAG.getNode(ISD::INTRINSIC_WO_CHAIN, DL, MVT::i32,

                  {DAG.getConstant(Intrin, DL, MVT::i32),

                   DAG.getSExtOrTrunc(LHS->getOperand(0), DL, VecVT)}),

      DL, MVT::i1);

  if (RequiresNegate)

    Ret = DAG.getNOT(DL, Ret, MVT::i1);

  return DAG.getZExtOrTrunc(Ret, DL, N->getValueType(0));

}


/// Try to convert a i128 comparison to a v16i8 comparison before type

/// legalization splits it up into chunks

static SDValue

combineVectorSizedSetCCEquality(SDNode *N, TargetLowering::DAGCombinerInfo &DCI,

                                const WebAssemblySubtarget *Subtarget) {


  SDLoc DL(N);

  SDValue X = N->getOperand(0);

  SDValue Y = N->getOperand(1);

  EVT VT = N->getValueType(0);

  EVT OpVT = X.getValueType();


  SelectionDAG &DAG = DCI.DAG;

  if (DCI.DAG.getMachineFunction().getFunction().hasFnAttribute(

          Attribute::NoImplicitFloat))

    return SDValue();


  ISD::CondCode CC = cast<CondCodeSDNode>(N->getOperand(2))->get();

  // We're looking for an oversized integer equality comparison with SIMD

  if (!OpVT.isScalarInteger() || !OpVT.isByteSized() || OpVT != MVT::i128 ||

      !Subtarget->hasSIMD128() || !isIntEqualitySetCC(CC))

    return SDValue();


  // Don't perform this combine if constructing the vector will be expensive.

  auto IsVectorBitCastCheap = [](SDValue X) {

    X = peekThroughBitcasts(X);

    return isa<ConstantSDNode>(X) || X.getOpcode() == ISD::LOAD;

  };


  if (!IsVectorBitCastCheap(X) || !IsVectorBitCastCheap(Y))

    return SDValue();


  SDValue VecX = DAG.getBitcast(MVT::v16i8, X);

  SDValue VecY = DAG.getBitcast(MVT::v16i8, Y);

  SDValue Cmp = DAG.getSetCC(DL, MVT::v16i8, VecX, VecY, CC);


  SDValue Intr =

      DAG.getNode(ISD::INTRINSIC_WO_CHAIN, DL, MVT::i32,

                  {DAG.getConstant(CC == ISD::SETEQ ? Intrinsic::wasm_alltrue

                                                    : Intrinsic::wasm_anytrue,

                                   DL, MVT::i32),

                   Cmp});


  return DAG.getSetCC(DL, VT, Intr, DAG.getConstant(0, DL, MVT::i32),

                      ISD::SETNE);

}


static SDValue performSETCCCombine(SDNode *N,

                                   TargetLowering::DAGCombinerInfo &DCI,

                                   const WebAssemblySubtarget *Subtarget) {

  if (!DCI.isBeforeLegalize())

    return SDValue();


  EVT VT = N->getValueType(0);

  if (!VT.isScalarInteger())

    return SDValue();


  if (SDValue V = combineVectorSizedSetCCEquality(N, DCI, Subtarget))

    return V;


  SDValue LHS = N->getOperand(0);

  if (LHS->getOpcode() != ISD::BITCAST)

    return SDValue();


  EVT FromVT = LHS->getOperand(0).getValueType();

  if (!FromVT.isFixedLengthVector() || FromVT.getVectorElementType() != MVT::i1)

    return SDValue();


  unsigned NumElts = FromVT.getVectorNumElements();

  if (NumElts != 2 && NumElts != 4 && NumElts != 8 && NumElts != 16)

    return SDValue();


  if (!cast<ConstantSDNode>(N->getOperand(1)))

    return SDValue();


  EVT VecVT = FromVT.changeVectorElementType(MVT::getIntegerVT(128 / NumElts));

  auto &DAG = DCI.DAG;

  // setcc (iN (bitcast (vNi1 X))), 0, ne

  //   ==> any_true (vNi1 X)

  if (auto Match = TryMatchTrue<0, ISD::SETNE, false, Intrinsic::wasm_anytrue>(

          N, VecVT, DAG)) {

    return Match;

  }

  // setcc (iN (bitcast (vNi1 X))), 0, eq

  //   ==> xor (any_true (vNi1 X)), -1

  if (auto Match = TryMatchTrue<0, ISD::SETEQ, true, Intrinsic::wasm_anytrue>(

          N, VecVT, DAG)) {

    return Match;

  }

  // setcc (iN (bitcast (vNi1 X))), -1, eq

  //   ==> all_true (vNi1 X)

  if (auto Match = TryMatchTrue<-1, ISD::SETEQ, false, Intrinsic::wasm_alltrue>(

          N, VecVT, DAG)) {

    return Match;

  }

  // setcc (iN (bitcast (vNi1 X))), -1, ne

  //   ==> xor (all_true (vNi1 X)), -1

  if (auto Match = TryMatchTrue<-1, ISD::SETNE, true, Intrinsic::wasm_alltrue>(

          N, VecVT, DAG)) {

    return Match;

  }

  return SDValue();

}


static SDValue TryWideExtMulCombine(SDNode *N, SelectionDAG &DAG) {

  EVT VT = N->getValueType(0);

  if (VT != MVT::v8i32 && VT != MVT::v16i32)

    return SDValue();


  // Mul with extending inputs.

  SDValue LHS = N->getOperand(0);

  SDValue RHS = N->getOperand(1);

  if (LHS.getOpcode() != RHS.getOpcode())

    return SDValue();


  if (LHS.getOpcode() != ISD::SIGN_EXTEND &&

      LHS.getOpcode() != ISD::ZERO_EXTEND)

    return SDValue();


  if (LHS->getOperand(0).getValueType() != RHS->getOperand(0).getValueType())

    return SDValue();


  EVT FromVT = LHS->getOperand(0).getValueType();

  EVT EltTy = FromVT.getVectorElementType();

  if (EltTy != MVT::i8)

    return SDValue();


  // For an input DAG that looks like this

  // %a = input_type

  // %b = input_type

  // %lhs = extend %a to output_type

  // %rhs = extend %b to output_type

  // %mul = mul %lhs, %rhs


  // input_type | output_type | instructions

  // v16i8      | v16i32      | %low = i16x8.extmul_low_i8x16_ %a, %b

  //            |             | %high = i16x8.extmul_high_i8x16_, %a, %b

  //            |             | %low_low = i32x4.ext_low_i16x8_ %low

  //            |             | %low_high = i32x4.ext_high_i16x8_ %low

  //            |             | %high_low = i32x4.ext_low_i16x8_ %high

  //            |             | %high_high = i32x4.ext_high_i16x8_ %high

  //            |             | %res = concat_vector(...)

  // v8i8       | v8i32       | %low = i16x8.extmul_low_i8x16_ %a, %b

  //            |             | %low_low = i32x4.ext_low_i16x8_ %low

  //            |             | %low_high = i32x4.ext_high_i16x8_ %low

  //            |             | %res = concat_vector(%low_low, %low_high)


  SDLoc DL(N);

  unsigned NumElts = VT.getVectorNumElements();

  SDValue ExtendInLHS = LHS->getOperand(0);

  SDValue ExtendInRHS = RHS->getOperand(0);

  bool IsSigned = LHS->getOpcode() == ISD::SIGN_EXTEND;

  unsigned ExtendLowOpc =

      IsSigned ? WebAssemblyISD::EXTEND_LOW_S : WebAssemblyISD::EXTEND_LOW_U;

  unsigned ExtendHighOpc =

      IsSigned ? WebAssemblyISD::EXTEND_HIGH_S : WebAssemblyISD::EXTEND_HIGH_U;


  auto GetExtendLow = [&DAG, &DL, &ExtendLowOpc](EVT VT, SDValue Op) {

    return DAG.getNode(ExtendLowOpc, DL, VT, Op);

  };

  auto GetExtendHigh = [&DAG, &DL, &ExtendHighOpc](EVT VT, SDValue Op) {

    return DAG.getNode(ExtendHighOpc, DL, VT, Op);

  };


  if (NumElts == 16) {

    SDValue LowLHS = GetExtendLow(MVT::v8i16, ExtendInLHS);

    SDValue LowRHS = GetExtendLow(MVT::v8i16, ExtendInRHS);

    SDValue MulLow = DAG.getNode(ISD::MUL, DL, MVT::v8i16, LowLHS, LowRHS);

    SDValue HighLHS = GetExtendHigh(MVT::v8i16, ExtendInLHS);

    SDValue HighRHS = GetExtendHigh(MVT::v8i16, ExtendInRHS);

    SDValue MulHigh = DAG.getNode(ISD::MUL, DL, MVT::v8i16, HighLHS, HighRHS);

    SDValue SubVectors[] = {

        GetExtendLow(MVT::v4i32, MulLow),

        GetExtendHigh(MVT::v4i32, MulLow),

        GetExtendLow(MVT::v4i32, MulHigh),

        GetExtendHigh(MVT::v4i32, MulHigh),

    };

    return DAG.getNode(ISD::CONCAT_VECTORS, DL, VT, SubVectors);

  } else {

    assert(NumElts == 8);

    SDValue LowLHS = DAG.getNode(LHS->getOpcode(), DL, MVT::v8i16, ExtendInLHS);

    SDValue LowRHS = DAG.getNode(RHS->getOpcode(), DL, MVT::v8i16, ExtendInRHS);

    SDValue MulLow = DAG.getNode(ISD::MUL, DL, MVT::v8i16, LowLHS, LowRHS);

    SDValue Lo = GetExtendLow(MVT::v4i32, MulLow);

    SDValue Hi = GetExtendHigh(MVT::v4i32, MulLow);

    return DAG.getNode(ISD::CONCAT_VECTORS, DL, VT, Lo, Hi);

  }

  return SDValue();

}


static SDValue performMulCombine(SDNode *N,

                                 TargetLowering::DAGCombinerInfo &DCI) {

  assert(N->getOpcode() == ISD::MUL);

  EVT VT = N->getValueType(0);

  if (!VT.isVector())

    return SDValue();


  if (auto Res = TryWideExtMulCombine(N, DCI.DAG))

    return Res;


  // We don't natively support v16i8 or v8i8 mul, but we do support v8i16. So,

  // extend them to v8i16. Only do this before legalization in case a narrow

  // vector is widened and may be simplified later.

  if (!DCI.isBeforeLegalize() || (VT != MVT::v8i8 && VT != MVT::v16i8))

    return SDValue();


  SDLoc DL(N);

  SelectionDAG &DAG = DCI.DAG;

  SDValue LHS = N->getOperand(0);

  SDValue RHS = N->getOperand(1);

  EVT MulVT = MVT::v8i16;


  if (VT == MVT::v8i8) {

    SDValue PromotedLHS = DAG.getNode(ISD::CONCAT_VECTORS, DL, MVT::v16i8, LHS,

                                      DAG.getUNDEF(MVT::v8i8));

    SDValue PromotedRHS = DAG.getNode(ISD::CONCAT_VECTORS, DL, MVT::v16i8, RHS,

                                      DAG.getUNDEF(MVT::v8i8));

    SDValue LowLHS =

        DAG.getNode(WebAssemblyISD::EXTEND_LOW_U, DL, MulVT, PromotedLHS);

    SDValue LowRHS =

        DAG.getNode(WebAssemblyISD::EXTEND_LOW_U, DL, MulVT, PromotedRHS);

    SDValue MulLow = DAG.getBitcast(

        MVT::v16i8, DAG.getNode(ISD::MUL, DL, MulVT, LowLHS, LowRHS));

    // Take the low byte of each lane.

    SDValue Shuffle = DAG.getVectorShuffle(

        MVT::v16i8, DL, MulLow, DAG.getUNDEF(MVT::v16i8),

        {0, 2, 4, 6, 8, 10, 12, 14, -1, -1, -1, -1, -1, -1, -1, -1});

    return extractSubVector(Shuffle, 0, DAG, DL, 64);

  } else {

    assert(VT == MVT::v16i8 && "Expected v16i8");

    SDValue LowLHS = DAG.getNode(WebAssemblyISD::EXTEND_LOW_U, DL, MulVT, LHS);

    SDValue LowRHS = DAG.getNode(WebAssemblyISD::EXTEND_LOW_U, DL, MulVT, RHS);

    SDValue HighLHS =

        DAG.getNode(WebAssemblyISD::EXTEND_HIGH_U, DL, MulVT, LHS);

    SDValue HighRHS =

        DAG.getNode(WebAssemblyISD::EXTEND_HIGH_U, DL, MulVT, RHS);


    SDValue MulLow =

        DAG.getBitcast(VT, DAG.getNode(ISD::MUL, DL, MulVT, LowLHS, LowRHS));

    SDValue MulHigh =

        DAG.getBitcast(VT, DAG.getNode(ISD::MUL, DL, MulVT, HighLHS, HighRHS));


    // Take the low byte of each lane.

    return DAG.getVectorShuffle(

        VT, DL, MulLow, MulHigh,

        {0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30});

  }

}


SDValue

WebAssemblyTargetLowering::PerformDAGCombine(SDNode *N,

                                             DAGCombinerInfo &DCI) const {

  switch (N->getOpcode()) {

  default:

    return SDValue();

  case ISD::BITCAST:

    return performBitcastCombine(N, DCI);

  case ISD::SETCC:

    return performSETCCCombine(N, DCI, Subtarget);

  case ISD::VECTOR_SHUFFLE:

    return performVECTOR_SHUFFLECombine(N, DCI);

  case ISD::SIGN_EXTEND:

  case ISD::ZERO_EXTEND:

    return performVectorExtendCombine(N, DCI);

  case ISD::UINT_TO_FP:

    if (auto ExtCombine = performVectorExtendToFPCombine(N, DCI))

      return ExtCombine;

    return performVectorNonNegToFPCombine(N, DCI);

  case ISD::SINT_TO_FP:

    return performVectorExtendToFPCombine(N, DCI);

  case ISD::FP_TO_SINT_SAT:

  case ISD::FP_TO_UINT_SAT:

  case ISD::FP_ROUND:

  case ISD::CONCAT_VECTORS:

    return performVectorTruncZeroCombine(N, DCI);

  case ISD::TRUNCATE:

    return performTruncateCombine(N, DCI);

  case ISD::INTRINSIC_WO_CHAIN: {

    if (auto AnyAllCombine = performAnyAllCombine(N, DCI.DAG))

      return AnyAllCombine;

    return performLowerPartialReduction(N, DCI.DAG);

  }

  case ISD::MUL:

    return performMulCombine(N, DCI);

  }

}

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:103

SelectTypeKind::FP
@ FP

performMulCombine
static SDValue performMulCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const AArch64Subtarget *Subtarget)
Definition: AArch64ISelLowering.cpp:19141

performTruncateCombine
static SDValue performTruncateCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI)
Definition: AArch64ISelLowering.cpp:21287

performSETCCCombine
static SDValue performSETCCCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI, SelectionDAG &DAG)
Definition: AArch64ISelLowering.cpp:25629

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

Intr
unsigned Intr
Definition: AMDGPUBaseInfo.cpp:3279

MBB
MachineBasicBlock & MBB
Definition: ARMSLSHardening.cpp:71

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

Results
Function Alias Analysis Results
Definition: AliasAnalysis.cpp:722

fail
static void fail(const SDLoc &DL, SelectionDAG &DAG, const Twine &Msg, SDValue Val={})
Definition: BPFISelLowering.cpp:41

Info
Analysis containing CSE Info
Definition: CSEInfo.cpp:27

CallingConvLower.h

RetTy
return RetTy
Definition: DeadArgumentElimination.cpp:355

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:347

DiagnosticInfo.h

DiagnosticPrinter.h

Sym
Symbol * Sym
Definition: ELF_riscv.cpp:479

X
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")

HashFunctionMode::Local
@ Local

GEP
Hexagon Common GEP
Definition: HexagonCommonGEP.cpp:164

TII
const HexagonInstrInfo * TII
Definition: HexagonCopyToCombine.cpp:118

_
#define _
Definition: HexagonMCCodeEmitter.cpp:47

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:110

Function.h

IntrinsicInst.h

Intrinsics.h

KnownBits.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

AddrMode
AddrMode
Definition: MSP430Disassembler.cpp:138

MachineFrameInfo.h

MachineInstrBuilder.h

MachineJumpTableInfo.h

MachineModuleInfo.h

MachineRegisterInfo.h

TRI
Register const TargetRegisterInfo * TRI
Definition: MachineSink.cpp:2118

MathExtras.h

Context
@ Context
Definition: MemProfContextDisambiguation.cpp:124

OpIdx
MachineInstr unsigned OpIdx
Definition: NVPTXPrologEpilogPass.cpp:56

Y
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")

performVECTOR_SHUFFLECombine
static SDValue performVECTOR_SHUFFLECombine(SDNode *N, SelectionDAG &DAG, const RISCVSubtarget &Subtarget, const RISCVTargetLowering &TLI)
Definition: RISCVISelLowering.cpp:19279

combineVectorSizedSetCCEquality
static SDValue combineVectorSizedSetCCEquality(EVT VT, SDValue X, SDValue Y, ISD::CondCode CC, const SDLoc &DL, SelectionDAG &DAG, const RISCVSubtarget &Subtarget)
Try to map an integer comparison with size > XLEN to vector instructions before type legalization spl...
Definition: RISCVISelLowering.cpp:16564

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition: RISCVRedundantCopyElimination.cpp:71

Opc
auto Opc
Definition: RISCVRedundantCopyElimination.cpp:75

SDPatternMatch.h
Contains matchers for matching SelectionDAG nodes and values.

SelectionDAGNodes.h

SelectionDAG.h

Int64
@ Int64
Definition: TargetLibraryInfo.cpp:69

TargetOptions.h

LowerFPToInt
static MachineBasicBlock * LowerFPToInt(MachineInstr &MI, DebugLoc DL, MachineBasicBlock *BB, const TargetInstrInfo &TII, bool IsUnsigned, bool Int64, bool Float64, unsigned LoweredOpcode)
Definition: WebAssemblyISelLowering.cpp:513

callingConvSupported
static bool callingConvSupported(CallingConv::ID CallConv)
Definition: WebAssemblyISelLowering.cpp:1186

TryWideExtMulCombine
static SDValue TryWideExtMulCombine(SDNode *N, SelectionDAG &DAG)
Definition: WebAssemblyISelLowering.cpp:3495

LowerMemcpy
static MachineBasicBlock * LowerMemcpy(MachineInstr &MI, DebugLoc DL, MachineBasicBlock *BB, const TargetInstrInfo &TII, bool Int64)
Definition: WebAssemblyISelLowering.cpp:608

IsWebAssemblyLocal
static std::optional< unsigned > IsWebAssemblyLocal(SDValue Op, SelectionDAG &DAG)
Definition: WebAssemblyISelLowering.cpp:1713

performVectorExtendCombine
static SDValue performVectorExtendCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
Definition: WebAssemblyISelLowering.cpp:2967

performVectorNonNegToFPCombine
static SDValue performVectorNonNegToFPCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
Definition: WebAssemblyISelLowering.cpp:2948

unrollVectorShift
static SDValue unrollVectorShift(SDValue Op, SelectionDAG &DAG)
Definition: WebAssemblyISelLowering.cpp:2782

performAnyAllCombine
static SDValue performAnyAllCombine(SDNode *N, SelectionDAG &DAG)
Definition: WebAssemblyISelLowering.cpp:3315

LowerCallResults
static MachineBasicBlock * LowerCallResults(MachineInstr &CallResults, DebugLoc DL, MachineBasicBlock *BB, const WebAssemblySubtarget *Subtarget, const TargetInstrInfo &TII)
Definition: WebAssemblyISelLowering.cpp:739

TryMatchTrue
static SDValue TryMatchTrue(SDNode *N, EVT VecVT, SelectionDAG &DAG)
Definition: WebAssemblyISelLowering.cpp:3370

GetExtendHigh
static SDValue GetExtendHigh(SDValue Op, unsigned UserOpc, EVT VT, SelectionDAG &DAG)
Definition: WebAssemblyISelLowering.cpp:2312

performVectorTruncZeroCombine
static SDValue performVectorTruncZeroCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
Definition: WebAssemblyISelLowering.cpp:3014

IsWebAssemblyGlobal
static bool IsWebAssemblyGlobal(SDValue Op)
Definition: WebAssemblyISelLowering.cpp:1706

LowerMemset
static MachineBasicBlock * LowerMemset(MachineInstr &MI, DebugLoc DL, MachineBasicBlock *BB, const TargetInstrInfo &TII, bool Int64)
Definition: WebAssemblyISelLowering.cpp:677

performVectorExtendToFPCombine
static SDValue performVectorExtendToFPCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
Convert ({u,s}itofp vec) --> ({u,s}itofp ({s,z}ext vec)) so it doesn't get split up into scalar instr...
Definition: WebAssemblyISelLowering.cpp:2925

LowerConvertLow
static SDValue LowerConvertLow(SDValue Op, SelectionDAG &DAG)
Definition: WebAssemblyISelLowering.cpp:2386

performLowerPartialReduction
SDValue performLowerPartialReduction(SDNode *N, SelectionDAG &DAG)
Definition: WebAssemblyISelLowering.cpp:2112

extractSubVector
static SDValue extractSubVector(SDValue Vec, unsigned IdxVal, SelectionDAG &DAG, const SDLoc &DL, unsigned VectorWidth)
Definition: WebAssemblyISelLowering.cpp:3135

performBitcastCombine
static SDValue performBitcastCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
Definition: WebAssemblyISelLowering.cpp:3242

truncateVectorWithNARROW
static SDValue truncateVectorWithNARROW(EVT DstVT, SDValue In, const SDLoc &DL, SelectionDAG &DAG)
Definition: WebAssemblyISelLowering.cpp:3164

WebAssemblyISelLowering.h
This file defines the interfaces that WebAssembly uses to lower LLVM code into a selection DAG.

WebAssemblyMCTargetDesc.h
This file provides WebAssembly-specific target descriptions.

WebAssemblyMachineFunctionInfo.h
This file declares WebAssembly-specific per-machine-function information.

WebAssemblySubtarget.h
This file declares the WebAssembly-specific subclass of TargetSubtarget.

WebAssemblyTargetMachine.h
This file declares the WebAssembly-specific subclass of TargetMachine.

WebAssemblyTypeUtilities.h
This file contains the declaration of the WebAssembly-specific type parsing utility functions.

WebAssemblyUtilities.h
This file contains the declaration of the WebAssembly-specific utility functions.

Conversion
X86 cmov Conversion
Definition: X86CmovConversion.cpp:890

Concat
static constexpr int Concat[]
Definition: X86InterleavedAccess.cpp:232

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

Node
Definition: ItaniumDemangle.h:166

T

bool

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::APInt::setBitsFrom
void setBitsFrom(unsigned loBit)
Set the top bits starting from loBit.
Definition: APInt.h:1385

llvm::APInt::getLowBitsSet
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
Definition: APInt.h:306

llvm::APInt::getHighBitsSet
static APInt getHighBitsSet(unsigned numBits, unsigned hiBitsSet)
Constructs an APInt value that has the top hiBitsSet bits set.
Definition: APInt.h:296

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::AtomicRMWInst
an instruction that atomically reads a memory location, combines it with another value,...
Definition: Instructions.h:709

llvm::AtomicRMWInst::Add
@ Add
*p = old + v
Definition: Instructions.h:725

llvm::AtomicRMWInst::Or
@ Or
*p = old | v
Definition: Instructions.h:733

llvm::AtomicRMWInst::Sub
@ Sub
*p = old - v
Definition: Instructions.h:727

llvm::AtomicRMWInst::And
@ And
*p = old & v
Definition: Instructions.h:729

llvm::AtomicRMWInst::Xor
@ Xor
*p = old ^ v
Definition: Instructions.h:735

llvm::AtomicRMWInst::Xchg
@ Xchg
*p = v
Definition: Instructions.h:723

llvm::AtomicRMWInst::getOperation
BinOp getOperation() const
Definition: Instructions.h:819

llvm::AttributeList
Definition: Attributes.h:506

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:62

llvm::CCState
CCState - This class holds information needed while lowering arguments and return values.
Definition: CallingConvLower.h:171

llvm::CCValAssign::Full
@ Full
Definition: CallingConvLower.h:37

llvm::CCValAssign::getMem
static CCValAssign getMem(unsigned ValNo, MVT ValVT, int64_t Offset, MVT LocVT, LocInfo HTP, bool IsCustom=false)
Definition: CallingConvLower.h:97

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1510

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:33

llvm::DWARFExpression::Operation::getNumOperands
uint64_t getNumOperands() const
Definition: DWARFExpression.h:93

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::DebugLoc
A debug info location.
Definition: DebugLoc.h:124

llvm::DiagnosticInfoUnsupported
Diagnostic information for unsupported feature in backend.
Definition: DiagnosticInfo.h:1101

llvm::FastISel
This is a fast-path instruction selection class that generates poor code and doesn't support illegal ...
Definition: FastISel.h:66

llvm::FrameIndexSDNode
Definition: SelectionDAGNodes.h:1983

llvm::FrameIndexSDNode::getIndex
int getIndex() const
Definition: SelectionDAGNodes.h:1994

llvm::FunctionLoweringInfo
FunctionLoweringInfo - This contains information that is global to a function that is used when lower...
Definition: FunctionLoweringInfo.h:56

llvm::Function
Definition: Function.h:64

llvm::Function::getFunctionType
FunctionType * getFunctionType() const
Returns the FunctionType for me.
Definition: Function.h:209

llvm::Function::getContext
LLVMContext & getContext() const
getContext - Return a reference to the LLVMContext associated with this function.
Definition: Function.cpp:359

llvm::Function::hasFnAttribute
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
Definition: Function.cpp:727

llvm::GlobalAddressSDNode
Definition: SelectionDAGNodes.h:1955

llvm::GlobalAddressSDNode::getOffset
int64_t getOffset() const
Definition: SelectionDAGNodes.h:1970

llvm::GlobalAddressSDNode::getAddressSpace
LLVM_ABI unsigned getAddressSpace() const
Definition: SelectionDAG.cpp:13499

llvm::GlobalAddressSDNode::getTargetFlags
unsigned getTargetFlags() const
Definition: SelectionDAGNodes.h:1971

llvm::GlobalAddressSDNode::getGlobal
const GlobalValue * getGlobal() const
Definition: SelectionDAGNodes.h:1969

llvm::GlobalValue
Definition: GlobalValue.h:49

llvm::GlobalValue::LocalExecTLSModel
@ LocalExecTLSModel
Definition: GlobalValue.h:202

llvm::GlobalValue::GeneralDynamicTLSModel
@ GeneralDynamicTLSModel
Definition: GlobalValue.h:199

llvm::GlobalValue::NotThreadLocal
@ NotThreadLocal
Definition: GlobalValue.h:198

llvm::GlobalValue::InitialExecTLSModel
@ InitialExecTLSModel
Definition: GlobalValue.h:201

llvm::GlobalValue::LocalDynamicTLSModel
@ LocalDynamicTLSModel
Definition: GlobalValue.h:200

llvm::GlobalValue::getThreadLocalMode
ThreadLocalMode getThreadLocalMode() const
Definition: GlobalValue.h:273

llvm::GlobalValue::getValueType
Type * getValueType() const
Definition: GlobalValue.h:298

llvm::Instruction
Definition: Instruction.h:69

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:49

llvm::JumpTableSDNode
Definition: SelectionDAGNodes.h:2048

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:68

llvm::LLVMContext::diagnose
LLVM_ABI void diagnose(const DiagnosticInfo &DI)
Report a message to the currently installed diagnostic handler.
Definition: LLVMContext.cpp:245

llvm::LoadSDNode
This class is used to represent ISD::LOAD nodes.
Definition: SelectionDAGNodes.h:2533

llvm::LoadSDNode::getBasePtr
const SDValue & getBasePtr() const
Definition: SelectionDAGNodes.h:2552

llvm::LoadSDNode::getOffset
const SDValue & getOffset() const
Definition: SelectionDAGNodes.h:2553

llvm::MCInstrDesc
Describe properties that are true of each instruction in the target description file.
Definition: MCInstrDesc.h:199

llvm::MCSymbolWasm
Definition: MCSymbolWasm.h:17

llvm::MCSymbolWasm::setNoStrip
void setNoStrip() const
Definition: MCSymbolWasm.h:67

llvm::MVT
Machine Value Type.
Definition: MachineValueType.h:36

llvm::MVT::is128BitVector
bool is128BitVector() const
Return true if this is a 128-bit vector type.
Definition: MachineValueType.h:157

llvm::MVT::INVALID_SIMPLE_VALUE_TYPE
@ INVALID_SIMPLE_VALUE_TYPE
Definition: MachineValueType.h:41

llvm::MVT::integer_fixedlen_vector_valuetypes
static auto integer_fixedlen_vector_valuetypes()
Definition: MachineValueType.h:555

llvm::MVT::changeVectorElementType
MVT changeVectorElementType(MVT EltVT) const
Return a VT for a vector type whose attributes match ourselves with the exception of the element type...
Definition: MachineValueType.h:208

llvm::MVT::getVectorNumElements
unsigned getVectorNumElements() const
Definition: MachineValueType.h:295

llvm::MVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition: MachineValueType.h:107

llvm::MVT::isInteger
bool isInteger() const
Return true if this is an integer or a vector integer type.
Definition: MachineValueType.h:91

llvm::MVT::getVT
static LLVM_ABI MVT getVT(Type *Ty, bool HandleUnknown=false)
Return the value type corresponding to the specified type.
Definition: ValueTypes.cpp:247

llvm::MVT::integer_valuetypes
static auto integer_valuetypes()
Definition: MachineValueType.h:526

llvm::MVT::getSizeInBits
TypeSize getSizeInBits() const
Returns the size of the specified MVT in bits.
Definition: MachineValueType.h:309

llvm::MVT::fixedlen_vector_valuetypes
static auto fixedlen_vector_valuetypes()
Definition: MachineValueType.h:543

llvm::MVT::isFixedLengthVector
bool isFixedLengthVector() const
Definition: MachineValueType.h:136

llvm::MVT::getVectorVT
static MVT getVectorVT(MVT VT, unsigned NumElements)
Definition: MachineValueType.h:452

llvm::MVT::getVectorElementType
MVT getVectorElementType() const
Definition: MachineValueType.h:264

llvm::MVT::isFloatingPoint
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
Definition: MachineValueType.h:81

llvm::MVT::getIntegerVT
static MVT getIntegerVT(unsigned BitWidth)
Definition: MachineValueType.h:442

llvm::MachineBasicBlock
Definition: MachineBasicBlock.h:122

llvm::MachineBasicBlock::transferSuccessorsAndUpdatePHIs
LLVM_ABI void transferSuccessorsAndUpdatePHIs(MachineBasicBlock *FromMBB)
Transfers all the successors, as in transferSuccessors, and update PHI operands in the successor bloc...
Definition: MachineBasicBlock.cpp:935

llvm::MachineBasicBlock::insert
LLVM_ABI instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
Definition: MachineBasicBlock.cpp:1463

llvm::MachineBasicBlock::getBasicBlock
const BasicBlock * getBasicBlock() const
Return the LLVM basic block that this instance corresponded to originally.
Definition: MachineBasicBlock.h:253

llvm::MachineBasicBlock::addSuccessor
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
Definition: MachineBasicBlock.cpp:796

llvm::MachineBasicBlock::begin
iterator begin()
Definition: MachineBasicBlock.h:377

llvm::MachineBasicBlock::end
iterator end()
Definition: MachineBasicBlock.h:379

llvm::MachineBasicBlock::getParent
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
Definition: MachineBasicBlock.h:323

llvm::MachineBasicBlock::insertAfter
iterator insertAfter(iterator I, MachineInstr *MI)
Insert MI into the instruction list after I.
Definition: MachineBasicBlock.h:1070

llvm::MachineBasicBlock::splice
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
Definition: MachineBasicBlock.h:1149

llvm::MachineFrameInfo::CreateStackObject
LLVM_ABI int CreateStackObject(uint64_t Size, Align Alignment, bool isSpillSlot, const AllocaInst *Alloca=nullptr, uint8_t ID=0)
Create a new statically sized stack object, returning a nonnegative identifier to represent it.
Definition: MachineFrameInfo.cpp:51

llvm::MachineFrameInfo::setFrameAddressIsTaken
void setFrameAddressIsTaken(bool T)
Definition: MachineFrameInfo.h:376

llvm::MachineFunction
Definition: MachineFunction.h:286

llvm::MachineFunction::getFunctionNumber
unsigned getFunctionNumber() const
getFunctionNumber - Return a unique ID for the current function.
Definition: MachineFunction.h:742

llvm::MachineFunction::getSubtarget
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Definition: MachineFunction.h:762

llvm::MachineFunction::CreateMachineInstr
MachineInstr * CreateMachineInstr(const MCInstrDesc &MCID, DebugLoc DL, bool NoImplicit=false)
CreateMachineInstr - Allocate a new MachineInstr.
Definition: MachineFunction.cpp:429

llvm::MachineFunction::getFrameInfo
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Definition: MachineFunction.h:778

llvm::MachineFunction::createExternalSymbolName
const char * createExternalSymbolName(StringRef Name)
Allocate a string and populate it with the given external symbol name.
Definition: MachineFunction.cpp:618

llvm::MachineFunction::getContext
MCContext & getContext() const
Definition: MachineFunction.h:719

llvm::MachineFunction::getRegInfo
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Definition: MachineFunction.h:772

llvm::MachineFunction::getDataLayout
const DataLayout & getDataLayout() const
Return the DataLayout attached to the Module associated to this MF.
Definition: MachineFunction.cpp:309

llvm::MachineFunction::getFunction
Function & getFunction()
Return the LLVM function that this machine code represents.
Definition: MachineFunction.h:733

llvm::MachineFunction::getInfo
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
Definition: MachineFunction.h:860

llvm::MachineFunction::getJumpTableInfo
const MachineJumpTableInfo * getJumpTableInfo() const
getJumpTableInfo - Return the jump table info object for the current function.
Definition: MachineFunction.h:785

llvm::MachineInstrBuilder
Definition: MachineInstrBuilder.h:98

llvm::MachineInstrBuilder::addImm
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
Definition: MachineInstrBuilder.h:160

llvm::MachineInstrBuilder::add
const MachineInstrBuilder & add(const MachineOperand &MO) const
Definition: MachineInstrBuilder.h:253

llvm::MachineInstrBuilder::addSym
const MachineInstrBuilder & addSym(MCSymbol *Sym, unsigned char TargetFlags=0) const
Definition: MachineInstrBuilder.h:295

llvm::MachineInstrBuilder::addReg
const MachineInstrBuilder & addReg(Register RegNo, unsigned flags=0, unsigned SubReg=0) const
Add a new virtual register operand.
Definition: MachineInstrBuilder.h:126

llvm::MachineInstrBuilder::addFPImm
const MachineInstrBuilder & addFPImm(const ConstantFP *Val) const
Definition: MachineInstrBuilder.h:170

llvm::MachineInstrBuilder::addMBB
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
Definition: MachineInstrBuilder.h:175

llvm::MachineInstrBuilder::getInstr
MachineInstr * getInstr() const
If conversion operators fail, use this method to get the MachineInstr explicitly.
Definition: MachineInstrBuilder.h:118

llvm::MachineInstr
Representation of each machine instruction.
Definition: MachineInstr.h:72

llvm::MachineInstr::defs
mop_range defs()
Returns all explicit operands that are register definitions.
Definition: MachineInstr.h:724

llvm::MachineInstr::getOpcode
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
Definition: MachineInstr.h:587

llvm::MachineInstr::addOperand
LLVM_ABI void addOperand(MachineFunction &MF, const MachineOperand &Op)
Add the specified operand to the instruction.
Definition: MachineInstr.cpp:206

llvm::MachineInstr::uses
mop_range uses()
Returns all operands which may be register uses.
Definition: MachineInstr.h:731

llvm::MachineInstr::eraseFromParent
LLVM_ABI void eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
Definition: MachineInstr.cpp:770

llvm::MachineInstr::removeOperand
LLVM_ABI void removeOperand(unsigned OpNo)
Erase an operand from an instruction, leaving it with one fewer operand than it started with.
Definition: MachineInstr.cpp:296

llvm::MachineInstr::getOperand
const MachineOperand & getOperand(unsigned i) const
Definition: MachineInstr.h:595

llvm::MachineJumpTableInfo
Definition: MachineJumpTableInfo.h:48

llvm::MachineJumpTableInfo::getJumpTables
const std::vector< MachineJumpTableEntry > & getJumpTables() const
Definition: MachineJumpTableInfo.h:113

llvm::MachineMemOperand::Flags
Flags
Flags values. These may be or'd together.
Definition: MachineMemOperand.h:133

llvm::MachineMemOperand::MOVolatile
@ MOVolatile
The memory access is volatile.
Definition: MachineMemOperand.h:141

llvm::MachineMemOperand::MOLoad
@ MOLoad
The memory access reads data.
Definition: MachineMemOperand.h:137

llvm::MachineMemOperand::MOStore
@ MOStore
The memory access writes data.
Definition: MachineMemOperand.h:139

llvm::MachineOperand
MachineOperand class - Representation of each machine instruction operand.
Definition: MachineOperand.h:48

llvm::MachineOperand::isReg
bool isReg() const
isReg - Tests if this is a MO_Register operand.
Definition: MachineOperand.h:328

llvm::MachineOperand::setIsKill
void setIsKill(bool Val=true)
Definition: MachineOperand.h:519

llvm::MachineOperand::getReg
Register getReg() const
getReg - Returns the register number.
Definition: MachineOperand.h:368

llvm::MachineOperand::isFI
bool isFI() const
isFI - Tests if this is a MO_FrameIndex operand.
Definition: MachineOperand.h:338

llvm::MachineRegisterInfo
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
Definition: MachineRegisterInfo.h:53

llvm::MachineRegisterInfo::createVirtualRegister
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
Definition: MachineRegisterInfo.cpp:156

llvm::MachineRegisterInfo::addLiveIn
void addLiveIn(MCRegister Reg, Register vreg=Register())
addLiveIn - Add the specified register as a live-in.
Definition: MachineRegisterInfo.h:1000

llvm::MemSDNode::getAddressSpace
unsigned getAddressSpace() const
Return the address space for the associated pointer.
Definition: SelectionDAGNodes.h:1488

llvm::MemSDNode::getMemOperand
MachineMemOperand * getMemOperand() const
Return a MachineMemOperand object describing the memory reference performed by operation.
Definition: SelectionDAGNodes.h:1481

llvm::MemSDNode::getChain
const SDValue & getChain() const
Definition: SelectionDAGNodes.h:1508

llvm::MemSDNode::getMemoryVT
EVT getMemoryVT() const
Return the type of the in-memory value.
Definition: SelectionDAGNodes.h:1477

llvm::PointerType::getUnqual
static PointerType * getUnqual(Type *ElementType)
This constructs a pointer to an object of the specified type in the default address space (address sp...
Definition: DerivedTypes.h:720

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::SDLoc
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Definition: SelectionDAGNodes.h:1225

llvm::SDNode
Represents one node in the SelectionDAG.
Definition: SelectionDAGNodes.h:501

llvm::SDNode::ops
ArrayRef< SDUse > ops() const
Definition: SelectionDAGNodes.h:1043

llvm::SDNode::getOpcode
unsigned getOpcode() const
Return the SelectionDAG opcode value for this node.
Definition: SelectionDAGNodes.h:692

llvm::SDNode::getAsZExtVal
uint64_t getAsZExtVal() const
Helper method returns the zero-extended integer value of a ConstantSDNode.
Definition: SelectionDAGNodes.h:1783

llvm::SDNode::getOperand
const SDValue & getOperand(unsigned Num) const
Definition: SelectionDAGNodes.h:1034

llvm::SDNode::getConstantOperandVal
uint64_t getConstantOperandVal(unsigned Num) const
Helper method returns the integer value of a ConstantSDNode operand.
Definition: SelectionDAGNodes.h:1779

llvm::SDNode::getValueType
EVT getValueType(unsigned ResNo) const
Return the type of a specified result.
Definition: SelectionDAGNodes.h:1104

llvm::SDValue
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
Definition: SelectionDAGNodes.h:147

llvm::SDValue::isUndef
bool isUndef() const
Definition: SelectionDAGNodes.h:1292

llvm::SDValue::getNode
SDNode * getNode() const
get the SDNode which holds the desired result
Definition: SelectionDAGNodes.h:161

llvm::SDValue::getValue
SDValue getValue(unsigned R) const
Definition: SelectionDAGNodes.h:181

llvm::SDValue::getValueType
EVT getValueType() const
Return the ValueType of the referenced return value.
Definition: SelectionDAGNodes.h:1260

llvm::SDValue::getOperand
const SDValue & getOperand(unsigned i) const
Definition: SelectionDAGNodes.h:1268

llvm::SDValue::getSimpleValueType
MVT getSimpleValueType() const
Return the simple ValueType of the referenced return value.
Definition: SelectionDAGNodes.h:192

llvm::SDValue::getOpcode
unsigned getOpcode() const
Definition: SelectionDAGNodes.h:1256

llvm::SelectionDAG
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
Definition: SelectionDAG.h:229

llvm::SelectionDAG::getTargetGlobalAddress
SDValue getTargetGlobalAddress(const GlobalValue *GV, const SDLoc &DL, EVT VT, int64_t offset=0, unsigned TargetFlags=0)
Definition: SelectionDAG.h:758

llvm::SelectionDAG::getCopyToReg
SDValue getCopyToReg(SDValue Chain, const SDLoc &dl, Register Reg, SDValue N)
Definition: SelectionDAG.h:813

llvm::SelectionDAG::getMergeValues
LLVM_ABI SDValue getMergeValues(ArrayRef< SDValue > Ops, const SDLoc &dl)
Create a MERGE_VALUES node from the given operands.
Definition: SelectionDAG.cpp:9490

llvm::SelectionDAG::getVTList
LLVM_ABI SDVTList getVTList(EVT VT)
Return an SDVTList that represents the list of values specified.
Definition: SelectionDAG.cpp:11150

llvm::SelectionDAG::getShiftAmountConstant
LLVM_ABI SDValue getShiftAmountConstant(uint64_t Val, EVT VT, const SDLoc &DL)
Definition: SelectionDAG.cpp:1806

llvm::SelectionDAG::getSplatValue
LLVM_ABI SDValue getSplatValue(SDValue V, bool LegalTypes=false)
If V is a splat vector, return its scalar source operand by extracting that element from the source v...
Definition: SelectionDAG.cpp:3236

llvm::SelectionDAG::getMachineNode
LLVM_ABI MachineSDNode * getMachineNode(unsigned Opcode, const SDLoc &dl, EVT VT)
These are used for target selectors to create a new node with specified return type(s),...
Definition: SelectionDAG.cpp:11591

llvm::SelectionDAG::ExtractVectorElements
LLVM_ABI void ExtractVectorElements(SDValue Op, SmallVectorImpl< SDValue > &Args, unsigned Start=0, unsigned Count=0, EVT EltVT=EVT())
Append the extracted elements from Start to Count out of the vector Op in Args.
Definition: SelectionDAG.cpp:13483

llvm::SelectionDAG::getSetCC
SDValue getSetCC(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, ISD::CondCode Cond, SDValue Chain=SDValue(), bool IsSignaling=false)
Helper function to make it easier to build SetCC's if you just have an ISD::CondCode instead of an SD...
Definition: SelectionDAG.h:1311

llvm::SelectionDAG::UnrollVectorOp
LLVM_ABI SDValue UnrollVectorOp(SDNode *N, unsigned ResNE=0)
Utility function used by legalize and lowering to "unroll" a vector operation by splitting out the sc...
Definition: SelectionDAG.cpp:13154

llvm::SelectionDAG::getConstantFP
LLVM_ABI SDValue getConstantFP(double Val, const SDLoc &DL, EVT VT, bool isTarget=false)
Create a ConstantFPSDNode wrapping a constant value.
Definition: SelectionDAG.cpp:1868

llvm::SelectionDAG::getMemIntrinsicNode
LLVM_ABI SDValue getMemIntrinsicNode(unsigned Opcode, const SDLoc &dl, SDVTList VTList, ArrayRef< SDValue > Ops, EVT MemVT, MachinePointerInfo PtrInfo, Align Alignment, MachineMemOperand::Flags Flags=MachineMemOperand::MOLoad|MachineMemOperand::MOStore, LocationSize Size=LocationSize::precise(0), const AAMDNodes &AAInfo=AAMDNodes())
Creates a MemIntrinsicNode that may produce a result and takes a list of operands.
Definition: SelectionDAG.cpp:9501

llvm::SelectionDAG::getMemcpy
LLVM_ABI SDValue getMemcpy(SDValue Chain, const SDLoc &dl, SDValue Dst, SDValue Src, SDValue Size, Align Alignment, bool isVol, bool AlwaysInline, const CallInst *CI, std::optional< bool > OverrideTailCall, MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo, const AAMDNodes &AAInfo=AAMDNodes(), BatchAAResults *BatchAA=nullptr)
Definition: SelectionDAG.cpp:9067

llvm::SelectionDAG::getNOT
LLVM_ABI SDValue getNOT(const SDLoc &DL, SDValue Val, EVT VT)
Create a bitwise NOT operation as (XOR Val, -1).
Definition: SelectionDAG.cpp:1617

llvm::SelectionDAG::getTargetJumpTable
SDValue getTargetJumpTable(int JTI, EVT VT, unsigned TargetFlags=0)
Definition: SelectionDAG.h:768

llvm::SelectionDAG::getUNDEF
SDValue getUNDEF(EVT VT)
Return an UNDEF node. UNDEF does not have a useful SDLoc.
Definition: SelectionDAG.h:1175

llvm::SelectionDAG::getBuildVector
SDValue getBuildVector(EVT VT, const SDLoc &DL, ArrayRef< SDValue > Ops)
Return an ISD::BUILD_VECTOR node.
Definition: SelectionDAG.h:868

llvm::SelectionDAG::getBitcast
LLVM_ABI SDValue getBitcast(EVT VT, SDValue V)
Return a bitcast using the SDLoc of the value operand, and casting to the provided type.
Definition: SelectionDAG.cpp:2428

llvm::SelectionDAG::getCopyFromReg
SDValue getCopyFromReg(SDValue Chain, const SDLoc &dl, Register Reg, EVT VT)
Definition: SelectionDAG.h:839

llvm::SelectionDAG::getDataLayout
const DataLayout & getDataLayout() const
Definition: SelectionDAG.h:498

llvm::SelectionDAG::getTargetFrameIndex
SDValue getTargetFrameIndex(int FI, EVT VT)
Definition: SelectionDAG.h:763

llvm::SelectionDAG::getConstant
LLVM_ABI SDValue getConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Create a ConstantSDNode wrapping a constant value.
Definition: SelectionDAG.cpp:1661

llvm::SelectionDAG::getStore
LLVM_ABI SDValue getStore(SDValue Chain, const SDLoc &dl, SDValue Val, SDValue Ptr, MachinePointerInfo PtrInfo, Align Alignment, MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes())
Helper function to build ISD::STORE nodes.
Definition: SelectionDAG.cpp:9780

llvm::SelectionDAG::SignBitIsZero
LLVM_ABI bool SignBitIsZero(SDValue Op, unsigned Depth=0) const
Return true if the sign bit of Op is known to be zero.
Definition: SelectionDAG.cpp:2919

llvm::SelectionDAG::getBasicBlock
LLVM_ABI SDValue getBasicBlock(MachineBasicBlock *MBB)
Definition: SelectionDAG.cpp:2019

llvm::SelectionDAG::getTarget
const TargetMachine & getTarget() const
Definition: SelectionDAG.h:499

llvm::SelectionDAG::getAnyExtOrTrunc
LLVM_ABI SDValue getAnyExtOrTrunc(SDValue Op, const SDLoc &DL, EVT VT)
Convert Op, which must be of integer type, to the integer type VT, by either any-extending or truncat...
Definition: SelectionDAG.cpp:1491

llvm::SelectionDAG::getIntPtrConstant
LLVM_ABI SDValue getIntPtrConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
Definition: SelectionDAG.cpp:1801

llvm::SelectionDAG::getValueType
LLVM_ABI SDValue getValueType(EVT)
Definition: SelectionDAG.cpp:2033

llvm::SelectionDAG::getNode
LLVM_ABI SDValue getNode(unsigned Opcode, const SDLoc &DL, EVT VT, ArrayRef< SDUse > Ops)
Gets or creates the specified node.
Definition: SelectionDAG.cpp:10781

llvm::SelectionDAG::getTargetConstant
SDValue getTargetConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isOpaque=false)
Definition: SelectionDAG.h:707

llvm::SelectionDAG::getMachineFunction
MachineFunction & getMachineFunction() const
Definition: SelectionDAG.h:493

llvm::SelectionDAG::getSplatBuildVector
SDValue getSplatBuildVector(EVT VT, const SDLoc &DL, SDValue Op)
Return a splat ISD::BUILD_VECTOR node, consisting of Op splatted to all elements.
Definition: SelectionDAG.h:885

llvm::SelectionDAG::getFrameIndex
LLVM_ABI SDValue getFrameIndex(int FI, EVT VT, bool isTarget=false)
Definition: SelectionDAG.cpp:1920

llvm::SelectionDAG::getZExtOrTrunc
LLVM_ABI SDValue getZExtOrTrunc(SDValue Op, const SDLoc &DL, EVT VT)
Convert Op, which must be of integer type, to the integer type VT, by either zero-extending or trunca...
Definition: SelectionDAG.cpp:1503

llvm::SelectionDAG::getContext
LLVMContext * getContext() const
Definition: SelectionDAG.h:511

llvm::SelectionDAG::getTargetExternalSymbol
LLVM_ABI SDValue getTargetExternalSymbol(const char *Sym, EVT VT, unsigned TargetFlags=0)
Definition: SelectionDAG.cpp:2064

llvm::SelectionDAG::getMCSymbol
LLVM_ABI SDValue getMCSymbol(MCSymbol *Sym, EVT VT)
Definition: SelectionDAG.cpp:2055

llvm::SelectionDAG::getEntryNode
SDValue getEntryNode() const
Return the token chain corresponding to the entry of the function.
Definition: SelectionDAG.h:581

llvm::SelectionDAG::getVectorShuffle
LLVM_ABI SDValue getVectorShuffle(EVT VT, const SDLoc &dl, SDValue N1, SDValue N2, ArrayRef< int > Mask)
Return an ISD::VECTOR_SHUFFLE node.
Definition: SelectionDAG.cpp:2142

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:82

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:79

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:574

llvm::SmallVectorImpl::append
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
Definition: SmallVector.h:684

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:414

llvm::SmallVectorTemplateCommon::end
iterator end()
Definition: SmallVector.h:270

llvm::SmallVectorTemplateCommon::begin
iterator begin()
Definition: SmallVector.h:268

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1197

llvm::StoreSDNode
This class is used to represent ISD::STORE nodes.
Definition: SelectionDAGNodes.h:2561

llvm::StoreSDNode::getBasePtr
const SDValue & getBasePtr() const
Definition: SelectionDAGNodes.h:2580

llvm::StoreSDNode::getOffset
const SDValue & getOffset() const
Definition: SelectionDAGNodes.h:2581

llvm::StoreSDNode::getValue
const SDValue & getValue() const
Definition: SelectionDAGNodes.h:2579

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:55

llvm::StringRef::size
constexpr size_t size() const
size - Get the string size.
Definition: StringRef.h:154

llvm::TargetInstrInfo
TargetInstrInfo - Interface to description of machine instruction set.
Definition: TargetInstrInfo.h:114

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition: TargetLibraryInfo.h:285

llvm::TargetLoweringBase::InstructionOpcodeToISD
int InstructionOpcodeToISD(unsigned Opcode) const
Get the ISD node that corresponds to the Instruction class opcode.
Definition: TargetLoweringBase.cpp:1841

llvm::TargetLoweringBase::setBooleanVectorContents
void setBooleanVectorContents(BooleanContent Ty)
Specify how the target extends the result of a vector boolean value from a vector of i1 to a wider ty...
Definition: TargetLowering.h:2566

llvm::TargetLoweringBase::setOperationAction
void setOperationAction(unsigned Op, MVT VT, LegalizeAction Action)
Indicate that the specified operation does not work with the specified type and indicate what to do a...
Definition: TargetLowering.h:2626

llvm::TargetLoweringBase::Custom
@ Custom
Definition: TargetLowering.h:207

llvm::TargetLoweringBase::Expand
@ Expand
Definition: TargetLowering.h:205

llvm::TargetLoweringBase::Promote
@ Promote
Definition: TargetLowering.h:204

llvm::TargetLoweringBase::getRegClassFor
virtual const TargetRegisterClass * getRegClassFor(MVT VT, bool isDivergent=false) const
Return the register class that should be used for the specified value type.
Definition: TargetLowering.h:1069

llvm::TargetLoweringBase::getTargetMachine
const TargetMachine & getTargetMachine() const
Definition: TargetLowering.h:373

llvm::TargetLoweringBase::MaxLoadsPerMemcmp
unsigned MaxLoadsPerMemcmp
Specify maximum number of load instructions per memcmp call.
Definition: TargetLowering.h:3894

llvm::TargetLoweringBase::LegalizeTypeAction
LegalizeTypeAction
This enum indicates whether a types are legal for a target, and if not, what action should be used to...
Definition: TargetLowering.h:212

llvm::TargetLoweringBase::TypeWidenVector
@ TypeWidenVector
Definition: TargetLowering.h:220

llvm::TargetLoweringBase::setMaxAtomicSizeInBitsSupported
void setMaxAtomicSizeInBitsSupported(unsigned SizeInBits)
Set the maximum atomic operation size supported by the backend.
Definition: TargetLowering.h:2849

llvm::TargetLoweringBase::getPreferredVectorAction
virtual TargetLoweringBase::LegalizeTypeAction getPreferredVectorAction(MVT VT) const
Return the preferred vector type legalization action.
Definition: TargetLowering.h:544

llvm::TargetLoweringBase::setBooleanContents
void setBooleanContents(BooleanContent Ty)
Specify how the target extends the result of integer and floating point boolean values from i1 to a w...
Definition: TargetLowering.h:2552

llvm::TargetLoweringBase::computeRegisterProperties
void computeRegisterProperties(const TargetRegisterInfo *TRI)
Once all of the register classes are added, this allows us to compute derived properties we expose.
Definition: TargetLoweringBase.cpp:1351

llvm::TargetLoweringBase::addRegisterClass
void addRegisterClass(MVT VT, const TargetRegisterClass *RC)
Add the specified register class as an available regclass for the specified value type.
Definition: TargetLowering.h:2609

llvm::TargetLoweringBase::getPointerTy
virtual MVT getPointerTy(const DataLayout &DL, uint32_t AS=0) const
Return the pointer type for the given address space, defaults to the pointer type from the data layou...
Definition: TargetLowering.h:380

llvm::TargetLoweringBase::setMinimumJumpTableEntries
void setMinimumJumpTableEntries(unsigned Val)
Indicate the minimum number of blocks to generate jump tables.
Definition: TargetLoweringBase.cpp:2103

llvm::TargetLoweringBase::setTruncStoreAction
void setTruncStoreAction(MVT ValVT, MVT MemVT, LegalizeAction Action)
Indicate that the specified truncating store does not work with the specified type and indicate what ...
Definition: TargetLowering.h:2689

llvm::TargetLoweringBase::ZeroOrOneBooleanContent
@ ZeroOrOneBooleanContent
Definition: TargetLowering.h:239

llvm::TargetLoweringBase::ZeroOrNegativeOneBooleanContent
@ ZeroOrNegativeOneBooleanContent
Definition: TargetLowering.h:240

llvm::TargetLoweringBase::MaxLoadsPerMemcmpOptSize
unsigned MaxLoadsPerMemcmpOptSize
Likewise for functions with the OptSize attribute.
Definition: TargetLowering.h:3896

llvm::TargetLoweringBase::isBinOp
virtual bool isBinOp(unsigned Opcode) const
Return true if the node is a math/logic binary operator.
Definition: TargetLowering.h:3024

llvm::TargetLoweringBase::setStackPointerRegisterToSaveRestore
void setStackPointerRegisterToSaveRestore(Register R)
If set to a physical register, this specifies the register that llvm.savestack/llvm....
Definition: TargetLowering.h:2584

llvm::TargetLoweringBase::AtomicExpansionKind
AtomicExpansionKind
Enum that specifies what an atomic load/AtomicRMWInst is expanded to, if at all.
Definition: TargetLowering.h:256

llvm::TargetLoweringBase::AtomicExpansionKind::CmpXChg
@ CmpXChg

llvm::TargetLoweringBase::AtomicExpansionKind::None
@ None

llvm::TargetLoweringBase::setCondCodeAction
void setCondCodeAction(ArrayRef< ISD::CondCode > CCs, MVT VT, LegalizeAction Action)
Indicate that the specified condition code is or isn't supported on the target and indicate what to d...
Definition: TargetLowering.h:2750

llvm::TargetLoweringBase::setTargetDAGCombine
void setTargetDAGCombine(ArrayRef< ISD::NodeType > NTs)
Targets should invoke this method for each target independent node that they want to provide a custom...
Definition: TargetLowering.h:2814

llvm::TargetLoweringBase::setLoadExtAction
void setLoadExtAction(unsigned ExtType, MVT ValVT, MVT MemVT, LegalizeAction Action)
Indicate that the specified load with extension does not work with the specified type and indicate wh...
Definition: TargetLowering.h:2643

llvm::TargetLoweringBase::getPointerMemTy
virtual MVT getPointerMemTy(const DataLayout &DL, uint32_t AS=0) const
Return the in-memory pointer type for the given address space, defaults to the pointer type from the ...
Definition: TargetLowering.h:387

llvm::TargetLoweringBase::setSchedulingPreference
void setSchedulingPreference(Sched::Preference Pref)
Specify the target scheduling preference.
Definition: TargetLowering.h:2571

llvm::TargetLoweringBase::isOperationLegalOrCustomOrPromote
bool isOperationLegalOrCustomOrPromote(unsigned Op, EVT VT, bool LegalOnly=false) const
Return true if the specified operation is legal on this target or can be made legal with custom lower...
Definition: TargetLowering.h:1394

llvm::TargetLowering
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Definition: TargetLowering.h:3937

llvm::TargetLowering::makeLibCall
std::pair< SDValue, SDValue > makeLibCall(SelectionDAG &DAG, RTLIB::Libcall LC, EVT RetVT, ArrayRef< SDValue > Ops, MakeLibCallOptions CallOptions, const SDLoc &dl, SDValue Chain=SDValue()) const
Returns a pair of (return value, chain).
Definition: TargetLowering.cpp:154

llvm::TargetLowering::isPositionIndependent
bool isPositionIndependent() const
Definition: TargetLowering.cpp:54

llvm::TargetLowering::getRegForInlineAsmConstraint
virtual std::pair< unsigned, const TargetRegisterClass * > getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const
Given a physical register constraint (e.g.
Definition: TargetLowering.cpp:5873

llvm::TargetLowering::isOffsetFoldingLegal
virtual bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const
Return true if folding a constant offset with the given GlobalAddress is legal.
Definition: TargetLowering.cpp:518

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:83

llvm::TargetRegisterClass
Definition: TargetRegisterInfo.h:45

llvm::TargetRegisterInfo
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
Definition: TargetRegisterInfo.h:237

llvm::Triple::isOSEmscripten
bool isOSEmscripten() const
Tests whether the OS is Emscripten.
Definition: Triple.h:745

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getFloatTy
static LLVM_ABI Type * getFloatTy(LLVMContext &C)

llvm::Type::getDoubleTy
static LLVM_ABI Type * getDoubleTy(LLVMContext &C)

llvm::Type::isFunctionTy
bool isFunctionTy() const
True if this is an instance of FunctionType.
Definition: Type.h:258

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition: Use.h:35

llvm::Value
LLVM Value Representation.
Definition: Value.h:75

llvm::Value::stripPointerCastsAndAliases
LLVM_ABI const Value * stripPointerCastsAndAliases() const
Strip off pointer casts, all-zero GEPs, address space casts, and aliases.
Definition: Value.cpp:705

llvm::WebAssemblyFrameLowering::getLocalForStackObject
static std::optional< unsigned > getLocalForStackObject(MachineFunction &MF, int FrameIndex)
Definition: WebAssemblyFrameLowering.cpp:52

llvm::WebAssemblyFunctionInfo
This class is derived from MachineFunctionInfo and contains private WebAssembly-specific information ...
Definition: WebAssemblyMachineFunctionInfo.h:34

llvm::WebAssemblyRegisterInfo::getFrameRegister
Register getFrameRegister(const MachineFunction &MF) const override
Definition: WebAssemblyRegisterInfo.cpp:138

llvm::WebAssemblySubtarget
Definition: WebAssemblySubtarget.h:35

llvm::WebAssemblySubtarget::hasCallIndirectOverlong
bool hasCallIndirectOverlong() const
Definition: WebAssemblySubtarget.h:102

llvm::WebAssemblySubtarget::hasFP16
bool hasFP16() const
Definition: WebAssemblySubtarget.h:105

llvm::WebAssemblySubtarget::hasTailCall
bool hasTailCall() const
Definition: WebAssemblySubtarget.h:115

llvm::WebAssemblySubtarget::getTargetTriple
const Triple & getTargetTriple() const
Definition: WebAssemblySubtarget.h:91

llvm::WebAssemblySubtarget::getInstrInfo
const WebAssemblyInstrInfo * getInstrInfo() const override
Definition: WebAssemblySubtarget.h:85

llvm::WebAssemblySubtarget::hasAddr64
bool hasAddr64() const
Definition: WebAssemblySubtarget.h:98

llvm::WebAssemblySubtarget::hasBulkMemory
bool hasBulkMemory() const
Definition: WebAssemblySubtarget.h:100

llvm::WebAssemblySubtarget::getRegisterInfo
const WebAssemblyRegisterInfo * getRegisterInfo() const override
Definition: WebAssemblySubtarget.h:88

llvm::WebAssemblySubtarget::hasWideArithmetic
bool hasWideArithmetic() const
Definition: WebAssemblySubtarget.h:116

llvm::WebAssemblySubtarget::hasReferenceTypes
bool hasReferenceTypes() const
Definition: WebAssemblySubtarget.h:110

llvm::WebAssemblySubtarget::hasSIMD128
bool hasSIMD128() const
Definition: WebAssemblySubtarget.h:114

llvm::WebAssemblySubtarget::hasExceptionHandling
bool hasExceptionHandling() const
Definition: WebAssemblySubtarget.h:103

llvm::WebAssemblySubtarget::hasSignExt
bool hasSignExt() const
Definition: WebAssemblySubtarget.h:113

llvm::WebAssemblySubtarget::hasNontrappingFPToInt
bool hasNontrappingFPToInt() const
Definition: WebAssemblySubtarget.h:109

llvm::WebAssemblyTargetLowering::WebAssemblyTargetLowering
WebAssemblyTargetLowering(const TargetMachine &TM, const WebAssemblySubtarget &STI)
Definition: WebAssemblyISelLowering.cpp:44

llvm::WebAssemblyTargetLowering::getPointerTy
MVT getPointerTy(const DataLayout &DL, uint32_t AS=0) const override
Return the pointer type for the given address space, defaults to the pointer type from the data layou...
Definition: WebAssemblyISelLowering.cpp:401

llvm::WebAssemblyTargetLowering::getPointerMemTy
MVT getPointerMemTy(const DataLayout &DL, uint32_t AS=0) const override
Return the in-memory pointer type for the given address space, defaults to the pointer type from the ...
Definition: WebAssemblyISelLowering.cpp:410

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition: ilist_node.h:134

llvm::ilist_node_with_parent::getPrevNode
NodeTy * getPrevNode()
Definition: ilist_node.h:345

uint32_t

uint64_t

unsigned

INT64_MIN
#define INT64_MIN
Definition: DataTypes.h:74

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:164

false
Definition: MachinePipeliner.cpp:239

llvm::ARM::ProfileKind::M
@ M

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition: BitmaskEnum.h:126

llvm::CallingConv::Swift
@ Swift
Calling convention for Swift.
Definition: CallingConv.h:69

llvm::CallingConv::PreserveMost
@ PreserveMost
Used for runtime calls that preserves most registers.
Definition: CallingConv.h:63

llvm::CallingConv::CXX_FAST_TLS
@ CXX_FAST_TLS
Used for access functions.
Definition: CallingConv.h:72

llvm::CallingConv::WASM_EmscriptenInvoke
@ WASM_EmscriptenInvoke
For emscripten __invoke_* functions.
Definition: CallingConv.h:229

llvm::CallingConv::Cold
@ Cold
Attempts to make code in the caller as efficient as possible under the assumption that the call is no...
Definition: CallingConv.h:47

llvm::CallingConv::PreserveAll
@ PreserveAll
Used for runtime calls that preserves (almost) all registers.
Definition: CallingConv.h:66

llvm::CallingConv::Fast
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition: CallingConv.h:41

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::HexagonISD::JT
@ JT
Definition: HexagonISelLowering.h:53

llvm::IRSimilarity::Legal
@ Legal
Definition: IRSimilarityIdentifier.h:77

llvm::ISD::SETCC
@ SETCC
SetCC operator - This evaluates to a true value iff the condition is true.
Definition: ISDOpcodes.h:801

llvm::ISD::STACKRESTORE
@ STACKRESTORE
STACKRESTORE has two operands, an input chain and a pointer to restore to it returns an output chain.
Definition: ISDOpcodes.h:1236

llvm::ISD::STACKSAVE
@ STACKSAVE
STACKSAVE - STACKSAVE has one operand, an input chain.
Definition: ISDOpcodes.h:1232

llvm::ISD::STORE
@ STORE
Definition: ISDOpcodes.h:1142

llvm::ISD::JumpTable
@ JumpTable
Definition: ISDOpcodes.h:91

llvm::ISD::FLOG10
@ FLOG10
Definition: ISDOpcodes.h:1029

llvm::ISD::SREM
@ SREM
Definition: ISDOpcodes.h:264

llvm::ISD::SMUL_LOHI
@ SMUL_LOHI
SMUL_LOHI/UMUL_LOHI - Multiply two integers of type iN, producing a signed/unsigned value of type i[2...
Definition: ISDOpcodes.h:270

llvm::ISD::UDIV
@ UDIV
Definition: ISDOpcodes.h:263

llvm::ISD::UINT_TO_FP
@ UINT_TO_FP
Definition: ISDOpcodes.h:863

llvm::ISD::UMIN
@ UMIN
Definition: ISDOpcodes.h:720

llvm::ISD::BSWAP
@ BSWAP
Byte Swap and Counting operators.
Definition: ISDOpcodes.h:765

llvm::ISD::ROTR
@ ROTR
Definition: ISDOpcodes.h:760

llvm::ISD::FPOW
@ FPOW
Definition: ISDOpcodes.h:1015

llvm::ISD::VAEND
@ VAEND
VAEND, VASTART - VAEND and VASTART have three operands: an input chain, pointer, and a SRCVALUE.
Definition: ISDOpcodes.h:1265

llvm::ISD::ConstantFP
@ ConstantFP
Definition: ISDOpcodes.h:87

llvm::ISD::UADDO
@ UADDO
Definition: ISDOpcodes.h:344

llvm::ISD::FTRUNC
@ FTRUNC
Definition: ISDOpcodes.h:1034

llvm::ISD::SDIV
@ SDIV
Definition: ISDOpcodes.h:262

llvm::ISD::ADDC
@ ADDC
Carry-setting nodes for multiple precision addition and subtraction.
Definition: ISDOpcodes.h:289

llvm::ISD::ADD
@ ADD
Simple integer binary arithmetic operators.
Definition: ISDOpcodes.h:259

llvm::ISD::LOAD
@ LOAD
LOAD and STORE have token chains as their first operand, then the same operands as an LLVM load/store...
Definition: ISDOpcodes.h:1141

llvm::ISD::FMA
@ FMA
FMA - Perform a * b + c with no intermediate rounding step.
Definition: ISDOpcodes.h:511

llvm::ISD::SUBC
@ SUBC
Definition: ISDOpcodes.h:290

llvm::ISD::FNEARBYINT
@ FNEARBYINT
Definition: ISDOpcodes.h:1036

llvm::ISD::INTRINSIC_VOID
@ INTRINSIC_VOID
OUTCHAIN = INTRINSIC_VOID(INCHAIN, INTRINSICID, arg1, arg2, ...) This node represents a target intrin...
Definition: ISDOpcodes.h:215

llvm::ISD::RETURNADDR
@ RETURNADDR
Definition: ISDOpcodes.h:111

llvm::ISD::GlobalAddress
@ GlobalAddress
Definition: ISDOpcodes.h:88

llvm::ISD::SINT_TO_FP
@ SINT_TO_FP
[SU]INT_TO_FP - These operators convert integers (whose interpreted sign depends on the first letter)...
Definition: ISDOpcodes.h:862

llvm::ISD::CONCAT_VECTORS
@ CONCAT_VECTORS
CONCAT_VECTORS(VECTOR0, VECTOR1, ...) - Given a number of values of vector type with the same length ...
Definition: ISDOpcodes.h:571

llvm::ISD::ABS
@ ABS
ABS - Determine the unsigned absolute value of a signed integer value of the same bitwidth.
Definition: ISDOpcodes.h:738

llvm::ISD::FEXP10
@ FEXP10
Definition: ISDOpcodes.h:1032

llvm::ISD::SIGN_EXTEND_VECTOR_INREG
@ SIGN_EXTEND_VECTOR_INREG
SIGN_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register sign-extension of the low ...
Definition: ISDOpcodes.h:892

llvm::ISD::FP_TO_FP16
@ FP_TO_FP16
Definition: ISDOpcodes.h:986

llvm::ISD::UDIVREM
@ UDIVREM
Definition: ISDOpcodes.h:276

llvm::ISD::SDIVREM
@ SDIVREM
SDIVREM/UDIVREM - Divide two integers and produce both a quotient and remainder result.
Definition: ISDOpcodes.h:275

llvm::ISD::SRL
@ SRL
Definition: ISDOpcodes.h:758

llvm::ISD::FMAXIMUM
@ FMAXIMUM
Definition: ISDOpcodes.h:1082

llvm::ISD::FP16_TO_FP
@ FP16_TO_FP
FP16_TO_FP, FP_TO_FP16 - These operators are used to perform promotions and truncation for half-preci...
Definition: ISDOpcodes.h:985

llvm::ISD::BITCAST
@ BITCAST
BITCAST - This operator converts between integer, vector and FP values, as if the value was stored to...
Definition: ISDOpcodes.h:975

llvm::ISD::BUILD_PAIR
@ BUILD_PAIR
BUILD_PAIR - This is the opposite of EXTRACT_ELEMENT in some ways.
Definition: ISDOpcodes.h:249

llvm::ISD::FFLOOR
@ FFLOOR
Definition: ISDOpcodes.h:1039

llvm::ISD::BUILTIN_OP_END
@ BUILTIN_OP_END
BUILTIN_OP_END - This must be the last enum value in this list.
Definition: ISDOpcodes.h:1568

llvm::ISD::GlobalTLSAddress
@ GlobalTLSAddress
Definition: ISDOpcodes.h:89

llvm::ISD::SRA
@ SRA
Definition: ISDOpcodes.h:757

llvm::ISD::FrameIndex
@ FrameIndex
Definition: ISDOpcodes.h:90

llvm::ISD::SIGN_EXTEND
@ SIGN_EXTEND
Conversion operators.
Definition: ISDOpcodes.h:826

llvm::ISD::FLOG2
@ FLOG2
Definition: ISDOpcodes.h:1028

llvm::ISD::SCALAR_TO_VECTOR
@ SCALAR_TO_VECTOR
SCALAR_TO_VECTOR(VAL) - This represents the operation of loading a scalar value into element 0 of the...
Definition: ISDOpcodes.h:656

llvm::ISD::UADDSAT
@ UADDSAT
Definition: ISDOpcodes.h:361

llvm::ISD::FRINT
@ FRINT
Definition: ISDOpcodes.h:1035

llvm::ISD::FSINCOS
@ FSINCOS
FSINCOS - Compute both fsin and fcos as a single operation.
Definition: ISDOpcodes.h:1090

llvm::ISD::BR_CC
@ BR_CC
BR_CC - Conditional branch.
Definition: ISDOpcodes.h:1187

llvm::ISD::CTTZ
@ CTTZ
Definition: ISDOpcodes.h:766

llvm::ISD::FP_TO_UINT
@ FP_TO_UINT
Definition: ISDOpcodes.h:909

llvm::ISD::BRIND
@ BRIND
BRIND - Indirect branch.
Definition: ISDOpcodes.h:1162

llvm::ISD::BR_JT
@ BR_JT
BR_JT - Jumptable branch.
Definition: ISDOpcodes.h:1166

llvm::ISD::SSUBSAT
@ SSUBSAT
RESULT = [US]SUBSAT(LHS, RHS) - Perform saturation subtraction on 2 integers with the same bit width ...
Definition: ISDOpcodes.h:369

llvm::ISD::SRA_PARTS
@ SRA_PARTS
Definition: ISDOpcodes.h:816

llvm::ISD::UMUL_LOHI
@ UMUL_LOHI
Definition: ISDOpcodes.h:271

llvm::ISD::EXTRACT_ELEMENT
@ EXTRACT_ELEMENT
EXTRACT_ELEMENT - This is used to get the lower or upper (determined by a Constant,...
Definition: ISDOpcodes.h:242

llvm::ISD::SPLAT_VECTOR
@ SPLAT_VECTOR
SPLAT_VECTOR(VAL) - Returns a vector with the scalar value VAL duplicated in all lanes.
Definition: ISDOpcodes.h:663

llvm::ISD::VACOPY
@ VACOPY
VACOPY - VACOPY has 5 operands: an input chain, a destination pointer, a source pointer,...
Definition: ISDOpcodes.h:1261

llvm::ISD::AVGCEILU
@ AVGCEILU
Definition: ISDOpcodes.h:707

llvm::ISD::USUBSAT
@ USUBSAT
Definition: ISDOpcodes.h:370

llvm::ISD::MULHU
@ MULHU
MULHU/MULHS - Multiply high - Multiply two integers of type iN, producing an unsigned/signed value of...
Definition: ISDOpcodes.h:695

llvm::ISD::SHL
@ SHL
Shift and rotation operations.
Definition: ISDOpcodes.h:756

llvm::ISD::VECTOR_SHUFFLE
@ VECTOR_SHUFFLE
VECTOR_SHUFFLE(VEC1, VEC2) - Returns a vector, of the same type as VEC1/VEC2.
Definition: ISDOpcodes.h:636

llvm::ISD::EXTRACT_SUBVECTOR
@ EXTRACT_SUBVECTOR
EXTRACT_SUBVECTOR(VECTOR, IDX) - Returns a subvector from VECTOR.
Definition: ISDOpcodes.h:601

llvm::ISD::FCOS
@ FCOS
Definition: ISDOpcodes.h:1007

llvm::ISD::EXTRACT_VECTOR_ELT
@ EXTRACT_VECTOR_ELT
EXTRACT_VECTOR_ELT(VECTOR, IDX) - Returns a single element from VECTOR identified by the (potentially...
Definition: ISDOpcodes.h:563

llvm::ISD::CopyToReg
@ CopyToReg
CopyToReg - This node has three operands: a chain, a register number to set to this value,...
Definition: ISDOpcodes.h:219

llvm::ISD::ZERO_EXTEND
@ ZERO_EXTEND
ZERO_EXTEND - Used for integer types, zeroing the new bits.
Definition: ISDOpcodes.h:832

llvm::ISD::DEBUGTRAP
@ DEBUGTRAP
DEBUGTRAP - Trap intended to get the attention of a debugger.
Definition: ISDOpcodes.h:1321

llvm::ISD::FP_TO_UINT_SAT
@ FP_TO_UINT_SAT
Definition: ISDOpcodes.h:928

llvm::ISD::CTPOP
@ CTPOP
Definition: ISDOpcodes.h:768

llvm::ISD::SELECT_CC
@ SELECT_CC
Select with condition operator - This selects between a true value and a false value (ops #2 and #3) ...
Definition: ISDOpcodes.h:793

llvm::ISD::SRL_PARTS
@ SRL_PARTS
Definition: ISDOpcodes.h:817

llvm::ISD::SUB
@ SUB
Definition: ISDOpcodes.h:260

llvm::ISD::MULHS
@ MULHS
Definition: ISDOpcodes.h:696

llvm::ISD::DYNAMIC_STACKALLOC
@ DYNAMIC_STACKALLOC
DYNAMIC_STACKALLOC - Allocate some number of bytes on the stack aligned to a specified boundary.
Definition: ISDOpcodes.h:1151

llvm::ISD::SIGN_EXTEND_INREG
@ SIGN_EXTEND_INREG
SIGN_EXTEND_INREG - This operator atomically performs a SHL/SRA pair to sign extend a small value in ...
Definition: ISDOpcodes.h:870

llvm::ISD::SMIN
@ SMIN
[US]{MIN/MAX} - Binary minimum or maximum of signed or unsigned integers.
Definition: ISDOpcodes.h:718

llvm::ISD::Constant
@ Constant
Definition: ISDOpcodes.h:86

llvm::ISD::FP_EXTEND
@ FP_EXTEND
X = FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
Definition: ISDOpcodes.h:960

llvm::ISD::FROUNDEVEN
@ FROUNDEVEN
Definition: ISDOpcodes.h:1038

llvm::ISD::FRAMEADDR
@ FRAMEADDR
FRAMEADDR, RETURNADDR - These nodes represent llvm.frameaddress and llvm.returnaddress on the DAG.
Definition: ISDOpcodes.h:110

llvm::ISD::FREM
@ FREM
Definition: ISDOpcodes.h:414

llvm::ISD::FMINIMUM
@ FMINIMUM
FMINIMUM/FMAXIMUM - NaN-propagating minimum/maximum that also treat -0.0 as less than 0....
Definition: ISDOpcodes.h:1081

llvm::ISD::FP_TO_SINT
@ FP_TO_SINT
FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
Definition: ISDOpcodes.h:908

llvm::ISD::TargetConstant
@ TargetConstant
TargetConstant* - Like Constant*, but the DAG does not do any folding, simplification,...
Definition: ISDOpcodes.h:174

llvm::ISD::AND
@ AND
Bitwise operators - logical and, logical or, logical xor.
Definition: ISDOpcodes.h:730

llvm::ISD::TRAP
@ TRAP
TRAP - Trapping instruction.
Definition: ISDOpcodes.h:1318

llvm::ISD::INTRINSIC_WO_CHAIN
@ INTRINSIC_WO_CHAIN
RESULT = INTRINSIC_WO_CHAIN(INTRINSICID, arg1, arg2, ...) This node represents a target intrinsic fun...
Definition: ISDOpcodes.h:200

llvm::ISD::FLOG
@ FLOG
Definition: ISDOpcodes.h:1027

llvm::ISD::SUBE
@ SUBE
Definition: ISDOpcodes.h:300

llvm::ISD::ADDE
@ ADDE
Carry-using nodes for multiple precision addition and subtraction.
Definition: ISDOpcodes.h:299

llvm::ISD::UREM
@ UREM
Definition: ISDOpcodes.h:265

llvm::ISD::INSERT_VECTOR_ELT
@ INSERT_VECTOR_ELT
INSERT_VECTOR_ELT(VECTOR, VAL, IDX) - Returns VECTOR with the element at IDX replaced with VAL.
Definition: ISDOpcodes.h:552

llvm::ISD::TokenFactor
@ TokenFactor
TokenFactor - This node takes multiple tokens as input and produces a single token result.
Definition: ISDOpcodes.h:53

llvm::ISD::FSIN
@ FSIN
Definition: ISDOpcodes.h:1006

llvm::ISD::FEXP
@ FEXP
Definition: ISDOpcodes.h:1030

llvm::ISD::FCEIL
@ FCEIL
Definition: ISDOpcodes.h:1033

llvm::ISD::ExternalSymbol
@ ExternalSymbol
Definition: ISDOpcodes.h:93

llvm::ISD::MUL
@ MUL
Definition: ISDOpcodes.h:261

llvm::ISD::FP_ROUND
@ FP_ROUND
X = FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating point type down to the precision of the ...
Definition: ISDOpcodes.h:941

llvm::ISD::CTLZ
@ CTLZ
Definition: ISDOpcodes.h:767

llvm::ISD::CLEAR_CACHE
@ CLEAR_CACHE
Definition: ISDOpcodes.h:1564

llvm::ISD::ZERO_EXTEND_VECTOR_INREG
@ ZERO_EXTEND_VECTOR_INREG
ZERO_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register zero-extension of the low ...
Definition: ISDOpcodes.h:903

llvm::ISD::VASTART
@ VASTART
Definition: ISDOpcodes.h:1266

llvm::ISD::FP_TO_SINT_SAT
@ FP_TO_SINT_SAT
FP_TO_[US]INT_SAT - Convert floating point value in operand 0 to a signed or unsigned scalar integer ...
Definition: ISDOpcodes.h:927

llvm::ISD::TRUNCATE
@ TRUNCATE
TRUNCATE - Completely drop the high bits.
Definition: ISDOpcodes.h:838

llvm::ISD::VAARG
@ VAARG
VAARG - VAARG has four operands: an input chain, a pointer, a SRCVALUE, and the alignment.
Definition: ISDOpcodes.h:1256

llvm::ISD::ROTL
@ ROTL
Definition: ISDOpcodes.h:759

llvm::ISD::BlockAddress
@ BlockAddress
Definition: ISDOpcodes.h:94

llvm::ISD::SHL_PARTS
@ SHL_PARTS
SHL_PARTS/SRA_PARTS/SRL_PARTS - These operators are used for expanded integer shift operations.
Definition: ISDOpcodes.h:815

llvm::ISD::FCOPYSIGN
@ FCOPYSIGN
FCOPYSIGN(X, Y) - Return the value of X with the sign of Y.
Definition: ISDOpcodes.h:521

llvm::ISD::SADDSAT
@ SADDSAT
RESULT = [US]ADDSAT(LHS, RHS) - Perform saturation addition on 2 integers with the same bit width (W)...
Definition: ISDOpcodes.h:360

llvm::ISD::FEXP2
@ FEXP2
Definition: ISDOpcodes.h:1031

llvm::ISD::SMAX
@ SMAX
Definition: ISDOpcodes.h:719

llvm::ISD::UMAX
@ UMAX
Definition: ISDOpcodes.h:721

llvm::ISD::INTRINSIC_W_CHAIN
@ INTRINSIC_W_CHAIN
RESULT,OUTCHAIN = INTRINSIC_W_CHAIN(INCHAIN, INTRINSICID, arg1, ...) This node represents a target in...
Definition: ISDOpcodes.h:208

llvm::ISD::BUILD_VECTOR
@ BUILD_VECTOR
BUILD_VECTOR(ELT0, ELT1, ELT2, ELT3,...) - Return a fixed-width vector with the specified,...
Definition: ISDOpcodes.h:543

llvm::ISD::isExtOpcode
bool isExtOpcode(unsigned Opcode)
Definition: ISDOpcodes.h:1756

llvm::ISD::isConstantSplatVector
LLVM_ABI bool isConstantSplatVector(const SDNode *N, APInt &SplatValue)
Node predicates.
Definition: SelectionDAG.cpp:151

llvm::ISD::CondCode
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
Definition: ISDOpcodes.h:1685

llvm::ISD::SETUEQ
@ SETUEQ
Definition: ISDOpcodes.h:1696

llvm::ISD::SETNE
@ SETNE
Definition: ISDOpcodes.h:1710

llvm::ISD::SETUGT
@ SETUGT
Definition: ISDOpcodes.h:1697

llvm::ISD::SETULT
@ SETULT
Definition: ISDOpcodes.h:1699

llvm::ISD::SETUO
@ SETUO
Definition: ISDOpcodes.h:1695

llvm::ISD::SETONE
@ SETONE
Definition: ISDOpcodes.h:1693

llvm::ISD::SETO
@ SETO
Definition: ISDOpcodes.h:1694

llvm::ISD::SETUGE
@ SETUGE
Definition: ISDOpcodes.h:1698

llvm::ISD::SETULE
@ SETULE
Definition: ISDOpcodes.h:1700

llvm::ISD::SETEQ
@ SETEQ
Definition: ISDOpcodes.h:1705

llvm::ISD::SEXTLOAD
@ SEXTLOAD
Definition: ISDOpcodes.h:1665

llvm::ISD::ZEXTLOAD
@ ZEXTLOAD
Definition: ISDOpcodes.h:1665

llvm::ISD::EXTLOAD
@ EXTLOAD
Definition: ISDOpcodes.h:1665

llvm::M68k::MemAddrModeKind::V
@ V

llvm::MCOI::OperandFlags
OperandFlags
These are flags set on operands, but should be considered private, all access should go through the M...
Definition: MCInstrDesc.h:51

llvm::MipsISD::Ret
@ Ret
Definition: MipsISelLowering.h:117

llvm::MipsISD::Ext
@ Ext
Definition: MipsISelLowering.h:157

llvm::MipsISD::Ins
@ Ins
Definition: MipsISelLowering.h:158

llvm::NVPTX::Const
@ Const
Definition: NVPTX.h:185

llvm::PatternMatch::m_BitCast
CastOperator_match< OpTy, Instruction::BitCast > m_BitCast(const OpTy &Op)
Matches BitCast.
Definition: PatternMatch.h:2150

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_Zero
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
Definition: PatternMatch.h:612

llvm::SDPatternMatch
Definition: SDPatternMatch.h:25

llvm::Sched::RegPressure
@ RegPressure
Definition: TargetLowering.h:106

llvm::SystemZISD::TM
@ TM
Definition: SystemZISelLowering.h:66

llvm::WebAssemblyII::MO_TABLE_BASE_REL
@ MO_TABLE_BASE_REL
Definition: WebAssemblyMCTargetDesc.h:116

llvm::WebAssemblyII::MO_MEMORY_BASE_REL
@ MO_MEMORY_BASE_REL
Definition: WebAssemblyMCTargetDesc.h:106

llvm::WebAssemblyII::MO_TLS_BASE_REL
@ MO_TLS_BASE_REL
Definition: WebAssemblyMCTargetDesc.h:111

llvm::WebAssemblyII::MO_GOT
@ MO_GOT
Definition: WebAssemblyMCTargetDesc.h:98

llvm::WebAssemblyII::MO_GOT_TLS
@ MO_GOT_TLS
Definition: WebAssemblyMCTargetDesc.h:101

llvm::WebAssemblyISD::NodeType
NodeType
Definition: WebAssemblyISelLowering.h:24

llvm::WebAssemblyISD::FIRST_NUMBER
@ FIRST_NUMBER
Definition: WebAssemblyISelLowering.h:25

llvm::WebAssembly::getOrCreateFunctionTableSymbol
MCSymbolWasm * getOrCreateFunctionTableSymbol(MCContext &Ctx, const WebAssemblySubtarget *Subtarget)
Returns the __indirect_function_table, for use in call_indirect and in function bitcasts.
Definition: WebAssemblyUtilities.cpp:104

llvm::WebAssembly::WASM_ADDRESS_SPACE_EXTERNREF
@ WASM_ADDRESS_SPACE_EXTERNREF
Definition: WasmAddressSpaces.h:29

llvm::WebAssembly::WASM_ADDRESS_SPACE_FUNCREF
@ WASM_ADDRESS_SPACE_FUNCREF
Definition: WasmAddressSpaces.h:31

llvm::WebAssembly::isWebAssemblyFuncrefType
bool isWebAssemblyFuncrefType(const Type *Ty)
Return true if this is a WebAssembly Funcref Type.
Definition: WebAssemblyTypeUtilities.h:37

llvm::WebAssembly::isWebAssemblyTableType
bool isWebAssemblyTableType(const Type *Ty)
Return true if the table represents a WebAssembly table type.
Definition: WebAssemblyTypeUtilities.h:49

llvm::WebAssembly::getOrCreateFuncrefCallTableSymbol
MCSymbolWasm * getOrCreateFuncrefCallTableSymbol(MCContext &Ctx, const WebAssemblySubtarget *Subtarget)
Returns the __funcref_call_table, for use in funcref calls when lowered to table.set + call_indirect.
Definition: WebAssemblyUtilities.cpp:123

llvm::WebAssembly::createFastISel
FastISel * createFastISel(FunctionLoweringInfo &funcInfo, const TargetLibraryInfo *libInfo)
Definition: WebAssemblyFastISel.cpp:1451

llvm::WebAssembly::isValidAddressSpace
bool isValidAddressSpace(unsigned AS)
Definition: WasmAddressSpaces.h:40

llvm::WebAssembly::canLowerReturn
bool canLowerReturn(size_t ResultSize, const WebAssemblySubtarget *Subtarget)
Returns true if the function's return value(s) can be lowered directly, i.e., not indirectly via a po...
Definition: WebAssemblyUtilities.cpp:193

llvm::WebAssembly::isWasmVarAddressSpace
bool isWasmVarAddressSpace(unsigned AS)
Definition: WasmAddressSpaces.h:37

llvm::X86Disassembler::Reg
Reg
All possible values of the reg field in the ModR/M byte.
Definition: X86DisassemblerDecoder.h:621

llvm::codeview::FrameCookieKind::Copy
@ Copy

llvm::codeview::ExportFlags::IsConstant
@ IsConstant

llvm::dwarf::Index
Index
Definition: Dwarf.h:889

llvm::logicalview::LVAttributeKind::Zero
@ Zero

llvm::ms_demangle::QualifierMangleMode::Result
@ Result

llvm::omp::RTLDependInfoFields::BaseAddr
@ BaseAddr

llvm::pdb::PDB_SymType::Callee
@ Callee

llvm::sampleprof::Base
@ Base
Definition: Discriminator.h:58

llvm::sframe::Flags
Flags
Definition: SFrame.h:39

llvm::tgtok::In
@ In
Definition: TGLexer.h:84

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::drop_begin
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition: STLExtras.h:338

llvm::Log2_32_Ceil
unsigned Log2_32_Ceil(uint32_t Value)
Return the ceil log base 2 of the specified value, 32 if the value is zero.
Definition: MathExtras.h:349

llvm::Offset
@ Offset
Definition: DWP.cpp:477

llvm::computeSignatureVTs
void computeSignatureVTs(const FunctionType *Ty, const Function *TargetFunc, const Function &ContextFunc, const TargetMachine &TM, SmallVectorImpl< MVT > &Params, SmallVectorImpl< MVT > &Results)
Definition: WebAssemblyMachineFunctionInfo.cpp:64

llvm::size
auto size(R &&Range, std::enable_if_t< std::is_base_of< std::random_access_iterator_tag, typename std::iterator_traits< decltype(Range.begin())>::iterator_category >::value, void > *=nullptr)
Get the size of a range.
Definition: STLExtras.h:1702

llvm::BuildMI
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
Definition: MachineInstrBuilder.h:369

llvm::isNullConstant
LLVM_ABI bool isNullConstant(SDValue V)
Returns true if V is a constant integer zero.
Definition: SelectionDAG.cpp:12647

llvm::Depth
@ Depth
Definition: SIMachineScheduler.h:36

llvm::peekThroughBitcasts
LLVM_ABI SDValue peekThroughBitcasts(SDValue V)
Return the non-bitcasted source operand of V if it exists.
Definition: SelectionDAG.cpp:12739

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:288

llvm::get
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
Definition: PointerIntPair.h:269

llvm::ComplexDeinterleavingOperation::Splat
@ Splat

llvm::report_fatal_error
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition: Error.cpp:167

llvm::PackElem::Hi
@ Hi

llvm::PackElem::Lo
@ Lo

llvm::RecurKind::Mul
@ Mul
Product of integers.

llvm::RecurKind::Add
@ Add
Sum of integers.

llvm::Op
DWARFExpression::Operation Op
Definition: DWARFExpressionPrinter.cpp:22

llvm::max_element
auto max_element(R &&Range)
Provide wrappers to std::max_element which take ranges instead of having to pass begin/end explicitly...
Definition: STLExtras.h:2049

llvm::BitWidth
constexpr unsigned BitWidth
Definition: BitmaskEnum.h:223

llvm::find_if
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1777

llvm::erase_if
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
Definition: STLExtras.h:2139

llvm::computeLegalValueVTs
void computeLegalValueVTs(const WebAssemblyTargetLowering &TLI, LLVMContext &Ctx, const DataLayout &DL, Type *Ty, SmallVectorImpl< MVT > &ValueVTs)
Definition: WebAssemblyMachineFunctionInfo.cpp:42

llvm::NextPowerOf2
constexpr uint64_t NextPowerOf2(uint64_t A)
Returns the next power of two (in 64-bits) that is strictly greater than A.
Definition: MathExtras.h:378

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition: BitVector.h:858

N
#define N

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:35

llvm::EVT::changeVectorElementTypeToInteger
EVT changeVectorElementTypeToInteger() const
Return a vector with the same number of elements as this vector, but with the element type converted ...
Definition: ValueTypes.h:94

llvm::EVT::isSimple
bool isSimple() const
Test if the given EVT is simple (as opposed to being extended).
Definition: ValueTypes.h:137

llvm::EVT::getVectorVT
static EVT getVectorVT(LLVMContext &Context, EVT VT, unsigned NumElements, bool IsScalable=false)
Returns the EVT that represents a vector NumElements in length, where each element is of type VT.
Definition: ValueTypes.h:74

llvm::EVT::isFloatingPoint
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
Definition: ValueTypes.h:147

llvm::EVT::getVectorElementCount
ElementCount getVectorElementCount() const
Definition: ValueTypes.h:345

llvm::EVT::getSizeInBits
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition: ValueTypes.h:368

llvm::EVT::isByteSized
bool isByteSized() const
Return true if the bit size is a multiple of 8.
Definition: ValueTypes.h:238

llvm::EVT::getScalarSizeInBits
uint64_t getScalarSizeInBits() const
Definition: ValueTypes.h:380

llvm::EVT::getEVT
static LLVM_ABI EVT getEVT(Type *Ty, bool HandleUnknown=false)
Return the value type corresponding to the specified type.
Definition: ValueTypes.cpp:299

llvm::EVT::getSimpleVT
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Definition: ValueTypes.h:311

llvm::EVT::is128BitVector
bool is128BitVector() const
Return true if this is a 128-bit vector type.
Definition: ValueTypes.h:207

llvm::EVT::getIntegerVT
static EVT getIntegerVT(LLVMContext &Context, unsigned BitWidth)
Returns the EVT that represents an integer with the given number of bits.
Definition: ValueTypes.h:65

llvm::EVT::getFixedSizeInBits
uint64_t getFixedSizeInBits() const
Return the size of the specified fixed width value type in bits.
Definition: ValueTypes.h:376

llvm::EVT::isFixedLengthVector
bool isFixedLengthVector() const
Definition: ValueTypes.h:181

llvm::EVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition: ValueTypes.h:168

llvm::EVT::getScalarType
EVT getScalarType() const
If this is a vector type, return the element type, otherwise return this.
Definition: ValueTypes.h:318

llvm::EVT::bitsGE
bool bitsGE(EVT VT) const
Return true if this has no less bits than VT.
Definition: ValueTypes.h:287

llvm::EVT::is256BitVector
bool is256BitVector() const
Return true if this is a 256-bit vector type.
Definition: ValueTypes.h:212

llvm::EVT::getTypeForEVT
LLVM_ABI Type * getTypeForEVT(LLVMContext &Context) const
This method returns an LLVM type corresponding to the specified EVT.
Definition: ValueTypes.cpp:216

llvm::EVT::getVectorElementType
EVT getVectorElementType() const
Given a vector type, return the type of each element.
Definition: ValueTypes.h:323

llvm::EVT::isScalarInteger
bool isScalarInteger() const
Return true if this is an integer, but not a vector.
Definition: ValueTypes.h:157

llvm::EVT::changeVectorElementType
EVT changeVectorElementType(EVT EltVT) const
Return a VT for a vector type whose attributes match ourselves with the exception of the element type...
Definition: ValueTypes.h:102

llvm::EVT::getVectorNumElements
unsigned getVectorNumElements() const
Given a vector type, return the number of elements it contains.
Definition: ValueTypes.h:331

llvm::ISD::ArgFlagsTy
Definition: TargetCallingConv.h:27

llvm::ISD::ArgFlagsTy::isNest
bool isNest() const
Definition: TargetCallingConv.h:124

llvm::ISD::ArgFlagsTy::isInConsecutiveRegs
bool isInConsecutiveRegs() const
Definition: TargetCallingConv.h:130

llvm::ISD::ArgFlagsTy::isInAlloca
bool isInAlloca() const
Definition: TargetCallingConv.h:97

llvm::ISD::ArgFlagsTy::getNonZeroOrigAlign
Align getNonZeroOrigAlign() const
Definition: TargetCallingConv.h:169

llvm::ISD::ArgFlagsTy::isSwiftSelf
bool isSwiftSelf() const
Definition: TargetCallingConv.h:103

llvm::ISD::ArgFlagsTy::isSwiftError
bool isSwiftError() const
Definition: TargetCallingConv.h:109

llvm::ISD::ArgFlagsTy::getByValSize
unsigned getByValSize() const
Definition: TargetCallingConv.h:178

llvm::ISD::ArgFlagsTy::isByVal
bool isByVal() const
Definition: TargetCallingConv.h:91

llvm::ISD::ArgFlagsTy::isInConsecutiveRegsLast
bool isInConsecutiveRegsLast() const
Definition: TargetCallingConv.h:133

llvm::ISD::ArgFlagsTy::isVarArg
bool isVarArg() const
Definition: TargetCallingConv.h:150

llvm::ISD::ArgFlagsTy::getNonZeroByValAlign
Align getNonZeroByValAlign() const
Definition: TargetCallingConv.h:162

llvm::ISD::InputArg
InputArg - This struct carries flags and type information about a single incoming (formal) argument o...
Definition: TargetCallingConv.h:204

llvm::ISD::OutputArg
OutputArg - This struct carries flags and a value for a single outgoing (actual) argument or outgoing...
Definition: TargetCallingConv.h:246

llvm::ISD::OutputArg::Flags
ArgFlagsTy Flags
Definition: TargetCallingConv.h:247

llvm::KnownBits
Definition: KnownBits.h:24

llvm::KnownBits::getBitWidth
unsigned getBitWidth() const
Get the bit width of this value.
Definition: KnownBits.h:44

llvm::KnownBits::Zero
APInt Zero
Definition: KnownBits.h:25

llvm::MIPatternMatch::And
Matching combinators.
Definition: MIPatternMatch.h:313

llvm::MachinePointerInfo
This class contains a discriminated union of information about pointers in memory operands,...
Definition: MachineMemOperand.h:42

llvm::MachinePointerInfo::getFixedStack
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
Definition: MachineOperand.cpp:1064

llvm::MaybeAlign
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Definition: Alignment.h:117

llvm::SDNodeFlags
These are IR-level optimization flags that may be propagated to SDNodes.
Definition: SelectionDAGNodes.h:384

llvm::SDVTList
This represents a list of ValueType's that has been intern'd by a SelectionDAG.
Definition: SelectionDAGNodes.h:80

llvm::TargetLowering::DAGCombinerInfo
Definition: TargetLowering.h:4398

llvm::TargetLowering::DAGCombinerInfo::isBeforeLegalize
bool isBeforeLegalize() const
Definition: TargetLowering.h:4409

llvm::TargetLowering::DAGCombinerInfo::DAG
SelectionDAG & DAG
Definition: TargetLowering.h:4404

llvm::less_second
Function object to check whether the second component of a container supported by std::get (like std:...
Definition: STLExtras.h:1481