LLVM: lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp Source File

//===- LegalizeVectorOps.cpp - Implement SelectionDAG::LegalizeVectors ----===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the SelectionDAG::LegalizeVectors method.

//

// The vector legalizer looks for vector operations which might need to be

// scalarized and legalizes them. This is a separate step from Legalize because

// scalarizing can introduce illegal types.  For example, suppose we have an

// ISD::SDIV of type v2i64 on x86-32.  The type is legal (for example, addition

// on a v2i64 is legal), but ISD::SDIV isn't legal, so we have to unroll the

// operation, which introduces nodes with the illegal type i64 which must be

// expanded.  Similarly, suppose we have an ISD::SRA of type v16i8 on PowerPC;

// the operation must be unrolled, which introduces nodes with the illegal

// type i8 which must be promoted.

//

// This does not legalize vector manipulations like ISD::BUILD_VECTOR,

// or operations that happen to take a vector which are custom-lowered;

// the legalization for such operations never produces nodes

// with illegal types, so it's okay to put off legalizing them until

// SelectionDAG::Legalize runs.

//

//===----------------------------------------------------------------------===//


#include "llvm/ADT/DenseMap.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/Analysis/TargetLibraryInfo.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/CodeGen/ISDOpcodes.h"

#include "llvm/CodeGen/SelectionDAG.h"

#include "llvm/CodeGen/SelectionDAGNodes.h"

#include "llvm/CodeGen/TargetLowering.h"

#include "llvm/CodeGen/ValueTypes.h"

#include "llvm/CodeGenTypes/MachineValueType.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include <cassert>

#include <cstdint>

#include <iterator>

#include <utility>


using namespace llvm;


#define DEBUG_TYPE "legalizevectorops"


namespace {


class VectorLegalizer {

  SelectionDAG& DAG;

  const TargetLowering &TLI;

  bool Changed = false; // Keep track of whether anything changed


  /// For nodes that are of legal width, and that have more than one use, this

  /// map indicates what regularized operand to use.  This allows us to avoid

  /// legalizing the same thing more than once.

  SmallDenseMap<SDValue, SDValue, 64> LegalizedNodes;


  /// Adds a node to the translation cache.

  void AddLegalizedOperand(SDValue From, SDValue To) {

    LegalizedNodes.insert(std::make_pair(From, To));

    // If someone requests legalization of the new node, return itself.

    if (From != To)

      LegalizedNodes.insert(std::make_pair(To, To));

  }


  /// Legalizes the given node.

  SDValue LegalizeOp(SDValue Op);


  /// Assuming the node is legal, "legalize" the results.

  SDValue TranslateLegalizeResults(SDValue Op, SDNode *Result);


  /// Make sure Results are legal and update the translation cache.

  SDValue RecursivelyLegalizeResults(SDValue Op,

                                     MutableArrayRef<SDValue> Results);


  /// Wrapper to interface LowerOperation with a vector of Results.

  /// Returns false if the target wants to use default expansion. Otherwise

  /// returns true. If return is true and the Results are empty, then the

  /// target wants to keep the input node as is.

  bool LowerOperationWrapper(SDNode *N, SmallVectorImpl<SDValue> &Results);


  /// Implements unrolling a VSETCC.

  SDValue UnrollVSETCC(SDNode *Node);


  /// Implement expand-based legalization of vector operations.

  ///

  /// This is just a high-level routine to dispatch to specific code paths for

  /// operations to legalize them.

  void Expand(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  /// Implements expansion for FP_TO_UINT; falls back to UnrollVectorOp if

  /// FP_TO_SINT isn't legal.

  void ExpandFP_TO_UINT(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  /// Implements expansion for UINT_TO_FLOAT; falls back to UnrollVectorOp if

  /// SINT_TO_FLOAT and SHR on vectors isn't legal.

  void ExpandUINT_TO_FLOAT(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  /// Implement expansion for SIGN_EXTEND_INREG using SRL and SRA.

  SDValue ExpandSEXTINREG(SDNode *Node);


  /// Implement expansion for ANY_EXTEND_VECTOR_INREG.

  ///

  /// Shuffles the low lanes of the operand into place and bitcasts to the proper

  /// type. The contents of the bits in the extended part of each element are

  /// undef.

  SDValue ExpandANY_EXTEND_VECTOR_INREG(SDNode *Node);


  /// Implement expansion for SIGN_EXTEND_VECTOR_INREG.

  ///

  /// Shuffles the low lanes of the operand into place, bitcasts to the proper

  /// type, then shifts left and arithmetic shifts right to introduce a sign

  /// extension.

  SDValue ExpandSIGN_EXTEND_VECTOR_INREG(SDNode *Node);


  /// Implement expansion for ZERO_EXTEND_VECTOR_INREG.

  ///

  /// Shuffles the low lanes of the operand into place and blends zeros into

  /// the remaining lanes, finally bitcasting to the proper type.

  SDValue ExpandZERO_EXTEND_VECTOR_INREG(SDNode *Node);


  /// Expand bswap of vectors into a shuffle if legal.

  SDValue ExpandBSWAP(SDNode *Node);


  /// Implement vselect in terms of XOR, AND, OR when blend is not

  /// supported by the target.

  SDValue ExpandVSELECT(SDNode *Node);

  SDValue ExpandVP_SELECT(SDNode *Node);

  SDValue ExpandVP_MERGE(SDNode *Node);

  SDValue ExpandVP_REM(SDNode *Node);

  SDValue ExpandVP_FNEG(SDNode *Node);

  SDValue ExpandVP_FABS(SDNode *Node);

  SDValue ExpandVP_FCOPYSIGN(SDNode *Node);

  SDValue ExpandSELECT(SDNode *Node);

  std::pair<SDValue, SDValue> ExpandLoad(SDNode *N);

  SDValue ExpandStore(SDNode *N);

  SDValue ExpandFNEG(SDNode *Node);

  SDValue ExpandFABS(SDNode *Node);

  SDValue ExpandFCOPYSIGN(SDNode *Node);

  void ExpandFSUB(SDNode *Node, SmallVectorImpl<SDValue> &Results);

  void ExpandSETCC(SDNode *Node, SmallVectorImpl<SDValue> &Results);

  SDValue ExpandBITREVERSE(SDNode *Node);

  void ExpandUADDSUBO(SDNode *Node, SmallVectorImpl<SDValue> &Results);

  void ExpandSADDSUBO(SDNode *Node, SmallVectorImpl<SDValue> &Results);

  void ExpandMULO(SDNode *Node, SmallVectorImpl<SDValue> &Results);

  void ExpandFixedPointDiv(SDNode *Node, SmallVectorImpl<SDValue> &Results);

  void ExpandStrictFPOp(SDNode *Node, SmallVectorImpl<SDValue> &Results);

  void ExpandREM(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  bool tryExpandVecMathCall(SDNode *Node, RTLIB::Libcall LC,

                            SmallVectorImpl<SDValue> &Results);

  bool tryExpandVecMathCall(SDNode *Node, RTLIB::Libcall Call_F32,

                            RTLIB::Libcall Call_F64, RTLIB::Libcall Call_F80,

                            RTLIB::Libcall Call_F128,

                            RTLIB::Libcall Call_PPCF128,

                            SmallVectorImpl<SDValue> &Results);


  void UnrollStrictFPOp(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  /// Implements vector promotion.

  ///

  /// This is essentially just bitcasting the operands to a different type and

  /// bitcasting the result back to the original type.

  void Promote(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  /// Implements [SU]INT_TO_FP vector promotion.

  ///

  /// This is a [zs]ext of the input operand to a larger integer type.

  void PromoteINT_TO_FP(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  /// Implements FP_TO_[SU]INT vector promotion of the result type.

  ///

  /// It is promoted to a larger integer type.  The result is then

  /// truncated back to the original type.

  void PromoteFP_TO_INT(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  /// Implements vector setcc operation promotion.

  ///

  /// All vector operands are promoted to a vector type with larger element

  /// type.

  void PromoteSETCC(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  void PromoteSTRICT(SDNode *Node, SmallVectorImpl<SDValue> &Results);


  /// Calculate the reduction using a type of higher precision and round the

  /// result to match the original type. Setting NonArithmetic signifies the

  /// rounding of the result does not affect its value.

  void PromoteFloatVECREDUCE(SDNode *Node, SmallVectorImpl<SDValue> &Results,

                             bool NonArithmetic);


public:

  VectorLegalizer(SelectionDAG& dag) :

      DAG(dag), TLI(dag.getTargetLoweringInfo()) {}


  /// Begin legalizer the vector operations in the DAG.

  bool Run();

};


} // end anonymous namespace


bool VectorLegalizer::Run() {

  // Before we start legalizing vector nodes, check if there are any vectors.

  bool HasVectors = false;

  for (SelectionDAG::allnodes_iterator I = DAG.allnodes_begin(),

       E = std::prev(DAG.allnodes_end()); I != std::next(E); ++I) {

    // Check if the values of the nodes contain vectors. We don't need to check

    // the operands because we are going to check their values at some point.

    HasVectors = llvm::any_of(I->values(), [](EVT T) { return T.isVector(); });


    // If we found a vector node we can start the legalization.

    if (HasVectors)

      break;

  }


  // If this basic block has no vectors then no need to legalize vectors.

  if (!HasVectors)

    return false;


  // The legalize process is inherently a bottom-up recursive process (users

  // legalize their uses before themselves).  Given infinite stack space, we

  // could just start legalizing on the root and traverse the whole graph.  In

  // practice however, this causes us to run out of stack space on large basic

  // blocks.  To avoid this problem, compute an ordering of the nodes where each

  // node is only legalized after all of its operands are legalized.

  DAG.AssignTopologicalOrder();

  for (SelectionDAG::allnodes_iterator I = DAG.allnodes_begin(),

       E = std::prev(DAG.allnodes_end()); I != std::next(E); ++I)

    LegalizeOp(SDValue(&*I, 0));


  // Finally, it's possible the root changed.  Get the new root.

  SDValue OldRoot = DAG.getRoot();

  assert(LegalizedNodes.count(OldRoot) && "Root didn't get legalized?");

  DAG.setRoot(LegalizedNodes[OldRoot]);


  LegalizedNodes.clear();


  // Remove dead nodes now.

  DAG.RemoveDeadNodes();


  return Changed;

}


SDValue VectorLegalizer::TranslateLegalizeResults(SDValue Op, SDNode *Result) {

  assert(Op->getNumValues() == Result->getNumValues() &&

         "Unexpected number of results");

  // Generic legalization: just pass the operand through.

  for (unsigned i = 0, e = Op->getNumValues(); i != e; ++i)

    AddLegalizedOperand(Op.getValue(i), SDValue(Result, i));

  return SDValue(Result, Op.getResNo());

}


SDValue

VectorLegalizer::RecursivelyLegalizeResults(SDValue Op,

                                            MutableArrayRef<SDValue> Results) {

  assert(Results.size() == Op->getNumValues() &&

         "Unexpected number of results");

  // Make sure that the generated code is itself legal.

  for (unsigned i = 0, e = Results.size(); i != e; ++i) {

    Results[i] = LegalizeOp(Results[i]);

    AddLegalizedOperand(Op.getValue(i), Results[i]);

  }


  return Results[Op.getResNo()];

}


SDValue VectorLegalizer::LegalizeOp(SDValue Op) {

  // Note that LegalizeOp may be reentered even from single-use nodes, which

  // means that we always must cache transformed nodes.

  DenseMap<SDValue, SDValue>::iterator I = LegalizedNodes.find(Op);

  if (I != LegalizedNodes.end()) return I->second;


  // Legalize the operands

  SmallVector<SDValue, 8> Ops;

  for (const SDValue &Oper : Op->op_values())

    Ops.push_back(LegalizeOp(Oper));


  SDNode *Node = DAG.UpdateNodeOperands(Op.getNode(), Ops);


  bool HasVectorValueOrOp =

      llvm::any_of(Node->values(), [](EVT T) { return T.isVector(); }) ||

      llvm::any_of(Node->op_values(),

                   [](SDValue O) { return O.getValueType().isVector(); });

  if (!HasVectorValueOrOp)

    return TranslateLegalizeResults(Op, Node);


  TargetLowering::LegalizeAction Action = TargetLowering::Legal;

  EVT ValVT;

  switch (Op.getOpcode()) {

  default:

    return TranslateLegalizeResults(Op, Node);

  case ISD::LOAD: {

    LoadSDNode *LD = cast<LoadSDNode>(Node);

    ISD::LoadExtType ExtType = LD->getExtensionType();

    EVT LoadedVT = LD->getMemoryVT();

    if (LoadedVT.isVector() && ExtType != ISD::NON_EXTLOAD)

      Action = TLI.getLoadExtAction(ExtType, LD->getValueType(0), LoadedVT);

    break;

  }

  case ISD::STORE: {

    StoreSDNode *ST = cast<StoreSDNode>(Node);

    EVT StVT = ST->getMemoryVT();

    MVT ValVT = ST->getValue().getSimpleValueType();

    if (StVT.isVector() && ST->isTruncatingStore())

      Action = TLI.getTruncStoreAction(ValVT, StVT);

    break;

  }

  case ISD::MERGE_VALUES:

    Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));

    // This operation lies about being legal: when it claims to be legal,

    // it should actually be expanded.

    if (Action == TargetLowering::Legal)

      Action = TargetLowering::Expand;

    break;

#define DAG_INSTRUCTION(NAME, NARG, ROUND_MODE, INTRINSIC, DAGN)               \

  case ISD::STRICT_##DAGN:

#include "llvm/IR/ConstrainedOps.def"

    ValVT = Node->getValueType(0);

    if (Op.getOpcode() == ISD::STRICT_SINT_TO_FP ||

        Op.getOpcode() == ISD::STRICT_UINT_TO_FP)

      ValVT = Node->getOperand(1).getValueType();

    if (Op.getOpcode() == ISD::STRICT_FSETCC ||

        Op.getOpcode() == ISD::STRICT_FSETCCS) {

      MVT OpVT = Node->getOperand(1).getSimpleValueType();

      ISD::CondCode CCCode = cast<CondCodeSDNode>(Node->getOperand(3))->get();

      Action = TLI.getCondCodeAction(CCCode, OpVT);

      if (Action == TargetLowering::Legal)

        Action = TLI.getOperationAction(Node->getOpcode(), OpVT);

    } else {

      Action = TLI.getOperationAction(Node->getOpcode(), ValVT);

    }

    // If we're asked to expand a strict vector floating-point operation,

    // by default we're going to simply unroll it.  That is usually the

    // best approach, except in the case where the resulting strict (scalar)

    // operations would themselves use the fallback mutation to non-strict.

    // In that specific case, just do the fallback on the vector op.

    if (Action == TargetLowering::Expand && !TLI.isStrictFPEnabled() &&

        TLI.getStrictFPOperationAction(Node->getOpcode(), ValVT) ==

            TargetLowering::Legal) {

      EVT EltVT = ValVT.getVectorElementType();

      if (TLI.getOperationAction(Node->getOpcode(), EltVT)

          == TargetLowering::Expand &&

          TLI.getStrictFPOperationAction(Node->getOpcode(), EltVT)

          == TargetLowering::Legal)

        Action = TargetLowering::Legal;

    }

    break;

  case ISD::ADD:

  case ISD::SUB:

  case ISD::MUL:

  case ISD::MULHS:

  case ISD::MULHU:

  case ISD::SDIV:

  case ISD::UDIV:

  case ISD::SREM:

  case ISD::UREM:

  case ISD::SDIVREM:

  case ISD::UDIVREM:

  case ISD::FADD:

  case ISD::FSUB:

  case ISD::FMUL:

  case ISD::FDIV:

  case ISD::FREM:

  case ISD::AND:

  case ISD::OR:

  case ISD::XOR:

  case ISD::SHL:

  case ISD::SRA:

  case ISD::SRL:

  case ISD::FSHL:

  case ISD::FSHR:

  case ISD::ROTL:

  case ISD::ROTR:

  case ISD::ABS:

  case ISD::ABDS:

  case ISD::ABDU:

  case ISD::AVGCEILS:

  case ISD::AVGCEILU:

  case ISD::AVGFLOORS:

  case ISD::AVGFLOORU:

  case ISD::BSWAP:

  case ISD::BITREVERSE:

  case ISD::CTLZ:

  case ISD::CTTZ:

  case ISD::CTLZ_ZERO_UNDEF:

  case ISD::CTTZ_ZERO_UNDEF:

  case ISD::CTPOP:

  case ISD::SELECT:

  case ISD::VSELECT:

  case ISD::SELECT_CC:

  case ISD::ZERO_EXTEND:

  case ISD::ANY_EXTEND:

  case ISD::TRUNCATE:

  case ISD::SIGN_EXTEND:

  case ISD::FP_TO_SINT:

  case ISD::FP_TO_UINT:

  case ISD::FNEG:

  case ISD::FABS:

  case ISD::FMINNUM:

  case ISD::FMAXNUM:

  case ISD::FMINNUM_IEEE:

  case ISD::FMAXNUM_IEEE:

  case ISD::FMINIMUM:

  case ISD::FMAXIMUM:

  case ISD::FMINIMUMNUM:

  case ISD::FMAXIMUMNUM:

  case ISD::FCOPYSIGN:

  case ISD::FSQRT:

  case ISD::FSIN:

  case ISD::FCOS:

  case ISD::FTAN:

  case ISD::FASIN:

  case ISD::FACOS:

  case ISD::FATAN:

  case ISD::FATAN2:

  case ISD::FSINH:

  case ISD::FCOSH:

  case ISD::FTANH:

  case ISD::FLDEXP:

  case ISD::FPOWI:

  case ISD::FPOW:

  case ISD::FLOG:

  case ISD::FLOG2:

  case ISD::FLOG10:

  case ISD::FEXP:

  case ISD::FEXP2:

  case ISD::FEXP10:

  case ISD::FCEIL:

  case ISD::FTRUNC:

  case ISD::FRINT:

  case ISD::FNEARBYINT:

  case ISD::FROUND:

  case ISD::FROUNDEVEN:

  case ISD::FFLOOR:

  case ISD::FP_ROUND:

  case ISD::FP_EXTEND:

  case ISD::FPTRUNC_ROUND:

  case ISD::FMA:

  case ISD::SIGN_EXTEND_INREG:

  case ISD::ANY_EXTEND_VECTOR_INREG:

  case ISD::SIGN_EXTEND_VECTOR_INREG:

  case ISD::ZERO_EXTEND_VECTOR_INREG:

  case ISD::SMIN:

  case ISD::SMAX:

  case ISD::UMIN:

  case ISD::UMAX:

  case ISD::SMUL_LOHI:

  case ISD::UMUL_LOHI:

  case ISD::SADDO:

  case ISD::UADDO:

  case ISD::SSUBO:

  case ISD::USUBO:

  case ISD::SMULO:

  case ISD::UMULO:

  case ISD::FCANONICALIZE:

  case ISD::FFREXP:

  case ISD::FMODF:

  case ISD::FSINCOS:

  case ISD::FSINCOSPI:

  case ISD::SADDSAT:

  case ISD::UADDSAT:

  case ISD::SSUBSAT:

  case ISD::USUBSAT:

  case ISD::SSHLSAT:

  case ISD::USHLSAT:

  case ISD::FP_TO_SINT_SAT:

  case ISD::FP_TO_UINT_SAT:

  case ISD::MGATHER:

  case ISD::VECTOR_COMPRESS:

  case ISD::SCMP:

  case ISD::UCMP:

    Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));

    break;

  case ISD::SMULFIX:

  case ISD::SMULFIXSAT:

  case ISD::UMULFIX:

  case ISD::UMULFIXSAT:

  case ISD::SDIVFIX:

  case ISD::SDIVFIXSAT:

  case ISD::UDIVFIX:

  case ISD::UDIVFIXSAT: {

    unsigned Scale = Node->getConstantOperandVal(2);

    Action = TLI.getFixedPointOperationAction(Node->getOpcode(),

                                              Node->getValueType(0), Scale);

    break;

  }

  case ISD::LROUND:

  case ISD::LLROUND:

  case ISD::LRINT:

  case ISD::LLRINT:

  case ISD::SINT_TO_FP:

  case ISD::UINT_TO_FP:

  case ISD::VECREDUCE_ADD:

  case ISD::VECREDUCE_MUL:

  case ISD::VECREDUCE_AND:

  case ISD::VECREDUCE_OR:

  case ISD::VECREDUCE_XOR:

  case ISD::VECREDUCE_SMAX:

  case ISD::VECREDUCE_SMIN:

  case ISD::VECREDUCE_UMAX:

  case ISD::VECREDUCE_UMIN:

  case ISD::VECREDUCE_FADD:

  case ISD::VECREDUCE_FMAX:

  case ISD::VECREDUCE_FMAXIMUM:

  case ISD::VECREDUCE_FMIN:

  case ISD::VECREDUCE_FMINIMUM:

  case ISD::VECREDUCE_FMUL:

  case ISD::VECTOR_FIND_LAST_ACTIVE:

    Action = TLI.getOperationAction(Node->getOpcode(),

                                    Node->getOperand(0).getValueType());

    break;

  case ISD::VECREDUCE_SEQ_FADD:

  case ISD::VECREDUCE_SEQ_FMUL:

    Action = TLI.getOperationAction(Node->getOpcode(),

                                    Node->getOperand(1).getValueType());

    break;

  case ISD::SETCC: {

    MVT OpVT = Node->getOperand(0).getSimpleValueType();

    ISD::CondCode CCCode = cast<CondCodeSDNode>(Node->getOperand(2))->get();

    Action = TLI.getCondCodeAction(CCCode, OpVT);

    if (Action == TargetLowering::Legal)

      Action = TLI.getOperationAction(Node->getOpcode(), OpVT);

    break;

  }

  case ISD::PARTIAL_REDUCE_UMLA:

  case ISD::PARTIAL_REDUCE_SMLA:

  case ISD::PARTIAL_REDUCE_SUMLA:

    Action =

        TLI.getPartialReduceMLAAction(Op.getOpcode(), Node->getValueType(0),

                                      Node->getOperand(1).getValueType());

    break;


#define BEGIN_REGISTER_VP_SDNODE(VPID, LEGALPOS, ...)                          \

  case ISD::VPID: {                                                            \

    EVT LegalizeVT = LEGALPOS < 0 ? Node->getValueType(-(1 + LEGALPOS))        \

                                  : Node->getOperand(LEGALPOS).getValueType(); \

    if (ISD::VPID == ISD::VP_SETCC) {                                          \

      ISD::CondCode CCCode = cast<CondCodeSDNode>(Node->getOperand(2))->get(); \

      Action = TLI.getCondCodeAction(CCCode, LegalizeVT.getSimpleVT());        \

      if (Action != TargetLowering::Legal)                                     \

        break;                                                                 \

    }                                                                          \

    /* Defer non-vector results to LegalizeDAG. */                             \

    if (!Node->getValueType(0).isVector() &&                                   \

        Node->getValueType(0) != MVT::Other) {                                 \

      Action = TargetLowering::Legal;                                          \

      break;                                                                   \

    }                                                                          \

    Action = TLI.getOperationAction(Node->getOpcode(), LegalizeVT);            \

  } break;

#include "llvm/IR/VPIntrinsics.def"

  }


  LLVM_DEBUG(dbgs() << "\nLegalizing vector op: "; Node->dump(&DAG));


  SmallVector<SDValue, 8> ResultVals;

  switch (Action) {

  default: llvm_unreachable("This action is not supported yet!");

  case TargetLowering::Promote:

    assert((Op.getOpcode() != ISD::LOAD && Op.getOpcode() != ISD::STORE) &&

           "This action is not supported yet!");

    LLVM_DEBUG(dbgs() << "Promoting\n");

    Promote(Node, ResultVals);

    assert(!ResultVals.empty() && "No results for promotion?");

    break;

  case TargetLowering::Legal:

    LLVM_DEBUG(dbgs() << "Legal node: nothing to do\n");

    break;

  case TargetLowering::Custom:

    LLVM_DEBUG(dbgs() << "Trying custom legalization\n");

    if (LowerOperationWrapper(Node, ResultVals))

      break;

    LLVM_DEBUG(dbgs() << "Could not custom legalize node\n");

    [[fallthrough]];

  case TargetLowering::Expand:

    LLVM_DEBUG(dbgs() << "Expanding\n");

    Expand(Node, ResultVals);

    break;

  }


  if (ResultVals.empty())

    return TranslateLegalizeResults(Op, Node);


  Changed = true;

  return RecursivelyLegalizeResults(Op, ResultVals);

}


// FIXME: This is very similar to TargetLowering::LowerOperationWrapper. Can we

// merge them somehow?

bool VectorLegalizer::LowerOperationWrapper(SDNode *Node,

                                            SmallVectorImpl<SDValue> &Results) {

  SDValue Res = TLI.LowerOperation(SDValue(Node, 0), DAG);


  if (!Res.getNode())

    return false;


  if (Res == SDValue(Node, 0))

    return true;


  // If the original node has one result, take the return value from

  // LowerOperation as is. It might not be result number 0.

  if (Node->getNumValues() == 1) {

    Results.push_back(Res);

    return true;

  }


  // If the original node has multiple results, then the return node should

  // have the same number of results.

  assert((Node->getNumValues() == Res->getNumValues()) &&

         "Lowering returned the wrong number of results!");


  // Places new result values base on N result number.

  for (unsigned I = 0, E = Node->getNumValues(); I != E; ++I)

    Results.push_back(Res.getValue(I));


  return true;

}


void VectorLegalizer::PromoteSETCC(SDNode *Node,

                                   SmallVectorImpl<SDValue> &Results) {

  MVT VecVT = Node->getOperand(0).getSimpleValueType();

  MVT NewVecVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VecVT);


  unsigned ExtOp = VecVT.isFloatingPoint() ? ISD::FP_EXTEND : ISD::ANY_EXTEND;


  SDLoc DL(Node);

  SmallVector<SDValue, 5> Operands(Node->getNumOperands());


  Operands[0] = DAG.getNode(ExtOp, DL, NewVecVT, Node->getOperand(0));

  Operands[1] = DAG.getNode(ExtOp, DL, NewVecVT, Node->getOperand(1));

  Operands[2] = Node->getOperand(2);


  if (Node->getOpcode() == ISD::VP_SETCC) {

    Operands[3] = Node->getOperand(3); // mask

    Operands[4] = Node->getOperand(4); // evl

  }


  SDValue Res = DAG.getNode(Node->getOpcode(), DL, Node->getSimpleValueType(0),

                            Operands, Node->getFlags());


  Results.push_back(Res);

}


void VectorLegalizer::PromoteSTRICT(SDNode *Node,

                                    SmallVectorImpl<SDValue> &Results) {

  MVT VecVT = Node->getOperand(1).getSimpleValueType();

  MVT NewVecVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VecVT);


  assert(VecVT.isFloatingPoint());


  SDLoc DL(Node);

  SmallVector<SDValue, 5> Operands(Node->getNumOperands());

  SmallVector<SDValue, 2> Chains;


  for (unsigned j = 1; j != Node->getNumOperands(); ++j)

    if (Node->getOperand(j).getValueType().isVector() &&

        !(ISD::isVPOpcode(Node->getOpcode()) &&

          ISD::getVPMaskIdx(Node->getOpcode()) == j)) // Skip mask operand.

    {

      // promote the vector operand.

      SDValue Ext =

          DAG.getNode(ISD::STRICT_FP_EXTEND, DL, {NewVecVT, MVT::Other},

                      {Node->getOperand(0), Node->getOperand(j)});

      Operands[j] = Ext.getValue(0);

      Chains.push_back(Ext.getValue(1));

    } else

      Operands[j] = Node->getOperand(j); // Skip no vector operand.


  SDVTList VTs = DAG.getVTList(NewVecVT, Node->getValueType(1));


  Operands[0] = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, Chains);


  SDValue Res =

      DAG.getNode(Node->getOpcode(), DL, VTs, Operands, Node->getFlags());


  SDValue Round =

      DAG.getNode(ISD::STRICT_FP_ROUND, DL, {VecVT, MVT::Other},

                  {Res.getValue(1), Res.getValue(0),

                   DAG.getIntPtrConstant(0, DL, /*isTarget=*/true)});


  Results.push_back(Round.getValue(0));

  Results.push_back(Round.getValue(1));

}


void VectorLegalizer::PromoteFloatVECREDUCE(SDNode *Node,

                                            SmallVectorImpl<SDValue> &Results,

                                            bool NonArithmetic) {

  MVT OpVT = Node->getOperand(0).getSimpleValueType();

  assert(OpVT.isFloatingPoint() && "Expected floating point reduction!");

  MVT NewOpVT = TLI.getTypeToPromoteTo(Node->getOpcode(), OpVT);


  SDLoc DL(Node);

  SDValue NewOp = DAG.getNode(ISD::FP_EXTEND, DL, NewOpVT, Node->getOperand(0));

  SDValue Rdx =

      DAG.getNode(Node->getOpcode(), DL, NewOpVT.getVectorElementType(), NewOp,

                  Node->getFlags());

  SDValue Res =

      DAG.getNode(ISD::FP_ROUND, DL, Node->getValueType(0), Rdx,

                  DAG.getIntPtrConstant(NonArithmetic, DL, /*isTarget=*/true));

  Results.push_back(Res);

}


void VectorLegalizer::Promote(SDNode *Node, SmallVectorImpl<SDValue> &Results) {

  // For a few operations there is a specific concept for promotion based on

  // the operand's type.

  switch (Node->getOpcode()) {

  case ISD::SINT_TO_FP:

  case ISD::UINT_TO_FP:

  case ISD::STRICT_SINT_TO_FP:

  case ISD::STRICT_UINT_TO_FP:

    // "Promote" the operation by extending the operand.

    PromoteINT_TO_FP(Node, Results);

    return;

  case ISD::FP_TO_UINT:

  case ISD::FP_TO_SINT:

  case ISD::STRICT_FP_TO_UINT:

  case ISD::STRICT_FP_TO_SINT:

    // Promote the operation by extending the operand.

    PromoteFP_TO_INT(Node, Results);

    return;

  case ISD::VP_SETCC:

  case ISD::SETCC:

    // Promote the operation by extending the operand.

    PromoteSETCC(Node, Results);

    return;

  case ISD::STRICT_FADD:

  case ISD::STRICT_FSUB:

  case ISD::STRICT_FMUL:

  case ISD::STRICT_FDIV:

  case ISD::STRICT_FSQRT:

  case ISD::STRICT_FMA:

    PromoteSTRICT(Node, Results);

    return;

  case ISD::VECREDUCE_FADD:

    PromoteFloatVECREDUCE(Node, Results, /*NonArithmetic=*/false);

    return;

  case ISD::VECREDUCE_FMAX:

  case ISD::VECREDUCE_FMAXIMUM:

  case ISD::VECREDUCE_FMIN:

  case ISD::VECREDUCE_FMINIMUM:

    PromoteFloatVECREDUCE(Node, Results, /*NonArithmetic=*/true);

    return;

  case ISD::FP_ROUND:

  case ISD::FP_EXTEND:

    // These operations are used to do promotion so they can't be promoted

    // themselves.

    llvm_unreachable("Don't know how to promote this operation!");

  case ISD::VP_FABS:

  case ISD::VP_FCOPYSIGN:

  case ISD::VP_FNEG:

    // Promoting fabs, fneg, and fcopysign changes their semantics.

    llvm_unreachable("These operations should not be promoted");

  }


  // There are currently two cases of vector promotion:

  // 1) Bitcasting a vector of integers to a different type to a vector of the

  //    same overall length. For example, x86 promotes ISD::AND v2i32 to v1i64.

  // 2) Extending a vector of floats to a vector of the same number of larger

  //    floats. For example, AArch64 promotes ISD::FADD on v4f16 to v4f32.

  assert(Node->getNumValues() == 1 &&

         "Can't promote a vector with multiple results!");

  MVT VT = Node->getSimpleValueType(0);

  MVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VT);

  SDLoc dl(Node);

  SmallVector<SDValue, 4> Operands(Node->getNumOperands());


  for (unsigned j = 0; j != Node->getNumOperands(); ++j) {

    // Do not promote the mask operand of a VP OP.

    bool SkipPromote = ISD::isVPOpcode(Node->getOpcode()) &&

                       ISD::getVPMaskIdx(Node->getOpcode()) == j;

    if (Node->getOperand(j).getValueType().isVector() && !SkipPromote)

      if (Node->getOperand(j)

              .getValueType()

              .getVectorElementType()

              .isFloatingPoint() &&

          NVT.isVector() && NVT.getVectorElementType().isFloatingPoint())

        if (ISD::isVPOpcode(Node->getOpcode())) {

          unsigned EVLIdx =

              *ISD::getVPExplicitVectorLengthIdx(Node->getOpcode());

          unsigned MaskIdx = *ISD::getVPMaskIdx(Node->getOpcode());

          Operands[j] =

              DAG.getNode(ISD::VP_FP_EXTEND, dl, NVT, Node->getOperand(j),

                          Node->getOperand(MaskIdx), Node->getOperand(EVLIdx));

        } else {

          Operands[j] =

              DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(j));

        }

      else

        Operands[j] = DAG.getNode(ISD::BITCAST, dl, NVT, Node->getOperand(j));

    else

      Operands[j] = Node->getOperand(j);

  }


  SDValue Res =

      DAG.getNode(Node->getOpcode(), dl, NVT, Operands, Node->getFlags());


  if ((VT.isFloatingPoint() && NVT.isFloatingPoint()) ||

      (VT.isVector() && VT.getVectorElementType().isFloatingPoint() &&

       NVT.isVector() && NVT.getVectorElementType().isFloatingPoint()))

    if (ISD::isVPOpcode(Node->getOpcode())) {

      unsigned EVLIdx = *ISD::getVPExplicitVectorLengthIdx(Node->getOpcode());

      unsigned MaskIdx = *ISD::getVPMaskIdx(Node->getOpcode());

      Res = DAG.getNode(ISD::VP_FP_ROUND, dl, VT, Res,

                        Node->getOperand(MaskIdx), Node->getOperand(EVLIdx));

    } else {

      Res = DAG.getNode(ISD::FP_ROUND, dl, VT, Res,

                        DAG.getIntPtrConstant(0, dl, /*isTarget=*/true));

    }

  else

    Res = DAG.getNode(ISD::BITCAST, dl, VT, Res);


  Results.push_back(Res);

}


void VectorLegalizer::PromoteINT_TO_FP(SDNode *Node,

                                       SmallVectorImpl<SDValue> &Results) {

  // INT_TO_FP operations may require the input operand be promoted even

  // when the type is otherwise legal.

  bool IsStrict = Node->isStrictFPOpcode();

  MVT VT = Node->getOperand(IsStrict ? 1 : 0).getSimpleValueType();

  MVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VT);

  assert(NVT.getVectorNumElements() == VT.getVectorNumElements() &&

         "Vectors have different number of elements!");


  SDLoc dl(Node);

  SmallVector<SDValue, 4> Operands(Node->getNumOperands());


  unsigned Opc = (Node->getOpcode() == ISD::UINT_TO_FP ||

                  Node->getOpcode() == ISD::STRICT_UINT_TO_FP)

                     ? ISD::ZERO_EXTEND

                     : ISD::SIGN_EXTEND;

  for (unsigned j = 0; j != Node->getNumOperands(); ++j) {

    if (Node->getOperand(j).getValueType().isVector())

      Operands[j] = DAG.getNode(Opc, dl, NVT, Node->getOperand(j));

    else

      Operands[j] = Node->getOperand(j);

  }


  if (IsStrict) {

    SDValue Res = DAG.getNode(Node->getOpcode(), dl,

                              {Node->getValueType(0), MVT::Other}, Operands);

    Results.push_back(Res);

    Results.push_back(Res.getValue(1));

    return;

  }


  SDValue Res =

      DAG.getNode(Node->getOpcode(), dl, Node->getValueType(0), Operands);

  Results.push_back(Res);

}


// For FP_TO_INT we promote the result type to a vector type with wider

// elements and then truncate the result.  This is different from the default

// PromoteVector which uses bitcast to promote thus assumning that the

// promoted vector type has the same overall size.

void VectorLegalizer::PromoteFP_TO_INT(SDNode *Node,

                                       SmallVectorImpl<SDValue> &Results) {

  MVT VT = Node->getSimpleValueType(0);

  MVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VT);

  bool IsStrict = Node->isStrictFPOpcode();

  assert(NVT.getVectorNumElements() == VT.getVectorNumElements() &&

         "Vectors have different number of elements!");


  unsigned NewOpc = Node->getOpcode();

  // Change FP_TO_UINT to FP_TO_SINT if possible.

  // TODO: Should we only do this if FP_TO_UINT itself isn't legal?

  if (NewOpc == ISD::FP_TO_UINT &&

      TLI.isOperationLegalOrCustom(ISD::FP_TO_SINT, NVT))

    NewOpc = ISD::FP_TO_SINT;


  if (NewOpc == ISD::STRICT_FP_TO_UINT &&

      TLI.isOperationLegalOrCustom(ISD::STRICT_FP_TO_SINT, NVT))

    NewOpc = ISD::STRICT_FP_TO_SINT;


  SDLoc dl(Node);

  SDValue Promoted, Chain;

  if (IsStrict) {

    Promoted = DAG.getNode(NewOpc, dl, {NVT, MVT::Other},

                           {Node->getOperand(0), Node->getOperand(1)});

    Chain = Promoted.getValue(1);

  } else

    Promoted = DAG.getNode(NewOpc, dl, NVT, Node->getOperand(0));


  // Assert that the converted value fits in the original type.  If it doesn't

  // (eg: because the value being converted is too big), then the result of the

  // original operation was undefined anyway, so the assert is still correct.

  if (Node->getOpcode() == ISD::FP_TO_UINT ||

      Node->getOpcode() == ISD::STRICT_FP_TO_UINT)

    NewOpc = ISD::AssertZext;

  else

    NewOpc = ISD::AssertSext;


  Promoted = DAG.getNode(NewOpc, dl, NVT, Promoted,

                         DAG.getValueType(VT.getScalarType()));

  Promoted = DAG.getNode(ISD::TRUNCATE, dl, VT, Promoted);

  Results.push_back(Promoted);

  if (IsStrict)

    Results.push_back(Chain);

}


std::pair<SDValue, SDValue> VectorLegalizer::ExpandLoad(SDNode *N) {

  LoadSDNode *LD = cast<LoadSDNode>(N);

  return TLI.scalarizeVectorLoad(LD, DAG);

}


SDValue VectorLegalizer::ExpandStore(SDNode *N) {

  StoreSDNode *ST = cast<StoreSDNode>(N);

  SDValue TF = TLI.scalarizeVectorStore(ST, DAG);

  return TF;

}


void VectorLegalizer::Expand(SDNode *Node, SmallVectorImpl<SDValue> &Results) {

  switch (Node->getOpcode()) {

  case ISD::LOAD: {

    std::pair<SDValue, SDValue> Tmp = ExpandLoad(Node);

    Results.push_back(Tmp.first);

    Results.push_back(Tmp.second);

    return;

  }

  case ISD::STORE:

    Results.push_back(ExpandStore(Node));

    return;

  case ISD::MERGE_VALUES:

    for (unsigned i = 0, e = Node->getNumValues(); i != e; ++i)

      Results.push_back(Node->getOperand(i));

    return;

  case ISD::SIGN_EXTEND_INREG:

    if (SDValue Expanded = ExpandSEXTINREG(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::ANY_EXTEND_VECTOR_INREG:

    Results.push_back(ExpandANY_EXTEND_VECTOR_INREG(Node));

    return;

  case ISD::SIGN_EXTEND_VECTOR_INREG:

    Results.push_back(ExpandSIGN_EXTEND_VECTOR_INREG(Node));

    return;

  case ISD::ZERO_EXTEND_VECTOR_INREG:

    Results.push_back(ExpandZERO_EXTEND_VECTOR_INREG(Node));

    return;

  case ISD::BSWAP:

    if (SDValue Expanded = ExpandBSWAP(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_BSWAP:

    Results.push_back(TLI.expandVPBSWAP(Node, DAG));

    return;

  case ISD::VSELECT:

    if (SDValue Expanded = ExpandVSELECT(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_SELECT:

    if (SDValue Expanded = ExpandVP_SELECT(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_SREM:

  case ISD::VP_UREM:

    if (SDValue Expanded = ExpandVP_REM(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_FNEG:

    if (SDValue Expanded = ExpandVP_FNEG(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_FABS:

    if (SDValue Expanded = ExpandVP_FABS(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_FCOPYSIGN:

    if (SDValue Expanded = ExpandVP_FCOPYSIGN(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::SELECT:

    if (SDValue Expanded = ExpandSELECT(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::SELECT_CC: {

    if (Node->getValueType(0).isScalableVector()) {

      EVT CondVT = TLI.getSetCCResultType(

          DAG.getDataLayout(), *DAG.getContext(), Node->getValueType(0));

      SDValue SetCC =

          DAG.getNode(ISD::SETCC, SDLoc(Node), CondVT, Node->getOperand(0),

                      Node->getOperand(1), Node->getOperand(4));

      Results.push_back(DAG.getSelect(SDLoc(Node), Node->getValueType(0), SetCC,

                                      Node->getOperand(2),

                                      Node->getOperand(3)));

      return;

    }

    break;

  }

  case ISD::FP_TO_UINT:

    ExpandFP_TO_UINT(Node, Results);

    return;

  case ISD::UINT_TO_FP:

    ExpandUINT_TO_FLOAT(Node, Results);

    return;

  case ISD::FNEG:

    if (SDValue Expanded = ExpandFNEG(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::FABS:

    if (SDValue Expanded = ExpandFABS(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::FCOPYSIGN:

    if (SDValue Expanded = ExpandFCOPYSIGN(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::FSUB:

    ExpandFSUB(Node, Results);

    return;

  case ISD::SETCC:

  case ISD::VP_SETCC:

    ExpandSETCC(Node, Results);

    return;

  case ISD::ABS:

    if (SDValue Expanded = TLI.expandABS(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::ABDS:

  case ISD::ABDU:

    if (SDValue Expanded = TLI.expandABD(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::AVGCEILS:

  case ISD::AVGCEILU:

  case ISD::AVGFLOORS:

  case ISD::AVGFLOORU:

    if (SDValue Expanded = TLI.expandAVG(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::BITREVERSE:

    if (SDValue Expanded = ExpandBITREVERSE(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_BITREVERSE:

    if (SDValue Expanded = TLI.expandVPBITREVERSE(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::CTPOP:

    if (SDValue Expanded = TLI.expandCTPOP(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_CTPOP:

    if (SDValue Expanded = TLI.expandVPCTPOP(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::CTLZ:

  case ISD::CTLZ_ZERO_UNDEF:

    if (SDValue Expanded = TLI.expandCTLZ(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_CTLZ:

  case ISD::VP_CTLZ_ZERO_UNDEF:

    if (SDValue Expanded = TLI.expandVPCTLZ(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::CTTZ:

  case ISD::CTTZ_ZERO_UNDEF:

    if (SDValue Expanded = TLI.expandCTTZ(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::VP_CTTZ:

  case ISD::VP_CTTZ_ZERO_UNDEF:

    if (SDValue Expanded = TLI.expandVPCTTZ(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::FSHL:

  case ISD::VP_FSHL:

  case ISD::FSHR:

  case ISD::VP_FSHR:

    if (SDValue Expanded = TLI.expandFunnelShift(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::ROTL:

  case ISD::ROTR:

    if (SDValue Expanded = TLI.expandROT(Node, false /*AllowVectorOps*/, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::FMINNUM:

  case ISD::FMAXNUM:

    if (SDValue Expanded = TLI.expandFMINNUM_FMAXNUM(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::FMINIMUM:

  case ISD::FMAXIMUM:

    Results.push_back(TLI.expandFMINIMUM_FMAXIMUM(Node, DAG));

    return;

  case ISD::FMINIMUMNUM:

  case ISD::FMAXIMUMNUM:

    Results.push_back(TLI.expandFMINIMUMNUM_FMAXIMUMNUM(Node, DAG));

    return;

  case ISD::SMIN:

  case ISD::SMAX:

  case ISD::UMIN:

  case ISD::UMAX:

    if (SDValue Expanded = TLI.expandIntMINMAX(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::UADDO:

  case ISD::USUBO:

    ExpandUADDSUBO(Node, Results);

    return;

  case ISD::SADDO:

  case ISD::SSUBO:

    ExpandSADDSUBO(Node, Results);

    return;

  case ISD::UMULO:

  case ISD::SMULO:

    ExpandMULO(Node, Results);

    return;

  case ISD::USUBSAT:

  case ISD::SSUBSAT:

  case ISD::UADDSAT:

  case ISD::SADDSAT:

    if (SDValue Expanded = TLI.expandAddSubSat(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::USHLSAT:

  case ISD::SSHLSAT:

    if (SDValue Expanded = TLI.expandShlSat(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::FP_TO_SINT_SAT:

  case ISD::FP_TO_UINT_SAT:

    // Expand the fpsosisat if it is scalable to prevent it from unrolling below.

    if (Node->getValueType(0).isScalableVector()) {

      if (SDValue Expanded = TLI.expandFP_TO_INT_SAT(Node, DAG)) {

        Results.push_back(Expanded);

        return;

      }

    }

    break;

  case ISD::SMULFIX:

  case ISD::UMULFIX:

    if (SDValue Expanded = TLI.expandFixedPointMul(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::SMULFIXSAT:

  case ISD::UMULFIXSAT:

    // FIXME: We do not expand SMULFIXSAT/UMULFIXSAT here yet, not sure exactly

    // why. Maybe it results in worse codegen compared to the unroll for some

    // targets? This should probably be investigated. And if we still prefer to

    // unroll an explanation could be helpful.

    break;

  case ISD::SDIVFIX:

  case ISD::UDIVFIX:

    ExpandFixedPointDiv(Node, Results);

    return;

  case ISD::SDIVFIXSAT:

  case ISD::UDIVFIXSAT:

    break;

#define DAG_INSTRUCTION(NAME, NARG, ROUND_MODE, INTRINSIC, DAGN)               \

  case ISD::STRICT_##DAGN:

#include "llvm/IR/ConstrainedOps.def"

    ExpandStrictFPOp(Node, Results);

    return;

  case ISD::VECREDUCE_ADD:

  case ISD::VECREDUCE_MUL:

  case ISD::VECREDUCE_AND:

  case ISD::VECREDUCE_OR:

  case ISD::VECREDUCE_XOR:

  case ISD::VECREDUCE_SMAX:

  case ISD::VECREDUCE_SMIN:

  case ISD::VECREDUCE_UMAX:

  case ISD::VECREDUCE_UMIN:

  case ISD::VECREDUCE_FADD:

  case ISD::VECREDUCE_FMUL:

  case ISD::VECREDUCE_FMAX:

  case ISD::VECREDUCE_FMIN:

  case ISD::VECREDUCE_FMAXIMUM:

  case ISD::VECREDUCE_FMINIMUM:

    Results.push_back(TLI.expandVecReduce(Node, DAG));

    return;

  case ISD::PARTIAL_REDUCE_UMLA:

  case ISD::PARTIAL_REDUCE_SMLA:

  case ISD::PARTIAL_REDUCE_SUMLA:

    Results.push_back(TLI.expandPartialReduceMLA(Node, DAG));

    return;

  case ISD::VECREDUCE_SEQ_FADD:

  case ISD::VECREDUCE_SEQ_FMUL:

    Results.push_back(TLI.expandVecReduceSeq(Node, DAG));

    return;

  case ISD::SREM:

  case ISD::UREM:

    ExpandREM(Node, Results);

    return;

  case ISD::VP_MERGE:

    if (SDValue Expanded = ExpandVP_MERGE(Node)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  case ISD::FREM:

    if (tryExpandVecMathCall(Node, RTLIB::REM_F32, RTLIB::REM_F64,

                             RTLIB::REM_F80, RTLIB::REM_F128,

                             RTLIB::REM_PPCF128, Results))

      return;


    break;

  case ISD::FSINCOS:

  case ISD::FSINCOSPI: {

    EVT VT = Node->getValueType(0).getVectorElementType();

    RTLIB::Libcall LC = Node->getOpcode() == ISD::FSINCOS

                            ? RTLIB::getSINCOS(VT)

                            : RTLIB::getSINCOSPI(VT);

    if (DAG.expandMultipleResultFPLibCall(LC, Node, Results))

      return;

    break;

  }

  case ISD::FMODF: {

    RTLIB::Libcall LC =

        RTLIB::getMODF(Node->getValueType(0).getVectorElementType());

    if (DAG.expandMultipleResultFPLibCall(LC, Node, Results,

                                          /*CallRetResNo=*/0))

      return;

    break;

  }

  case ISD::VECTOR_COMPRESS:

    Results.push_back(TLI.expandVECTOR_COMPRESS(Node, DAG));

    return;

  case ISD::VECTOR_FIND_LAST_ACTIVE:

    Results.push_back(TLI.expandVectorFindLastActive(Node, DAG));

    return;

  case ISD::SCMP:

  case ISD::UCMP:

    Results.push_back(TLI.expandCMP(Node, DAG));

    return;


  case ISD::FADD:

  case ISD::FMUL:

  case ISD::FMA:

  case ISD::FDIV:

  case ISD::FCEIL:

  case ISD::FFLOOR:

  case ISD::FNEARBYINT:

  case ISD::FRINT:

  case ISD::FROUND:

  case ISD::FROUNDEVEN:

  case ISD::FTRUNC:

  case ISD::FSQRT:

    if (SDValue Expanded = TLI.expandVectorNaryOpBySplitting(Node, DAG)) {

      Results.push_back(Expanded);

      return;

    }

    break;

  }


  SDValue Unrolled = DAG.UnrollVectorOp(Node);

  if (Node->getNumValues() == 1) {

    Results.push_back(Unrolled);

  } else {

    assert(Node->getNumValues() == Unrolled->getNumValues() &&

      "VectorLegalizer Expand returned wrong number of results!");

    for (unsigned I = 0, E = Unrolled->getNumValues(); I != E; ++I)

      Results.push_back(Unrolled.getValue(I));

  }

}


SDValue VectorLegalizer::ExpandSELECT(SDNode *Node) {

  // Lower a select instruction where the condition is a scalar and the

  // operands are vectors. Lower this select to VSELECT and implement it

  // using XOR AND OR. The selector bit is broadcasted.

  EVT VT = Node->getValueType(0);

  SDLoc DL(Node);


  SDValue Mask = Node->getOperand(0);

  SDValue Op1 = Node->getOperand(1);

  SDValue Op2 = Node->getOperand(2);


  assert(VT.isVector() && !Mask.getValueType().isVector()

         && Op1.getValueType() == Op2.getValueType() && "Invalid type");


  // If we can't even use the basic vector operations of

  // AND,OR,XOR, we will have to scalarize the op.

  // Notice that the operation may be 'promoted' which means that it is

  // 'bitcasted' to another type which is handled.

  // Also, we need to be able to construct a splat vector using either

  // BUILD_VECTOR or SPLAT_VECTOR.

  // FIXME: Should we also permit fixed-length SPLAT_VECTOR as a fallback to

  // BUILD_VECTOR?

  if (TLI.getOperationAction(ISD::AND, VT) == TargetLowering::Expand ||

      TLI.getOperationAction(ISD::XOR, VT) == TargetLowering::Expand ||

      TLI.getOperationAction(ISD::OR, VT) == TargetLowering::Expand ||

      TLI.getOperationAction(VT.isFixedLengthVector() ? ISD::BUILD_VECTOR

                                                      : ISD::SPLAT_VECTOR,

                             VT) == TargetLowering::Expand)

    return SDValue();


  // Generate a mask operand.

  EVT MaskTy = VT.changeVectorElementTypeToInteger();


  // What is the size of each element in the vector mask.

  EVT BitTy = MaskTy.getScalarType();


  Mask = DAG.getSelect(DL, BitTy, Mask, DAG.getAllOnesConstant(DL, BitTy),

                       DAG.getConstant(0, DL, BitTy));


  // Broadcast the mask so that the entire vector is all one or all zero.

  Mask = DAG.getSplat(MaskTy, DL, Mask);


  // Bitcast the operands to be the same type as the mask.

  // This is needed when we select between FP types because

  // the mask is a vector of integers.

  Op1 = DAG.getNode(ISD::BITCAST, DL, MaskTy, Op1);

  Op2 = DAG.getNode(ISD::BITCAST, DL, MaskTy, Op2);


  SDValue NotMask = DAG.getNOT(DL, Mask, MaskTy);


  Op1 = DAG.getNode(ISD::AND, DL, MaskTy, Op1, Mask);

  Op2 = DAG.getNode(ISD::AND, DL, MaskTy, Op2, NotMask);

  SDValue Val = DAG.getNode(ISD::OR, DL, MaskTy, Op1, Op2);

  return DAG.getNode(ISD::BITCAST, DL, Node->getValueType(0), Val);

}


SDValue VectorLegalizer::ExpandSEXTINREG(SDNode *Node) {

  EVT VT = Node->getValueType(0);


  // Make sure that the SRA and SHL instructions are available.

  if (TLI.getOperationAction(ISD::SRA, VT) == TargetLowering::Expand ||

      TLI.getOperationAction(ISD::SHL, VT) == TargetLowering::Expand)

    return SDValue();


  SDLoc DL(Node);

  EVT OrigTy = cast<VTSDNode>(Node->getOperand(1))->getVT();


  unsigned BW = VT.getScalarSizeInBits();

  unsigned OrigBW = OrigTy.getScalarSizeInBits();

  SDValue ShiftSz = DAG.getConstant(BW - OrigBW, DL, VT);


  SDValue Op = DAG.getNode(ISD::SHL, DL, VT, Node->getOperand(0), ShiftSz);

  return DAG.getNode(ISD::SRA, DL, VT, Op, ShiftSz);

}


// Generically expand a vector anyext in register to a shuffle of the relevant

// lanes into the appropriate locations, with other lanes left undef.

SDValue VectorLegalizer::ExpandANY_EXTEND_VECTOR_INREG(SDNode *Node) {

  SDLoc DL(Node);

  EVT VT = Node->getValueType(0);

  int NumElements = VT.getVectorNumElements();

  SDValue Src = Node->getOperand(0);

  EVT SrcVT = Src.getValueType();

  int NumSrcElements = SrcVT.getVectorNumElements();


  // *_EXTEND_VECTOR_INREG SrcVT can be smaller than VT - so insert the vector

  // into a larger vector type.

  if (SrcVT.bitsLE(VT)) {

    assert((VT.getSizeInBits() % SrcVT.getScalarSizeInBits()) == 0 &&

           "ANY_EXTEND_VECTOR_INREG vector size mismatch");

    NumSrcElements = VT.getSizeInBits() / SrcVT.getScalarSizeInBits();

    SrcVT = EVT::getVectorVT(*DAG.getContext(), SrcVT.getScalarType(),

                             NumSrcElements);

    Src = DAG.getInsertSubvector(DL, DAG.getUNDEF(SrcVT), Src, 0);

  }


  // Build a base mask of undef shuffles.

  SmallVector<int, 16> ShuffleMask;

  ShuffleMask.resize(NumSrcElements, -1);


  // Place the extended lanes into the correct locations.

  int ExtLaneScale = NumSrcElements / NumElements;

  int EndianOffset = DAG.getDataLayout().isBigEndian() ? ExtLaneScale - 1 : 0;

  for (int i = 0; i < NumElements; ++i)

    ShuffleMask[i * ExtLaneScale + EndianOffset] = i;


  return DAG.getNode(

      ISD::BITCAST, DL, VT,

      DAG.getVectorShuffle(SrcVT, DL, Src, DAG.getUNDEF(SrcVT), ShuffleMask));

}


SDValue VectorLegalizer::ExpandSIGN_EXTEND_VECTOR_INREG(SDNode *Node) {

  SDLoc DL(Node);

  EVT VT = Node->getValueType(0);

  SDValue Src = Node->getOperand(0);

  EVT SrcVT = Src.getValueType();


  // First build an any-extend node which can be legalized above when we

  // recurse through it.

  SDValue Op = DAG.getNode(ISD::ANY_EXTEND_VECTOR_INREG, DL, VT, Src);


  // Now we need sign extend. Do this by shifting the elements. Even if these

  // aren't legal operations, they have a better chance of being legalized

  // without full scalarization than the sign extension does.

  unsigned EltWidth = VT.getScalarSizeInBits();

  unsigned SrcEltWidth = SrcVT.getScalarSizeInBits();

  SDValue ShiftAmount = DAG.getConstant(EltWidth - SrcEltWidth, DL, VT);

  return DAG.getNode(ISD::SRA, DL, VT,

                     DAG.getNode(ISD::SHL, DL, VT, Op, ShiftAmount),

                     ShiftAmount);

}


// Generically expand a vector zext in register to a shuffle of the relevant

// lanes into the appropriate locations, a blend of zero into the high bits,

// and a bitcast to the wider element type.

SDValue VectorLegalizer::ExpandZERO_EXTEND_VECTOR_INREG(SDNode *Node) {

  SDLoc DL(Node);

  EVT VT = Node->getValueType(0);

  int NumElements = VT.getVectorNumElements();

  SDValue Src = Node->getOperand(0);

  EVT SrcVT = Src.getValueType();

  int NumSrcElements = SrcVT.getVectorNumElements();


  // *_EXTEND_VECTOR_INREG SrcVT can be smaller than VT - so insert the vector

  // into a larger vector type.

  if (SrcVT.bitsLE(VT)) {

    assert((VT.getSizeInBits() % SrcVT.getScalarSizeInBits()) == 0 &&

           "ZERO_EXTEND_VECTOR_INREG vector size mismatch");

    NumSrcElements = VT.getSizeInBits() / SrcVT.getScalarSizeInBits();

    SrcVT = EVT::getVectorVT(*DAG.getContext(), SrcVT.getScalarType(),

                             NumSrcElements);

    Src = DAG.getInsertSubvector(DL, DAG.getUNDEF(SrcVT), Src, 0);

  }


  // Build up a zero vector to blend into this one.

  SDValue Zero = DAG.getConstant(0, DL, SrcVT);


  // Shuffle the incoming lanes into the correct position, and pull all other

  // lanes from the zero vector.

  auto ShuffleMask = llvm::to_vector<16>(llvm::seq<int>(0, NumSrcElements));


  int ExtLaneScale = NumSrcElements / NumElements;

  int EndianOffset = DAG.getDataLayout().isBigEndian() ? ExtLaneScale - 1 : 0;

  for (int i = 0; i < NumElements; ++i)

    ShuffleMask[i * ExtLaneScale + EndianOffset] = NumSrcElements + i;


  return DAG.getNode(ISD::BITCAST, DL, VT,

                     DAG.getVectorShuffle(SrcVT, DL, Zero, Src, ShuffleMask));

}


static void createBSWAPShuffleMask(EVT VT, SmallVectorImpl<int> &ShuffleMask) {

  int ScalarSizeInBytes = VT.getScalarSizeInBits() / 8;

  for (int I = 0, E = VT.getVectorNumElements(); I != E; ++I)

    for (int J = ScalarSizeInBytes - 1; J >= 0; --J)

      ShuffleMask.push_back((I * ScalarSizeInBytes) + J);

}


SDValue VectorLegalizer::ExpandBSWAP(SDNode *Node) {

  EVT VT = Node->getValueType(0);


  // Scalable vectors can't use shuffle expansion.

  if (VT.isScalableVector())

    return TLI.expandBSWAP(Node, DAG);


  // Generate a byte wise shuffle mask for the BSWAP.

  SmallVector<int, 16> ShuffleMask;

  createBSWAPShuffleMask(VT, ShuffleMask);

  EVT ByteVT = EVT::getVectorVT(*DAG.getContext(), MVT::i8, ShuffleMask.size());


  // Only emit a shuffle if the mask is legal.

  if (TLI.isShuffleMaskLegal(ShuffleMask, ByteVT)) {

    SDLoc DL(Node);

    SDValue Op = DAG.getNode(ISD::BITCAST, DL, ByteVT, Node->getOperand(0));

    Op = DAG.getVectorShuffle(ByteVT, DL, Op, DAG.getUNDEF(ByteVT), ShuffleMask);

    return DAG.getNode(ISD::BITCAST, DL, VT, Op);

  }


  // If we have the appropriate vector bit operations, it is better to use them

  // than unrolling and expanding each component.

  if (TLI.isOperationLegalOrCustom(ISD::SHL, VT) &&

      TLI.isOperationLegalOrCustom(ISD::SRL, VT) &&

      TLI.isOperationLegalOrCustomOrPromote(ISD::AND, VT) &&

      TLI.isOperationLegalOrCustomOrPromote(ISD::OR, VT))

    return TLI.expandBSWAP(Node, DAG);


  // Otherwise let the caller unroll.

  return SDValue();

}


SDValue VectorLegalizer::ExpandBITREVERSE(SDNode *Node) {

  EVT VT = Node->getValueType(0);


  // We can't unroll or use shuffles for scalable vectors.

  if (VT.isScalableVector())

    return TLI.expandBITREVERSE(Node, DAG);


  // If we have the scalar operation, it's probably cheaper to unroll it.

  if (TLI.isOperationLegalOrCustom(ISD::BITREVERSE, VT.getScalarType()))

    return SDValue();


  // If the vector element width is a whole number of bytes, test if its legal

  // to BSWAP shuffle the bytes and then perform the BITREVERSE on the byte

  // vector. This greatly reduces the number of bit shifts necessary.

  unsigned ScalarSizeInBits = VT.getScalarSizeInBits();

  if (ScalarSizeInBits > 8 && (ScalarSizeInBits % 8) == 0) {

    SmallVector<int, 16> BSWAPMask;

    createBSWAPShuffleMask(VT, BSWAPMask);


    EVT ByteVT = EVT::getVectorVT(*DAG.getContext(), MVT::i8, BSWAPMask.size());

    if (TLI.isShuffleMaskLegal(BSWAPMask, ByteVT) &&

        (TLI.isOperationLegalOrCustom(ISD::BITREVERSE, ByteVT) ||

         (TLI.isOperationLegalOrCustom(ISD::SHL, ByteVT) &&

          TLI.isOperationLegalOrCustom(ISD::SRL, ByteVT) &&

          TLI.isOperationLegalOrCustomOrPromote(ISD::AND, ByteVT) &&

          TLI.isOperationLegalOrCustomOrPromote(ISD::OR, ByteVT)))) {

      SDLoc DL(Node);

      SDValue Op = DAG.getNode(ISD::BITCAST, DL, ByteVT, Node->getOperand(0));

      Op = DAG.getVectorShuffle(ByteVT, DL, Op, DAG.getUNDEF(ByteVT),

                                BSWAPMask);

      Op = DAG.getNode(ISD::BITREVERSE, DL, ByteVT, Op);

      Op = DAG.getNode(ISD::BITCAST, DL, VT, Op);

      return Op;

    }

  }


  // If we have the appropriate vector bit operations, it is better to use them

  // than unrolling and expanding each component.

  if (TLI.isOperationLegalOrCustom(ISD::SHL, VT) &&

      TLI.isOperationLegalOrCustom(ISD::SRL, VT) &&

      TLI.isOperationLegalOrCustomOrPromote(ISD::AND, VT) &&

      TLI.isOperationLegalOrCustomOrPromote(ISD::OR, VT))

    return TLI.expandBITREVERSE(Node, DAG);


  // Otherwise unroll.

  return SDValue();

}


SDValue VectorLegalizer::ExpandVSELECT(SDNode *Node) {

  // Implement VSELECT in terms of XOR, AND, OR

  // on platforms which do not support blend natively.

  SDLoc DL(Node);


  SDValue Mask = Node->getOperand(0);

  SDValue Op1 = Node->getOperand(1);

  SDValue Op2 = Node->getOperand(2);


  EVT VT = Mask.getValueType();


  // If we can't even use the basic vector operations of

  // AND,OR,XOR, we will have to scalarize the op.

  // Notice that the operation may be 'promoted' which means that it is

  // 'bitcasted' to another type which is handled.

  if (TLI.getOperationAction(ISD::AND, VT) == TargetLowering::Expand ||

      TLI.getOperationAction(ISD::XOR, VT) == TargetLowering::Expand ||

      TLI.getOperationAction(ISD::OR, VT) == TargetLowering::Expand)

    return SDValue();


  // This operation also isn't safe with AND, OR, XOR when the boolean type is

  // 0/1 and the select operands aren't also booleans, as we need an all-ones

  // vector constant to mask with.

  // FIXME: Sign extend 1 to all ones if that's legal on the target.

  auto BoolContents = TLI.getBooleanContents(Op1.getValueType());

  if (BoolContents != TargetLowering::ZeroOrNegativeOneBooleanContent &&

      !(BoolContents == TargetLowering::ZeroOrOneBooleanContent &&

        Op1.getValueType().getVectorElementType() == MVT::i1))

    return SDValue();


  // If the mask and the type are different sizes, unroll the vector op. This

  // can occur when getSetCCResultType returns something that is different in

  // size from the operand types. For example, v4i8 = select v4i32, v4i8, v4i8.

  if (VT.getSizeInBits() != Op1.getValueSizeInBits())

    return SDValue();


  // Bitcast the operands to be the same type as the mask.

  // This is needed when we select between FP types because

  // the mask is a vector of integers.

  Op1 = DAG.getNode(ISD::BITCAST, DL, VT, Op1);

  Op2 = DAG.getNode(ISD::BITCAST, DL, VT, Op2);


  SDValue NotMask = DAG.getNOT(DL, Mask, VT);


  Op1 = DAG.getNode(ISD::AND, DL, VT, Op1, Mask);

  Op2 = DAG.getNode(ISD::AND, DL, VT, Op2, NotMask);

  SDValue Val = DAG.getNode(ISD::OR, DL, VT, Op1, Op2);

  return DAG.getNode(ISD::BITCAST, DL, Node->getValueType(0), Val);

}


SDValue VectorLegalizer::ExpandVP_SELECT(SDNode *Node) {

  // Implement VP_SELECT in terms of VP_XOR, VP_AND and VP_OR on platforms which

  // do not support it natively.

  SDLoc DL(Node);


  SDValue Mask = Node->getOperand(0);

  SDValue Op1 = Node->getOperand(1);

  SDValue Op2 = Node->getOperand(2);

  SDValue EVL = Node->getOperand(3);


  EVT VT = Mask.getValueType();


  // If we can't even use the basic vector operations of

  // VP_AND,VP_OR,VP_XOR, we will have to scalarize the op.

  if (TLI.getOperationAction(ISD::VP_AND, VT) == TargetLowering::Expand ||

      TLI.getOperationAction(ISD::VP_XOR, VT) == TargetLowering::Expand ||

      TLI.getOperationAction(ISD::VP_OR, VT) == TargetLowering::Expand)

    return SDValue();


  // This operation also isn't safe when the operands aren't also booleans.

  if (Op1.getValueType().getVectorElementType() != MVT::i1)

    return SDValue();


  SDValue Ones = DAG.getAllOnesConstant(DL, VT);

  SDValue NotMask = DAG.getNode(ISD::VP_XOR, DL, VT, Mask, Ones, Ones, EVL);


  Op1 = DAG.getNode(ISD::VP_AND, DL, VT, Op1, Mask, Ones, EVL);

  Op2 = DAG.getNode(ISD::VP_AND, DL, VT, Op2, NotMask, Ones, EVL);

  return DAG.getNode(ISD::VP_OR, DL, VT, Op1, Op2, Ones, EVL);

}


SDValue VectorLegalizer::ExpandVP_MERGE(SDNode *Node) {

  // Implement VP_MERGE in terms of VSELECT. Construct a mask where vector

  // indices less than the EVL/pivot are true. Combine that with the original

  // mask for a full-length mask. Use a full-length VSELECT to select between

  // the true and false values.

  SDLoc DL(Node);


  SDValue Mask = Node->getOperand(0);

  SDValue Op1 = Node->getOperand(1);

  SDValue Op2 = Node->getOperand(2);

  SDValue EVL = Node->getOperand(3);


  EVT MaskVT = Mask.getValueType();

  bool IsFixedLen = MaskVT.isFixedLengthVector();


  EVT EVLVecVT = EVT::getVectorVT(*DAG.getContext(), EVL.getValueType(),

                                  MaskVT.getVectorElementCount());


  // If we can't construct the EVL mask efficiently, it's better to unroll.

  if ((IsFixedLen &&

       !TLI.isOperationLegalOrCustom(ISD::BUILD_VECTOR, EVLVecVT)) ||

      (!IsFixedLen &&

       (!TLI.isOperationLegalOrCustom(ISD::STEP_VECTOR, EVLVecVT) ||

        !TLI.isOperationLegalOrCustom(ISD::SPLAT_VECTOR, EVLVecVT))))

    return SDValue();


  // If using a SETCC would result in a different type than the mask type,

  // unroll.

  if (TLI.getSetCCResultType(DAG.getDataLayout(), *DAG.getContext(),

                             EVLVecVT) != MaskVT)

    return SDValue();


  SDValue StepVec = DAG.getStepVector(DL, EVLVecVT);

  SDValue SplatEVL = DAG.getSplat(EVLVecVT, DL, EVL);

  SDValue EVLMask =

      DAG.getSetCC(DL, MaskVT, StepVec, SplatEVL, ISD::CondCode::SETULT);


  SDValue FullMask = DAG.getNode(ISD::AND, DL, MaskVT, Mask, EVLMask);

  return DAG.getSelect(DL, Node->getValueType(0), FullMask, Op1, Op2);

}


SDValue VectorLegalizer::ExpandVP_REM(SDNode *Node) {

  // Implement VP_SREM/UREM in terms of VP_SDIV/VP_UDIV, VP_MUL, VP_SUB.

  EVT VT = Node->getValueType(0);


  unsigned DivOpc = Node->getOpcode() == ISD::VP_SREM ? ISD::VP_SDIV : ISD::VP_UDIV;


  if (!TLI.isOperationLegalOrCustom(DivOpc, VT) ||

      !TLI.isOperationLegalOrCustom(ISD::VP_MUL, VT) ||

      !TLI.isOperationLegalOrCustom(ISD::VP_SUB, VT))

    return SDValue();


  SDLoc DL(Node);


  SDValue Dividend = Node->getOperand(0);

  SDValue Divisor = Node->getOperand(1);

  SDValue Mask = Node->getOperand(2);

  SDValue EVL = Node->getOperand(3);


  // X % Y -> X-X/Y*Y

  SDValue Div = DAG.getNode(DivOpc, DL, VT, Dividend, Divisor, Mask, EVL);

  SDValue Mul = DAG.getNode(ISD::VP_MUL, DL, VT, Divisor, Div, Mask, EVL);

  return DAG.getNode(ISD::VP_SUB, DL, VT, Dividend, Mul, Mask, EVL);

}


SDValue VectorLegalizer::ExpandVP_FNEG(SDNode *Node) {

  EVT VT = Node->getValueType(0);

  EVT IntVT = VT.changeVectorElementTypeToInteger();


  if (!TLI.isOperationLegalOrCustom(ISD::VP_XOR, IntVT))

    return SDValue();


  SDValue Mask = Node->getOperand(1);

  SDValue EVL = Node->getOperand(2);


  SDLoc DL(Node);

  SDValue Cast = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));

  SDValue SignMask = DAG.getConstant(

      APInt::getSignMask(IntVT.getScalarSizeInBits()), DL, IntVT);

  SDValue Xor = DAG.getNode(ISD::VP_XOR, DL, IntVT, Cast, SignMask, Mask, EVL);

  return DAG.getNode(ISD::BITCAST, DL, VT, Xor);

}


SDValue VectorLegalizer::ExpandVP_FABS(SDNode *Node) {

  EVT VT = Node->getValueType(0);

  EVT IntVT = VT.changeVectorElementTypeToInteger();


  if (!TLI.isOperationLegalOrCustom(ISD::VP_AND, IntVT))

    return SDValue();


  SDValue Mask = Node->getOperand(1);

  SDValue EVL = Node->getOperand(2);


  SDLoc DL(Node);

  SDValue Cast = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));

  SDValue ClearSignMask = DAG.getConstant(

      APInt::getSignedMaxValue(IntVT.getScalarSizeInBits()), DL, IntVT);

  SDValue ClearSign =

      DAG.getNode(ISD::VP_AND, DL, IntVT, Cast, ClearSignMask, Mask, EVL);

  return DAG.getNode(ISD::BITCAST, DL, VT, ClearSign);

}


SDValue VectorLegalizer::ExpandVP_FCOPYSIGN(SDNode *Node) {

  EVT VT = Node->getValueType(0);


  if (VT != Node->getOperand(1).getValueType())

    return SDValue();


  EVT IntVT = VT.changeVectorElementTypeToInteger();

  if (!TLI.isOperationLegalOrCustom(ISD::VP_AND, IntVT) ||

      !TLI.isOperationLegalOrCustom(ISD::VP_XOR, IntVT))

    return SDValue();


  SDValue Mask = Node->getOperand(2);

  SDValue EVL = Node->getOperand(3);


  SDLoc DL(Node);

  SDValue Mag = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));

  SDValue Sign = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(1));


  SDValue SignMask = DAG.getConstant(

      APInt::getSignMask(IntVT.getScalarSizeInBits()), DL, IntVT);

  SDValue SignBit =

      DAG.getNode(ISD::VP_AND, DL, IntVT, Sign, SignMask, Mask, EVL);


  SDValue ClearSignMask = DAG.getConstant(

      APInt::getSignedMaxValue(IntVT.getScalarSizeInBits()), DL, IntVT);

  SDValue ClearedSign =

      DAG.getNode(ISD::VP_AND, DL, IntVT, Mag, ClearSignMask, Mask, EVL);


  SDValue CopiedSign = DAG.getNode(ISD::VP_OR, DL, IntVT, ClearedSign, SignBit,

                                   Mask, EVL, SDNodeFlags::Disjoint);


  return DAG.getNode(ISD::BITCAST, DL, VT, CopiedSign);

}


void VectorLegalizer::ExpandFP_TO_UINT(SDNode *Node,

                                       SmallVectorImpl<SDValue> &Results) {

  // Attempt to expand using TargetLowering.

  SDValue Result, Chain;

  if (TLI.expandFP_TO_UINT(Node, Result, Chain, DAG)) {

    Results.push_back(Result);

    if (Node->isStrictFPOpcode())

      Results.push_back(Chain);

    return;

  }


  // Otherwise go ahead and unroll.

  if (Node->isStrictFPOpcode()) {

    UnrollStrictFPOp(Node, Results);

    return;

  }


  Results.push_back(DAG.UnrollVectorOp(Node));

}


void VectorLegalizer::ExpandUINT_TO_FLOAT(SDNode *Node,

                                          SmallVectorImpl<SDValue> &Results) {

  bool IsStrict = Node->isStrictFPOpcode();

  unsigned OpNo = IsStrict ? 1 : 0;

  SDValue Src = Node->getOperand(OpNo);

  EVT SrcVT = Src.getValueType();

  EVT DstVT = Node->getValueType(0);

  SDLoc DL(Node);


  // Attempt to expand using TargetLowering.

  SDValue Result;

  SDValue Chain;

  if (TLI.expandUINT_TO_FP(Node, Result, Chain, DAG)) {

    Results.push_back(Result);

    if (IsStrict)

      Results.push_back(Chain);

    return;

  }


  // Make sure that the SINT_TO_FP and SRL instructions are available.

  if (((!IsStrict && TLI.getOperationAction(ISD::SINT_TO_FP, SrcVT) ==

                         TargetLowering::Expand) ||

       (IsStrict && TLI.getOperationAction(ISD::STRICT_SINT_TO_FP, SrcVT) ==

                        TargetLowering::Expand)) ||

      TLI.getOperationAction(ISD::SRL, SrcVT) == TargetLowering::Expand) {

    if (IsStrict) {

      UnrollStrictFPOp(Node, Results);

      return;

    }


    Results.push_back(DAG.UnrollVectorOp(Node));

    return;

  }


  unsigned BW = SrcVT.getScalarSizeInBits();

  assert((BW == 64 || BW == 32) &&

         "Elements in vector-UINT_TO_FP must be 32 or 64 bits wide");


  // If STRICT_/FMUL is not supported by the target (in case of f16) replace the

  // UINT_TO_FP with a larger float and round to the smaller type

  if ((!IsStrict && !TLI.isOperationLegalOrCustom(ISD::FMUL, DstVT)) ||

      (IsStrict && !TLI.isOperationLegalOrCustom(ISD::STRICT_FMUL, DstVT))) {

    EVT FPVT = BW == 32 ? MVT::f32 : MVT::f64;

    SDValue UIToFP;

    SDValue Result;

    SDValue TargetZero = DAG.getIntPtrConstant(0, DL, /*isTarget=*/true);

    EVT FloatVecVT = SrcVT.changeVectorElementType(FPVT);

    if (IsStrict) {

      UIToFP = DAG.getNode(ISD::STRICT_UINT_TO_FP, DL, {FloatVecVT, MVT::Other},

                           {Node->getOperand(0), Src});

      Result = DAG.getNode(ISD::STRICT_FP_ROUND, DL, {DstVT, MVT::Other},

                           {Node->getOperand(0), UIToFP, TargetZero});

      Results.push_back(Result);

      Results.push_back(Result.getValue(1));

    } else {

      UIToFP = DAG.getNode(ISD::UINT_TO_FP, DL, FloatVecVT, Src);

      Result = DAG.getNode(ISD::FP_ROUND, DL, DstVT, UIToFP, TargetZero);

      Results.push_back(Result);

    }


    return;

  }


  SDValue HalfWord = DAG.getConstant(BW / 2, DL, SrcVT);


  // Constants to clear the upper part of the word.

  // Notice that we can also use SHL+SHR, but using a constant is slightly

  // faster on x86.

  uint64_t HWMask = (BW == 64) ? 0x00000000FFFFFFFF : 0x0000FFFF;

  SDValue HalfWordMask = DAG.getConstant(HWMask, DL, SrcVT);


  // Two to the power of half-word-size.

  SDValue TWOHW = DAG.getConstantFP(1ULL << (BW / 2), DL, DstVT);


  // Clear upper part of LO, lower HI

  SDValue HI = DAG.getNode(ISD::SRL, DL, SrcVT, Src, HalfWord);

  SDValue LO = DAG.getNode(ISD::AND, DL, SrcVT, Src, HalfWordMask);


  if (IsStrict) {

    // Convert hi and lo to floats

    // Convert the hi part back to the upper values

    // TODO: Can any fast-math-flags be set on these nodes?

    SDValue fHI = DAG.getNode(ISD::STRICT_SINT_TO_FP, DL, {DstVT, MVT::Other},

                              {Node->getOperand(0), HI});

    fHI = DAG.getNode(ISD::STRICT_FMUL, DL, {DstVT, MVT::Other},

                      {fHI.getValue(1), fHI, TWOHW});

    SDValue fLO = DAG.getNode(ISD::STRICT_SINT_TO_FP, DL, {DstVT, MVT::Other},

                              {Node->getOperand(0), LO});


    SDValue TF = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, fHI.getValue(1),

                             fLO.getValue(1));


    // Add the two halves

    SDValue Result =

        DAG.getNode(ISD::STRICT_FADD, DL, {DstVT, MVT::Other}, {TF, fHI, fLO});


    Results.push_back(Result);

    Results.push_back(Result.getValue(1));

    return;

  }


  // Convert hi and lo to floats

  // Convert the hi part back to the upper values

  // TODO: Can any fast-math-flags be set on these nodes?

  SDValue fHI = DAG.getNode(ISD::SINT_TO_FP, DL, DstVT, HI);

  fHI = DAG.getNode(ISD::FMUL, DL, DstVT, fHI, TWOHW);

  SDValue fLO = DAG.getNode(ISD::SINT_TO_FP, DL, DstVT, LO);


  // Add the two halves

  Results.push_back(DAG.getNode(ISD::FADD, DL, DstVT, fHI, fLO));

}


SDValue VectorLegalizer::ExpandFNEG(SDNode *Node) {

  EVT VT = Node->getValueType(0);

  EVT IntVT = VT.changeVectorElementTypeToInteger();


  if (!TLI.isOperationLegalOrCustom(ISD::XOR, IntVT))

    return SDValue();


  // FIXME: The FSUB check is here to force unrolling v1f64 vectors on AArch64.

  if (!TLI.isOperationLegalOrCustomOrPromote(ISD::FSUB, VT) &&

      !VT.isScalableVector())

    return SDValue();


  SDLoc DL(Node);

  SDValue Cast = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));

  SDValue SignMask = DAG.getConstant(

      APInt::getSignMask(IntVT.getScalarSizeInBits()), DL, IntVT);

  SDValue Xor = DAG.getNode(ISD::XOR, DL, IntVT, Cast, SignMask);

  return DAG.getNode(ISD::BITCAST, DL, VT, Xor);

}


SDValue VectorLegalizer::ExpandFABS(SDNode *Node) {

  EVT VT = Node->getValueType(0);

  EVT IntVT = VT.changeVectorElementTypeToInteger();


  if (!TLI.isOperationLegalOrCustom(ISD::AND, IntVT))

    return SDValue();


  // FIXME: The FSUB check is here to force unrolling v1f64 vectors on AArch64.

  if (!TLI.isOperationLegalOrCustomOrPromote(ISD::FSUB, VT) &&

      !VT.isScalableVector())

    return SDValue();


  SDLoc DL(Node);

  SDValue Cast = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));

  SDValue ClearSignMask = DAG.getConstant(

      APInt::getSignedMaxValue(IntVT.getScalarSizeInBits()), DL, IntVT);

  SDValue ClearedSign = DAG.getNode(ISD::AND, DL, IntVT, Cast, ClearSignMask);

  return DAG.getNode(ISD::BITCAST, DL, VT, ClearedSign);

}


SDValue VectorLegalizer::ExpandFCOPYSIGN(SDNode *Node) {

  EVT VT = Node->getValueType(0);

  EVT IntVT = VT.changeVectorElementTypeToInteger();


  if (VT != Node->getOperand(1).getValueType() ||

      !TLI.isOperationLegalOrCustom(ISD::AND, IntVT) ||

      !TLI.isOperationLegalOrCustom(ISD::OR, IntVT))

    return SDValue();


  // FIXME: The FSUB check is here to force unrolling v1f64 vectors on AArch64.

  if (!TLI.isOperationLegalOrCustomOrPromote(ISD::FSUB, VT) &&

      !VT.isScalableVector())

    return SDValue();


  SDLoc DL(Node);

  SDValue Mag = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));

  SDValue Sign = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(1));


  SDValue SignMask = DAG.getConstant(

      APInt::getSignMask(IntVT.getScalarSizeInBits()), DL, IntVT);

  SDValue SignBit = DAG.getNode(ISD::AND, DL, IntVT, Sign, SignMask);


  SDValue ClearSignMask = DAG.getConstant(

      APInt::getSignedMaxValue(IntVT.getScalarSizeInBits()), DL, IntVT);

  SDValue ClearedSign = DAG.getNode(ISD::AND, DL, IntVT, Mag, ClearSignMask);


  SDValue CopiedSign = DAG.getNode(ISD::OR, DL, IntVT, ClearedSign, SignBit,

                                   SDNodeFlags::Disjoint);


  return DAG.getNode(ISD::BITCAST, DL, VT, CopiedSign);

}


void VectorLegalizer::ExpandFSUB(SDNode *Node,

                                 SmallVectorImpl<SDValue> &Results) {

  // For floating-point values, (a-b) is the same as a+(-b). If FNEG is legal,

  // we can defer this to operation legalization where it will be lowered as

  // a+(-b).

  EVT VT = Node->getValueType(0);

  if (TLI.isOperationLegalOrCustom(ISD::FNEG, VT) &&

      TLI.isOperationLegalOrCustom(ISD::FADD, VT))

    return; // Defer to LegalizeDAG


  if (SDValue Expanded = TLI.expandVectorNaryOpBySplitting(Node, DAG)) {

    Results.push_back(Expanded);

    return;

  }


  SDValue Tmp = DAG.UnrollVectorOp(Node);

  Results.push_back(Tmp);

}


void VectorLegalizer::ExpandSETCC(SDNode *Node,

                                  SmallVectorImpl<SDValue> &Results) {

  bool NeedInvert = false;

  bool IsVP = Node->getOpcode() == ISD::VP_SETCC;

  bool IsStrict = Node->getOpcode() == ISD::STRICT_FSETCC ||

                  Node->getOpcode() == ISD::STRICT_FSETCCS;

  bool IsSignaling = Node->getOpcode() == ISD::STRICT_FSETCCS;

  unsigned Offset = IsStrict ? 1 : 0;


  SDValue Chain = IsStrict ? Node->getOperand(0) : SDValue();

  SDValue LHS = Node->getOperand(0 + Offset);

  SDValue RHS = Node->getOperand(1 + Offset);

  SDValue CC = Node->getOperand(2 + Offset);


  MVT OpVT = LHS.getSimpleValueType();

  ISD::CondCode CCCode = cast<CondCodeSDNode>(CC)->get();


  if (TLI.getCondCodeAction(CCCode, OpVT) != TargetLowering::Expand) {

    if (IsStrict) {

      UnrollStrictFPOp(Node, Results);

      return;

    }

    Results.push_back(UnrollVSETCC(Node));

    return;

  }


  SDValue Mask, EVL;

  if (IsVP) {

    Mask = Node->getOperand(3 + Offset);

    EVL = Node->getOperand(4 + Offset);

  }


  SDLoc dl(Node);

  bool Legalized =

      TLI.LegalizeSetCCCondCode(DAG, Node->getValueType(0), LHS, RHS, CC, Mask,

                                EVL, NeedInvert, dl, Chain, IsSignaling);


  if (Legalized) {

    // If we expanded the SETCC by swapping LHS and RHS, or by inverting the

    // condition code, create a new SETCC node.

    if (CC.getNode()) {

      if (IsStrict) {

        LHS = DAG.getNode(Node->getOpcode(), dl, Node->getVTList(),

                          {Chain, LHS, RHS, CC}, Node->getFlags());

        Chain = LHS.getValue(1);

      } else if (IsVP) {

        LHS = DAG.getNode(ISD::VP_SETCC, dl, Node->getValueType(0),

                          {LHS, RHS, CC, Mask, EVL}, Node->getFlags());

      } else {

        LHS = DAG.getNode(ISD::SETCC, dl, Node->getValueType(0), LHS, RHS, CC,

                          Node->getFlags());

      }

    }


    // If we expanded the SETCC by inverting the condition code, then wrap

    // the existing SETCC in a NOT to restore the intended condition.

    if (NeedInvert) {

      if (!IsVP)

        LHS = DAG.getLogicalNOT(dl, LHS, LHS->getValueType(0));

      else

        LHS = DAG.getVPLogicalNOT(dl, LHS, Mask, EVL, LHS->getValueType(0));

    }

  } else {

    assert(!IsStrict && "Don't know how to expand for strict nodes.");


    // Otherwise, SETCC for the given comparison type must be completely

    // illegal; expand it into a SELECT_CC.

    EVT VT = Node->getValueType(0);

    LHS = DAG.getNode(ISD::SELECT_CC, dl, VT, LHS, RHS,

                      DAG.getBoolConstant(true, dl, VT, LHS.getValueType()),

                      DAG.getBoolConstant(false, dl, VT, LHS.getValueType()),

                      CC, Node->getFlags());

  }


  Results.push_back(LHS);

  if (IsStrict)

    Results.push_back(Chain);

}


void VectorLegalizer::ExpandUADDSUBO(SDNode *Node,

                                     SmallVectorImpl<SDValue> &Results) {

  SDValue Result, Overflow;

  TLI.expandUADDSUBO(Node, Result, Overflow, DAG);

  Results.push_back(Result);

  Results.push_back(Overflow);

}


void VectorLegalizer::ExpandSADDSUBO(SDNode *Node,

                                     SmallVectorImpl<SDValue> &Results) {

  SDValue Result, Overflow;

  TLI.expandSADDSUBO(Node, Result, Overflow, DAG);

  Results.push_back(Result);

  Results.push_back(Overflow);

}


void VectorLegalizer::ExpandMULO(SDNode *Node,

                                 SmallVectorImpl<SDValue> &Results) {

  SDValue Result, Overflow;

  if (!TLI.expandMULO(Node, Result, Overflow, DAG))

    std::tie(Result, Overflow) = DAG.UnrollVectorOverflowOp(Node);


  Results.push_back(Result);

  Results.push_back(Overflow);

}


void VectorLegalizer::ExpandFixedPointDiv(SDNode *Node,

                                          SmallVectorImpl<SDValue> &Results) {

  SDNode *N = Node;

  if (SDValue Expanded = TLI.expandFixedPointDiv(N->getOpcode(), SDLoc(N),

          N->getOperand(0), N->getOperand(1), N->getConstantOperandVal(2), DAG))

    Results.push_back(Expanded);

}


void VectorLegalizer::ExpandStrictFPOp(SDNode *Node,

                                       SmallVectorImpl<SDValue> &Results) {

  if (Node->getOpcode() == ISD::STRICT_UINT_TO_FP) {

    ExpandUINT_TO_FLOAT(Node, Results);

    return;

  }

  if (Node->getOpcode() == ISD::STRICT_FP_TO_UINT) {

    ExpandFP_TO_UINT(Node, Results);

    return;

  }


  if (Node->getOpcode() == ISD::STRICT_FSETCC ||

      Node->getOpcode() == ISD::STRICT_FSETCCS) {

    ExpandSETCC(Node, Results);

    return;

  }


  UnrollStrictFPOp(Node, Results);

}


void VectorLegalizer::ExpandREM(SDNode *Node,

                                SmallVectorImpl<SDValue> &Results) {

  assert((Node->getOpcode() == ISD::SREM || Node->getOpcode() == ISD::UREM) &&

         "Expected REM node");


  SDValue Result;

  if (!TLI.expandREM(Node, Result, DAG))

    Result = DAG.UnrollVectorOp(Node);

  Results.push_back(Result);

}


// Try to expand libm nodes into vector math routine calls. Callers provide the

// LibFunc equivalent of the passed in Node, which is used to lookup mappings

// within TargetLibraryInfo. The only mappings considered are those where the

// result and all operands are the same vector type. While predicated nodes are

// not supported, we will emit calls to masked routines by passing in an all

// true mask.

bool VectorLegalizer::tryExpandVecMathCall(SDNode *Node, RTLIB::Libcall LC,

                                           SmallVectorImpl<SDValue> &Results) {

  // Chain must be propagated but currently strict fp operations are down

  // converted to their none strict counterpart.

  assert(!Node->isStrictFPOpcode() && "Unexpected strict fp operation!");


  const char *LCName = TLI.getLibcallName(LC);

  if (!LCName)

    return false;

  LLVM_DEBUG(dbgs() << "Looking for vector variant of " << LCName << "\n");


  EVT VT = Node->getValueType(0);

  ElementCount VL = VT.getVectorElementCount();


  // Lookup a vector function equivalent to the specified libcall. Prefer

  // unmasked variants but we will generate a mask if need be.

  const TargetLibraryInfo &TLibInfo = DAG.getLibInfo();

  const VecDesc *VD = TLibInfo.getVectorMappingInfo(LCName, VL, false);

  if (!VD)

    VD = TLibInfo.getVectorMappingInfo(LCName, VL, /*Masked=*/true);

  if (!VD)

    return false;


  LLVMContext *Ctx = DAG.getContext();

  Type *Ty = VT.getTypeForEVT(*Ctx);

  Type *ScalarTy = Ty->getScalarType();


  // Construct a scalar function type based on Node's operands.

  SmallVector<Type *, 8> ArgTys;

  for (unsigned i = 0; i < Node->getNumOperands(); ++i) {

    assert(Node->getOperand(i).getValueType() == VT &&

           "Expected matching vector types!");

    ArgTys.push_back(ScalarTy);

  }

  FunctionType *ScalarFTy = FunctionType::get(ScalarTy, ArgTys, false);


  // Generate call information for the vector function.

  const std::string MangledName = VD->getVectorFunctionABIVariantString();

  auto OptVFInfo = VFABI::tryDemangleForVFABI(MangledName, ScalarFTy);

  if (!OptVFInfo)

    return false;


  LLVM_DEBUG(dbgs() << "Found vector variant " << VD->getVectorFnName()

                    << "\n");


  // Sanity check just in case OptVFInfo has unexpected parameters.

  if (OptVFInfo->Shape.Parameters.size() !=

      Node->getNumOperands() + VD->isMasked())

    return false;


  // Collect vector call operands.


  SDLoc DL(Node);

  TargetLowering::ArgListTy Args;


  unsigned OpNum = 0;

  for (auto &VFParam : OptVFInfo->Shape.Parameters) {

    if (VFParam.ParamKind == VFParamKind::GlobalPredicate) {

      EVT MaskVT = TLI.getSetCCResultType(DAG.getDataLayout(), *Ctx, VT);

      Args.emplace_back(DAG.getBoolConstant(true, DL, MaskVT, VT),

                        MaskVT.getTypeForEVT(*Ctx));

      continue;

    }


    // Only vector operands are supported.

    if (VFParam.ParamKind != VFParamKind::Vector)

      return false;


    Args.emplace_back(Node->getOperand(OpNum++), Ty);

  }


  // Emit a call to the vector function.

  SDValue Callee = DAG.getExternalSymbol(VD->getVectorFnName().data(),

                                         TLI.getPointerTy(DAG.getDataLayout()));

  TargetLowering::CallLoweringInfo CLI(DAG);

  CLI.setDebugLoc(DL)

      .setChain(DAG.getEntryNode())

      .setLibCallee(CallingConv::C, Ty, Callee, std::move(Args));


  std::pair<SDValue, SDValue> CallResult = TLI.LowerCallTo(CLI);

  Results.push_back(CallResult.first);

  return true;

}


/// Try to expand the node to a vector libcall based on the result type.

bool VectorLegalizer::tryExpandVecMathCall(

    SDNode *Node, RTLIB::Libcall Call_F32, RTLIB::Libcall Call_F64,

    RTLIB::Libcall Call_F80, RTLIB::Libcall Call_F128,

    RTLIB::Libcall Call_PPCF128, SmallVectorImpl<SDValue> &Results) {

  RTLIB::Libcall LC = RTLIB::getFPLibCall(

      Node->getValueType(0).getVectorElementType(), Call_F32, Call_F64,

      Call_F80, Call_F128, Call_PPCF128);


  if (LC == RTLIB::UNKNOWN_LIBCALL)

    return false;


  return tryExpandVecMathCall(Node, LC, Results);

}


void VectorLegalizer::UnrollStrictFPOp(SDNode *Node,

                                       SmallVectorImpl<SDValue> &Results) {

  EVT VT = Node->getValueType(0);

  EVT EltVT = VT.getVectorElementType();

  unsigned NumElems = VT.getVectorNumElements();

  unsigned NumOpers = Node->getNumOperands();

  const TargetLowering &TLI = DAG.getTargetLoweringInfo();


  EVT TmpEltVT = EltVT;

  if (Node->getOpcode() == ISD::STRICT_FSETCC ||

      Node->getOpcode() == ISD::STRICT_FSETCCS)

    TmpEltVT = TLI.getSetCCResultType(DAG.getDataLayout(),

                                      *DAG.getContext(), TmpEltVT);


  EVT ValueVTs[] = {TmpEltVT, MVT::Other};

  SDValue Chain = Node->getOperand(0);

  SDLoc dl(Node);


  SmallVector<SDValue, 32> OpValues;

  SmallVector<SDValue, 32> OpChains;

  for (unsigned i = 0; i < NumElems; ++i) {

    SmallVector<SDValue, 4> Opers;

    SDValue Idx = DAG.getVectorIdxConstant(i, dl);


    // The Chain is the first operand.

    Opers.push_back(Chain);


    // Now process the remaining operands.

    for (unsigned j = 1; j < NumOpers; ++j) {

      SDValue Oper = Node->getOperand(j);

      EVT OperVT = Oper.getValueType();


      if (OperVT.isVector())

        Oper = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl,

                           OperVT.getVectorElementType(), Oper, Idx);


      Opers.push_back(Oper);

    }


    SDValue ScalarOp = DAG.getNode(Node->getOpcode(), dl, ValueVTs, Opers);

    SDValue ScalarResult = ScalarOp.getValue(0);

    SDValue ScalarChain = ScalarOp.getValue(1);


    if (Node->getOpcode() == ISD::STRICT_FSETCC ||

        Node->getOpcode() == ISD::STRICT_FSETCCS)

      ScalarResult = DAG.getSelect(dl, EltVT, ScalarResult,

                                   DAG.getAllOnesConstant(dl, EltVT),

                                   DAG.getConstant(0, dl, EltVT));


    OpValues.push_back(ScalarResult);

    OpChains.push_back(ScalarChain);

  }


  SDValue Result = DAG.getBuildVector(VT, dl, OpValues);

  SDValue NewChain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, OpChains);


  Results.push_back(Result);

  Results.push_back(NewChain);

}


SDValue VectorLegalizer::UnrollVSETCC(SDNode *Node) {

  EVT VT = Node->getValueType(0);

  unsigned NumElems = VT.getVectorNumElements();

  EVT EltVT = VT.getVectorElementType();

  SDValue LHS = Node->getOperand(0);

  SDValue RHS = Node->getOperand(1);

  SDValue CC = Node->getOperand(2);

  EVT TmpEltVT = LHS.getValueType().getVectorElementType();

  SDLoc dl(Node);

  SmallVector<SDValue, 8> Ops(NumElems);

  for (unsigned i = 0; i < NumElems; ++i) {

    SDValue LHSElem = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, TmpEltVT, LHS,

                                  DAG.getVectorIdxConstant(i, dl));

    SDValue RHSElem = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, TmpEltVT, RHS,

                                  DAG.getVectorIdxConstant(i, dl));

    // FIXME: We should use i1 setcc + boolext here, but it causes regressions.

    Ops[i] = DAG.getNode(ISD::SETCC, dl,

                         TLI.getSetCCResultType(DAG.getDataLayout(),

                                                *DAG.getContext(), TmpEltVT),

                         LHSElem, RHSElem, CC);

    Ops[i] = DAG.getSelect(dl, EltVT, Ops[i],

                           DAG.getBoolConstant(true, dl, EltVT, VT),

                           DAG.getConstant(0, dl, EltVT));

  }

  return DAG.getBuildVector(VT, dl, Ops);

}


bool SelectionDAG::LegalizeVectors() {

  return VectorLegalizer(*this).Run();

}

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

Results
Function Alias Analysis Results
Definition: AliasAnalysis.cpp:722

From
BlockVerifier::State From
Definition: BlockVerifier.cpp:57

Casting.h

Compiler.h

DataLayout.h

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:347

DenseMap.h
This file defines the DenseMap class.

ISDOpcodes.h

createBSWAPShuffleMask
static void createBSWAPShuffleMask(EVT VT, SmallVectorImpl< int > &ShuffleMask)
Definition: LegalizeVectorOps.cpp:1495

I
#define I(x, y, z)
Definition: MD5.cpp:58

Operands
mir Rename Register Operands
Definition: MIRNamerPass.cpp:74

MachineValueType.h

Opc
auto Opc
Definition: RISCVRedundantCopyElimination.cpp:75

SelectionDAGNodes.h

SelectionDAG.h

SmallVector.h
This file defines the SmallVector class.

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition: Debug.h:119

TargetLibraryInfo.h

TargetLowering.h
This file describes how to lower LLVM code to machine code.

ValueTypes.h

VectorUtils.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

Mul
BinaryOperator * Mul
Definition: X86PartialReduction.cpp:68

FunctionType
Definition: ItaniumDemangle.h:835

Node
Definition: ItaniumDemangle.h:166

Node::dump
DEMANGLE_DUMP_METHOD void dump() const

T

llvm::APInt::getSignMask
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition: APInt.h:229

llvm::APInt::getSignedMaxValue
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition: APInt.h:209

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:33

llvm::DenseMapBase::insert
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition: DenseMap.h:230

llvm::DenseMap
Definition: DenseMap.h:730

llvm::ElementCount
Definition: TypeSize.h:301

llvm::Function::size
size_t size() const
Definition: Function.h:856

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:68

llvm::LoadSDNode
This class is used to represent ISD::LOAD nodes.
Definition: SelectionDAGNodes.h:2533

llvm::MVT
Machine Value Type.
Definition: MachineValueType.h:36

llvm::MVT::getVectorNumElements
unsigned getVectorNumElements() const
Definition: MachineValueType.h:295

llvm::MVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition: MachineValueType.h:107

llvm::MVT::getVectorElementType
MVT getVectorElementType() const
Definition: MachineValueType.h:264

llvm::MVT::isFloatingPoint
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
Definition: MachineValueType.h:81

llvm::MVT::getScalarType
MVT getScalarType() const
If this is a vector, return the element type, otherwise return this.
Definition: MachineValueType.h:260

llvm::MutableArrayRef
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
Definition: ArrayRef.h:303

llvm::SDLoc
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Definition: SelectionDAGNodes.h:1225

llvm::SDNode
Represents one node in the SelectionDAG.
Definition: SelectionDAGNodes.h:501

llvm::SDNode::getNumValues
unsigned getNumValues() const
Return the number of values defined/returned by this operator.
Definition: SelectionDAGNodes.h:1101

llvm::SDValue
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
Definition: SelectionDAGNodes.h:147

llvm::SDValue::getNode
SDNode * getNode() const
get the SDNode which holds the desired result
Definition: SelectionDAGNodes.h:161

llvm::SDValue::getValue
SDValue getValue(unsigned R) const
Definition: SelectionDAGNodes.h:181

llvm::SDValue::getValueType
EVT getValueType() const
Return the ValueType of the referenced return value.
Definition: SelectionDAGNodes.h:1260

llvm::SDValue::getValueSizeInBits
TypeSize getValueSizeInBits() const
Returns the size of the value in bits.
Definition: SelectionDAGNodes.h:201

llvm::SelectionDAG
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
Definition: SelectionDAG.h:229

llvm::SelectionDAG::LegalizeVectors
LLVM_ABI bool LegalizeVectors()
This transforms the SelectionDAG into a SelectionDAG that only uses vector math operations supported ...
Definition: LegalizeVectorOps.cpp:2358

llvm::SelectionDAG::getTargetLoweringInfo
const TargetLowering & getTargetLoweringInfo() const
Definition: SelectionDAG.h:504

llvm::SelectionDAG::allnodes_iterator
ilist< SDNode >::iterator allnodes_iterator
Definition: SelectionDAG.h:561

llvm::SmallDenseMap
Definition: DenseMap.h:889

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:82

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:79

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:574

llvm::SmallVectorImpl::resize
void resize(size_type N)
Definition: SmallVector.h:639

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:414

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1197

llvm::StoreSDNode
This class is used to represent ISD::STORE nodes.
Definition: SelectionDAGNodes.h:2561

llvm::StringRef::data
constexpr const char * data() const
data - Get a pointer to the start of the string (which may not be null terminated).
Definition: StringRef.h:148

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition: TargetLibraryInfo.h:285

llvm::TargetLibraryInfo::getVectorMappingInfo
const VecDesc * getVectorMappingInfo(StringRef F, const ElementCount &VF, bool Masked) const
Definition: TargetLibraryInfo.h:407

llvm::TargetLoweringBase::LegalizeAction
LegalizeAction
This enum indicates whether operations are valid for a target, and if not, what action should be used...
Definition: TargetLowering.h:202

llvm::TargetLoweringBase::getSetCCResultType
virtual EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context, EVT VT) const
Return the ValueType of the result of SETCC operations.
Definition: TargetLoweringBase.cpp:1599

llvm::TargetLoweringBase::ArgListTy
std::vector< ArgListEntry > ArgListTy
Definition: TargetLowering.h:341

llvm::TargetLowering
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Definition: TargetLowering.h:3937

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition: Type.h:352

llvm::VecDesc
Provides info so a possible vectorization of a function can be computed.
Definition: TargetLibraryInfo.h:43

llvm::VecDesc::isMasked
bool isMasked() const
Definition: TargetLibraryInfo.h:63

llvm::VecDesc::getVectorFunctionABIVariantString
LLVM_ABI std::string getVectorFunctionABIVariantString() const
Returns a vector function ABI variant string on the form: ZGV<isa><mask><vlen><vparams><scalarname>(<...
Definition: TargetLibraryInfo.cpp:51

llvm::VecDesc::getVectorFnName
StringRef getVectorFnName() const
Definition: TargetLibraryInfo.h:61

uint64_t

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:164

llvm::AArch64CC::HI
@ HI
Definition: AArch64BaseInfo.h:263

llvm::AArch64CC::LO
@ LO
Definition: AArch64BaseInfo.h:258

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition: AMDGPUMetadata.h:396

llvm::ARM_MB::LD
@ LD
Definition: ARMBaseInfo.h:72

llvm::ARM_MB::ST
@ ST
Definition: ARMBaseInfo.h:73

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition: BitmaskEnum.h:126

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::ISD::SETCC
@ SETCC
SetCC operator - This evaluates to a true value iff the condition is true.
Definition: ISDOpcodes.h:801

llvm::ISD::MERGE_VALUES
@ MERGE_VALUES
MERGE_VALUES - This node takes multiple discrete operands and returns them all as its individual resu...
Definition: ISDOpcodes.h:256

llvm::ISD::CTLZ_ZERO_UNDEF
@ CTLZ_ZERO_UNDEF
Definition: ISDOpcodes.h:774

llvm::ISD::STRICT_FSETCC
@ STRICT_FSETCC
STRICT_FSETCC/STRICT_FSETCCS - Constrained versions of SETCC, used for floating-point operands only.
Definition: ISDOpcodes.h:504

llvm::ISD::STORE
@ STORE
Definition: ISDOpcodes.h:1142

llvm::ISD::LRINT
@ LRINT
Definition: ISDOpcodes.h:1042

llvm::ISD::PARTIAL_REDUCE_SMLA
@ PARTIAL_REDUCE_SMLA
Definition: ISDOpcodes.h:1510

llvm::ISD::VECREDUCE_SEQ_FADD
@ VECREDUCE_SEQ_FADD
Generic reduction nodes.
Definition: ISDOpcodes.h:1458

llvm::ISD::FLOG10
@ FLOG10
Definition: ISDOpcodes.h:1029

llvm::ISD::VECREDUCE_SMIN
@ VECREDUCE_SMIN
Definition: ISDOpcodes.h:1491

llvm::ISD::SREM
@ SREM
Definition: ISDOpcodes.h:264

llvm::ISD::SMUL_LOHI
@ SMUL_LOHI
SMUL_LOHI/UMUL_LOHI - Multiply two integers of type iN, producing a signed/unsigned value of type i[2...
Definition: ISDOpcodes.h:270

llvm::ISD::UDIV
@ UDIV
Definition: ISDOpcodes.h:263

llvm::ISD::UINT_TO_FP
@ UINT_TO_FP
Definition: ISDOpcodes.h:863

llvm::ISD::UMIN
@ UMIN
Definition: ISDOpcodes.h:720

llvm::ISD::BSWAP
@ BSWAP
Byte Swap and Counting operators.
Definition: ISDOpcodes.h:765

llvm::ISD::ROTR
@ ROTR
Definition: ISDOpcodes.h:760

llvm::ISD::FPOW
@ FPOW
Definition: ISDOpcodes.h:1015

llvm::ISD::SMULFIX
@ SMULFIX
RESULT = [US]MULFIX(LHS, RHS, SCALE) - Perform fixed point multiplication on 2 integers with the same...
Definition: ISDOpcodes.h:387

llvm::ISD::UADDO
@ UADDO
Definition: ISDOpcodes.h:344

llvm::ISD::FTRUNC
@ FTRUNC
Definition: ISDOpcodes.h:1034

llvm::ISD::SDIV
@ SDIV
Definition: ISDOpcodes.h:262

llvm::ISD::FMAXNUM_IEEE
@ FMAXNUM_IEEE
Definition: ISDOpcodes.h:1076

llvm::ISD::LLRINT
@ LLRINT
Definition: ISDOpcodes.h:1043

llvm::ISD::ADD
@ ADD
Simple integer binary arithmetic operators.
Definition: ISDOpcodes.h:259

llvm::ISD::LOAD
@ LOAD
LOAD and STORE have token chains as their first operand, then the same operands as an LLVM load/store...
Definition: ISDOpcodes.h:1141

llvm::ISD::SMULFIXSAT
@ SMULFIXSAT
Same as the corresponding unsaturated fixed point instructions, but the result is clamped between the...
Definition: ISDOpcodes.h:393

llvm::ISD::STRICT_FMA
@ STRICT_FMA
Definition: ISDOpcodes.h:425

llvm::ISD::ANY_EXTEND
@ ANY_EXTEND
ANY_EXTEND - Used for integer types. The high bits are undefined.
Definition: ISDOpcodes.h:835

llvm::ISD::FSUB
@ FSUB
Definition: ISDOpcodes.h:411

llvm::ISD::FMA
@ FMA
FMA - Perform a * b + c with no intermediate rounding step.
Definition: ISDOpcodes.h:511

llvm::ISD::UMULFIX
@ UMULFIX
Definition: ISDOpcodes.h:388

llvm::ISD::VECTOR_FIND_LAST_ACTIVE
@ VECTOR_FIND_LAST_ACTIVE
Definition: ISDOpcodes.h:1550

llvm::ISD::FMODF
@ FMODF
FMODF - Decomposes the operand into integral and fractional parts, each having the same type and sign...
Definition: ISDOpcodes.h:1098

llvm::ISD::FATAN2
@ FATAN2
FATAN2 - atan2, inspired by libm.
Definition: ISDOpcodes.h:1020

llvm::ISD::FABS
@ FABS
Definition: ISDOpcodes.h:1003

llvm::ISD::FSINCOSPI
@ FSINCOSPI
FSINCOSPI - Compute both the sine and cosine times pi more accurately than FSINCOS(pi*x),...
Definition: ISDOpcodes.h:1094

llvm::ISD::FNEARBYINT
@ FNEARBYINT
Definition: ISDOpcodes.h:1036

llvm::ISD::FCOSH
@ FCOSH
Definition: ISDOpcodes.h:1013

llvm::ISD::SINT_TO_FP
@ SINT_TO_FP
[SU]INT_TO_FP - These operators convert integers (whose interpreted sign depends on the first letter)...
Definition: ISDOpcodes.h:862

llvm::ISD::VECREDUCE_FMAX
@ VECREDUCE_FMAX
FMIN/FMAX nodes can have flags, for NaN/NoNaN variants.
Definition: ISDOpcodes.h:1476

llvm::ISD::FADD
@ FADD
Simple binary floating point operators.
Definition: ISDOpcodes.h:410

llvm::ISD::VECREDUCE_FMAXIMUM
@ VECREDUCE_FMAXIMUM
FMINIMUM/FMAXIMUM nodes propatate NaNs and signed zeroes using the llvm.minimum and llvm....
Definition: ISDOpcodes.h:1480

llvm::ISD::ABS
@ ABS
ABS - Determine the unsigned absolute value of a signed integer value of the same bitwidth.
Definition: ISDOpcodes.h:738

llvm::ISD::FEXP10
@ FEXP10
Definition: ISDOpcodes.h:1032

llvm::ISD::SIGN_EXTEND_VECTOR_INREG
@ SIGN_EXTEND_VECTOR_INREG
SIGN_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register sign-extension of the low ...
Definition: ISDOpcodes.h:892

llvm::ISD::UDIVREM
@ UDIVREM
Definition: ISDOpcodes.h:276

llvm::ISD::SDIVREM
@ SDIVREM
SDIVREM/UDIVREM - Divide two integers and produce both a quotient and remainder result.
Definition: ISDOpcodes.h:275

llvm::ISD::FACOS
@ FACOS
Definition: ISDOpcodes.h:1010

llvm::ISD::VECREDUCE_SMAX
@ VECREDUCE_SMAX
Definition: ISDOpcodes.h:1490

llvm::ISD::SRL
@ SRL
Definition: ISDOpcodes.h:758

llvm::ISD::STRICT_FSETCCS
@ STRICT_FSETCCS
Definition: ISDOpcodes.h:505

llvm::ISD::FMAXIMUM
@ FMAXIMUM
Definition: ISDOpcodes.h:1082

llvm::ISD::FATAN
@ FATAN
Definition: ISDOpcodes.h:1011

llvm::ISD::FPTRUNC_ROUND
@ FPTRUNC_ROUND
FPTRUNC_ROUND - This corresponds to the fptrunc_round intrinsic.
Definition: ISDOpcodes.h:508

llvm::ISD::BITCAST
@ BITCAST
BITCAST - This operator converts between integer, vector and FP values, as if the value was stored to...
Definition: ISDOpcodes.h:975

llvm::ISD::STRICT_FDIV
@ STRICT_FDIV
Definition: ISDOpcodes.h:423

llvm::ISD::FFLOOR
@ FFLOOR
Definition: ISDOpcodes.h:1039

llvm::ISD::FLDEXP
@ FLDEXP
FLDEXP - ldexp, inspired by libm (op0 * 2**op1).
Definition: ISDOpcodes.h:1018

llvm::ISD::SDIVFIX
@ SDIVFIX
RESULT = [US]DIVFIX(LHS, RHS, SCALE) - Perform fixed point division on 2 integers with the same width...
Definition: ISDOpcodes.h:400

llvm::ISD::STRICT_FSQRT
@ STRICT_FSQRT
Constrained versions of libm-equivalent floating point intrinsics.
Definition: ISDOpcodes.h:431

llvm::ISD::UCMP
@ UCMP
Definition: ISDOpcodes.h:727

llvm::ISD::SRA
@ SRA
Definition: ISDOpcodes.h:757

llvm::ISD::STRICT_FMUL
@ STRICT_FMUL
Definition: ISDOpcodes.h:422

llvm::ISD::LLROUND
@ LLROUND
Definition: ISDOpcodes.h:1041

llvm::ISD::USUBO
@ USUBO
Definition: ISDOpcodes.h:348

llvm::ISD::AVGFLOORU
@ AVGFLOORU
Definition: ISDOpcodes.h:702

llvm::ISD::PARTIAL_REDUCE_UMLA
@ PARTIAL_REDUCE_UMLA
Definition: ISDOpcodes.h:1511

llvm::ISD::SIGN_EXTEND
@ SIGN_EXTEND
Conversion operators.
Definition: ISDOpcodes.h:826

llvm::ISD::FLOG2
@ FLOG2
Definition: ISDOpcodes.h:1028

llvm::ISD::AVGCEILS
@ AVGCEILS
AVGCEILS/AVGCEILU - Rounding averaging add - Add two integers using an integer of type i[N+2],...
Definition: ISDOpcodes.h:706

llvm::ISD::STRICT_UINT_TO_FP
@ STRICT_UINT_TO_FP
Definition: ISDOpcodes.h:478

llvm::ISD::USHLSAT
@ USHLSAT
Definition: ISDOpcodes.h:380

llvm::ISD::UDIVFIXSAT
@ UDIVFIXSAT
Definition: ISDOpcodes.h:407

llvm::ISD::VECREDUCE_FADD
@ VECREDUCE_FADD
These reductions have relaxed evaluation order semantics, and have a single vector operand.
Definition: ISDOpcodes.h:1473

llvm::ISD::UADDSAT
@ UADDSAT
Definition: ISDOpcodes.h:361

llvm::ISD::CTTZ_ZERO_UNDEF
@ CTTZ_ZERO_UNDEF
Bit counting operators with an undefined result for zero inputs.
Definition: ISDOpcodes.h:773

llvm::ISD::FASIN
@ FASIN
Definition: ISDOpcodes.h:1009

llvm::ISD::FMAXNUM
@ FMAXNUM
Definition: ISDOpcodes.h:1060

llvm::ISD::FPOWI
@ FPOWI
Definition: ISDOpcodes.h:1016

llvm::ISD::FRINT
@ FRINT
Definition: ISDOpcodes.h:1035

llvm::ISD::VECREDUCE_FMIN
@ VECREDUCE_FMIN
Definition: ISDOpcodes.h:1477

llvm::ISD::FSINCOS
@ FSINCOS
FSINCOS - Compute both fsin and fcos as a single operation.
Definition: ISDOpcodes.h:1090

llvm::ISD::FNEG
@ FNEG
Perform various unary floating-point operations inspired by libm.
Definition: ISDOpcodes.h:1002

llvm::ISD::CTTZ
@ CTTZ
Definition: ISDOpcodes.h:766

llvm::ISD::SSUBO
@ SSUBO
Same for subtraction.
Definition: ISDOpcodes.h:347

llvm::ISD::FP_TO_UINT
@ FP_TO_UINT
Definition: ISDOpcodes.h:909

llvm::ISD::STEP_VECTOR
@ STEP_VECTOR
STEP_VECTOR(IMM) - Returns a scalable vector whose lanes are comprised of a linear sequence of unsign...
Definition: ISDOpcodes.h:682

llvm::ISD::OR
@ OR
Definition: ISDOpcodes.h:731

llvm::ISD::FCANONICALIZE
@ FCANONICALIZE
Returns platform specific canonical encoding of a floating point number.
Definition: ISDOpcodes.h:528

llvm::ISD::SSUBSAT
@ SSUBSAT
RESULT = [US]SUBSAT(LHS, RHS) - Perform saturation subtraction on 2 integers with the same bit width ...
Definition: ISDOpcodes.h:369

llvm::ISD::UMULO
@ UMULO
Definition: ISDOpcodes.h:352

llvm::ISD::SELECT
@ SELECT
Select(COND, TRUEVAL, FALSEVAL).
Definition: ISDOpcodes.h:778

llvm::ISD::UMUL_LOHI
@ UMUL_LOHI
Definition: ISDOpcodes.h:271

llvm::ISD::VECREDUCE_UMAX
@ VECREDUCE_UMAX
Definition: ISDOpcodes.h:1492

llvm::ISD::FTANH
@ FTANH
Definition: ISDOpcodes.h:1014

llvm::ISD::SPLAT_VECTOR
@ SPLAT_VECTOR
SPLAT_VECTOR(VAL) - Returns a vector with the scalar value VAL duplicated in all lanes.
Definition: ISDOpcodes.h:663

llvm::ISD::FSHL
@ FSHL
Definition: ISDOpcodes.h:761

llvm::ISD::AVGCEILU
@ AVGCEILU
Definition: ISDOpcodes.h:707

llvm::ISD::SADDO
@ SADDO
RESULT, BOOL = [SU]ADDO(LHS, RHS) - Overflow-aware nodes for addition.
Definition: ISDOpcodes.h:343

llvm::ISD::FSHR
@ FSHR
Definition: ISDOpcodes.h:762

llvm::ISD::FROUND
@ FROUND
Definition: ISDOpcodes.h:1037

llvm::ISD::USUBSAT
@ USUBSAT
Definition: ISDOpcodes.h:370

llvm::ISD::VECREDUCE_ADD
@ VECREDUCE_ADD
Integer reductions may have a result type larger than the vector element type.
Definition: ISDOpcodes.h:1485

llvm::ISD::MULHU
@ MULHU
MULHU/MULHS - Multiply high - Multiply two integers of type iN, producing an unsigned/signed value of...
Definition: ISDOpcodes.h:695

llvm::ISD::SHL
@ SHL
Shift and rotation operations.
Definition: ISDOpcodes.h:756

llvm::ISD::FMINNUM_IEEE
@ FMINNUM_IEEE
FMINNUM_IEEE/FMAXNUM_IEEE - Perform floating-point minimumNumber or maximumNumber on two values,...
Definition: ISDOpcodes.h:1075

llvm::ISD::FCOS
@ FCOS
Definition: ISDOpcodes.h:1007

llvm::ISD::XOR
@ XOR
Definition: ISDOpcodes.h:732

llvm::ISD::EXTRACT_VECTOR_ELT
@ EXTRACT_VECTOR_ELT
EXTRACT_VECTOR_ELT(VECTOR, IDX) - Returns a single element from VECTOR identified by the (potentially...
Definition: ISDOpcodes.h:563

llvm::ISD::ZERO_EXTEND
@ ZERO_EXTEND
ZERO_EXTEND - Used for integer types, zeroing the new bits.
Definition: ISDOpcodes.h:832

llvm::ISD::FP_TO_UINT_SAT
@ FP_TO_UINT_SAT
Definition: ISDOpcodes.h:928

llvm::ISD::CTPOP
@ CTPOP
Definition: ISDOpcodes.h:768

llvm::ISD::SELECT_CC
@ SELECT_CC
Select with condition operator - This selects between a true value and a false value (ops #2 and #3) ...
Definition: ISDOpcodes.h:793

llvm::ISD::FMUL
@ FMUL
Definition: ISDOpcodes.h:412

llvm::ISD::VECREDUCE_XOR
@ VECREDUCE_XOR
Definition: ISDOpcodes.h:1489

llvm::ISD::FTAN
@ FTAN
Definition: ISDOpcodes.h:1008

llvm::ISD::FMINNUM
@ FMINNUM
FMINNUM/FMAXNUM - Perform floating-point minimum maximum on two values, following IEEE-754 definition...
Definition: ISDOpcodes.h:1059

llvm::ISD::SUB
@ SUB
Definition: ISDOpcodes.h:260

llvm::ISD::MULHS
@ MULHS
Definition: ISDOpcodes.h:696

llvm::ISD::SSHLSAT
@ SSHLSAT
RESULT = [US]SHLSAT(LHS, RHS) - Perform saturation left shift.
Definition: ISDOpcodes.h:379

llvm::ISD::SMULO
@ SMULO
Same for multiplication.
Definition: ISDOpcodes.h:351

llvm::ISD::VECREDUCE_AND
@ VECREDUCE_AND
Definition: ISDOpcodes.h:1487

llvm::ISD::ANY_EXTEND_VECTOR_INREG
@ ANY_EXTEND_VECTOR_INREG
ANY_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register any-extension of the low la...
Definition: ISDOpcodes.h:881

llvm::ISD::SIGN_EXTEND_INREG
@ SIGN_EXTEND_INREG
SIGN_EXTEND_INREG - This operator atomically performs a SHL/SRA pair to sign extend a small value in ...
Definition: ISDOpcodes.h:870

llvm::ISD::UDIVFIX
@ UDIVFIX
Definition: ISDOpcodes.h:401

llvm::ISD::UMULFIXSAT
@ UMULFIXSAT
Definition: ISDOpcodes.h:394

llvm::ISD::SMIN
@ SMIN
[US]{MIN/MAX} - Binary minimum or maximum of signed or unsigned integers.
Definition: ISDOpcodes.h:718

llvm::ISD::SDIVFIXSAT
@ SDIVFIXSAT
Same as the corresponding unsaturated fixed point instructions, but the result is clamped between the...
Definition: ISDOpcodes.h:406

llvm::ISD::FP_EXTEND
@ FP_EXTEND
X = FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
Definition: ISDOpcodes.h:960

llvm::ISD::VECREDUCE_OR
@ VECREDUCE_OR
Definition: ISDOpcodes.h:1488

llvm::ISD::VSELECT
@ VSELECT
Select with a vector condition (op #0) and two vector operands (ops #1 and #2), returning a vector re...
Definition: ISDOpcodes.h:787

llvm::ISD::STRICT_SINT_TO_FP
@ STRICT_SINT_TO_FP
STRICT_[US]INT_TO_FP - Convert a signed or unsigned integer to a floating point value.
Definition: ISDOpcodes.h:477

llvm::ISD::FROUNDEVEN
@ FROUNDEVEN
Definition: ISDOpcodes.h:1038

llvm::ISD::VECREDUCE_MUL
@ VECREDUCE_MUL
Definition: ISDOpcodes.h:1486

llvm::ISD::MGATHER
@ MGATHER
Masked gather and scatter - load and store operations for a vector of random addresses with additiona...
Definition: ISDOpcodes.h:1413

llvm::ISD::VECREDUCE_UMIN
@ VECREDUCE_UMIN
Definition: ISDOpcodes.h:1493

llvm::ISD::FDIV
@ FDIV
Definition: ISDOpcodes.h:413

llvm::ISD::FREM
@ FREM
Definition: ISDOpcodes.h:414

llvm::ISD::STRICT_FP_TO_UINT
@ STRICT_FP_TO_UINT
Definition: ISDOpcodes.h:471

llvm::ISD::STRICT_FP_ROUND
@ STRICT_FP_ROUND
X = STRICT_FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating point type down to the precision ...
Definition: ISDOpcodes.h:493

llvm::ISD::STRICT_FP_TO_SINT
@ STRICT_FP_TO_SINT
STRICT_FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
Definition: ISDOpcodes.h:470

llvm::ISD::FMINIMUM
@ FMINIMUM
FMINIMUM/FMAXIMUM - NaN-propagating minimum/maximum that also treat -0.0 as less than 0....
Definition: ISDOpcodes.h:1081

llvm::ISD::FP_TO_SINT
@ FP_TO_SINT
FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
Definition: ISDOpcodes.h:908

llvm::ISD::STRICT_FP_EXTEND
@ STRICT_FP_EXTEND
X = STRICT_FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
Definition: ISDOpcodes.h:498

llvm::ISD::AND
@ AND
Bitwise operators - logical and, logical or, logical xor.
Definition: ISDOpcodes.h:730

llvm::ISD::FLOG
@ FLOG
Definition: ISDOpcodes.h:1027

llvm::ISD::SCMP
@ SCMP
[US]CMP - 3-way comparison of signed or unsigned integers.
Definition: ISDOpcodes.h:726

llvm::ISD::AVGFLOORS
@ AVGFLOORS
AVGFLOORS/AVGFLOORU - Averaging add - Add two integers using an integer of type i[N+1],...
Definition: ISDOpcodes.h:701

llvm::ISD::VECREDUCE_FMUL
@ VECREDUCE_FMUL
Definition: ISDOpcodes.h:1474

llvm::ISD::STRICT_FADD
@ STRICT_FADD
Constrained versions of the binary floating point operators.
Definition: ISDOpcodes.h:420

llvm::ISD::UREM
@ UREM
Definition: ISDOpcodes.h:265

llvm::ISD::TokenFactor
@ TokenFactor
TokenFactor - This node takes multiple tokens as input and produces a single token result.
Definition: ISDOpcodes.h:53

llvm::ISD::FSIN
@ FSIN
Definition: ISDOpcodes.h:1006

llvm::ISD::FEXP
@ FEXP
Definition: ISDOpcodes.h:1030

llvm::ISD::FCEIL
@ FCEIL
Definition: ISDOpcodes.h:1033

llvm::ISD::STRICT_FSUB
@ STRICT_FSUB
Definition: ISDOpcodes.h:421

llvm::ISD::MUL
@ MUL
Definition: ISDOpcodes.h:261

llvm::ISD::FSINH
@ FSINH
Definition: ISDOpcodes.h:1012

llvm::ISD::FFREXP
@ FFREXP
FFREXP - frexp, extract fractional and exponent component of a floating-point value.
Definition: ISDOpcodes.h:1025

llvm::ISD::FP_ROUND
@ FP_ROUND
X = FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating point type down to the precision of the ...
Definition: ISDOpcodes.h:941

llvm::ISD::VECTOR_COMPRESS
@ VECTOR_COMPRESS
VECTOR_COMPRESS(Vec, Mask, Passthru) consecutively place vector elements based on mask e....
Definition: ISDOpcodes.h:690

llvm::ISD::LROUND
@ LROUND
Definition: ISDOpcodes.h:1040

llvm::ISD::CTLZ
@ CTLZ
Definition: ISDOpcodes.h:767

llvm::ISD::FMAXIMUMNUM
@ FMAXIMUMNUM
Definition: ISDOpcodes.h:1087

llvm::ISD::ZERO_EXTEND_VECTOR_INREG
@ ZERO_EXTEND_VECTOR_INREG
ZERO_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register zero-extension of the low ...
Definition: ISDOpcodes.h:903

llvm::ISD::FSQRT
@ FSQRT
Definition: ISDOpcodes.h:1004

llvm::ISD::FP_TO_SINT_SAT
@ FP_TO_SINT_SAT
FP_TO_[US]INT_SAT - Convert floating point value in operand 0 to a signed or unsigned scalar integer ...
Definition: ISDOpcodes.h:927

llvm::ISD::VECREDUCE_FMINIMUM
@ VECREDUCE_FMINIMUM
Definition: ISDOpcodes.h:1481

llvm::ISD::TRUNCATE
@ TRUNCATE
TRUNCATE - Completely drop the high bits.
Definition: ISDOpcodes.h:838

llvm::ISD::ROTL
@ ROTL
Definition: ISDOpcodes.h:759

llvm::ISD::VECREDUCE_SEQ_FMUL
@ VECREDUCE_SEQ_FMUL
Definition: ISDOpcodes.h:1459

llvm::ISD::AssertSext
@ AssertSext
AssertSext, AssertZext - These nodes record if a register contains a value that has already been zero...
Definition: ISDOpcodes.h:62

llvm::ISD::BITREVERSE
@ BITREVERSE
Definition: ISDOpcodes.h:769

llvm::ISD::FCOPYSIGN
@ FCOPYSIGN
FCOPYSIGN(X, Y) - Return the value of X with the sign of Y.
Definition: ISDOpcodes.h:521

llvm::ISD::PARTIAL_REDUCE_SUMLA
@ PARTIAL_REDUCE_SUMLA
Definition: ISDOpcodes.h:1512

llvm::ISD::SADDSAT
@ SADDSAT
RESULT = [US]ADDSAT(LHS, RHS) - Perform saturation addition on 2 integers with the same bit width (W)...
Definition: ISDOpcodes.h:360

llvm::ISD::AssertZext
@ AssertZext
Definition: ISDOpcodes.h:63

llvm::ISD::FEXP2
@ FEXP2
Definition: ISDOpcodes.h:1031

llvm::ISD::SMAX
@ SMAX
Definition: ISDOpcodes.h:719

llvm::ISD::UMAX
@ UMAX
Definition: ISDOpcodes.h:721

llvm::ISD::FMINIMUMNUM
@ FMINIMUMNUM
FMINIMUMNUM/FMAXIMUMNUM - minimumnum/maximumnum that is same with FMINNUM_IEEE and FMAXNUM_IEEE besid...
Definition: ISDOpcodes.h:1086

llvm::ISD::ABDS
@ ABDS
ABDS/ABDU - Absolute difference - Return the absolute difference between two numbers interpreted as s...
Definition: ISDOpcodes.h:713

llvm::ISD::ABDU
@ ABDU
Definition: ISDOpcodes.h:714

llvm::ISD::BUILD_VECTOR
@ BUILD_VECTOR
BUILD_VECTOR(ELT0, ELT1, ELT2, ELT3,...) - Return a fixed-width vector with the specified,...
Definition: ISDOpcodes.h:543

llvm::ISD::getVPMaskIdx
LLVM_ABI std::optional< unsigned > getVPMaskIdx(unsigned Opcode)
The operand position of the vector mask.
Definition: SelectionDAG.cpp:542

llvm::ISD::getVPExplicitVectorLengthIdx
LLVM_ABI std::optional< unsigned > getVPExplicitVectorLengthIdx(unsigned Opcode)
The operand position of the explicit vector length parameter.
Definition: SelectionDAG.cpp:554

llvm::ISD::CondCode
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
Definition: ISDOpcodes.h:1685

llvm::ISD::LoadExtType
LoadExtType
LoadExtType enum - This enum defines the three variants of LOADEXT (load with extension).
Definition: ISDOpcodes.h:1665

llvm::ISD::NON_EXTLOAD
@ NON_EXTLOAD
Definition: ISDOpcodes.h:1665

llvm::ISD::isVPOpcode
LLVM_ABI bool isVPOpcode(unsigned Opcode)
Whether this is a vector-predicated Opcode.
Definition: SelectionDAG.cpp:493

llvm::M68k::MemAddrModeKind::j
@ j

llvm::MipsISD::Ext
@ Ext
Definition: MipsISelLowering.h:157

llvm::RTLIB::getSINCOSPI
LLVM_ABI Libcall getSINCOSPI(EVT RetVT)
getSINCOSPI - Return the SINCOSPI_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition: TargetLoweringBase.cpp:426

llvm::RTLIB::getMODF
LLVM_ABI Libcall getMODF(EVT RetVT)
getMODF - Return the MODF_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition: TargetLoweringBase.cpp:431

llvm::RTLIB::getFPLibCall
LLVM_ABI Libcall getFPLibCall(EVT VT, Libcall Call_F32, Libcall Call_F64, Libcall Call_F80, Libcall Call_F128, Libcall Call_PPCF128)
GetFPLibCall - Helper to return the right libcall for the given floating point type,...

llvm::RTLIB::getSINCOS
LLVM_ABI Libcall getSINCOS(EVT RetVT)
getSINCOS - Return the SINCOS_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition: TargetLoweringBase.cpp:421

llvm::VFABI::tryDemangleForVFABI
LLVM_ABI std::optional< VFInfo > tryDemangleForVFABI(StringRef MangledName, const FunctionType *FTy)
Function to construct a VFInfo out of a mangled names in the following format:
Definition: VFABIDemangler.cpp:379

llvm::logicalview::LVAttributeKind::Zero
@ Zero

llvm::ms_demangle::QualifierMangleMode::Result
@ Result

llvm::pdb::PDB_SymType::Callee
@ Callee

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Offset
@ Offset
Definition: DWP.cpp:477

llvm::any_of
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1751

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:207

llvm::RecurKind::Xor
@ Xor
Bitwise or logical XOR of integers.

llvm::Op
DWARFExpression::Operation Op
Definition: DWARFExpressionPrinter.cpp:22

N
#define N

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:35

llvm::EVT::changeVectorElementTypeToInteger
EVT changeVectorElementTypeToInteger() const
Return a vector with the same number of elements as this vector, but with the element type converted ...
Definition: ValueTypes.h:94

llvm::EVT::getVectorVT
static EVT getVectorVT(LLVMContext &Context, EVT VT, unsigned NumElements, bool IsScalable=false)
Returns the EVT that represents a vector NumElements in length, where each element is of type VT.
Definition: ValueTypes.h:74

llvm::EVT::getVectorElementCount
ElementCount getVectorElementCount() const
Definition: ValueTypes.h:345

llvm::EVT::getSizeInBits
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition: ValueTypes.h:368

llvm::EVT::getScalarSizeInBits
uint64_t getScalarSizeInBits() const
Definition: ValueTypes.h:380

llvm::EVT::isFixedLengthVector
bool isFixedLengthVector() const
Definition: ValueTypes.h:181

llvm::EVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition: ValueTypes.h:168

llvm::EVT::getScalarType
EVT getScalarType() const
If this is a vector type, return the element type, otherwise return this.
Definition: ValueTypes.h:318

llvm::EVT::getTypeForEVT
LLVM_ABI Type * getTypeForEVT(LLVMContext &Context) const
This method returns an LLVM type corresponding to the specified EVT.
Definition: ValueTypes.cpp:216

llvm::EVT::isScalableVector
bool isScalableVector() const
Return true if this is a vector type where the runtime length is machine dependent.
Definition: ValueTypes.h:174

llvm::EVT::getVectorElementType
EVT getVectorElementType() const
Given a vector type, return the type of each element.
Definition: ValueTypes.h:323

llvm::EVT::changeVectorElementType
EVT changeVectorElementType(EVT EltVT) const
Return a VT for a vector type whose attributes match ourselves with the exception of the element type...
Definition: ValueTypes.h:102

llvm::EVT::getVectorNumElements
unsigned getVectorNumElements() const
Given a vector type, return the number of elements it contains.
Definition: ValueTypes.h:331

llvm::EVT::bitsLE
bool bitsLE(EVT VT) const
Return true if this has no more bits than VT.
Definition: ValueTypes.h:303

llvm::SDNodeFlags::Disjoint
@ Disjoint
Definition: SelectionDAGNodes.h:401

llvm::SDVTList
This represents a list of ValueType's that has been intern'd by a SelectionDAG.
Definition: SelectionDAGNodes.h:80

llvm::TargetLowering::CallLoweringInfo
This structure contains all information that is necessary for lowering calls.
Definition: TargetLowering.h:4704