LLVM: lib/Target/RISCV/GISel/RISCVLegalizerInfo.cpp Source File

//===-- RISCVLegalizerInfo.cpp ----------------------------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

/// This file implements the targeting of the Machinelegalizer class for RISC-V.

/// \todo This should be generated by TableGen.

//===----------------------------------------------------------------------===//


#include "RISCVLegalizerInfo.h"

#include "MCTargetDesc/RISCVMatInt.h"

#include "RISCVMachineFunctionInfo.h"

#include "RISCVSubtarget.h"

#include "llvm/CodeGen/GlobalISel/GIMatchTableExecutor.h"

#include "llvm/CodeGen/GlobalISel/GenericMachineInstrs.h"

#include "llvm/CodeGen/GlobalISel/LegalizerHelper.h"

#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"

#include "llvm/CodeGen/MachineConstantPool.h"

#include "llvm/CodeGen/MachineJumpTableInfo.h"

#include "llvm/CodeGen/MachineMemOperand.h"

#include "llvm/CodeGen/MachineOperand.h"

#include "llvm/CodeGen/MachineRegisterInfo.h"

#include "llvm/CodeGen/TargetOpcodes.h"

#include "llvm/CodeGen/ValueTypes.h"

#include "llvm/IR/DerivedTypes.h"

#include "llvm/IR/Intrinsics.h"

#include "llvm/IR/IntrinsicsRISCV.h"

#include "llvm/IR/Type.h"


using namespace llvm;

using namespace LegalityPredicates;

using namespace LegalizeMutations;


static LegalityPredicate

typeIsLegalIntOrFPVec(unsigned TypeIdx,

                      std::initializer_list<LLT> IntOrFPVecTys,

                      const RISCVSubtarget &ST) {

  LegalityPredicate P = [=, &ST](const LegalityQuery &Query) {

    return ST.hasVInstructions() &&

           (Query.Types[TypeIdx].getScalarSizeInBits() != 64 ||

            ST.hasVInstructionsI64()) &&

           (Query.Types[TypeIdx].getElementCount().getKnownMinValue() != 1 ||

            ST.getELen() == 64);

  };


  return all(typeInSet(TypeIdx, IntOrFPVecTys), P);

}


static LegalityPredicate

typeIsLegalBoolVec(unsigned TypeIdx, std::initializer_list<LLT> BoolVecTys,

                   const RISCVSubtarget &ST) {

  LegalityPredicate P = [=, &ST](const LegalityQuery &Query) {

    return ST.hasVInstructions() &&

           (Query.Types[TypeIdx].getElementCount().getKnownMinValue() != 1 ||

            ST.getELen() == 64);

  };

  return all(typeInSet(TypeIdx, BoolVecTys), P);

}


static LegalityPredicate typeIsLegalPtrVec(unsigned TypeIdx,

                                           std::initializer_list<LLT> PtrVecTys,

                                           const RISCVSubtarget &ST) {

  LegalityPredicate P = [=, &ST](const LegalityQuery &Query) {

    return ST.hasVInstructions() &&

           (Query.Types[TypeIdx].getElementCount().getKnownMinValue() != 1 ||

            ST.getELen() == 64) &&

           (Query.Types[TypeIdx].getElementCount().getKnownMinValue() != 16 ||

            Query.Types[TypeIdx].getScalarSizeInBits() == 32);

  };

  return all(typeInSet(TypeIdx, PtrVecTys), P);

}


RISCVLegalizerInfo::RISCVLegalizerInfo(const RISCVSubtarget &ST)

    : STI(ST), XLen(STI.getXLen()), sXLen(LLT::scalar(XLen)) {

  const LLT sDoubleXLen = LLT::scalar(2 * XLen);

  const LLT p0 = LLT::pointer(0, XLen);

  const LLT s1 = LLT::scalar(1);

  const LLT s8 = LLT::scalar(8);

  const LLT s16 = LLT::scalar(16);

  const LLT s32 = LLT::scalar(32);

  const LLT s64 = LLT::scalar(64);

  const LLT s128 = LLT::scalar(128);


  const LLT nxv1s1 = LLT::scalable_vector(1, s1);

  const LLT nxv2s1 = LLT::scalable_vector(2, s1);

  const LLT nxv4s1 = LLT::scalable_vector(4, s1);

  const LLT nxv8s1 = LLT::scalable_vector(8, s1);

  const LLT nxv16s1 = LLT::scalable_vector(16, s1);

  const LLT nxv32s1 = LLT::scalable_vector(32, s1);

  const LLT nxv64s1 = LLT::scalable_vector(64, s1);


  const LLT nxv1s8 = LLT::scalable_vector(1, s8);

  const LLT nxv2s8 = LLT::scalable_vector(2, s8);

  const LLT nxv4s8 = LLT::scalable_vector(4, s8);

  const LLT nxv8s8 = LLT::scalable_vector(8, s8);

  const LLT nxv16s8 = LLT::scalable_vector(16, s8);

  const LLT nxv32s8 = LLT::scalable_vector(32, s8);

  const LLT nxv64s8 = LLT::scalable_vector(64, s8);


  const LLT nxv1s16 = LLT::scalable_vector(1, s16);

  const LLT nxv2s16 = LLT::scalable_vector(2, s16);

  const LLT nxv4s16 = LLT::scalable_vector(4, s16);

  const LLT nxv8s16 = LLT::scalable_vector(8, s16);

  const LLT nxv16s16 = LLT::scalable_vector(16, s16);

  const LLT nxv32s16 = LLT::scalable_vector(32, s16);


  const LLT nxv1s32 = LLT::scalable_vector(1, s32);

  const LLT nxv2s32 = LLT::scalable_vector(2, s32);

  const LLT nxv4s32 = LLT::scalable_vector(4, s32);

  const LLT nxv8s32 = LLT::scalable_vector(8, s32);

  const LLT nxv16s32 = LLT::scalable_vector(16, s32);


  const LLT nxv1s64 = LLT::scalable_vector(1, s64);

  const LLT nxv2s64 = LLT::scalable_vector(2, s64);

  const LLT nxv4s64 = LLT::scalable_vector(4, s64);

  const LLT nxv8s64 = LLT::scalable_vector(8, s64);


  const LLT nxv1p0 = LLT::scalable_vector(1, p0);

  const LLT nxv2p0 = LLT::scalable_vector(2, p0);

  const LLT nxv4p0 = LLT::scalable_vector(4, p0);

  const LLT nxv8p0 = LLT::scalable_vector(8, p0);

  const LLT nxv16p0 = LLT::scalable_vector(16, p0);


  using namespace TargetOpcode;


  auto BoolVecTys = {nxv1s1, nxv2s1, nxv4s1, nxv8s1, nxv16s1, nxv32s1, nxv64s1};


  auto IntOrFPVecTys = {nxv1s8,   nxv2s8,  nxv4s8,  nxv8s8,  nxv16s8, nxv32s8,

                        nxv64s8,  nxv1s16, nxv2s16, nxv4s16, nxv8s16, nxv16s16,

                        nxv32s16, nxv1s32, nxv2s32, nxv4s32, nxv8s32, nxv16s32,

                        nxv1s64,  nxv2s64, nxv4s64, nxv8s64};


  auto PtrVecTys = {nxv1p0, nxv2p0, nxv4p0, nxv8p0, nxv16p0};


  getActionDefinitionsBuilder({G_ADD, G_SUB})

      .legalFor({sXLen})

      .legalIf(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST))

      .customFor(ST.is64Bit(), {s32})

      .widenScalarToNextPow2(0)

      .clampScalar(0, sXLen, sXLen);


  getActionDefinitionsBuilder({G_AND, G_OR, G_XOR})

      .legalFor({sXLen})

      .legalIf(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST))

      .widenScalarToNextPow2(0)

      .clampScalar(0, sXLen, sXLen);


  getActionDefinitionsBuilder(

      {G_UADDE, G_UADDO, G_USUBE, G_USUBO}).lower();


  getActionDefinitionsBuilder({G_SADDO, G_SSUBO}).minScalar(0, sXLen).lower();


  // TODO: Use Vector Single-Width Saturating Instructions for vector types.

  getActionDefinitionsBuilder(

      {G_UADDSAT, G_SADDSAT, G_USUBSAT, G_SSUBSAT, G_SSHLSAT, G_USHLSAT})

      .lower();


  getActionDefinitionsBuilder({G_SHL, G_ASHR, G_LSHR})

      .legalFor({{sXLen, sXLen}})

      .customFor(ST.is64Bit(), {{s32, s32}})

      .widenScalarToNextPow2(0)

      .clampScalar(1, sXLen, sXLen)

      .clampScalar(0, sXLen, sXLen);


  getActionDefinitionsBuilder({G_ZEXT, G_SEXT, G_ANYEXT})

      .legalFor({{s32, s16}})

      .legalFor(ST.is64Bit(), {{s64, s16}, {s64, s32}})

      .legalIf(all(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST),

                   typeIsLegalIntOrFPVec(1, IntOrFPVecTys, ST)))

      .customIf(typeIsLegalBoolVec(1, BoolVecTys, ST))

      .maxScalar(0, sXLen);


  getActionDefinitionsBuilder(G_SEXT_INREG)

      .customFor({sXLen})

      .clampScalar(0, sXLen, sXLen)

      .lower();


  // Merge/Unmerge

  for (unsigned Op : {G_MERGE_VALUES, G_UNMERGE_VALUES}) {

    auto &MergeUnmergeActions = getActionDefinitionsBuilder(Op);

    unsigned BigTyIdx = Op == G_MERGE_VALUES ? 0 : 1;

    unsigned LitTyIdx = Op == G_MERGE_VALUES ? 1 : 0;

    if (XLen == 32 && ST.hasStdExtD()) {

      MergeUnmergeActions.legalIf(

          all(typeIs(BigTyIdx, s64), typeIs(LitTyIdx, s32)));

    }

    MergeUnmergeActions.widenScalarToNextPow2(LitTyIdx, XLen)

        .widenScalarToNextPow2(BigTyIdx, XLen)

        .clampScalar(LitTyIdx, sXLen, sXLen)

        .clampScalar(BigTyIdx, sXLen, sXLen);

  }


  getActionDefinitionsBuilder({G_FSHL, G_FSHR}).lower();


  getActionDefinitionsBuilder({G_ROTR, G_ROTL})

      .legalFor(ST.hasStdExtZbb() || ST.hasStdExtZbkb(), {{sXLen, sXLen}})

      .customFor(ST.is64Bit() && (ST.hasStdExtZbb() || ST.hasStdExtZbkb()),

                 {{s32, s32}})

      .lower();


  getActionDefinitionsBuilder(G_BITREVERSE).maxScalar(0, sXLen).lower();


  getActionDefinitionsBuilder(G_BITCAST).legalIf(

      all(LegalityPredicates::any(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST),

                                  typeIsLegalBoolVec(0, BoolVecTys, ST)),

          LegalityPredicates::any(typeIsLegalIntOrFPVec(1, IntOrFPVecTys, ST),

                                  typeIsLegalBoolVec(1, BoolVecTys, ST))));


  auto &BSWAPActions = getActionDefinitionsBuilder(G_BSWAP);

  if (ST.hasStdExtZbb() || ST.hasStdExtZbkb())

    BSWAPActions.legalFor({sXLen}).clampScalar(0, sXLen, sXLen);

  else

    BSWAPActions.maxScalar(0, sXLen).lower();


  auto &CountZerosActions = getActionDefinitionsBuilder({G_CTLZ, G_CTTZ});

  auto &CountZerosUndefActions =

      getActionDefinitionsBuilder({G_CTLZ_ZERO_UNDEF, G_CTTZ_ZERO_UNDEF});

  if (ST.hasStdExtZbb()) {

    CountZerosActions.legalFor({{sXLen, sXLen}})

        .customFor({{s32, s32}})

        .clampScalar(0, s32, sXLen)

        .widenScalarToNextPow2(0)

        .scalarSameSizeAs(1, 0);

  } else {

    CountZerosActions.maxScalar(0, sXLen).scalarSameSizeAs(1, 0).lower();

    CountZerosUndefActions.maxScalar(0, sXLen).scalarSameSizeAs(1, 0);

  }

  CountZerosUndefActions.lower();


  auto &CTPOPActions = getActionDefinitionsBuilder(G_CTPOP);

  if (ST.hasStdExtZbb()) {

    CTPOPActions.legalFor({{sXLen, sXLen}})

        .clampScalar(0, sXLen, sXLen)

        .scalarSameSizeAs(1, 0);

  } else {

    CTPOPActions.maxScalar(0, sXLen).scalarSameSizeAs(1, 0).lower();

  }


  getActionDefinitionsBuilder(G_CONSTANT)

      .legalFor({p0})

      .legalFor(!ST.is64Bit(), {s32})

      .customFor(ST.is64Bit(), {s64})

      .widenScalarToNextPow2(0)

      .clampScalar(0, sXLen, sXLen);


  // TODO: transform illegal vector types into legal vector type

  getActionDefinitionsBuilder(G_FREEZE)

      .legalFor({s16, s32, p0})

      .legalFor(ST.is64Bit(), {s64})

      .legalIf(typeIsLegalBoolVec(0, BoolVecTys, ST))

      .legalIf(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST))

      .widenScalarToNextPow2(0)

      .clampScalar(0, s16, sXLen);


  // TODO: transform illegal vector types into legal vector type

  // TODO: Merge with G_FREEZE?

  getActionDefinitionsBuilder(

      {G_IMPLICIT_DEF, G_CONSTANT_FOLD_BARRIER})

      .legalFor({s32, sXLen, p0})

      .legalIf(typeIsLegalBoolVec(0, BoolVecTys, ST))

      .legalIf(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST))

      .widenScalarToNextPow2(0)

      .clampScalar(0, s32, sXLen);


  getActionDefinitionsBuilder(G_ICMP)

      .legalFor({{sXLen, sXLen}, {sXLen, p0}})

      .legalIf(all(typeIsLegalBoolVec(0, BoolVecTys, ST),

                   typeIsLegalIntOrFPVec(1, IntOrFPVecTys, ST)))

      .widenScalarOrEltToNextPow2OrMinSize(1, 8)

      .clampScalar(1, sXLen, sXLen)

      .clampScalar(0, sXLen, sXLen);


  getActionDefinitionsBuilder(G_SELECT)

      .legalFor({{s32, sXLen}, {p0, sXLen}})

      .legalIf(all(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST),

                   typeIsLegalBoolVec(1, BoolVecTys, ST)))

      .legalFor(XLen == 64 || ST.hasStdExtD(), {{s64, sXLen}})

      .widenScalarToNextPow2(0)

      .clampScalar(0, s32, (XLen == 64 || ST.hasStdExtD()) ? s64 : s32)

      .clampScalar(1, sXLen, sXLen);


  auto &LoadActions = getActionDefinitionsBuilder(G_LOAD);

  auto &StoreActions = getActionDefinitionsBuilder(G_STORE);

  auto &ExtLoadActions = getActionDefinitionsBuilder({G_SEXTLOAD, G_ZEXTLOAD});


  // Return the alignment needed for scalar memory ops. If unaligned scalar mem

  // is supported, we only require byte alignment. Otherwise, we need the memory

  // op to be natively aligned.

  auto getScalarMemAlign = [&ST](unsigned Size) {

    return ST.enableUnalignedScalarMem() ? 8 : Size;

  };


  LoadActions.legalForTypesWithMemDesc(

      {{s16, p0, s8, getScalarMemAlign(8)},

       {s32, p0, s8, getScalarMemAlign(8)},

       {s16, p0, s16, getScalarMemAlign(16)},

       {s32, p0, s16, getScalarMemAlign(16)},

       {s32, p0, s32, getScalarMemAlign(32)},

       {p0, p0, sXLen, getScalarMemAlign(XLen)}});

  StoreActions.legalForTypesWithMemDesc(

      {{s16, p0, s8, getScalarMemAlign(8)},

       {s32, p0, s8, getScalarMemAlign(8)},

       {s16, p0, s16, getScalarMemAlign(16)},

       {s32, p0, s16, getScalarMemAlign(16)},

       {s32, p0, s32, getScalarMemAlign(32)},

       {p0, p0, sXLen, getScalarMemAlign(XLen)}});

  ExtLoadActions.legalForTypesWithMemDesc(

      {{sXLen, p0, s8, getScalarMemAlign(8)},

       {sXLen, p0, s16, getScalarMemAlign(16)}});

  if (XLen == 64) {

    LoadActions.legalForTypesWithMemDesc(

        {{s64, p0, s8, getScalarMemAlign(8)},

         {s64, p0, s16, getScalarMemAlign(16)},

         {s64, p0, s32, getScalarMemAlign(32)},

         {s64, p0, s64, getScalarMemAlign(64)}});

    StoreActions.legalForTypesWithMemDesc(

        {{s64, p0, s8, getScalarMemAlign(8)},

         {s64, p0, s16, getScalarMemAlign(16)},

         {s64, p0, s32, getScalarMemAlign(32)},

         {s64, p0, s64, getScalarMemAlign(64)}});

    ExtLoadActions.legalForTypesWithMemDesc(

        {{s64, p0, s32, getScalarMemAlign(32)}});

  } else if (ST.hasStdExtD()) {

    LoadActions.legalForTypesWithMemDesc(

        {{s64, p0, s64, getScalarMemAlign(64)}});

    StoreActions.legalForTypesWithMemDesc(

        {{s64, p0, s64, getScalarMemAlign(64)}});

  }


  // Vector loads/stores.

  if (ST.hasVInstructions()) {

    LoadActions.legalForTypesWithMemDesc({{nxv2s8, p0, nxv2s8, 8},

                                          {nxv4s8, p0, nxv4s8, 8},

                                          {nxv8s8, p0, nxv8s8, 8},

                                          {nxv16s8, p0, nxv16s8, 8},

                                          {nxv32s8, p0, nxv32s8, 8},

                                          {nxv64s8, p0, nxv64s8, 8},

                                          {nxv2s16, p0, nxv2s16, 16},

                                          {nxv4s16, p0, nxv4s16, 16},

                                          {nxv8s16, p0, nxv8s16, 16},

                                          {nxv16s16, p0, nxv16s16, 16},

                                          {nxv32s16, p0, nxv32s16, 16},

                                          {nxv2s32, p0, nxv2s32, 32},

                                          {nxv4s32, p0, nxv4s32, 32},

                                          {nxv8s32, p0, nxv8s32, 32},

                                          {nxv16s32, p0, nxv16s32, 32}});

    StoreActions.legalForTypesWithMemDesc({{nxv2s8, p0, nxv2s8, 8},

                                           {nxv4s8, p0, nxv4s8, 8},

                                           {nxv8s8, p0, nxv8s8, 8},

                                           {nxv16s8, p0, nxv16s8, 8},

                                           {nxv32s8, p0, nxv32s8, 8},

                                           {nxv64s8, p0, nxv64s8, 8},

                                           {nxv2s16, p0, nxv2s16, 16},

                                           {nxv4s16, p0, nxv4s16, 16},

                                           {nxv8s16, p0, nxv8s16, 16},

                                           {nxv16s16, p0, nxv16s16, 16},

                                           {nxv32s16, p0, nxv32s16, 16},

                                           {nxv2s32, p0, nxv2s32, 32},

                                           {nxv4s32, p0, nxv4s32, 32},

                                           {nxv8s32, p0, nxv8s32, 32},

                                           {nxv16s32, p0, nxv16s32, 32}});


    if (ST.getELen() == 64) {

      LoadActions.legalForTypesWithMemDesc({{nxv1s8, p0, nxv1s8, 8},

                                            {nxv1s16, p0, nxv1s16, 16},

                                            {nxv1s32, p0, nxv1s32, 32}});

      StoreActions.legalForTypesWithMemDesc({{nxv1s8, p0, nxv1s8, 8},

                                             {nxv1s16, p0, nxv1s16, 16},

                                             {nxv1s32, p0, nxv1s32, 32}});

    }


    if (ST.hasVInstructionsI64()) {

      LoadActions.legalForTypesWithMemDesc({{nxv1s64, p0, nxv1s64, 64},

                                            {nxv2s64, p0, nxv2s64, 64},

                                            {nxv4s64, p0, nxv4s64, 64},

                                            {nxv8s64, p0, nxv8s64, 64}});

      StoreActions.legalForTypesWithMemDesc({{nxv1s64, p0, nxv1s64, 64},

                                             {nxv2s64, p0, nxv2s64, 64},

                                             {nxv4s64, p0, nxv4s64, 64},

                                             {nxv8s64, p0, nxv8s64, 64}});

    }


    // we will take the custom lowering logic if we have scalable vector types

    // with non-standard alignments

    LoadActions.customIf(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST));

    StoreActions.customIf(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST));


    // Pointers require that XLen sized elements are legal.

    if (XLen <= ST.getELen()) {

      LoadActions.customIf(typeIsLegalPtrVec(0, PtrVecTys, ST));

      StoreActions.customIf(typeIsLegalPtrVec(0, PtrVecTys, ST));

    }

  }


  LoadActions.widenScalarToNextPow2(0, /* MinSize = */ 8)

      .lowerIfMemSizeNotByteSizePow2()

      .clampScalar(0, s16, sXLen)

      .lower();

  StoreActions

      .clampScalar(0, s16, sXLen)

      .lowerIfMemSizeNotByteSizePow2()

      .lower();


  ExtLoadActions.widenScalarToNextPow2(0).clampScalar(0, sXLen, sXLen).lower();


  getActionDefinitionsBuilder({G_PTR_ADD, G_PTRMASK}).legalFor({{p0, sXLen}});


  getActionDefinitionsBuilder(G_PTRTOINT)

      .legalFor({{sXLen, p0}})

      .clampScalar(0, sXLen, sXLen);


  getActionDefinitionsBuilder(G_INTTOPTR)

      .legalFor({{p0, sXLen}})

      .clampScalar(1, sXLen, sXLen);


  getActionDefinitionsBuilder(G_BRCOND).legalFor({sXLen}).minScalar(0, sXLen);


  getActionDefinitionsBuilder(G_BRJT).customFor({{p0, sXLen}});


  getActionDefinitionsBuilder(G_BRINDIRECT).legalFor({p0});


  getActionDefinitionsBuilder(G_PHI)

      .legalFor({p0, s32, sXLen})

      .widenScalarToNextPow2(0)

      .clampScalar(0, s32, sXLen);


  getActionDefinitionsBuilder({G_GLOBAL_VALUE, G_JUMP_TABLE, G_CONSTANT_POOL})

      .legalFor({p0});


  if (ST.hasStdExtZmmul()) {

    getActionDefinitionsBuilder(G_MUL)

        .legalFor({sXLen})

        .widenScalarToNextPow2(0)

        .clampScalar(0, sXLen, sXLen);


    // clang-format off

    getActionDefinitionsBuilder({G_SMULH, G_UMULH})

        .legalFor({sXLen})

        .lower();

    // clang-format on


    getActionDefinitionsBuilder({G_SMULO, G_UMULO}).minScalar(0, sXLen).lower();

  } else {

    getActionDefinitionsBuilder(G_MUL)

        .libcallFor({sXLen, sDoubleXLen})

        .widenScalarToNextPow2(0)

        .clampScalar(0, sXLen, sDoubleXLen);


    getActionDefinitionsBuilder({G_SMULH, G_UMULH}).lowerFor({sXLen});


    getActionDefinitionsBuilder({G_SMULO, G_UMULO})

        .minScalar(0, sXLen)

        // Widen sXLen to sDoubleXLen so we can use a single libcall to get

        // the low bits for the mul result and high bits to do the overflow

        // check.

        .widenScalarIf(typeIs(0, sXLen),

                       LegalizeMutations::changeTo(0, sDoubleXLen))

        .lower();

  }


  if (ST.hasStdExtM()) {

    getActionDefinitionsBuilder({G_SDIV, G_UDIV, G_UREM})

        .legalFor({sXLen})

        .customFor({s32})

        .libcallFor({sDoubleXLen})

        .clampScalar(0, s32, sDoubleXLen)

        .widenScalarToNextPow2(0);

    getActionDefinitionsBuilder(G_SREM)

        .legalFor({sXLen})

        .libcallFor({sDoubleXLen})

        .clampScalar(0, sXLen, sDoubleXLen)

        .widenScalarToNextPow2(0);

  } else {

    getActionDefinitionsBuilder({G_UDIV, G_SDIV, G_UREM, G_SREM})

        .libcallFor({sXLen, sDoubleXLen})

        .clampScalar(0, sXLen, sDoubleXLen)

        .widenScalarToNextPow2(0);

  }


  // TODO: Use libcall for sDoubleXLen.

  getActionDefinitionsBuilder({G_SDIVREM, G_UDIVREM}).lower();


  getActionDefinitionsBuilder(G_ABS)

      .customFor(ST.hasStdExtZbb(), {sXLen})

      .minScalar(ST.hasStdExtZbb(), 0, sXLen)

      .lower();


  getActionDefinitionsBuilder({G_UMAX, G_UMIN, G_SMAX, G_SMIN})

      .legalFor(ST.hasStdExtZbb(), {sXLen})

      .minScalar(ST.hasStdExtZbb(), 0, sXLen)

      .lower();


  getActionDefinitionsBuilder({G_SCMP, G_UCMP}).lower();


  getActionDefinitionsBuilder(G_FRAME_INDEX).legalFor({p0});


  getActionDefinitionsBuilder({G_MEMCPY, G_MEMMOVE, G_MEMSET}).libcall();


  getActionDefinitionsBuilder({G_DYN_STACKALLOC, G_STACKSAVE, G_STACKRESTORE})

      .lower();


  // FP Operations


  // FIXME: Support s128 for rv32 when libcall handling is able to use sret.

  getActionDefinitionsBuilder(

      {G_FADD, G_FSUB, G_FMUL, G_FDIV, G_FMA, G_FSQRT, G_FMAXNUM, G_FMINNUM})

      .legalFor(ST.hasStdExtF(), {s32})

      .legalFor(ST.hasStdExtD(), {s64})

      .legalFor(ST.hasStdExtZfh(), {s16})

      .libcallFor({s32, s64})

      .libcallFor(ST.is64Bit(), {s128});


  getActionDefinitionsBuilder({G_FNEG, G_FABS})

      .legalFor(ST.hasStdExtF(), {s32})

      .legalFor(ST.hasStdExtD(), {s64})

      .legalFor(ST.hasStdExtZfh(), {s16})

      .lowerFor({s32, s64, s128});


  getActionDefinitionsBuilder(G_FREM)

      .libcallFor({s32, s64})

      .libcallFor(ST.is64Bit(), {s128})

      .minScalar(0, s32)

      .scalarize(0);


  getActionDefinitionsBuilder(G_FCOPYSIGN)

      .legalFor(ST.hasStdExtF(), {{s32, s32}})

      .legalFor(ST.hasStdExtD(), {{s64, s64}, {s32, s64}, {s64, s32}})

      .legalFor(ST.hasStdExtZfh(), {{s16, s16}, {s16, s32}, {s32, s16}})

      .legalFor(ST.hasStdExtZfh() && ST.hasStdExtD(), {{s16, s64}, {s64, s16}})

      .lower();


  // FIXME: Use Zfhmin.

  getActionDefinitionsBuilder(G_FPTRUNC)

      .legalFor(ST.hasStdExtD(), {{s32, s64}})

      .legalFor(ST.hasStdExtZfh(), {{s16, s32}})

      .legalFor(ST.hasStdExtZfh() && ST.hasStdExtD(), {{s16, s64}})

      .libcallFor({{s32, s64}})

      .libcallFor(ST.is64Bit(), {{s32, s128}, {s64, s128}});

  getActionDefinitionsBuilder(G_FPEXT)

      .legalFor(ST.hasStdExtD(), {{s64, s32}})

      .legalFor(ST.hasStdExtZfh(), {{s32, s16}})

      .legalFor(ST.hasStdExtZfh() && ST.hasStdExtD(), {{s64, s16}})

      .libcallFor({{s64, s32}})

      .libcallFor(ST.is64Bit(), {{s128, s32}, {s128, s64}});


  getActionDefinitionsBuilder(G_FCMP)

      .legalFor(ST.hasStdExtF(), {{sXLen, s32}})

      .legalFor(ST.hasStdExtD(), {{sXLen, s64}})

      .legalFor(ST.hasStdExtZfh(), {{sXLen, s16}})

      .clampScalar(0, sXLen, sXLen)

      .libcallFor({{sXLen, s32}, {sXLen, s64}})

      .libcallFor(ST.is64Bit(), {{sXLen, s128}});


  // TODO: Support vector version of G_IS_FPCLASS.

  getActionDefinitionsBuilder(G_IS_FPCLASS)

      .customFor(ST.hasStdExtF(), {{s1, s32}})

      .customFor(ST.hasStdExtD(), {{s1, s64}})

      .customFor(ST.hasStdExtZfh(), {{s1, s16}})

      .lowerFor({{s1, s32}, {s1, s64}});


  getActionDefinitionsBuilder(G_FCONSTANT)

      .legalFor(ST.hasStdExtF(), {s32})

      .legalFor(ST.hasStdExtD(), {s64})

      .legalFor(ST.hasStdExtZfh(), {s16})

      .lowerFor({s32, s64, s128});


  getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})

      .legalFor(ST.hasStdExtF(), {{sXLen, s32}})

      .legalFor(ST.hasStdExtD(), {{sXLen, s64}})

      .legalFor(ST.hasStdExtZfh(), {{sXLen, s16}})

      .customFor(ST.is64Bit() && ST.hasStdExtF(), {{s32, s32}})

      .customFor(ST.is64Bit() && ST.hasStdExtD(), {{s32, s64}})

      .customFor(ST.is64Bit() && ST.hasStdExtZfh(), {{s32, s16}})

      .widenScalarToNextPow2(0)

      .minScalar(0, s32)

      .libcallFor({{s32, s32}, {s64, s32}, {s32, s64}, {s64, s64}})

      .libcallFor(ST.is64Bit(), {{s32, s128}, {s64, s128}}) // FIXME RV32.

      .libcallFor(ST.is64Bit(), {{s128, s32}, {s128, s64}, {s128, s128}});


  getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})

      .legalFor(ST.hasStdExtF(), {{s32, sXLen}})

      .legalFor(ST.hasStdExtD(), {{s64, sXLen}})

      .legalFor(ST.hasStdExtZfh(), {{s16, sXLen}})

      .widenScalarToNextPow2(1)

      // Promote to XLen if the operation is legal.

      .widenScalarIf(

          [=, &ST](const LegalityQuery &Query) {

            return Query.Types[0].isScalar() && Query.Types[1].isScalar() &&

                   (Query.Types[1].getSizeInBits() < ST.getXLen()) &&

                   ((ST.hasStdExtF() && Query.Types[0].getSizeInBits() == 32) ||

                    (ST.hasStdExtD() && Query.Types[0].getSizeInBits() == 64) ||

                    (ST.hasStdExtZfh() &&

                     Query.Types[0].getSizeInBits() == 16));

          },

          LegalizeMutations::changeTo(1, sXLen))

      // Otherwise only promote to s32 since we have si libcalls.

      .minScalar(1, s32)

      .libcallFor({{s32, s32}, {s64, s32}, {s32, s64}, {s64, s64}})

      .libcallFor(ST.is64Bit(), {{s128, s32}, {s128, s64}}) // FIXME RV32.

      .libcallFor(ST.is64Bit(), {{s32, s128}, {s64, s128}, {s128, s128}});


  // FIXME: We can do custom inline expansion like SelectionDAG.

  getActionDefinitionsBuilder({G_FCEIL, G_FFLOOR, G_FRINT, G_FNEARBYINT,

                               G_INTRINSIC_TRUNC, G_INTRINSIC_ROUND,

                               G_INTRINSIC_ROUNDEVEN})

      .legalFor(ST.hasStdExtZfa(), {s32})

      .legalFor(ST.hasStdExtZfa() && ST.hasStdExtD(), {s64})

      .legalFor(ST.hasStdExtZfa() && ST.hasStdExtZfh(), {s16})

      .libcallFor({s32, s64})

      .libcallFor(ST.is64Bit(), {s128});


  getActionDefinitionsBuilder({G_FMAXIMUM, G_FMINIMUM})

      .legalFor(ST.hasStdExtZfa(), {s32})

      .legalFor(ST.hasStdExtZfa() && ST.hasStdExtD(), {s64})

      .legalFor(ST.hasStdExtZfa() && ST.hasStdExtZfh(), {s16});


  getActionDefinitionsBuilder({G_FCOS, G_FSIN, G_FTAN, G_FPOW, G_FLOG, G_FLOG2,

                               G_FLOG10, G_FEXP, G_FEXP2, G_FEXP10, G_FACOS,

                               G_FASIN, G_FATAN, G_FATAN2, G_FCOSH, G_FSINH,

                               G_FTANH})

      .libcallFor({s32, s64})

      .libcallFor(ST.is64Bit(), {s128});

  getActionDefinitionsBuilder({G_FPOWI, G_FLDEXP})

      .libcallFor({{s32, s32}, {s64, s32}})

      .libcallFor(ST.is64Bit(), {s128, s32});


  getActionDefinitionsBuilder(G_VASTART).customFor({p0});


  // va_list must be a pointer, but most sized types are pretty easy to handle

  // as the destination.

  getActionDefinitionsBuilder(G_VAARG)

      // TODO: Implement narrowScalar and widenScalar for G_VAARG for types

      // other than sXLen.

      .clampScalar(0, sXLen, sXLen)

      .lowerForCartesianProduct({sXLen, p0}, {p0});


  getActionDefinitionsBuilder(G_VSCALE)

      .clampScalar(0, sXLen, sXLen)

      .customFor({sXLen});


  auto &SplatActions =

      getActionDefinitionsBuilder(G_SPLAT_VECTOR)

          .legalIf(all(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST),

                       typeIs(1, sXLen)))

          .customIf(all(typeIsLegalBoolVec(0, BoolVecTys, ST), typeIs(1, s1)));

  // Handle case of s64 element vectors on RV32. If the subtarget does not have

  // f64, then try to lower it to G_SPLAT_VECTOR_SPLIT_64_VL. If the subtarget

  // does have f64, then we don't know whether the type is an f64 or an i64,

  // so mark the G_SPLAT_VECTOR as legal and decide later what to do with it,

  // depending on how the instructions it consumes are legalized. They are not

  // legalized yet since legalization is in reverse postorder, so we cannot

  // make the decision at this moment.

  if (XLen == 32) {

    if (ST.hasVInstructionsF64() && ST.hasStdExtD())

      SplatActions.legalIf(all(

          typeInSet(0, {nxv1s64, nxv2s64, nxv4s64, nxv8s64}), typeIs(1, s64)));

    else if (ST.hasVInstructionsI64())

      SplatActions.customIf(all(

          typeInSet(0, {nxv1s64, nxv2s64, nxv4s64, nxv8s64}), typeIs(1, s64)));

  }


  SplatActions.clampScalar(1, sXLen, sXLen);


  LegalityPredicate ExtractSubvecBitcastPred = [=](const LegalityQuery &Query) {

    LLT DstTy = Query.Types[0];

    LLT SrcTy = Query.Types[1];

    return DstTy.getElementType() == LLT::scalar(1) &&

           DstTy.getElementCount().getKnownMinValue() >= 8 &&

           SrcTy.getElementCount().getKnownMinValue() >= 8;

  };

  getActionDefinitionsBuilder(G_EXTRACT_SUBVECTOR)

      // We don't have the ability to slide mask vectors down indexed by their

      // i1 elements; the smallest we can do is i8. Often we are able to bitcast

      // to equivalent i8 vectors.

      .bitcastIf(

          all(typeIsLegalBoolVec(0, BoolVecTys, ST),

              typeIsLegalBoolVec(1, BoolVecTys, ST), ExtractSubvecBitcastPred),

          [=](const LegalityQuery &Query) {

            LLT CastTy = LLT::vector(

                Query.Types[0].getElementCount().divideCoefficientBy(8), 8);

            return std::pair(0, CastTy);

          })

      .customIf(LegalityPredicates::any(

          all(typeIsLegalBoolVec(0, BoolVecTys, ST),

              typeIsLegalBoolVec(1, BoolVecTys, ST)),

          all(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST),

              typeIsLegalIntOrFPVec(1, IntOrFPVecTys, ST))));


  getActionDefinitionsBuilder(G_INSERT_SUBVECTOR)

      .customIf(all(typeIsLegalBoolVec(0, BoolVecTys, ST),

                    typeIsLegalBoolVec(1, BoolVecTys, ST)))

      .customIf(all(typeIsLegalIntOrFPVec(0, IntOrFPVecTys, ST),

                    typeIsLegalIntOrFPVec(1, IntOrFPVecTys, ST)));


  getActionDefinitionsBuilder(G_ATOMICRMW_ADD)

      .legalFor(ST.hasStdExtA(), {{sXLen, p0}})

      .libcallFor(!ST.hasStdExtA(), {{s8, p0}, {s16, p0}, {s32, p0}, {s64, p0}})

      .clampScalar(0, sXLen, sXLen);


  getLegacyLegalizerInfo().computeTables();

  verify(*ST.getInstrInfo());

}


bool RISCVLegalizerInfo::legalizeIntrinsic(LegalizerHelper &Helper,

                                           MachineInstr &MI) const {

  Intrinsic::ID IntrinsicID = cast<GIntrinsic>(MI).getIntrinsicID();

  switch (IntrinsicID) {

  default:

    return false;

  case Intrinsic::vacopy: {

    // vacopy arguments must be legal because of the intrinsic signature.

    // No need to check here.


    MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;

    MachineRegisterInfo &MRI = *MIRBuilder.getMRI();

    MachineFunction &MF = *MI.getMF();

    const DataLayout &DL = MIRBuilder.getDataLayout();

    LLVMContext &Ctx = MF.getFunction().getContext();


    Register DstLst = MI.getOperand(1).getReg();

    LLT PtrTy = MRI.getType(DstLst);


    // Load the source va_list

    Align Alignment = DL.getABITypeAlign(getTypeForLLT(PtrTy, Ctx));

    MachineMemOperand *LoadMMO = MF.getMachineMemOperand(

        MachinePointerInfo(), MachineMemOperand::MOLoad, PtrTy, Alignment);

    auto Tmp = MIRBuilder.buildLoad(PtrTy, MI.getOperand(2), *LoadMMO);


    // Store the result in the destination va_list

    MachineMemOperand *StoreMMO = MF.getMachineMemOperand(

        MachinePointerInfo(), MachineMemOperand::MOStore, PtrTy, Alignment);

    MIRBuilder.buildStore(Tmp, DstLst, *StoreMMO);


    MI.eraseFromParent();

    return true;

  }

  case Intrinsic::riscv_masked_atomicrmw_add:

    return true;

  }

}


bool RISCVLegalizerInfo::legalizeVAStart(MachineInstr &MI,

                                         MachineIRBuilder &MIRBuilder) const {

  // Stores the address of the VarArgsFrameIndex slot into the memory location

  assert(MI.getOpcode() == TargetOpcode::G_VASTART);

  MachineFunction *MF = MI.getParent()->getParent();

  RISCVMachineFunctionInfo *FuncInfo = MF->getInfo<RISCVMachineFunctionInfo>();

  int FI = FuncInfo->getVarArgsFrameIndex();

  LLT AddrTy = MIRBuilder.getMRI()->getType(MI.getOperand(0).getReg());

  auto FINAddr = MIRBuilder.buildFrameIndex(AddrTy, FI);

  assert(MI.hasOneMemOperand());

  MIRBuilder.buildStore(FINAddr, MI.getOperand(0).getReg(),

                        *MI.memoperands()[0]);

  MI.eraseFromParent();

  return true;

}


bool RISCVLegalizerInfo::legalizeBRJT(MachineInstr &MI,

                                      MachineIRBuilder &MIRBuilder) const {

  MachineRegisterInfo &MRI = *MIRBuilder.getMRI();

  auto &MF = *MI.getParent()->getParent();

  const MachineJumpTableInfo *MJTI = MF.getJumpTableInfo();

  unsigned EntrySize = MJTI->getEntrySize(MF.getDataLayout());


  Register PtrReg = MI.getOperand(0).getReg();

  LLT PtrTy = MRI.getType(PtrReg);

  Register IndexReg = MI.getOperand(2).getReg();

  LLT IndexTy = MRI.getType(IndexReg);


  if (!isPowerOf2_32(EntrySize))

    return false;


  auto ShiftAmt = MIRBuilder.buildConstant(IndexTy, Log2_32(EntrySize));

  IndexReg = MIRBuilder.buildShl(IndexTy, IndexReg, ShiftAmt).getReg(0);


  auto Addr = MIRBuilder.buildPtrAdd(PtrTy, PtrReg, IndexReg);


  MachineMemOperand *MMO = MF.getMachineMemOperand(

      MachinePointerInfo::getJumpTable(MF), MachineMemOperand::MOLoad,

      EntrySize, Align(MJTI->getEntryAlignment(MF.getDataLayout())));


  Register TargetReg;

  switch (MJTI->getEntryKind()) {

  default:

    return false;

  case MachineJumpTableInfo::EK_LabelDifference32: {

    // For PIC, the sequence is:

    // BRIND(load(Jumptable + index) + RelocBase)

    // RelocBase can be JumpTable, GOT or some sort of global base.

    unsigned LoadOpc =

        STI.is64Bit() ? TargetOpcode::G_SEXTLOAD : TargetOpcode::G_LOAD;

    auto Load = MIRBuilder.buildLoadInstr(LoadOpc, IndexTy, Addr, *MMO);

    TargetReg = MIRBuilder.buildPtrAdd(PtrTy, PtrReg, Load).getReg(0);

    break;

  }

  case MachineJumpTableInfo::EK_Custom32: {

    auto Load = MIRBuilder.buildLoadInstr(TargetOpcode::G_SEXTLOAD, IndexTy,

                                          Addr, *MMO);

    TargetReg = MIRBuilder.buildIntToPtr(PtrTy, Load).getReg(0);

    break;

  }

  case MachineJumpTableInfo::EK_BlockAddress:

    TargetReg = MIRBuilder.buildLoad(PtrTy, Addr, *MMO).getReg(0);

    break;

  }


  MIRBuilder.buildBrIndirect(TargetReg);


  MI.eraseFromParent();

  return true;

}


bool RISCVLegalizerInfo::shouldBeInConstantPool(const APInt &APImm,

                                                bool ShouldOptForSize) const {

  assert(APImm.getBitWidth() == 32 || APImm.getBitWidth() == 64);

  int64_t Imm = APImm.getSExtValue();

  // All simm32 constants should be handled by isel.

  // NOTE: The getMaxBuildIntsCost call below should return a value >= 2 making

  // this check redundant, but small immediates are common so this check

  // should have better compile time.

  if (isInt<32>(Imm))

    return false;


  // We only need to cost the immediate, if constant pool lowering is enabled.

  if (!STI.useConstantPoolForLargeInts())

    return false;


  RISCVMatInt::InstSeq Seq = RISCVMatInt::generateInstSeq(Imm, STI);

  if (Seq.size() <= STI.getMaxBuildIntsCost())

    return false;


  // Optimizations below are disabled for opt size. If we're optimizing for

  // size, use a constant pool.

  if (ShouldOptForSize)

    return true;

  //

  // Special case. See if we can build the constant as (ADD (SLLI X, C), X) do

  // that if it will avoid a constant pool.

  // It will require an extra temporary register though.

  // If we have Zba we can use (ADD_UW X, (SLLI X, 32)) to handle cases where

  // low and high 32 bits are the same and bit 31 and 63 are set.

  unsigned ShiftAmt, AddOpc;

  RISCVMatInt::InstSeq SeqLo =

      RISCVMatInt::generateTwoRegInstSeq(Imm, STI, ShiftAmt, AddOpc);

  return !(!SeqLo.empty() && (SeqLo.size() + 2) <= STI.getMaxBuildIntsCost());

}


bool RISCVLegalizerInfo::legalizeVScale(MachineInstr &MI,

                                        MachineIRBuilder &MIB) const {

  const LLT XLenTy(STI.getXLenVT());

  Register Dst = MI.getOperand(0).getReg();


  // We define our scalable vector types for lmul=1 to use a 64 bit known

  // minimum size. e.g. <vscale x 2 x i32>. VLENB is in bytes so we calculate

  // vscale as VLENB / 8.

  static_assert(RISCV::RVVBitsPerBlock == 64, "Unexpected bits per block!");

  if (STI.getRealMinVLen() < RISCV::RVVBitsPerBlock)

    // Support for VLEN==32 is incomplete.

    return false;


  // We assume VLENB is a multiple of 8. We manually choose the best shift

  // here because SimplifyDemandedBits isn't always able to simplify it.

  uint64_t Val = MI.getOperand(1).getCImm()->getZExtValue();

  if (isPowerOf2_64(Val)) {

    uint64_t Log2 = Log2_64(Val);

    if (Log2 < 3) {

      auto VLENB = MIB.buildInstr(RISCV::G_READ_VLENB, {XLenTy}, {});

      MIB.buildLShr(Dst, VLENB, MIB.buildConstant(XLenTy, 3 - Log2));

    } else if (Log2 > 3) {

      auto VLENB = MIB.buildInstr(RISCV::G_READ_VLENB, {XLenTy}, {});

      MIB.buildShl(Dst, VLENB, MIB.buildConstant(XLenTy, Log2 - 3));

    } else {

      MIB.buildInstr(RISCV::G_READ_VLENB, {Dst}, {});

    }

  } else if ((Val % 8) == 0) {

    // If the multiplier is a multiple of 8, scale it down to avoid needing

    // to shift the VLENB value.

    auto VLENB = MIB.buildInstr(RISCV::G_READ_VLENB, {XLenTy}, {});

    MIB.buildMul(Dst, VLENB, MIB.buildConstant(XLenTy, Val / 8));

  } else {

    auto VLENB = MIB.buildInstr(RISCV::G_READ_VLENB, {XLenTy}, {});

    auto VScale = MIB.buildLShr(XLenTy, VLENB, MIB.buildConstant(XLenTy, 3));

    MIB.buildMul(Dst, VScale, MIB.buildConstant(XLenTy, Val));

  }

  MI.eraseFromParent();

  return true;

}


// Custom-lower extensions from mask vectors by using a vselect either with 1

// for zero/any-extension or -1 for sign-extension:

//   (vXiN = (s|z)ext vXi1:vmask) -> (vXiN = vselect vmask, (-1 or 1), 0)

// Note that any-extension is lowered identically to zero-extension.

bool RISCVLegalizerInfo::legalizeExt(MachineInstr &MI,

                                     MachineIRBuilder &MIB) const {


  unsigned Opc = MI.getOpcode();

  assert(Opc == TargetOpcode::G_ZEXT || Opc == TargetOpcode::G_SEXT ||

         Opc == TargetOpcode::G_ANYEXT);


  MachineRegisterInfo &MRI = *MIB.getMRI();

  Register Dst = MI.getOperand(0).getReg();

  Register Src = MI.getOperand(1).getReg();


  LLT DstTy = MRI.getType(Dst);

  int64_t ExtTrueVal = Opc == TargetOpcode::G_SEXT ? -1 : 1;

  LLT DstEltTy = DstTy.getElementType();

  auto SplatZero = MIB.buildSplatVector(DstTy, MIB.buildConstant(DstEltTy, 0));

  auto SplatTrue =

      MIB.buildSplatVector(DstTy, MIB.buildConstant(DstEltTy, ExtTrueVal));

  MIB.buildSelect(Dst, Src, SplatTrue, SplatZero);


  MI.eraseFromParent();

  return true;

}


bool RISCVLegalizerInfo::legalizeLoadStore(MachineInstr &MI,

                                           LegalizerHelper &Helper,

                                           MachineIRBuilder &MIB) const {

  assert((isa<GLoad>(MI) || isa<GStore>(MI)) &&

         "Machine instructions must be Load/Store.");

  MachineRegisterInfo &MRI = *MIB.getMRI();

  MachineFunction *MF = MI.getMF();

  const DataLayout &DL = MIB.getDataLayout();

  LLVMContext &Ctx = MF->getFunction().getContext();


  Register DstReg = MI.getOperand(0).getReg();

  LLT DataTy = MRI.getType(DstReg);

  if (!DataTy.isVector())

    return false;


  if (!MI.hasOneMemOperand())

    return false;


  MachineMemOperand *MMO = *MI.memoperands_begin();


  const auto *TLI = STI.getTargetLowering();

  EVT VT = EVT::getEVT(getTypeForLLT(DataTy, Ctx));


  if (TLI->allowsMemoryAccessForAlignment(Ctx, DL, VT, *MMO))

    return true;


  unsigned EltSizeBits = DataTy.getScalarSizeInBits();

  assert((EltSizeBits == 16 || EltSizeBits == 32 || EltSizeBits == 64) &&

         "Unexpected unaligned RVV load type");


  // Calculate the new vector type with i8 elements

  unsigned NumElements =

      DataTy.getElementCount().getKnownMinValue() * (EltSizeBits / 8);

  LLT NewDataTy = LLT::scalable_vector(NumElements, 8);


  Helper.bitcast(MI, 0, NewDataTy);


  return true;

}


/// Return the type of the mask type suitable for masking the provided

/// vector type.  This is simply an i1 element type vector of the same

/// (possibly scalable) length.

static LLT getMaskTypeFor(LLT VecTy) {

  assert(VecTy.isVector());

  ElementCount EC = VecTy.getElementCount();

  return LLT::vector(EC, LLT::scalar(1));

}


/// Creates an all ones mask suitable for masking a vector of type VecTy with

/// vector length VL.

static MachineInstrBuilder buildAllOnesMask(LLT VecTy, const SrcOp &VL,

                                            MachineIRBuilder &MIB,

                                            MachineRegisterInfo &MRI) {

  LLT MaskTy = getMaskTypeFor(VecTy);

  return MIB.buildInstr(RISCV::G_VMSET_VL, {MaskTy}, {VL});

}


/// Gets the two common "VL" operands: an all-ones mask and the vector length.

/// VecTy is a scalable vector type.

static std::pair<MachineInstrBuilder, MachineInstrBuilder>

buildDefaultVLOps(LLT VecTy, MachineIRBuilder &MIB, MachineRegisterInfo &MRI) {

  assert(VecTy.isScalableVector() && "Expecting scalable container type");

  const RISCVSubtarget &STI = MIB.getMF().getSubtarget<RISCVSubtarget>();

  LLT XLenTy(STI.getXLenVT());

  auto VL = MIB.buildConstant(XLenTy, -1);

  auto Mask = buildAllOnesMask(VecTy, VL, MIB, MRI);

  return {Mask, VL};

}


static MachineInstrBuilder

buildSplatPartsS64WithVL(const DstOp &Dst, const SrcOp &Passthru, Register Lo,

                         Register Hi, const SrcOp &VL, MachineIRBuilder &MIB,

                         MachineRegisterInfo &MRI) {

  // TODO: If the Hi bits of the splat are undefined, then it's fine to just

  // splat Lo even if it might be sign extended. I don't think we have

  // introduced a case where we're build a s64 where the upper bits are undef

  // yet.


  // Fall back to a stack store and stride x0 vector load.

  // TODO: need to lower G_SPLAT_VECTOR_SPLIT_I64. This is done in

  // preprocessDAG in SDAG.

  return MIB.buildInstr(RISCV::G_SPLAT_VECTOR_SPLIT_I64_VL, {Dst},

                        {Passthru, Lo, Hi, VL});

}


static MachineInstrBuilder

buildSplatSplitS64WithVL(const DstOp &Dst, const SrcOp &Passthru,

                         const SrcOp &Scalar, const SrcOp &VL,

                         MachineIRBuilder &MIB, MachineRegisterInfo &MRI) {

  assert(Scalar.getLLTTy(MRI) == LLT::scalar(64) && "Unexpected VecTy!");

  auto Unmerge = MIB.buildUnmerge(LLT::scalar(32), Scalar);

  return buildSplatPartsS64WithVL(Dst, Passthru, Unmerge.getReg(0),

                                  Unmerge.getReg(1), VL, MIB, MRI);

}


// Lower splats of s1 types to G_ICMP. For each mask vector type, we have a

// legal equivalently-sized i8 type, so we can use that as a go-between.

// Splats of s1 types that have constant value can be legalized as VMSET_VL or

// VMCLR_VL.

bool RISCVLegalizerInfo::legalizeSplatVector(MachineInstr &MI,

                                             MachineIRBuilder &MIB) const {

  assert(MI.getOpcode() == TargetOpcode::G_SPLAT_VECTOR);


  MachineRegisterInfo &MRI = *MIB.getMRI();


  Register Dst = MI.getOperand(0).getReg();

  Register SplatVal = MI.getOperand(1).getReg();


  LLT VecTy = MRI.getType(Dst);

  LLT XLenTy(STI.getXLenVT());


  // Handle case of s64 element vectors on rv32

  if (XLenTy.getSizeInBits() == 32 &&

      VecTy.getElementType().getSizeInBits() == 64) {

    auto [_, VL] = buildDefaultVLOps(MRI.getType(Dst), MIB, MRI);

    buildSplatSplitS64WithVL(Dst, MIB.buildUndef(VecTy), SplatVal, VL, MIB,

                             MRI);

    MI.eraseFromParent();

    return true;

  }


  // All-zeros or all-ones splats are handled specially.

  MachineInstr &SplatValMI = *MRI.getVRegDef(SplatVal);

  if (isAllOnesOrAllOnesSplat(SplatValMI, MRI)) {

    auto VL = buildDefaultVLOps(VecTy, MIB, MRI).second;

    MIB.buildInstr(RISCV::G_VMSET_VL, {Dst}, {VL});

    MI.eraseFromParent();

    return true;

  }

  if (isNullOrNullSplat(SplatValMI, MRI)) {

    auto VL = buildDefaultVLOps(VecTy, MIB, MRI).second;

    MIB.buildInstr(RISCV::G_VMCLR_VL, {Dst}, {VL});

    MI.eraseFromParent();

    return true;

  }


  // Handle non-constant mask splat (i.e. not sure if it's all zeros or all

  // ones) by promoting it to an s8 splat.

  LLT InterEltTy = LLT::scalar(8);

  LLT InterTy = VecTy.changeElementType(InterEltTy);

  auto ZExtSplatVal = MIB.buildZExt(InterEltTy, SplatVal);

  auto And =

      MIB.buildAnd(InterEltTy, ZExtSplatVal, MIB.buildConstant(InterEltTy, 1));

  auto LHS = MIB.buildSplatVector(InterTy, And);

  auto ZeroSplat =

      MIB.buildSplatVector(InterTy, MIB.buildConstant(InterEltTy, 0));

  MIB.buildICmp(CmpInst::Predicate::ICMP_NE, Dst, LHS, ZeroSplat);

  MI.eraseFromParent();

  return true;

}


static LLT getLMUL1Ty(LLT VecTy) {

  assert(VecTy.getElementType().getSizeInBits() <= 64 &&

         "Unexpected vector LLT");

  return LLT::scalable_vector(RISCV::RVVBitsPerBlock /

                                  VecTy.getElementType().getSizeInBits(),

                              VecTy.getElementType());

}


bool RISCVLegalizerInfo::legalizeExtractSubvector(MachineInstr &MI,

                                                  MachineIRBuilder &MIB) const {

  GExtractSubvector &ES = cast<GExtractSubvector>(MI);


  MachineRegisterInfo &MRI = *MIB.getMRI();


  Register Dst = ES.getReg(0);

  Register Src = ES.getSrcVec();

  uint64_t Idx = ES.getIndexImm();


  // With an index of 0 this is a cast-like subvector, which can be performed

  // with subregister operations.

  if (Idx == 0)

    return true;


  LLT LitTy = MRI.getType(Dst);

  LLT BigTy = MRI.getType(Src);


  if (LitTy.getElementType() == LLT::scalar(1)) {

    // We can't slide this mask vector up indexed by its i1 elements.

    // This poses a problem when we wish to insert a scalable vector which

    // can't be re-expressed as a larger type. Just choose the slow path and

    // extend to a larger type, then truncate back down.

    LLT ExtBigTy = BigTy.changeElementType(LLT::scalar(8));

    LLT ExtLitTy = LitTy.changeElementType(LLT::scalar(8));

    auto BigZExt = MIB.buildZExt(ExtBigTy, Src);

    auto ExtractZExt = MIB.buildExtractSubvector(ExtLitTy, BigZExt, Idx);

    auto SplatZero = MIB.buildSplatVector(

        ExtLitTy, MIB.buildConstant(ExtLitTy.getElementType(), 0));

    MIB.buildICmp(CmpInst::Predicate::ICMP_NE, Dst, ExtractZExt, SplatZero);

    MI.eraseFromParent();

    return true;

  }


  // extract_subvector scales the index by vscale if the subvector is scalable,

  // and decomposeSubvectorInsertExtractToSubRegs takes this into account.

  const RISCVRegisterInfo *TRI = STI.getRegisterInfo();

  MVT LitTyMVT = getMVTForLLT(LitTy);

  auto Decompose =

      RISCVTargetLowering::decomposeSubvectorInsertExtractToSubRegs(

          getMVTForLLT(BigTy), LitTyMVT, Idx, TRI);

  unsigned RemIdx = Decompose.second;


  // If the Idx has been completely eliminated then this is a subvector extract

  // which naturally aligns to a vector register. These can easily be handled

  // using subregister manipulation.

  if (RemIdx == 0)

    return true;


  // Else LitTy is M1 or smaller and may need to be slid down: if LitTy

  // was > M1 then the index would need to be a multiple of VLMAX, and so would

  // divide exactly.

  assert(

      RISCVVType::decodeVLMUL(RISCVTargetLowering::getLMUL(LitTyMVT)).second ||

      RISCVTargetLowering::getLMUL(LitTyMVT) == RISCVVType::LMUL_1);


  // If the vector type is an LMUL-group type, extract a subvector equal to the

  // nearest full vector register type.

  LLT InterLitTy = BigTy;

  Register Vec = Src;

  if (TypeSize::isKnownGT(BigTy.getSizeInBits(),

                          getLMUL1Ty(BigTy).getSizeInBits())) {

    // If BigTy has an LMUL > 1, then LitTy should have a smaller LMUL, and

    // we should have successfully decomposed the extract into a subregister.

    assert(Decompose.first != RISCV::NoSubRegister);

    InterLitTy = getLMUL1Ty(BigTy);

    // SDAG builds a TargetExtractSubreg. We cannot create a a Copy with SubReg

    // specified on the source Register (the equivalent) since generic virtual

    // register does not allow subregister index.

    Vec = MIB.buildExtractSubvector(InterLitTy, Src, Idx - RemIdx).getReg(0);

  }


  // Slide this vector register down by the desired number of elements in order

  // to place the desired subvector starting at element 0.

  const LLT XLenTy(STI.getXLenVT());

  auto SlidedownAmt = MIB.buildVScale(XLenTy, RemIdx);

  auto [Mask, VL] = buildDefaultVLOps(LitTy, MIB, MRI);

  uint64_t Policy = RISCVVType::TAIL_AGNOSTIC | RISCVVType::MASK_AGNOSTIC;

  auto Slidedown = MIB.buildInstr(

      RISCV::G_VSLIDEDOWN_VL, {InterLitTy},

      {MIB.buildUndef(InterLitTy), Vec, SlidedownAmt, Mask, VL, Policy});


  // Now the vector is in the right position, extract our final subvector. This

  // should resolve to a COPY.

  MIB.buildExtractSubvector(Dst, Slidedown, 0);


  MI.eraseFromParent();

  return true;

}


bool RISCVLegalizerInfo::legalizeInsertSubvector(MachineInstr &MI,

                                                 LegalizerHelper &Helper,

                                                 MachineIRBuilder &MIB) const {

  GInsertSubvector &IS = cast<GInsertSubvector>(MI);


  MachineRegisterInfo &MRI = *MIB.getMRI();


  Register Dst = IS.getReg(0);

  Register BigVec = IS.getBigVec();

  Register LitVec = IS.getSubVec();

  uint64_t Idx = IS.getIndexImm();


  LLT BigTy = MRI.getType(BigVec);

  LLT LitTy = MRI.getType(LitVec);


  if (Idx == 0 ||

      MRI.getVRegDef(BigVec)->getOpcode() == TargetOpcode::G_IMPLICIT_DEF)

    return true;


  // We don't have the ability to slide mask vectors up indexed by their i1

  // elements; the smallest we can do is i8. Often we are able to bitcast to

  // equivalent i8 vectors. Otherwise, we can must zeroextend to equivalent i8

  // vectors and truncate down after the insert.

  if (LitTy.getElementType() == LLT::scalar(1)) {

    auto BigTyMinElts = BigTy.getElementCount().getKnownMinValue();

    auto LitTyMinElts = LitTy.getElementCount().getKnownMinValue();

    if (BigTyMinElts >= 8 && LitTyMinElts >= 8)

      return Helper.bitcast(

          IS, 0,

          LLT::vector(BigTy.getElementCount().divideCoefficientBy(8), 8));


    // We can't slide this mask vector up indexed by its i1 elements.

    // This poses a problem when we wish to insert a scalable vector which

    // can't be re-expressed as a larger type. Just choose the slow path and

    // extend to a larger type, then truncate back down.

    LLT ExtBigTy = BigTy.changeElementType(LLT::scalar(8));

    return Helper.widenScalar(IS, 0, ExtBigTy);

  }


  const RISCVRegisterInfo *TRI = STI.getRegisterInfo();

  unsigned SubRegIdx, RemIdx;

  std::tie(SubRegIdx, RemIdx) =

      RISCVTargetLowering::decomposeSubvectorInsertExtractToSubRegs(

          getMVTForLLT(BigTy), getMVTForLLT(LitTy), Idx, TRI);


  TypeSize VecRegSize = TypeSize::getScalable(RISCV::RVVBitsPerBlock);

  assert(isPowerOf2_64(

      STI.expandVScale(LitTy.getSizeInBits()).getKnownMinValue()));

  bool ExactlyVecRegSized =

      STI.expandVScale(LitTy.getSizeInBits())

          .isKnownMultipleOf(STI.expandVScale(VecRegSize));


  // If the Idx has been completely eliminated and this subvector's size is a

  // vector register or a multiple thereof, or the surrounding elements are

  // undef, then this is a subvector insert which naturally aligns to a vector

  // register. These can easily be handled using subregister manipulation.

  if (RemIdx == 0 && ExactlyVecRegSized)

    return true;


  // If the subvector is smaller than a vector register, then the insertion

  // must preserve the undisturbed elements of the register. We do this by

  // lowering to an EXTRACT_SUBVECTOR grabbing the nearest LMUL=1 vector type

  // (which resolves to a subregister copy), performing a VSLIDEUP to place the

  // subvector within the vector register, and an INSERT_SUBVECTOR of that

  // LMUL=1 type back into the larger vector (resolving to another subregister

  // operation). See below for how our VSLIDEUP works. We go via a LMUL=1 type

  // to avoid allocating a large register group to hold our subvector.


  // VSLIDEUP works by leaving elements 0<i<OFFSET undisturbed, elements

  // OFFSET<=i<VL set to the "subvector" and vl<=i<VLMAX set to the tail policy

  // (in our case undisturbed). This means we can set up a subvector insertion

  // where OFFSET is the insertion offset, and the VL is the OFFSET plus the

  // size of the subvector.

  const LLT XLenTy(STI.getXLenVT());

  LLT InterLitTy = BigTy;

  Register AlignedExtract = BigVec;

  unsigned AlignedIdx = Idx - RemIdx;

  if (TypeSize::isKnownGT(BigTy.getSizeInBits(),

                          getLMUL1Ty(BigTy).getSizeInBits())) {

    InterLitTy = getLMUL1Ty(BigTy);

    // Extract a subvector equal to the nearest full vector register type. This

    // should resolve to a G_EXTRACT on a subreg.

    AlignedExtract =

        MIB.buildExtractSubvector(InterLitTy, BigVec, AlignedIdx).getReg(0);

  }


  auto Insert = MIB.buildInsertSubvector(InterLitTy, MIB.buildUndef(InterLitTy),

                                         LitVec, 0);


  auto [Mask, _] = buildDefaultVLOps(BigTy, MIB, MRI);

  auto VL = MIB.buildVScale(XLenTy, LitTy.getElementCount().getKnownMinValue());


  // If we're inserting into the lowest elements, use a tail undisturbed

  // vmv.v.v.

  MachineInstrBuilder Inserted;

  bool NeedInsertSubvec =

      TypeSize::isKnownGT(BigTy.getSizeInBits(), InterLitTy.getSizeInBits());

  Register InsertedDst =

      NeedInsertSubvec ? MRI.createGenericVirtualRegister(InterLitTy) : Dst;

  if (RemIdx == 0) {

    Inserted = MIB.buildInstr(RISCV::G_VMV_V_V_VL, {InsertedDst},

                              {AlignedExtract, Insert, VL});

  } else {

    auto SlideupAmt = MIB.buildVScale(XLenTy, RemIdx);

    // Construct the vector length corresponding to RemIdx + length(LitTy).

    VL = MIB.buildAdd(XLenTy, SlideupAmt, VL);

    // Use tail agnostic policy if we're inserting over InterLitTy's tail.

    ElementCount EndIndex =

        ElementCount::getScalable(RemIdx) + LitTy.getElementCount();

    uint64_t Policy = RISCVVType::TAIL_UNDISTURBED_MASK_UNDISTURBED;

    if (STI.expandVScale(EndIndex) ==

        STI.expandVScale(InterLitTy.getElementCount()))

      Policy = RISCVVType::TAIL_AGNOSTIC;


    Inserted =

        MIB.buildInstr(RISCV::G_VSLIDEUP_VL, {InsertedDst},

                       {AlignedExtract, Insert, SlideupAmt, Mask, VL, Policy});

  }


  // If required, insert this subvector back into the correct vector register.

  // This should resolve to an INSERT_SUBREG instruction.

  if (NeedInsertSubvec)

    MIB.buildInsertSubvector(Dst, BigVec, Inserted, AlignedIdx);


  MI.eraseFromParent();

  return true;

}


static unsigned getRISCVWOpcode(unsigned Opcode) {

  switch (Opcode) {

  default:

    llvm_unreachable("Unexpected opcode");

  case TargetOpcode::G_ASHR:

    return RISCV::G_SRAW;

  case TargetOpcode::G_LSHR:

    return RISCV::G_SRLW;

  case TargetOpcode::G_SHL:

    return RISCV::G_SLLW;

  case TargetOpcode::G_SDIV:

    return RISCV::G_DIVW;

  case TargetOpcode::G_UDIV:

    return RISCV::G_DIVUW;

  case TargetOpcode::G_UREM:

    return RISCV::G_REMUW;

  case TargetOpcode::G_ROTL:

    return RISCV::G_ROLW;

  case TargetOpcode::G_ROTR:

    return RISCV::G_RORW;

  case TargetOpcode::G_CTLZ:

    return RISCV::G_CLZW;

  case TargetOpcode::G_CTTZ:

    return RISCV::G_CTZW;

  case TargetOpcode::G_FPTOSI:

    return RISCV::G_FCVT_W_RV64;

  case TargetOpcode::G_FPTOUI:

    return RISCV::G_FCVT_WU_RV64;

  }

}


bool RISCVLegalizerInfo::legalizeCustom(

    LegalizerHelper &Helper, MachineInstr &MI,

    LostDebugLocObserver &LocObserver) const {

  MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;

  MachineRegisterInfo &MRI = *MIRBuilder.getMRI();

  MachineFunction &MF = *MI.getParent()->getParent();

  switch (MI.getOpcode()) {

  default:

    // No idea what to do.

    return false;

  case TargetOpcode::G_ABS:

    return Helper.lowerAbsToMaxNeg(MI);

  // TODO: G_FCONSTANT

  case TargetOpcode::G_CONSTANT: {

    const Function &F = MF.getFunction();

    // TODO: if PSI and BFI are present, add " ||

    // llvm::shouldOptForSize(*CurMBB, PSI, BFI)".

    bool ShouldOptForSize = F.hasOptSize();

    const ConstantInt *ConstVal = MI.getOperand(1).getCImm();

    if (!shouldBeInConstantPool(ConstVal->getValue(), ShouldOptForSize))

      return true;

    return Helper.lowerConstant(MI);

  }

  case TargetOpcode::G_SUB:

  case TargetOpcode::G_ADD: {

    Helper.Observer.changingInstr(MI);

    Helper.widenScalarSrc(MI, sXLen, 1, TargetOpcode::G_ANYEXT);

    Helper.widenScalarSrc(MI, sXLen, 2, TargetOpcode::G_ANYEXT);


    Register DstALU = MRI.createGenericVirtualRegister(sXLen);


    MachineOperand &MO = MI.getOperand(0);

    MIRBuilder.setInsertPt(MIRBuilder.getMBB(), ++MIRBuilder.getInsertPt());

    auto DstSext = MIRBuilder.buildSExtInReg(sXLen, DstALU, 32);


    MIRBuilder.buildInstr(TargetOpcode::G_TRUNC, {MO}, {DstSext});

    MO.setReg(DstALU);


    Helper.Observer.changedInstr(MI);

    return true;

  }

  case TargetOpcode::G_SEXT_INREG: {

    LLT DstTy = MRI.getType(MI.getOperand(0).getReg());

    int64_t SizeInBits = MI.getOperand(2).getImm();

    // Source size of 32 is sext.w.

    if (DstTy.getSizeInBits() == 64 && SizeInBits == 32)

      return true;


    if (STI.hasStdExtZbb() && (SizeInBits == 8 || SizeInBits == 16))

      return true;


    return Helper.lower(MI, 0, /* Unused hint type */ LLT()) ==

           LegalizerHelper::Legalized;

  }

  case TargetOpcode::G_ASHR:

  case TargetOpcode::G_LSHR:

  case TargetOpcode::G_SHL: {

    if (getIConstantVRegValWithLookThrough(MI.getOperand(2).getReg(), MRI)) {

      // We don't need a custom node for shift by constant. Just widen the

      // source and the shift amount.

      unsigned ExtOpc = TargetOpcode::G_ANYEXT;

      if (MI.getOpcode() == TargetOpcode::G_ASHR)

        ExtOpc = TargetOpcode::G_SEXT;

      else if (MI.getOpcode() == TargetOpcode::G_LSHR)

        ExtOpc = TargetOpcode::G_ZEXT;


      Helper.Observer.changingInstr(MI);

      Helper.widenScalarSrc(MI, sXLen, 1, ExtOpc);

      Helper.widenScalarSrc(MI, sXLen, 2, TargetOpcode::G_ZEXT);

      Helper.widenScalarDst(MI, sXLen);

      Helper.Observer.changedInstr(MI);

      return true;

    }


    Helper.Observer.changingInstr(MI);

    Helper.widenScalarSrc(MI, sXLen, 1, TargetOpcode::G_ANYEXT);

    Helper.widenScalarSrc(MI, sXLen, 2, TargetOpcode::G_ANYEXT);

    Helper.widenScalarDst(MI, sXLen);

    MI.setDesc(MIRBuilder.getTII().get(getRISCVWOpcode(MI.getOpcode())));

    Helper.Observer.changedInstr(MI);

    return true;

  }

  case TargetOpcode::G_SDIV:

  case TargetOpcode::G_UDIV:

  case TargetOpcode::G_UREM:

  case TargetOpcode::G_ROTL:

  case TargetOpcode::G_ROTR: {

    Helper.Observer.changingInstr(MI);

    Helper.widenScalarSrc(MI, sXLen, 1, TargetOpcode::G_ANYEXT);

    Helper.widenScalarSrc(MI, sXLen, 2, TargetOpcode::G_ANYEXT);

    Helper.widenScalarDst(MI, sXLen);

    MI.setDesc(MIRBuilder.getTII().get(getRISCVWOpcode(MI.getOpcode())));

    Helper.Observer.changedInstr(MI);

    return true;

  }

  case TargetOpcode::G_CTLZ:

  case TargetOpcode::G_CTTZ: {

    Helper.Observer.changingInstr(MI);

    Helper.widenScalarSrc(MI, sXLen, 1, TargetOpcode::G_ANYEXT);

    Helper.widenScalarDst(MI, sXLen);

    MI.setDesc(MIRBuilder.getTII().get(getRISCVWOpcode(MI.getOpcode())));

    Helper.Observer.changedInstr(MI);

    return true;

  }

  case TargetOpcode::G_FPTOSI:

  case TargetOpcode::G_FPTOUI: {

    Helper.Observer.changingInstr(MI);

    Helper.widenScalarDst(MI, sXLen);

    MI.setDesc(MIRBuilder.getTII().get(getRISCVWOpcode(MI.getOpcode())));

    MI.addOperand(MachineOperand::CreateImm(RISCVFPRndMode::RTZ));

    Helper.Observer.changedInstr(MI);

    return true;

  }

  case TargetOpcode::G_IS_FPCLASS: {

    Register GISFPCLASS = MI.getOperand(0).getReg();

    Register Src = MI.getOperand(1).getReg();

    const MachineOperand &ImmOp = MI.getOperand(2);

    MachineIRBuilder MIB(MI);


    // Turn LLVM IR's floating point classes to that in RISC-V,

    // by simply rotating the 10-bit immediate right by two bits.

    APInt GFpClassImm(10, static_cast<uint64_t>(ImmOp.getImm()));

    auto FClassMask = MIB.buildConstant(sXLen, GFpClassImm.rotr(2).zext(XLen));

    auto ConstZero = MIB.buildConstant(sXLen, 0);


    auto GFClass = MIB.buildInstr(RISCV::G_FCLASS, {sXLen}, {Src});

    auto And = MIB.buildAnd(sXLen, GFClass, FClassMask);

    MIB.buildICmp(CmpInst::ICMP_NE, GISFPCLASS, And, ConstZero);


    MI.eraseFromParent();

    return true;

  }

  case TargetOpcode::G_BRJT:

    return legalizeBRJT(MI, MIRBuilder);

  case TargetOpcode::G_VASTART:

    return legalizeVAStart(MI, MIRBuilder);

  case TargetOpcode::G_VSCALE:

    return legalizeVScale(MI, MIRBuilder);

  case TargetOpcode::G_ZEXT:

  case TargetOpcode::G_SEXT:

  case TargetOpcode::G_ANYEXT:

    return legalizeExt(MI, MIRBuilder);

  case TargetOpcode::G_SPLAT_VECTOR:

    return legalizeSplatVector(MI, MIRBuilder);

  case TargetOpcode::G_EXTRACT_SUBVECTOR:

    return legalizeExtractSubvector(MI, MIRBuilder);

  case TargetOpcode::G_INSERT_SUBVECTOR:

    return legalizeInsertSubvector(MI, Helper, MIRBuilder);

  case TargetOpcode::G_LOAD:

  case TargetOpcode::G_STORE:

    return legalizeLoadStore(MI, Helper, MIRBuilder);

  }


  llvm_unreachable("expected switch to return");

}

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:103

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:347

DerivedTypes.h

Addr
uint64_t Addr
Definition: ELFObjHandler.cpp:79

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

GIMatchTableExecutor.h

GenericMachineInstrs.h
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...

libcall
@ libcall
Definition: HWAddressSanitizer.cpp:239

_
#define _
Definition: HexagonMCCodeEmitter.cpp:47

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:110

Type.h

Intrinsics.h

LegalizerHelper.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

MachineConstantPool.h
This file declares the MachineConstantPool class which is an abstract constant pool to keep track of ...

MachineIRBuilder.h
This file declares the MachineIRBuilder class.

MachineJumpTableInfo.h

MachineMemOperand.h

MachineOperand.h

MachineRegisterInfo.h

TRI
Register const TargetRegisterInfo * TRI
Definition: MachineSink.cpp:2118

P
#define P(N)

verify
ppc ctr loops verify
Definition: PPCCTRLoopsVerify.cpp:71

getLMUL1Ty
static LLT getLMUL1Ty(LLT VecTy)
Definition: RISCVLegalizerInfo.cpp:1071

buildAllOnesMask
static MachineInstrBuilder buildAllOnesMask(LLT VecTy, const SrcOp &VL, MachineIRBuilder &MIB, MachineRegisterInfo &MRI)
Creates an all ones mask suitable for masking a vector of type VecTy with vector length VL.
Definition: RISCVLegalizerInfo.cpp:970

buildDefaultVLOps
static std::pair< MachineInstrBuilder, MachineInstrBuilder > buildDefaultVLOps(LLT VecTy, MachineIRBuilder &MIB, MachineRegisterInfo &MRI)
Gets the two common "VL" operands: an all-ones mask and the vector length.
Definition: RISCVLegalizerInfo.cpp:980

typeIsLegalBoolVec
static LegalityPredicate typeIsLegalBoolVec(unsigned TypeIdx, std::initializer_list< LLT > BoolVecTys, const RISCVSubtarget &ST)
Definition: RISCVLegalizerInfo.cpp:53

buildSplatSplitS64WithVL
static MachineInstrBuilder buildSplatSplitS64WithVL(const DstOp &Dst, const SrcOp &Passthru, const SrcOp &Scalar, const SrcOp &VL, MachineIRBuilder &MIB, MachineRegisterInfo &MRI)
Definition: RISCVLegalizerInfo.cpp:1006

typeIsLegalIntOrFPVec
static LegalityPredicate typeIsLegalIntOrFPVec(unsigned TypeIdx, std::initializer_list< LLT > IntOrFPVecTys, const RISCVSubtarget &ST)
Definition: RISCVLegalizerInfo.cpp:38

buildSplatPartsS64WithVL
static MachineInstrBuilder buildSplatPartsS64WithVL(const DstOp &Dst, const SrcOp &Passthru, Register Lo, Register Hi, const SrcOp &VL, MachineIRBuilder &MIB, MachineRegisterInfo &MRI)
Definition: RISCVLegalizerInfo.cpp:990

getMaskTypeFor
static LLT getMaskTypeFor(LLT VecTy)
Return the type of the mask type suitable for masking the provided vector type.
Definition: RISCVLegalizerInfo.cpp:962

typeIsLegalPtrVec
static LegalityPredicate typeIsLegalPtrVec(unsigned TypeIdx, std::initializer_list< LLT > PtrVecTys, const RISCVSubtarget &ST)
Definition: RISCVLegalizerInfo.cpp:63

getRISCVWOpcode
static unsigned getRISCVWOpcode(unsigned Opcode)
Definition: RISCVLegalizerInfo.cpp:1297

RISCVLegalizerInfo.h
This file declares the targeting of the Machinelegalizer class for RISC-V.

RISCVMachineFunctionInfo.h

RISCVMatInt.h

Opc
auto Opc
Definition: RISCVRedundantCopyElimination.cpp:75

RISCVSubtarget.h

TargetOpcodes.h

ValueTypes.h

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::APInt::zext
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
Definition: APInt.cpp:1012

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition: APInt.h:1488

llvm::APInt::rotr
LLVM_ABI APInt rotr(unsigned rotateAmt) const
Rotate right by rotateAmt.
Definition: APInt.cpp:1154

llvm::APInt::getSExtValue
int64_t getSExtValue() const
Get sign extended value.
Definition: APInt.h:1562

llvm::CmpInst::ICMP_NE
@ ICMP_NE
not equal
Definition: InstrTypes.h:700

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:87

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition: Constants.h:154

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:33

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::DstOp
Definition: MachineIRBuilder.h:71

llvm::ElementCount
Definition: TypeSize.h:301

llvm::ElementCount::getScalable
static constexpr ElementCount getScalable(ScalarTy MinVal)
Definition: TypeSize.h:315

llvm::Function
Definition: Function.h:64

llvm::Function::getContext
LLVMContext & getContext() const
getContext - Return a reference to the LLVMContext associated with this function.
Definition: Function.cpp:359

llvm::GExtractSubvector
Represents an extract subvector.
Definition: GenericMachineInstrs.h:824

llvm::GExtractSubvector::getSrcVec
Register getSrcVec() const
Definition: GenericMachineInstrs.h:826

llvm::GExtractSubvector::getIndexImm
uint64_t getIndexImm() const
Definition: GenericMachineInstrs.h:827

llvm::GISelChangeObserver::changingInstr
virtual void changingInstr(MachineInstr &MI)=0
This instruction is about to be mutated in some way.

llvm::GISelChangeObserver::changedInstr
virtual void changedInstr(MachineInstr &MI)=0
This instruction was mutated in some way.

llvm::GInsertSubvector
Represents a insert subvector.
Definition: GenericMachineInstrs.h:835

llvm::GInsertSubvector::getSubVec
Register getSubVec() const
Definition: GenericMachineInstrs.h:838

llvm::GInsertSubvector::getBigVec
Register getBigVec() const
Definition: GenericMachineInstrs.h:837

llvm::GInsertSubvector::getIndexImm
uint64_t getIndexImm() const
Definition: GenericMachineInstrs.h:839

llvm::GenericMachineInstr::getReg
Register getReg(unsigned Idx) const
Access the Idx'th operand as a register and return it.
Definition: GenericMachineInstrs.h:38

llvm::LLT
Definition: LowLevelType.h:40

llvm::LLT::isScalableVector
constexpr bool isScalableVector() const
Returns true if the LLT is a scalable vector.
Definition: LowLevelType.h:182

llvm::LLT::getScalarSizeInBits
constexpr unsigned getScalarSizeInBits() const
Definition: LowLevelType.h:265

llvm::LLT::scalable_vector
static constexpr LLT scalable_vector(unsigned MinNumElements, unsigned ScalarSizeInBits)
Get a low-level scalable vector of some number of elements and element width.
Definition: LowLevelType.h:114

llvm::LLT::changeElementType
constexpr LLT changeElementType(LLT NewEltTy) const
If this type is a vector, return a vector with the same number of elements but the new element type.
Definition: LowLevelType.h:212

llvm::LLT::vector
static constexpr LLT vector(ElementCount EC, unsigned ScalarSizeInBits)
Get a low-level vector of some number of elements and element width.
Definition: LowLevelType.h:65

llvm::LLT::scalar
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
Definition: LowLevelType.h:43

llvm::LLT::isVector
constexpr bool isVector() const
Definition: LowLevelType.h:149

llvm::LLT::pointer
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
Definition: LowLevelType.h:58

llvm::LLT::getSizeInBits
constexpr TypeSize getSizeInBits() const
Returns the total size of the type. Must only be called on sized types.
Definition: LowLevelType.h:191

llvm::LLT::getElementType
constexpr LLT getElementType() const
Returns the vector's element type. Only valid for vector types.
Definition: LowLevelType.h:278

llvm::LLT::getElementCount
constexpr ElementCount getElementCount() const
Definition: LowLevelType.h:184

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:68

llvm::LegalizeRuleSet::maxScalar
LegalizeRuleSet & maxScalar(unsigned TypeIdx, const LLT Ty)
Ensure the scalar is at most as wide as Ty.
Definition: LegalizerInfo.h:1096

llvm::LegalizeRuleSet::lower
LegalizeRuleSet & lower()
The instruction is lowered.
Definition: LegalizerInfo.h:705

llvm::LegalizeRuleSet::clampScalar
LegalizeRuleSet & clampScalar(unsigned TypeIdx, const LLT MinTy, const LLT MaxTy)
Limit the range of scalar sizes to MinTy and MaxTy.
Definition: LegalizerInfo.h:1123

llvm::LegalizeRuleSet::customIf
LegalizeRuleSet & customIf(LegalityPredicate Predicate)
Definition: LegalizerInfo.h:891

llvm::LegalizeRuleSet::widenScalarToNextPow2
LegalizeRuleSet & widenScalarToNextPow2(unsigned TypeIdx, unsigned MinSize=0)
Widen the scalar to the next power of two that is at least MinSize.
Definition: LegalizerInfo.h:956

llvm::LegalizeRuleSet::customFor
LegalizeRuleSet & customFor(std::initializer_list< LLT > Types)
Definition: LegalizerInfo.h:897

llvm::LegalizerHelper
Definition: LegalizerHelper.h:49

llvm::LegalizerHelper::widenScalarSrc
LLVM_ABI void widenScalarSrc(MachineInstr &MI, LLT WideTy, unsigned OpIdx, unsigned ExtOpcode)
Legalize a single operand OpIdx of the machine instruction MI as a Use by extending the operand's typ...
Definition: LegalizerHelper.cpp:2082

llvm::LegalizerHelper::lowerAbsToMaxNeg
LLVM_ABI LegalizeResult lowerAbsToMaxNeg(MachineInstr &MI)
Definition: LegalizerHelper.cpp:9519

llvm::LegalizerHelper::bitcast
LLVM_ABI LegalizeResult bitcast(MachineInstr &MI, unsigned TypeIdx, LLT Ty)
Legalize an instruction by replacing the value type.
Definition: LegalizerHelper.cpp:4337

llvm::LegalizerHelper::Legalized
@ Legalized
Instruction has been legalized and the MachineFunction changed.
Definition: LegalizerHelper.h:71

llvm::LegalizerHelper::lower
LLVM_ABI LegalizeResult lower(MachineInstr &MI, unsigned TypeIdx, LLT Ty)
Legalize an instruction by splitting it into simpler parts, hopefully understood by the target.
Definition: LegalizerHelper.cpp:4425

llvm::LegalizerHelper::Observer
GISelChangeObserver & Observer
To keep track of changes made by the LegalizerHelper.
Definition: LegalizerHelper.h:56

llvm::LegalizerHelper::widenScalar
LLVM_ABI LegalizeResult widenScalar(MachineInstr &MI, unsigned TypeIdx, LLT WideTy)
Legalize an instruction by performing the operation on a wider scalar type (for example a 16-bit addi...
Definition: LegalizerHelper.cpp:2673

llvm::LegalizerHelper::MIRBuilder
MachineIRBuilder & MIRBuilder
Expose MIRBuilder so clients can set their own RecordInsertInstruction functions.
Definition: LegalizerHelper.h:53

llvm::LegalizerHelper::lowerConstant
LLVM_ABI LegalizeResult lowerConstant(MachineInstr &MI)
Definition: LegalizerHelper.cpp:3524

llvm::LegalizerHelper::widenScalarDst
LLVM_ABI void widenScalarDst(MachineInstr &MI, LLT WideTy, unsigned OpIdx=0, unsigned TruncOpcode=TargetOpcode::G_TRUNC)
Legalize a single operand OpIdx of the machine instruction MI as a Def by extending the operand's typ...
Definition: LegalizerHelper.cpp:2096

llvm::LegalizerInfo::getActionDefinitionsBuilder
LegalizeRuleSet & getActionDefinitionsBuilder(unsigned Opcode)
Get the action definition builder for the given opcode.
Definition: LegalizerInfo.cpp:314

llvm::LostDebugLocObserver
Definition: LostDebugLocObserver.h:20

llvm::MCInstrInfo::get
const MCInstrDesc & get(unsigned Opcode) const
Return the machine instruction descriptor that corresponds to the specified instruction opcode.
Definition: MCInstrInfo.h:64

llvm::MVT
Machine Value Type.
Definition: MachineValueType.h:36

llvm::MachineFunction
Definition: MachineFunction.h:286

llvm::MachineFunction::getSubtarget
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Definition: MachineFunction.h:762

llvm::MachineFunction::getMachineMemOperand
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
Definition: MachineFunction.cpp:536

llvm::MachineFunction::getDataLayout
const DataLayout & getDataLayout() const
Return the DataLayout attached to the Module associated to this MF.
Definition: MachineFunction.cpp:309

llvm::MachineFunction::getFunction
Function & getFunction()
Return the LLVM function that this machine code represents.
Definition: MachineFunction.h:733

llvm::MachineFunction::getInfo
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
Definition: MachineFunction.h:860

llvm::MachineFunction::getJumpTableInfo
const MachineJumpTableInfo * getJumpTableInfo() const
getJumpTableInfo - Return the jump table info object for the current function.
Definition: MachineFunction.h:785

llvm::MachineIRBuilder
Helper class to build MachineInstr.
Definition: MachineIRBuilder.h:236

llvm::MachineIRBuilder::setInsertPt
void setInsertPt(MachineBasicBlock &MBB, MachineBasicBlock::iterator II)
Set the insertion point before the specified position.
Definition: MachineIRBuilder.h:339

llvm::MachineIRBuilder::buildAdd
MachineInstrBuilder buildAdd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_ADD Op0, Op1.
Definition: MachineIRBuilder.h:1848

llvm::MachineIRBuilder::buildUndef
MachineInstrBuilder buildUndef(const DstOp &Res)
Build and insert Res = IMPLICIT_DEF.
Definition: MachineIRBuilder.cpp:659

llvm::MachineIRBuilder::buildUnmerge
MachineInstrBuilder buildUnmerge(ArrayRef< LLT > Res, const SrcOp &Op)
Build and insert Res0, ... = G_UNMERGE_VALUES Op.
Definition: MachineIRBuilder.cpp:702

llvm::MachineIRBuilder::buildSelect
MachineInstrBuilder buildSelect(const DstOp &Res, const SrcOp &Tst, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_SELECT Tst, Op0, Op1.
Definition: MachineIRBuilder.cpp:968

llvm::MachineIRBuilder::buildMul
MachineInstrBuilder buildMul(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_MUL Op0, Op1.
Definition: MachineIRBuilder.h:1881

llvm::MachineIRBuilder::buildInsertSubvector
MachineInstrBuilder buildInsertSubvector(const DstOp &Res, const SrcOp &Src0, const SrcOp &Src1, unsigned Index)
Build and insert Res = G_INSERT_SUBVECTOR Src0, Src1, Idx.
Definition: MachineIRBuilder.cpp:975

llvm::MachineIRBuilder::buildAnd
MachineInstrBuilder buildAnd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_AND Op0, Op1.
Definition: MachineIRBuilder.h:1993

llvm::MachineIRBuilder::getTII
const TargetInstrInfo & getTII()
Definition: MachineIRBuilder.h:282

llvm::MachineIRBuilder::buildICmp
MachineInstrBuilder buildICmp(CmpInst::Predicate Pred, const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_ICMP Pred, Op0, Op1.
Definition: MachineIRBuilder.cpp:938

llvm::MachineIRBuilder::buildLShr
MachineInstrBuilder buildLShr(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Definition: MachineIRBuilder.h:1970

llvm::MachineIRBuilder::getInsertPt
MachineBasicBlock::iterator getInsertPt()
Current insertion point for new instructions.
Definition: MachineIRBuilder.h:334

llvm::MachineIRBuilder::buildZExt
MachineInstrBuilder buildZExt(const DstOp &Res, const SrcOp &Op, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_ZEXT Op.
Definition: MachineIRBuilder.cpp:523

llvm::MachineIRBuilder::buildVScale
MachineInstrBuilder buildVScale(const DstOp &Res, unsigned MinElts)
Build and insert Res = G_VSCALE MinElts.
Definition: MachineIRBuilder.cpp:852

llvm::MachineIRBuilder::buildIntToPtr
MachineInstrBuilder buildIntToPtr(const DstOp &Dst, const SrcOp &Src)
Build and insert a G_INTTOPTR instruction.
Definition: MachineIRBuilder.h:753

llvm::MachineIRBuilder::buildLoad
MachineInstrBuilder buildLoad(const DstOp &Res, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert Res = G_LOAD Addr, MMO.
Definition: MachineIRBuilder.h:1036

llvm::MachineIRBuilder::buildPtrAdd
MachineInstrBuilder buildPtrAdd(const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_PTR_ADD Op0, Op1.
Definition: MachineIRBuilder.cpp:202

llvm::MachineIRBuilder::buildShl
MachineInstrBuilder buildShl(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Definition: MachineIRBuilder.h:1964

llvm::MachineIRBuilder::buildStore
MachineInstrBuilder buildStore(const SrcOp &Val, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert G_STORE Val, Addr, MMO.
Definition: MachineIRBuilder.cpp:486

llvm::MachineIRBuilder::buildInstr
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
Definition: MachineIRBuilder.h:418

llvm::MachineIRBuilder::buildFrameIndex
MachineInstrBuilder buildFrameIndex(const DstOp &Res, int Idx)
Build and insert Res = G_FRAME_INDEX Idx.
Definition: MachineIRBuilder.cpp:147

llvm::MachineIRBuilder::getMF
MachineFunction & getMF()
Getter for the function we currently build.
Definition: MachineIRBuilder.h:288

llvm::MachineIRBuilder::getMBB
const MachineBasicBlock & getMBB() const
Getter for the basic block we currently build.
Definition: MachineIRBuilder.h:320

llvm::MachineIRBuilder::getMRI
MachineRegisterInfo * getMRI()
Getter for MRI.
Definition: MachineIRBuilder.h:310

llvm::MachineIRBuilder::buildExtractSubvector
MachineInstrBuilder buildExtractSubvector(const DstOp &Res, const SrcOp &Src, unsigned Index)
Build and insert Res = G_EXTRACT_SUBVECTOR Src, Idx0.
Definition: MachineIRBuilder.cpp:983

llvm::MachineIRBuilder::getDataLayout
const DataLayout & getDataLayout() const
Definition: MachineIRBuilder.h:298

llvm::MachineIRBuilder::buildBrIndirect
MachineInstrBuilder buildBrIndirect(Register Tgt)
Build and insert G_BRINDIRECT Tgt.
Definition: MachineIRBuilder.cpp:312

llvm::MachineIRBuilder::buildSplatVector
MachineInstrBuilder buildSplatVector(const DstOp &Res, const SrcOp &Val)
Build and insert Res = G_SPLAT_VECTOR Val.
Definition: MachineIRBuilder.cpp:789

llvm::MachineIRBuilder::buildLoadInstr
MachineInstrBuilder buildLoadInstr(unsigned Opcode, const DstOp &Res, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert Res = <opcode> Addr, MMO.
Definition: MachineIRBuilder.cpp:455

llvm::MachineIRBuilder::buildConstant
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
Definition: MachineIRBuilder.cpp:333

llvm::MachineIRBuilder::buildSExtInReg
MachineInstrBuilder buildSExtInReg(const DstOp &Res, const SrcOp &Op, int64_t ImmOp)
Build and insert Res = G_SEXT_INREG Op, ImmOp.
Definition: MachineIRBuilder.h:737

llvm::MachineInstrBuilder
Definition: MachineInstrBuilder.h:98

llvm::MachineInstrBuilder::getReg
Register getReg(unsigned Idx) const
Get the register for the operand index.
Definition: MachineInstrBuilder.h:123

llvm::MachineInstr
Representation of each machine instruction.
Definition: MachineInstr.h:72

llvm::MachineJumpTableInfo
Definition: MachineJumpTableInfo.h:48

llvm::MachineJumpTableInfo::getEntrySize
LLVM_ABI unsigned getEntrySize(const DataLayout &TD) const
getEntrySize - Return the size of each entry in the jump table.
Definition: MachineFunction.cpp:1338

llvm::MachineJumpTableInfo::EK_LabelDifference32
@ EK_LabelDifference32
EK_LabelDifference32 - Each entry is the address of the block minus the address of the jump table.
Definition: MachineJumpTableInfo.h:74

llvm::MachineJumpTableInfo::EK_Custom32
@ EK_Custom32
EK_Custom32 - Each entry is a 32-bit value that is custom lowered by the TargetLowering::LowerCustomJ...
Definition: MachineJumpTableInfo.h:88

llvm::MachineJumpTableInfo::EK_BlockAddress
@ EK_BlockAddress
EK_BlockAddress - Each entry is a plain address of block, e.g.: .word LBB123.
Definition: MachineJumpTableInfo.h:55

llvm::MachineJumpTableInfo::getEntryAlignment
LLVM_ABI unsigned getEntryAlignment(const DataLayout &TD) const
getEntryAlignment - Return the alignment of each entry in the jump table.
Definition: MachineFunction.cpp:1358

llvm::MachineJumpTableInfo::getEntryKind
JTEntryKind getEntryKind() const
Definition: MachineJumpTableInfo.h:97

llvm::MachineMemOperand
A description of a memory reference used in the backend.
Definition: MachineMemOperand.h:130

llvm::MachineMemOperand::MOLoad
@ MOLoad
The memory access reads data.
Definition: MachineMemOperand.h:137

llvm::MachineMemOperand::MOStore
@ MOStore
The memory access writes data.
Definition: MachineMemOperand.h:139

llvm::MachineOperand
MachineOperand class - Representation of each machine instruction operand.
Definition: MachineOperand.h:48

llvm::MachineOperand::getImm
int64_t getImm() const
Definition: MachineOperand.h:556

llvm::MachineOperand::setReg
LLVM_ABI void setReg(Register Reg)
Change the register this operand corresponds to.
Definition: MachineOperand.cpp:60

llvm::MachineOperand::CreateImm
static MachineOperand CreateImm(int64_t Val)
Definition: MachineOperand.h:821

llvm::MachineRegisterInfo
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
Definition: MachineRegisterInfo.h:53

llvm::MachineRegisterInfo::getType
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
Definition: MachineRegisterInfo.h:768

llvm::RISCVLegalizerInfo::legalizeCustom
bool legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI, LostDebugLocObserver &LocObserver) const override
Called for instructions with the Custom LegalizationAction.
Definition: RISCVLegalizerInfo.cpp:1328

llvm::RISCVLegalizerInfo::legalizeIntrinsic
bool legalizeIntrinsic(LegalizerHelper &Helper, MachineInstr &MI) const override
Definition: RISCVLegalizerInfo.cpp:707

llvm::RISCVLegalizerInfo::RISCVLegalizerInfo
RISCVLegalizerInfo(const RISCVSubtarget &ST)
Definition: RISCVLegalizerInfo.cpp:76

llvm::RISCVMachineFunctionInfo
RISCVMachineFunctionInfo - This class is derived from MachineFunctionInfo and contains private RISCV-...
Definition: RISCVMachineFunctionInfo.h:47

llvm::RISCVMachineFunctionInfo::getVarArgsFrameIndex
int getVarArgsFrameIndex() const
Definition: RISCVMachineFunctionInfo.h:97

llvm::RISCVSubtarget
Definition: RISCVSubtarget.h:79

llvm::RISCVSubtarget::getRealMinVLen
unsigned getRealMinVLen() const
Definition: RISCVSubtarget.h:217

llvm::RISCVSubtarget::expandVScale
Quantity expandVScale(Quantity X) const
If the ElementCount or TypeSize X is scalable and VScale (VLEN) is exactly known, returns X converted...
Definition: RISCVSubtarget.h:236

llvm::RISCVSubtarget::getXLenVT
MVT getXLenVT() const
Definition: RISCVSubtarget.h:196

llvm::RISCVSubtarget::getMaxBuildIntsCost
unsigned getMaxBuildIntsCost() const
Definition: RISCVSubtarget.cpp:148

llvm::RISCVSubtarget::useConstantPoolForLargeInts
bool useConstantPoolForLargeInts() const
Definition: RISCVSubtarget.cpp:144

llvm::RISCVSubtarget::getRegisterInfo
const RISCVRegisterInfo * getRegisterInfo() const override
Definition: RISCVSubtarget.h:142

llvm::RISCVSubtarget::getTargetLowering
const RISCVTargetLowering * getTargetLowering() const override
Definition: RISCVSubtarget.h:145

llvm::RISCVSubtarget::is64Bit
bool is64Bit() const
Definition: RISCVSubtarget.h:195

llvm::RISCVTargetLowering::decomposeSubvectorInsertExtractToSubRegs
static std::pair< unsigned, unsigned > decomposeSubvectorInsertExtractToSubRegs(MVT VecVT, MVT SubVecVT, unsigned InsertExtractIdx, const RISCVRegisterInfo *TRI)
Definition: RISCVISelLowering.cpp:2693

llvm::RISCVTargetLowering::getLMUL
static RISCVVType::VLMUL getLMUL(MVT VT)
Definition: RISCVISelLowering.cpp:2556

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:82

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:79

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1197

llvm::SrcOp
Definition: MachineIRBuilder.h:143

llvm::SrcOp::getReg
Register getReg() const
Definition: MachineIRBuilder.h:195

llvm::TypeSize
Definition: TypeSize.h:335

llvm::TypeSize::getScalable
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition: TypeSize.h:349

llvm::details::FixedOrScalableQuantity::getKnownMinValue
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
Definition: TypeSize.h:169

llvm::details::FixedOrScalableQuantity< TypeSize, uint64_t >::isKnownGT
static constexpr bool isKnownGT(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition: TypeSize.h:226

llvm::details::FixedOrScalableQuantity::divideCoefficientBy
constexpr LeafTy divideCoefficientBy(ScalarTy RHS) const
We do not provide the '/' operator here because division for polynomial types does not work in the sa...
Definition: TypeSize.h:255

uint64_t

unsigned

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:164

llvm::AMDGPU::Imm
@ Imm
Definition: AMDGPURegBankLegalizeRules.h:129

llvm::ARM_MB::ST
@ ST
Definition: ARMBaseInfo.h:73

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition: BitmaskEnum.h:126

llvm::LegalityPredicates::typeInSet
LLVM_ABI LegalityPredicate typeInSet(unsigned TypeIdx, std::initializer_list< LLT > TypesInit)
True iff the given type index is one of the specified types.
Definition: LegalityPredicates.cpp:34

llvm::LegalityPredicates::any
Predicate any(Predicate P0, Predicate P1)
True iff P0 or P1 are true.
Definition: LegalizerInfo.h:246

llvm::LegalityPredicates::all
Predicate all(Predicate P0, Predicate P1)
True iff P0 and P1 are true.
Definition: LegalizerInfo.h:233

llvm::LegalityPredicates::typeIs
LLVM_ABI LegalityPredicate typeIs(unsigned TypeIdx, LLT TypesInit)
True iff the given type index is the specified type.
Definition: LegalityPredicates.cpp:28

llvm::LegalizeMutations::changeTo
LLVM_ABI LegalizeMutation changeTo(unsigned TypeIdx, LLT Ty)
Select this specific type for the given type index.
Definition: LegalizeMutations.cpp:17

llvm::RISCVFPRndMode::RTZ
@ RTZ
Definition: RISCVBaseInfo.h:409

llvm::RISCVMatInt::generateInstSeq
InstSeq generateInstSeq(int64_t Val, const MCSubtargetInfo &STI)
Definition: RISCVMatInt.cpp:257

llvm::RISCVMatInt::generateTwoRegInstSeq
InstSeq generateTwoRegInstSeq(int64_t Val, const MCSubtargetInfo &STI, unsigned &ShiftAmt, unsigned &AddOpc)
Definition: RISCVMatInt.cpp:505

llvm::RISCVVType::LMUL_1
@ LMUL_1
Definition: RISCVTargetParser.h:74

llvm::RISCVVType::decodeVLMUL
LLVM_ABI std::pair< unsigned, bool > decodeVLMUL(VLMUL VLMul)
Definition: RISCVTargetParser.cpp:186

llvm::RISCVVType::TAIL_UNDISTURBED_MASK_UNDISTURBED
@ TAIL_UNDISTURBED_MASK_UNDISTURBED
Definition: RISCVTargetParser.h:85

llvm::RISCVVType::TAIL_AGNOSTIC
@ TAIL_AGNOSTIC
Definition: RISCVTargetParser.h:86

llvm::RISCVVType::MASK_AGNOSTIC
@ MASK_AGNOSTIC
Definition: RISCVTargetParser.h:87

llvm::RISCV::RVVBitsPerBlock
static constexpr unsigned RVVBitsPerBlock
Definition: RISCVTargetParser.h:51

llvm::SPII::Load
@ Load
Definition: SparcInstrInfo.h:32

llvm::cfg::UpdateKind::Insert
@ Insert

llvm::logicalview::LVAttributeKind::Inserted
@ Inserted

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::getTypeForLLT
LLVM_ABI Type * getTypeForLLT(LLT Ty, LLVMContext &C)
Get the type back from LLT.
Definition: Utils.cpp:2029

llvm::isAllOnesOrAllOnesSplat
LLVM_ABI bool isAllOnesOrAllOnesSplat(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowUndefs=false)
Return true if the value is a constant -1 integer or a splatted vector of a constant -1 integer (with...
Definition: Utils.cpp:1605

llvm::getMVTForLLT
LLVM_ABI MVT getMVTForLLT(LLT Ty)
Get a rough equivalent of an MVT for a given LLT.
Definition: LowLevelTypeUtils.cpp:48

llvm::isPowerOf2_64
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
Definition: MathExtras.h:293

llvm::isNullOrNullSplat
LLVM_ABI bool isNullOrNullSplat(const MachineInstr &MI, const MachineRegisterInfo &MRI, bool AllowUndefs=false)
Return true if the value is a constant 0 integer or a splatted vector of a constant 0 integer (with n...
Definition: Utils.cpp:1587

llvm::Log2_64
unsigned Log2_64(uint64_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
Definition: MathExtras.h:342

llvm::Log2_32
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
Definition: MathExtras.h:336

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:288

llvm::PackElem::Hi
@ Hi

llvm::PackElem::Lo
@ Lo

llvm::getIConstantVRegValWithLookThrough
LLVM_ABI std::optional< ValueAndVReg > getIConstantVRegValWithLookThrough(Register VReg, const MachineRegisterInfo &MRI, bool LookThroughInstrs=true)
If VReg is defined by a statically evaluable chain of instructions rooted on a G_CONSTANT returns its...
Definition: Utils.cpp:433

llvm::Log2
unsigned Log2(Align A)
Returns the log2 of the alignment.
Definition: Alignment.h:208

llvm::LegalityPredicate
std::function< bool(const LegalityQuery &)> LegalityPredicate
Definition: LegalizerInfo.h:199

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:35

llvm::EVT::getEVT
static LLVM_ABI EVT getEVT(Type *Ty, bool HandleUnknown=false)
Return the value type corresponding to the specified type.
Definition: ValueTypes.cpp:299

llvm::LegalityQuery
The LegalityQuery object bundles together all the information that's needed to decide whether a given...
Definition: LegalizerInfo.h:111

llvm::LegalityQuery::Types
ArrayRef< LLT > Types
Definition: LegalizerInfo.h:113

llvm::MIPatternMatch::And
Matching combinators.
Definition: MIPatternMatch.h:313

llvm::MachinePointerInfo
This class contains a discriminated union of information about pointers in memory operands,...
Definition: MachineMemOperand.h:42

llvm::MachinePointerInfo::getJumpTable
static LLVM_ABI MachinePointerInfo getJumpTable(MachineFunction &MF)
Return a MachinePointerInfo record that refers to a jump table entry.
Definition: MachineOperand.cpp:1069

llvm::RISCVRegisterInfo
Definition: RISCVRegisterInfo.h:57