LLVM: include/llvm/Analysis/TargetTransformInfoImpl.h Source File

//===- TargetTransformInfoImpl.h --------------------------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

/// This file provides helpers for the implementation of

/// a TargetTransformInfo-conforming class.

///

//===----------------------------------------------------------------------===//


#ifndef LLVM_ANALYSIS_TARGETTRANSFORMINFOIMPL_H

#define LLVM_ANALYSIS_TARGETTRANSFORMINFOIMPL_H


#include "llvm/Analysis/ScalarEvolutionExpressions.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/GetElementPtrTypeIterator.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Operator.h"

#include "llvm/IR/PatternMatch.h"

#include <optional>

#include <utility>


namespace llvm {


class Function;


/// Base class for use as a mix-in that aids implementing

/// a TargetTransformInfo-compatible class.


class TargetTransformInfoImplBase {


protected:

  typedef TargetTransformInfo TTI;


  const DataLayout &DL;


  explicit TargetTransformInfoImplBase(const DataLayout &DL) : DL(DL) {}


public:

  virtual ~TargetTransformInfoImplBase();


  // Provide value semantics. MSVC requires that we spell all of these out.

  TargetTransformInfoImplBase(const TargetTransformInfoImplBase &Arg) = default;

  TargetTransformInfoImplBase(TargetTransformInfoImplBase &&Arg) : DL(Arg.DL) {}


  virtual const DataLayout &getDataLayout() const { return DL; }


  // FIXME: It looks like this implementation is dead. All clients appear to

  //  use the (non-const) version from `TargetTransformInfoImplCRTPBase`.


  virtual InstructionCost getGEPCost(Type *PointeeType, const Value *Ptr,

                                     ArrayRef<const Value *> Operands,

                                     Type *AccessType,

                                     TTI::TargetCostKind CostKind) const {

    // In the basic model, we just assume that all-constant GEPs will be folded

    // into their uses via addressing modes.

    for (const Value *Operand : Operands)

      if (!isa<Constant>(Operand))

        return TTI::TCC_Basic;


    return TTI::TCC_Free;

  }


  virtual InstructionCost


  getPointersChainCost(ArrayRef<const Value *> Ptrs, const Value *Base,

                       const TTI::PointersChainInfo &Info, Type *AccessTy,

                       TTI::TargetCostKind CostKind) const {

    llvm_unreachable("Not implemented");

  }


  virtual unsigned


  getEstimatedNumberOfCaseClusters(const SwitchInst &SI, unsigned &JTSize,

                                   ProfileSummaryInfo *PSI,

                                   BlockFrequencyInfo *BFI) const {

    (void)PSI;

    (void)BFI;

    JTSize = 0;

    return SI.getNumCases();

  }


  virtual InstructionCost


  getInstructionCost(const User *U, ArrayRef<const Value *> Operands,

                     TTI::TargetCostKind CostKind) const {

    llvm_unreachable("Not implemented");

  }


  virtual unsigned getInliningThresholdMultiplier() const { return 1; }


  virtual unsigned getInliningCostBenefitAnalysisSavingsMultiplier() const {

    return 8;

  }


  virtual unsigned getInliningCostBenefitAnalysisProfitableMultiplier() const {

    return 8;

  }


  virtual int getInliningLastCallToStaticBonus() const {

    // This is the value of InlineConstants::LastCallToStaticBonus before it was

    // removed along with the introduction of this function.

    return 15000;

  }


  virtual unsigned adjustInliningThreshold(const CallBase *CB) const {

    return 0;

  }


  virtual unsigned getCallerAllocaCost(const CallBase *CB,

                                       const AllocaInst *AI) const {

    return 0;

  };


  virtual int getInlinerVectorBonusPercent() const { return 150; }


  virtual InstructionCost getMemcpyCost(const Instruction *I) const {

    return TTI::TCC_Expensive;

  }


  virtual uint64_t getMaxMemIntrinsicInlineSizeThreshold() const { return 64; }


  // Although this default value is arbitrary, it is not random. It is assumed

  // that a condition that evaluates the same way by a higher percentage than

  // this is best represented as control flow. Therefore, the default value N

  // should be set such that the win from N% correct executions is greater than

  // the loss from (100 - N)% mispredicted executions for the majority of

  //  intended targets.


  virtual BranchProbability getPredictableBranchThreshold() const {

    return BranchProbability(99, 100);

  }


  virtual InstructionCost getBranchMispredictPenalty() const { return 0; }


  virtual bool hasBranchDivergence(const Function *F = nullptr) const {

    return false;

  }


  virtual bool isSourceOfDivergence(const Value *V) const { return false; }


  virtual bool isAlwaysUniform(const Value *V) const { return false; }


  virtual bool isValidAddrSpaceCast(unsigned FromAS, unsigned ToAS) const {

    return false;

  }


  virtual bool addrspacesMayAlias(unsigned AS0, unsigned AS1) const {

    return true;

  }


  virtual unsigned getFlatAddressSpace() const { return -1; }


  virtual bool collectFlatAddressOperands(SmallVectorImpl<int> &OpIndexes,

                                          Intrinsic::ID IID) const {

    return false;

  }


  virtual bool isNoopAddrSpaceCast(unsigned, unsigned) const { return false; }

  virtual bool


  canHaveNonUndefGlobalInitializerInAddressSpace(unsigned AS) const {

    return AS == 0;

  };


  virtual unsigned getAssumedAddrSpace(const Value *V) const { return -1; }


  virtual bool isSingleThreaded() const { return false; }


  virtual std::pair<const Value *, unsigned>


  getPredicatedAddrSpace(const Value *V) const {

    return std::make_pair(nullptr, -1);

  }


  virtual Value *rewriteIntrinsicWithAddressSpace(IntrinsicInst *II,

                                                  Value *OldV,

                                                  Value *NewV) const {

    return nullptr;

  }


  virtual bool isLoweredToCall(const Function *F) const {

    assert(F && "A concrete function must be provided to this routine.");


    // FIXME: These should almost certainly not be handled here, and instead

    // handled with the help of TLI or the target itself. This was largely

    // ported from existing analysis heuristics here so that such refactorings

    // can take place in the future.


    if (F->isIntrinsic())

      return false;


    if (F->hasLocalLinkage() || !F->hasName())

      return true;


    StringRef Name = F->getName();


    // These will all likely lower to a single selection DAG node.

    // clang-format off

    if (Name == "copysign" || Name == "copysignf" || Name == "copysignl" ||

        Name == "fabs"  || Name == "fabsf"  || Name == "fabsl" ||

        Name == "fmin"  || Name == "fminf"  || Name == "fminl" ||

        Name == "fmax"  || Name == "fmaxf"  || Name == "fmaxl" ||

        Name == "sin"   || Name == "sinf"   || Name == "sinl"  ||

        Name == "cos"   || Name == "cosf"   || Name == "cosl"  ||

        Name == "tan"   || Name == "tanf"   || Name == "tanl"  ||

        Name == "asin"  || Name == "asinf"  || Name == "asinl" ||

        Name == "acos"  || Name == "acosf"  || Name == "acosl" ||

        Name == "atan"  || Name == "atanf"  || Name == "atanl" ||

        Name == "atan2" || Name == "atan2f" || Name == "atan2l"||

        Name == "sinh"  || Name == "sinhf"  || Name == "sinhl" ||

        Name == "cosh"  || Name == "coshf"  || Name == "coshl" ||

        Name == "tanh"  || Name == "tanhf"  || Name == "tanhl" ||

        Name == "sqrt"  || Name == "sqrtf"  || Name == "sqrtl" ||

        Name == "exp10"  || Name == "exp10l"  || Name == "exp10f")

      return false;

    // clang-format on

    // These are all likely to be optimized into something smaller.

    if (Name == "pow" || Name == "powf" || Name == "powl" || Name == "exp2" ||

        Name == "exp2l" || Name == "exp2f" || Name == "floor" ||

        Name == "floorf" || Name == "ceil" || Name == "round" ||

        Name == "ffs" || Name == "ffsl" || Name == "abs" || Name == "labs" ||

        Name == "llabs")

      return false;


    return true;

  }


  virtual bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE,

                                        AssumptionCache &AC,

                                        TargetLibraryInfo *LibInfo,

                                        HardwareLoopInfo &HWLoopInfo) const {

    return false;

  }


  virtual unsigned getEpilogueVectorizationMinVF() const { return 16; }


  virtual bool preferPredicateOverEpilogue(TailFoldingInfo *TFI) const {

    return false;

  }


  virtual TailFoldingStyle


  getPreferredTailFoldingStyle(bool IVUpdateMayOverflow = true) const {

    return TailFoldingStyle::DataWithoutLaneMask;

  }


  virtual std::optional<Instruction *>


  instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const {

    return std::nullopt;

  }


  virtual std::optional<Value *>


  simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II,

                                   APInt DemandedMask, KnownBits &Known,

                                   bool &KnownBitsComputed) const {

    return std::nullopt;

  }


  virtual std::optional<Value *> simplifyDemandedVectorEltsIntrinsic(

      InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts,

      APInt &UndefElts2, APInt &UndefElts3,

      std::function<void(Instruction *, unsigned, APInt, APInt &)>

          SimplifyAndSetOp) const {

    return std::nullopt;

  }


  virtual void getUnrollingPreferences(Loop *, ScalarEvolution &,

                                       TTI::UnrollingPreferences &,

                                       OptimizationRemarkEmitter *) const {}


  virtual void getPeelingPreferences(Loop *, ScalarEvolution &,

                                     TTI::PeelingPreferences &) const {}


  virtual bool isLegalAddImmediate(int64_t Imm) const { return false; }


  virtual bool isLegalAddScalableImmediate(int64_t Imm) const { return false; }


  virtual bool isLegalICmpImmediate(int64_t Imm) const { return false; }


  virtual bool isLegalAddressingMode(Type *Ty, GlobalValue *BaseGV,

                                     int64_t BaseOffset, bool HasBaseReg,

                                     int64_t Scale, unsigned AddrSpace,

                                     Instruction *I = nullptr,

                                     int64_t ScalableOffset = 0) const {

    // Guess that only reg and reg+reg addressing is allowed. This heuristic is

    // taken from the implementation of LSR.

    return !BaseGV && BaseOffset == 0 && (Scale == 0 || Scale == 1);

  }


  virtual bool isLSRCostLess(const TTI::LSRCost &C1,

                             const TTI::LSRCost &C2) const {

    return std::tie(C1.NumRegs, C1.AddRecCost, C1.NumIVMuls, C1.NumBaseAdds,

                    C1.ScaleCost, C1.ImmCost, C1.SetupCost) <

           std::tie(C2.NumRegs, C2.AddRecCost, C2.NumIVMuls, C2.NumBaseAdds,

                    C2.ScaleCost, C2.ImmCost, C2.SetupCost);

  }


  virtual bool isNumRegsMajorCostOfLSR() const { return true; }


  virtual bool shouldDropLSRSolutionIfLessProfitable() const { return false; }


  virtual bool isProfitableLSRChainElement(Instruction *I) const {

    return false;

  }


  virtual bool canMacroFuseCmp() const { return false; }


  virtual bool canSaveCmp(Loop *L, BranchInst **BI, ScalarEvolution *SE,

                          LoopInfo *LI, DominatorTree *DT, AssumptionCache *AC,

                          TargetLibraryInfo *LibInfo) const {

    return false;

  }


  virtual TTI::AddressingModeKind


  getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const {

    return TTI::AMK_None;

  }


  virtual bool isLegalMaskedStore(Type *DataType, Align Alignment,

                                  unsigned AddressSpace) const {

    return false;

  }


  virtual bool isLegalMaskedLoad(Type *DataType, Align Alignment,

                                 unsigned AddressSpace) const {

    return false;

  }


  virtual bool isLegalNTStore(Type *DataType, Align Alignment) const {

    // By default, assume nontemporal memory stores are available for stores

    // that are aligned and have a size that is a power of 2.

    unsigned DataSize = DL.getTypeStoreSize(DataType);

    return Alignment >= DataSize && isPowerOf2_32(DataSize);

  }


  virtual bool isLegalNTLoad(Type *DataType, Align Alignment) const {

    // By default, assume nontemporal memory loads are available for loads that

    // are aligned and have a size that is a power of 2.

    unsigned DataSize = DL.getTypeStoreSize(DataType);

    return Alignment >= DataSize && isPowerOf2_32(DataSize);

  }


  virtual bool isLegalBroadcastLoad(Type *ElementTy,

                                    ElementCount NumElements) const {

    return false;

  }


  virtual bool isLegalMaskedScatter(Type *DataType, Align Alignment) const {

    return false;

  }


  virtual bool isLegalMaskedGather(Type *DataType, Align Alignment) const {

    return false;

  }


  virtual bool forceScalarizeMaskedGather(VectorType *DataType,

                                          Align Alignment) const {

    return false;

  }


  virtual bool forceScalarizeMaskedScatter(VectorType *DataType,

                                           Align Alignment) const {

    return false;

  }


  virtual bool isLegalMaskedCompressStore(Type *DataType,

                                          Align Alignment) const {

    return false;

  }


  virtual bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0,

                               unsigned Opcode1,

                               const SmallBitVector &OpcodeMask) const {

    return false;

  }


  virtual bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment) const {

    return false;

  }


  virtual bool isLegalStridedLoadStore(Type *DataType, Align Alignment) const {

    return false;

  }


  virtual bool isLegalInterleavedAccessType(VectorType *VTy, unsigned Factor,

                                            Align Alignment,

                                            unsigned AddrSpace) const {

    return false;

  }


  virtual bool isLegalMaskedVectorHistogram(Type *AddrType,

                                            Type *DataType) const {

    return false;

  }


  virtual bool enableOrderedReductions() const { return false; }


  virtual bool hasDivRemOp(Type *DataType, bool IsSigned) const {

    return false;

  }


  virtual bool hasVolatileVariant(Instruction *I, unsigned AddrSpace) const {

    return false;

  }


  virtual bool prefersVectorizedAddressing() const { return true; }


  virtual InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV,

                                               StackOffset BaseOffset,

                                               bool HasBaseReg, int64_t Scale,

                                               unsigned AddrSpace) const {

    // Guess that all legal addressing mode are free.

    if (isLegalAddressingMode(Ty, BaseGV, BaseOffset.getFixed(), HasBaseReg,

                              Scale, AddrSpace, /*I=*/nullptr,

                              BaseOffset.getScalable()))

      return 0;

    return InstructionCost::getInvalid();

  }


  virtual bool LSRWithInstrQueries() const { return false; }


  virtual bool isTruncateFree(Type *Ty1, Type *Ty2) const { return false; }


  virtual bool isProfitableToHoist(Instruction *I) const { return true; }


  virtual bool useAA() const { return false; }


  virtual bool isTypeLegal(Type *Ty) const { return false; }


  virtual unsigned getRegUsageForType(Type *Ty) const { return 1; }


  virtual bool shouldBuildLookupTables() const { return true; }


  virtual bool shouldBuildLookupTablesForConstant(Constant *C) const {

    return true;

  }


  virtual bool shouldBuildRelLookupTables() const { return false; }


  virtual bool useColdCCForColdCall(Function &F) const { return false; }


  virtual bool isTargetIntrinsicTriviallyScalarizable(Intrinsic::ID ID) const {

    return false;

  }


  virtual bool isTargetIntrinsicWithScalarOpAtArg(Intrinsic::ID ID,

                                                  unsigned ScalarOpdIdx) const {

    return false;

  }


  virtual bool isTargetIntrinsicWithOverloadTypeAtArg(Intrinsic::ID ID,

                                                      int OpdIdx) const {

    return OpdIdx == -1;

  }


  virtual bool


  isTargetIntrinsicWithStructReturnOverloadAtField(Intrinsic::ID ID,

                                                   int RetIdx) const {

    return RetIdx == 0;

  }


  virtual InstructionCost getScalarizationOverhead(

      VectorType *Ty, const APInt &DemandedElts, bool Insert, bool Extract,

      TTI::TargetCostKind CostKind, bool ForPoisonSrc = true,

      ArrayRef<Value *> VL = {}) const {

    return 0;

  }


  virtual InstructionCost


  getOperandsScalarizationOverhead(ArrayRef<Type *> Tys,

                                   TTI::TargetCostKind CostKind) const {

    return 0;

  }


  virtual bool supportsEfficientVectorElementLoadStore() const { return false; }


  virtual bool supportsTailCalls() const { return true; }


  virtual bool supportsTailCallFor(const CallBase *CB) const {

    llvm_unreachable("Not implemented");

  }


  virtual bool enableAggressiveInterleaving(bool LoopHasReductions) const {

    return false;

  }


  virtual TTI::MemCmpExpansionOptions


  enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const {

    return {};

  }


  virtual bool enableSelectOptimize() const { return true; }


  virtual bool shouldTreatInstructionLikeSelect(const Instruction *I) const {

    // A select with two constant operands will usually be better left as a

    // select.

    using namespace llvm::PatternMatch;

    if (match(I, m_Select(m_Value(), m_Constant(), m_Constant())))

      return false;

    // If the select is a logical-and/logical-or then it is better treated as a

    // and/or by the backend.

    return isa<SelectInst>(I) &&

           !match(I, m_CombineOr(m_LogicalAnd(m_Value(), m_Value()),

                                 m_LogicalOr(m_Value(), m_Value())));

  }


  virtual bool enableInterleavedAccessVectorization() const { return false; }


  virtual bool enableMaskedInterleavedAccessVectorization() const {

    return false;

  }


  virtual bool isFPVectorizationPotentiallyUnsafe() const { return false; }


  virtual bool allowsMisalignedMemoryAccesses(LLVMContext &Context,

                                              unsigned BitWidth,

                                              unsigned AddressSpace,

                                              Align Alignment,

                                              unsigned *Fast) const {

    return false;

  }


  virtual TTI::PopcntSupportKind


  getPopcntSupport(unsigned IntTyWidthInBit) const {

    return TTI::PSK_Software;

  }


  virtual bool haveFastSqrt(Type *Ty) const { return false; }


  virtual bool isExpensiveToSpeculativelyExecute(const Instruction *I) const {

    return true;

  }


  virtual bool isFCmpOrdCheaperThanFCmpZero(Type *Ty) const { return true; }


  virtual InstructionCost getFPOpCost(Type *Ty) const {

    return TargetTransformInfo::TCC_Basic;

  }


  virtual InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx,

                                                const APInt &Imm,

                                                Type *Ty) const {

    return 0;

  }


  virtual InstructionCost getIntImmCost(const APInt &Imm, Type *Ty,

                                        TTI::TargetCostKind CostKind) const {

    return TTI::TCC_Basic;

  }


  virtual InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx,

                                            const APInt &Imm, Type *Ty,

                                            TTI::TargetCostKind CostKind,

                                            Instruction *Inst = nullptr) const {

    return TTI::TCC_Free;

  }


  virtual InstructionCost


  getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx, const APInt &Imm,

                      Type *Ty, TTI::TargetCostKind CostKind) const {

    return TTI::TCC_Free;

  }


  virtual bool preferToKeepConstantsAttached(const Instruction &Inst,

                                             const Function &Fn) const {

    return false;

  }


  virtual unsigned getNumberOfRegisters(unsigned ClassID) const { return 8; }


  virtual bool hasConditionalLoadStoreForType(Type *Ty, bool IsStore) const {

    return false;

  }


  virtual unsigned getRegisterClassForType(bool Vector,

                                           Type *Ty = nullptr) const {

    return Vector ? 1 : 0;

  }


  virtual const char *getRegisterClassName(unsigned ClassID) const {

    switch (ClassID) {

    default:

      return "Generic::Unknown Register Class";

    case 0:

      return "Generic::ScalarRC";

    case 1:

      return "Generic::VectorRC";

    }

  }


  virtual TypeSize


  getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const {

    return TypeSize::getFixed(32);

  }


  virtual unsigned getMinVectorRegisterBitWidth() const { return 128; }


  virtual std::optional<unsigned> getMaxVScale() const { return std::nullopt; }


  virtual std::optional<unsigned> getVScaleForTuning() const {

    return std::nullopt;

  }


  virtual bool isVScaleKnownToBeAPowerOfTwo() const { return false; }


  virtual bool


  shouldMaximizeVectorBandwidth(TargetTransformInfo::RegisterKind K) const {

    return false;

  }


  virtual ElementCount getMinimumVF(unsigned ElemWidth, bool IsScalable) const {

    return ElementCount::get(0, IsScalable);

  }


  virtual unsigned getMaximumVF(unsigned ElemWidth, unsigned Opcode) const {

    return 0;

  }


  virtual unsigned getStoreMinimumVF(unsigned VF, Type *, Type *) const {

    return VF;

  }


  virtual bool shouldConsiderAddressTypePromotion(

      const Instruction &I, bool &AllowPromotionWithoutCommonHeader) const {

    AllowPromotionWithoutCommonHeader = false;

    return false;

  }


  virtual unsigned getCacheLineSize() const { return 0; }

  virtual std::optional<unsigned>


  getCacheSize(TargetTransformInfo::CacheLevel Level) const {

    switch (Level) {

    case TargetTransformInfo::CacheLevel::L1D:

      [[fallthrough]];

    case TargetTransformInfo::CacheLevel::L2D:

      return std::nullopt;

    }

    llvm_unreachable("Unknown TargetTransformInfo::CacheLevel");

  }


  virtual std::optional<unsigned>


  getCacheAssociativity(TargetTransformInfo::CacheLevel Level) const {

    switch (Level) {

    case TargetTransformInfo::CacheLevel::L1D:

      [[fallthrough]];

    case TargetTransformInfo::CacheLevel::L2D:

      return std::nullopt;

    }


    llvm_unreachable("Unknown TargetTransformInfo::CacheLevel");

  }


  virtual std::optional<unsigned> getMinPageSize() const { return {}; }


  virtual unsigned getPrefetchDistance() const { return 0; }


  virtual unsigned getMinPrefetchStride(unsigned NumMemAccesses,

                                        unsigned NumStridedMemAccesses,

                                        unsigned NumPrefetches,

                                        bool HasCall) const {

    return 1;

  }


  virtual unsigned getMaxPrefetchIterationsAhead() const { return UINT_MAX; }

  virtual bool enableWritePrefetching() const { return false; }

  virtual bool shouldPrefetchAddressSpace(unsigned AS) const { return !AS; }


  virtual InstructionCost getPartialReductionCost(

      unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType,

      ElementCount VF, TTI::PartialReductionExtendKind OpAExtend,

      TTI::PartialReductionExtendKind OpBExtend, std::optional<unsigned> BinOp,

      TTI::TargetCostKind CostKind) const {

    return InstructionCost::getInvalid();

  }


  virtual unsigned getMaxInterleaveFactor(ElementCount VF) const { return 1; }


  virtual InstructionCost getArithmeticInstrCost(

      unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Opd1Info, TTI::OperandValueInfo Opd2Info,

      ArrayRef<const Value *> Args, const Instruction *CxtI = nullptr) const {

    // Widenable conditions will eventually lower into constants, so some

    // operations with them will be trivially optimized away.

    auto IsWidenableCondition = [](const Value *V) {

      if (auto *II = dyn_cast<IntrinsicInst>(V))

        if (II->getIntrinsicID() == Intrinsic::experimental_widenable_condition)

          return true;

      return false;

    };

    // FIXME: A number of transformation tests seem to require these values

    // which seems a little odd for how arbitary there are.

    switch (Opcode) {

    default:

      break;

    case Instruction::FDiv:

    case Instruction::FRem:

    case Instruction::SDiv:

    case Instruction::SRem:

    case Instruction::UDiv:

    case Instruction::URem:

      // FIXME: Unlikely to be true for CodeSize.

      return TTI::TCC_Expensive;

    case Instruction::And:

    case Instruction::Or:

      if (any_of(Args, IsWidenableCondition))

        return TTI::TCC_Free;

      break;

    }


    // Assume a 3cy latency for fp arithmetic ops.

    if (CostKind == TTI::TCK_Latency)

      if (Ty->getScalarType()->isFloatingPointTy())

        return 3;


    return 1;

  }


  virtual InstructionCost getAltInstrCost(VectorType *VecTy, unsigned Opcode0,

                                          unsigned Opcode1,

                                          const SmallBitVector &OpcodeMask,

                                          TTI::TargetCostKind CostKind) const {

    return InstructionCost::getInvalid();

  }


  virtual InstructionCost


  getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy,

                 ArrayRef<int> Mask, TTI::TargetCostKind CostKind, int Index,

                 VectorType *SubTp, ArrayRef<const Value *> Args = {},

                 const Instruction *CxtI = nullptr) const {

    return 1;

  }


  virtual InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst,

                                           Type *Src, TTI::CastContextHint CCH,

                                           TTI::TargetCostKind CostKind,

                                           const Instruction *I) const {

    switch (Opcode) {

    default:

      break;

    case Instruction::IntToPtr: {

      unsigned SrcSize = Src->getScalarSizeInBits();

      if (DL.isLegalInteger(SrcSize) &&

          SrcSize <= DL.getPointerTypeSizeInBits(Dst))

        return 0;

      break;

    }

    case Instruction::PtrToAddr: {

      unsigned DstSize = Dst->getScalarSizeInBits();

      assert(DstSize == DL.getAddressSizeInBits(Src));

      if (DL.isLegalInteger(DstSize))

        return 0;

      break;

    }

    case Instruction::PtrToInt: {

      unsigned DstSize = Dst->getScalarSizeInBits();

      if (DL.isLegalInteger(DstSize) &&

          DstSize >= DL.getPointerTypeSizeInBits(Src))

        return 0;

      break;

    }

    case Instruction::BitCast:

      if (Dst == Src || (Dst->isPointerTy() && Src->isPointerTy()))

        // Identity and pointer-to-pointer casts are free.

        return 0;

      break;

    case Instruction::Trunc: {

      // trunc to a native type is free (assuming the target has compare and

      // shift-right of the same width).

      TypeSize DstSize = DL.getTypeSizeInBits(Dst);

      if (!DstSize.isScalable() && DL.isLegalInteger(DstSize.getFixedValue()))

        return 0;

      break;

    }

    }

    return 1;

  }


  virtual InstructionCost


  getExtractWithExtendCost(unsigned Opcode, Type *Dst, VectorType *VecTy,

                           unsigned Index, TTI::TargetCostKind CostKind) const {

    return 1;

  }


  virtual InstructionCost getCFInstrCost(unsigned Opcode,

                                         TTI::TargetCostKind CostKind,

                                         const Instruction *I = nullptr) const {

    // A phi would be free, unless we're costing the throughput because it

    // will require a register.

    if (Opcode == Instruction::PHI && CostKind != TTI::TCK_RecipThroughput)

      return 0;

    return 1;

  }


  virtual InstructionCost getCmpSelInstrCost(

      unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred,

      TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info,

      TTI::OperandValueInfo Op2Info, const Instruction *I) const {

    return 1;

  }


  virtual InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val,

                                             TTI::TargetCostKind CostKind,

                                             unsigned Index, const Value *Op0,

                                             const Value *Op1) const {

    return 1;

  }


  /// \param ScalarUserAndIdx encodes the information about extracts from a

  /// vector with 'Scalar' being the value being extracted,'User' being the user

  /// of the extract(nullptr if user is not known before vectorization) and

  /// 'Idx' being the extract lane.


  virtual InstructionCost getVectorInstrCost(

      unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index,

      Value *Scalar,

      ArrayRef<std::tuple<Value *, User *, int>> ScalarUserAndIdx) const {

    return 1;

  }


  virtual InstructionCost getVectorInstrCost(const Instruction &I, Type *Val,

                                             TTI::TargetCostKind CostKind,

                                             unsigned Index) const {

    return 1;

  }


  virtual InstructionCost


  getIndexedVectorInstrCostFromEnd(unsigned Opcode, Type *Val,

                                   TTI::TargetCostKind CostKind,

                                   unsigned Index) const {

    return 1;

  }


  virtual InstructionCost


  getReplicationShuffleCost(Type *EltTy, int ReplicationFactor, int VF,

                            const APInt &DemandedDstElts,

                            TTI::TargetCostKind CostKind) const {

    return 1;

  }


  virtual InstructionCost


  getInsertExtractValueCost(unsigned Opcode,

                            TTI::TargetCostKind CostKind) const {

    // Note: The `insertvalue` cost here is chosen to match the default case of

    // getInstructionCost() -- as prior to adding this helper `insertvalue` was

    // not handled.

    if (Opcode == Instruction::InsertValue &&

        CostKind != TTI::TCK_RecipThroughput)

      return TTI::TCC_Basic;

    return TTI::TCC_Free;

  }


  virtual InstructionCost


  getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment,

                  unsigned AddressSpace, TTI::TargetCostKind CostKind,

                  TTI::OperandValueInfo OpInfo, const Instruction *I) const {

    return 1;

  }


  virtual InstructionCost


  getMaskedMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment,

                        unsigned AddressSpace,

                        TTI::TargetCostKind CostKind) const {

    return 1;

  }


  virtual InstructionCost


  getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr,

                         bool VariableMask, Align Alignment,

                         TTI::TargetCostKind CostKind,

                         const Instruction *I = nullptr) const {

    return 1;

  }


  virtual InstructionCost getExpandCompressMemoryOpCost(

      unsigned Opcode, Type *DataTy, bool VariableMask, Align Alignment,

      TTI::TargetCostKind CostKind, const Instruction *I = nullptr) const {

    return 1;

  }


  virtual InstructionCost


  getStridedMemoryOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr,

                         bool VariableMask, Align Alignment,

                         TTI::TargetCostKind CostKind,

                         const Instruction *I = nullptr) const {

    return InstructionCost::getInvalid();

  }


  virtual InstructionCost getInterleavedMemoryOpCost(

      unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

      Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

      bool UseMaskForCond, bool UseMaskForGaps) const {

    return 1;

  }


  virtual InstructionCost


  getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,

                        TTI::TargetCostKind CostKind) const {

    switch (ICA.getID()) {

    default:

      break;

    case Intrinsic::allow_runtime_check:

    case Intrinsic::allow_ubsan_check:

    case Intrinsic::annotation:

    case Intrinsic::assume:

    case Intrinsic::sideeffect:

    case Intrinsic::pseudoprobe:

    case Intrinsic::arithmetic_fence:

    case Intrinsic::dbg_assign:

    case Intrinsic::dbg_declare:

    case Intrinsic::dbg_value:

    case Intrinsic::dbg_label:

    case Intrinsic::invariant_start:

    case Intrinsic::invariant_end:

    case Intrinsic::launder_invariant_group:

    case Intrinsic::strip_invariant_group:

    case Intrinsic::is_constant:

    case Intrinsic::lifetime_start:

    case Intrinsic::lifetime_end:

    case Intrinsic::experimental_noalias_scope_decl:

    case Intrinsic::objectsize:

    case Intrinsic::ptr_annotation:

    case Intrinsic::var_annotation:

    case Intrinsic::experimental_gc_result:

    case Intrinsic::experimental_gc_relocate:

    case Intrinsic::coro_alloc:

    case Intrinsic::coro_begin:

    case Intrinsic::coro_begin_custom_abi:

    case Intrinsic::coro_free:

    case Intrinsic::coro_end:

    case Intrinsic::coro_frame:

    case Intrinsic::coro_size:

    case Intrinsic::coro_align:

    case Intrinsic::coro_suspend:

    case Intrinsic::coro_subfn_addr:

    case Intrinsic::threadlocal_address:

    case Intrinsic::experimental_widenable_condition:

    case Intrinsic::ssa_copy:

      // These intrinsics don't actually represent code after lowering.

      return 0;

    }

    return 1;

  }


  virtual InstructionCost getCallInstrCost(Function *F, Type *RetTy,

                                           ArrayRef<Type *> Tys,

                                           TTI::TargetCostKind CostKind) const {

    return 1;

  }


  // Assume that we have a register of the right size for the type.

  virtual unsigned getNumberOfParts(Type *Tp) const { return 1; }


  virtual InstructionCost getAddressComputationCost(Type *PtrTy,

                                                    ScalarEvolution *,

                                                    const SCEV *,

                                                    TTI::TargetCostKind) const {

    return 0;

  }


  virtual InstructionCost


  getArithmeticReductionCost(unsigned, VectorType *,

                             std::optional<FastMathFlags> FMF,

                             TTI::TargetCostKind) const {

    return 1;

  }


  virtual InstructionCost getMinMaxReductionCost(Intrinsic::ID IID,

                                                 VectorType *, FastMathFlags,

                                                 TTI::TargetCostKind) const {

    return 1;

  }


  virtual InstructionCost


  getExtendedReductionCost(unsigned Opcode, bool IsUnsigned, Type *ResTy,

                           VectorType *Ty, std::optional<FastMathFlags> FMF,

                           TTI::TargetCostKind CostKind) const {

    return 1;

  }


  virtual InstructionCost


  getMulAccReductionCost(bool IsUnsigned, unsigned RedOpcode, Type *ResTy,

                         VectorType *Ty, TTI::TargetCostKind CostKind) const {

    return 1;

  }


  virtual InstructionCost


  getCostOfKeepingLiveOverCall(ArrayRef<Type *> Tys) const {

    return 0;

  }


  virtual bool getTgtMemIntrinsic(IntrinsicInst *Inst,

                                  MemIntrinsicInfo &Info) const {

    return false;

  }


  virtual unsigned getAtomicMemIntrinsicMaxElementSize() const {

    // Note for overrides: You must ensure for all element unordered-atomic

    // memory intrinsics that all power-of-2 element sizes up to, and

    // including, the return value of this method have a corresponding

    // runtime lib call. These runtime lib call definitions can be found

    // in RuntimeLibcalls.h

    return 0;

  }


  virtual Value *


  getOrCreateResultFromMemIntrinsic(IntrinsicInst *Inst, Type *ExpectedType,

                                    bool CanCreate = true) const {

    return nullptr;

  }


  virtual Type *


  getMemcpyLoopLoweringType(LLVMContext &Context, Value *Length,

                            unsigned SrcAddrSpace, unsigned DestAddrSpace,

                            Align SrcAlign, Align DestAlign,

                            std::optional<uint32_t> AtomicElementSize) const {

    return AtomicElementSize ? Type::getIntNTy(Context, *AtomicElementSize * 8)

                             : Type::getInt8Ty(Context);

  }


  virtual void getMemcpyLoopResidualLoweringType(

      SmallVectorImpl<Type *> &OpsOut, LLVMContext &Context,

      unsigned RemainingBytes, unsigned SrcAddrSpace, unsigned DestAddrSpace,

      Align SrcAlign, Align DestAlign,

      std::optional<uint32_t> AtomicCpySize) const {

    unsigned OpSizeInBytes = AtomicCpySize.value_or(1);

    Type *OpType = Type::getIntNTy(Context, OpSizeInBytes * 8);

    for (unsigned i = 0; i != RemainingBytes; i += OpSizeInBytes)

      OpsOut.push_back(OpType);

  }


  virtual bool areInlineCompatible(const Function *Caller,

                                   const Function *Callee) const {

    return (Caller->getFnAttribute("target-cpu") ==

            Callee->getFnAttribute("target-cpu")) &&

           (Caller->getFnAttribute("target-features") ==

            Callee->getFnAttribute("target-features"));

  }


  virtual unsigned getInlineCallPenalty(const Function *F, const CallBase &Call,

                                        unsigned DefaultCallPenalty) const {

    return DefaultCallPenalty;

  }


  virtual bool areTypesABICompatible(const Function *Caller,

                                     const Function *Callee,

                                     const ArrayRef<Type *> &Types) const {

    return (Caller->getFnAttribute("target-cpu") ==

            Callee->getFnAttribute("target-cpu")) &&

           (Caller->getFnAttribute("target-features") ==

            Callee->getFnAttribute("target-features"));

  }


  virtual bool isIndexedLoadLegal(TTI::MemIndexedMode Mode, Type *Ty) const {

    return false;

  }


  virtual bool isIndexedStoreLegal(TTI::MemIndexedMode Mode, Type *Ty) const {

    return false;

  }


  virtual unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const {

    return 128;

  }


  virtual bool isLegalToVectorizeLoad(LoadInst *LI) const { return true; }


  virtual bool isLegalToVectorizeStore(StoreInst *SI) const { return true; }


  virtual bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes,

                                           Align Alignment,

                                           unsigned AddrSpace) const {

    return true;

  }


  virtual bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes,

                                            Align Alignment,

                                            unsigned AddrSpace) const {

    return true;

  }


  virtual bool isLegalToVectorizeReduction(const RecurrenceDescriptor &RdxDesc,

                                           ElementCount VF) const {

    return true;

  }


  virtual bool isElementTypeLegalForScalableVector(Type *Ty) const {

    return true;

  }


  virtual unsigned getLoadVectorFactor(unsigned VF, unsigned LoadSize,

                                       unsigned ChainSizeInBytes,

                                       VectorType *VecTy) const {

    return VF;

  }


  virtual unsigned getStoreVectorFactor(unsigned VF, unsigned StoreSize,

                                        unsigned ChainSizeInBytes,

                                        VectorType *VecTy) const {

    return VF;

  }


  virtual bool preferFixedOverScalableIfEqualCost(bool IsEpilogue) const {

    return false;

  }


  virtual bool preferInLoopReduction(RecurKind Kind, Type *Ty) const {

    return false;

  }


  virtual bool preferAlternateOpcodeVectorization() const { return true; }


  virtual bool preferPredicatedReductionSelect() const { return false; }


  virtual bool preferEpilogueVectorization() const { return true; }


  virtual bool shouldConsiderVectorizationRegPressure() const { return false; }


  virtual bool shouldExpandReduction(const IntrinsicInst *II) const {

    return true;

  }


  virtual TTI::ReductionShuffle


  getPreferredExpandedReductionShuffle(const IntrinsicInst *II) const {

    return TTI::ReductionShuffle::SplitHalf;

  }


  virtual unsigned getGISelRematGlobalCost() const { return 1; }


  virtual unsigned getMinTripCountTailFoldingThreshold() const { return 0; }


  virtual bool supportsScalableVectors() const { return false; }


  virtual bool enableScalableVectorization() const { return false; }


  virtual bool hasActiveVectorLength() const { return false; }


  virtual bool isProfitableToSinkOperands(Instruction *I,

                                          SmallVectorImpl<Use *> &Ops) const {

    return false;

  }


  virtual bool isVectorShiftByScalarCheap(Type *Ty) const { return false; }


  virtual TargetTransformInfo::VPLegalization


  getVPLegalizationStrategy(const VPIntrinsic &PI) const {

    return TargetTransformInfo::VPLegalization(

        /* EVLParamStrategy */ TargetTransformInfo::VPLegalization::Discard,

        /* OperatorStrategy */ TargetTransformInfo::VPLegalization::Convert);

  }


  virtual bool hasArmWideBranch(bool) const { return false; }


  virtual APInt getFeatureMask(const Function &F) const {

    return APInt::getZero(32);

  }


  virtual bool isMultiversionedFunction(const Function &F) const {

    return false;

  }


  virtual unsigned getMaxNumArgs() const { return UINT_MAX; }


  virtual unsigned getNumBytesToPadGlobalArray(unsigned Size,

                                               Type *ArrayType) const {

    return 0;

  }


  virtual void collectKernelLaunchBounds(

      const Function &F,

      SmallVectorImpl<std::pair<StringRef, int64_t>> &LB) const {}


  virtual bool allowVectorElementIndexingUsingGEP() const { return true; }


protected:

  // Obtain the minimum required size to hold the value (without the sign)

  // In case of a vector it returns the min required size for one element.


  unsigned minRequiredElementSize(const Value *Val, bool &isSigned) const {

    if (isa<ConstantDataVector>(Val) || isa<ConstantVector>(Val)) {

      const auto *VectorValue = cast<Constant>(Val);


      // In case of a vector need to pick the max between the min

      // required size for each element

      auto *VT = cast<FixedVectorType>(Val->getType());


      // Assume unsigned elements

      isSigned = false;


      // The max required size is the size of the vector element type

      unsigned MaxRequiredSize =

          VT->getElementType()->getPrimitiveSizeInBits().getFixedValue();


      unsigned MinRequiredSize = 0;

      for (unsigned i = 0, e = VT->getNumElements(); i < e; ++i) {

        if (auto *IntElement =

                dyn_cast<ConstantInt>(VectorValue->getAggregateElement(i))) {

          bool signedElement = IntElement->getValue().isNegative();

          // Get the element min required size.

          unsigned ElementMinRequiredSize =

              IntElement->getValue().getSignificantBits() - 1;

          // In case one element is signed then all the vector is signed.

          isSigned |= signedElement;

          // Save the max required bit size between all the elements.

          MinRequiredSize = std::max(MinRequiredSize, ElementMinRequiredSize);

        } else {

          // not an int constant element

          return MaxRequiredSize;

        }

      }

      return MinRequiredSize;

    }


    if (const auto *CI = dyn_cast<ConstantInt>(Val)) {

      isSigned = CI->getValue().isNegative();

      return CI->getValue().getSignificantBits() - 1;

    }


    if (const auto *Cast = dyn_cast<SExtInst>(Val)) {

      isSigned = true;

      return Cast->getSrcTy()->getScalarSizeInBits() - 1;

    }


    if (const auto *Cast = dyn_cast<ZExtInst>(Val)) {

      isSigned = false;

      return Cast->getSrcTy()->getScalarSizeInBits();

    }


    isSigned = false;

    return Val->getType()->getScalarSizeInBits();

  }


  bool isStridedAccess(const SCEV *Ptr) const {

    return Ptr && isa<SCEVAddRecExpr>(Ptr);

  }


  const SCEVConstant *getConstantStrideStep(ScalarEvolution *SE,

                                            const SCEV *Ptr) const {

    if (!isStridedAccess(Ptr))

      return nullptr;

    const SCEVAddRecExpr *AddRec = cast<SCEVAddRecExpr>(Ptr);

    return dyn_cast<SCEVConstant>(AddRec->getStepRecurrence(*SE));

  }


  bool isConstantStridedAccessLessThan(ScalarEvolution *SE, const SCEV *Ptr,

                                       int64_t MergeDistance) const {

    const SCEVConstant *Step = getConstantStrideStep(SE, Ptr);

    if (!Step)

      return false;

    APInt StrideVal = Step->getAPInt();

    if (StrideVal.getBitWidth() > 64)

      return false;

    // FIXME: Need to take absolute value for negative stride case.

    return StrideVal.getSExtValue() < MergeDistance;

  }


};


/// CRTP base class for use as a mix-in that aids implementing

/// a TargetTransformInfo-compatible class.

template <typename T>


class TargetTransformInfoImplCRTPBase : public TargetTransformInfoImplBase {

private:

  typedef TargetTransformInfoImplBase BaseT;


protected:

  explicit TargetTransformInfoImplCRTPBase(const DataLayout &DL) : BaseT(DL) {}


public:


  InstructionCost getGEPCost(Type *PointeeType, const Value *Ptr,

                             ArrayRef<const Value *> Operands, Type *AccessType,

                             TTI::TargetCostKind CostKind) const override {

    assert(PointeeType && Ptr && "can't get GEPCost of nullptr");

    auto *BaseGV = dyn_cast<GlobalValue>(Ptr->stripPointerCasts());

    bool HasBaseReg = (BaseGV == nullptr);


    auto PtrSizeBits = DL.getPointerTypeSizeInBits(Ptr->getType());

    APInt BaseOffset(PtrSizeBits, 0);

    int64_t Scale = 0;


    auto GTI = gep_type_begin(PointeeType, Operands);

    Type *TargetType = nullptr;


    // Handle the case where the GEP instruction has a single operand,

    // the basis, therefore TargetType is a nullptr.

    if (Operands.empty())

      return !BaseGV ? TTI::TCC_Free : TTI::TCC_Basic;


    for (auto I = Operands.begin(); I != Operands.end(); ++I, ++GTI) {

      TargetType = GTI.getIndexedType();

      // We assume that the cost of Scalar GEP with constant index and the

      // cost of Vector GEP with splat constant index are the same.

      const ConstantInt *ConstIdx = dyn_cast<ConstantInt>(*I);

      if (!ConstIdx)

        if (auto Splat = getSplatValue(*I))

          ConstIdx = dyn_cast<ConstantInt>(Splat);

      if (StructType *STy = GTI.getStructTypeOrNull()) {

        // For structures the index is always splat or scalar constant

        assert(ConstIdx && "Unexpected GEP index");

        uint64_t Field = ConstIdx->getZExtValue();

        BaseOffset += DL.getStructLayout(STy)->getElementOffset(Field);

      } else {

        // If this operand is a scalable type, bail out early.

        // TODO: Make isLegalAddressingMode TypeSize aware.

        if (TargetType->isScalableTy())

          return TTI::TCC_Basic;

        int64_t ElementSize =

            GTI.getSequentialElementStride(DL).getFixedValue();

        if (ConstIdx) {

          BaseOffset +=

              ConstIdx->getValue().sextOrTrunc(PtrSizeBits) * ElementSize;

        } else {

          // Needs scale register.

          if (Scale != 0)

            // No addressing mode takes two scale registers.

            return TTI::TCC_Basic;

          Scale = ElementSize;

        }

      }

    }


    // If we haven't been provided a hint, use the target type for now.

    //

    // TODO: Take a look at potentially removing this: This is *slightly* wrong

    // as it's possible to have a GEP with a foldable target type but a memory

    // access that isn't foldable. For example, this load isn't foldable on

    // RISC-V:

    //

    // %p = getelementptr i32, ptr %base, i32 42

    // %x = load <2 x i32>, ptr %p

    if (!AccessType)

      AccessType = TargetType;


    // If the final address of the GEP is a legal addressing mode for the given

    // access type, then we can fold it into its users.

    if (static_cast<const T *>(this)->isLegalAddressingMode(

            AccessType, const_cast<GlobalValue *>(BaseGV),

            BaseOffset.sextOrTrunc(64).getSExtValue(), HasBaseReg, Scale,

            Ptr->getType()->getPointerAddressSpace()))

      return TTI::TCC_Free;


    // TODO: Instead of returning TCC_Basic here, we should use

    // getArithmeticInstrCost. Or better yet, provide a hook to let the target

    // model it.

    return TTI::TCC_Basic;

  }


  InstructionCost


  getPointersChainCost(ArrayRef<const Value *> Ptrs, const Value *Base,

                       const TTI::PointersChainInfo &Info, Type *AccessTy,

                       TTI::TargetCostKind CostKind) const override {

    InstructionCost Cost = TTI::TCC_Free;

    // In the basic model we take into account GEP instructions only

    // (although here can come alloca instruction, a value, constants and/or

    // constant expressions, PHIs, bitcasts ... whatever allowed to be used as a

    // pointer). Typically, if Base is a not a GEP-instruction and all the

    // pointers are relative to the same base address, all the rest are

    // either GEP instructions, PHIs, bitcasts or constants. When we have same

    // base, we just calculate cost of each non-Base GEP as an ADD operation if

    // any their index is a non-const.

    // If no known dependecies between the pointers cost is calculated as a sum

    // of costs of GEP instructions.

    for (const Value *V : Ptrs) {

      const auto *GEP = dyn_cast<GetElementPtrInst>(V);

      if (!GEP)

        continue;

      if (Info.isSameBase() && V != Base) {

        if (GEP->hasAllConstantIndices())

          continue;

        Cost += static_cast<const T *>(this)->getArithmeticInstrCost(

            Instruction::Add, GEP->getType(), CostKind,

            {TTI::OK_AnyValue, TTI::OP_None}, {TTI::OK_AnyValue, TTI::OP_None},

            {});

      } else {

        SmallVector<const Value *> Indices(GEP->indices());

        Cost += static_cast<const T *>(this)->getGEPCost(

            GEP->getSourceElementType(), GEP->getPointerOperand(), Indices,

            AccessTy, CostKind);

      }

    }

    return Cost;

  }


  InstructionCost


  getInstructionCost(const User *U, ArrayRef<const Value *> Operands,

                     TTI::TargetCostKind CostKind) const override {

    using namespace llvm::PatternMatch;


    auto *TargetTTI = static_cast<const T *>(this);

    // Handle non-intrinsic calls, invokes, and callbr.

    // FIXME: Unlikely to be true for anything but CodeSize.

    auto *CB = dyn_cast<CallBase>(U);

    if (CB && !isa<IntrinsicInst>(U)) {

      if (const Function *F = CB->getCalledFunction()) {

        if (!TargetTTI->isLoweredToCall(F))

          return TTI::TCC_Basic; // Give a basic cost if it will be lowered


        return TTI::TCC_Basic * (F->getFunctionType()->getNumParams() + 1);

      }

      // For indirect or other calls, scale cost by number of arguments.

      return TTI::TCC_Basic * (CB->arg_size() + 1);

    }


    Type *Ty = U->getType();

    unsigned Opcode = Operator::getOpcode(U);

    auto *I = dyn_cast<Instruction>(U);

    switch (Opcode) {

    default:

      break;

    case Instruction::Call: {

      assert(isa<IntrinsicInst>(U) && "Unexpected non-intrinsic call");

      auto *Intrinsic = cast<IntrinsicInst>(U);

      IntrinsicCostAttributes CostAttrs(Intrinsic->getIntrinsicID(), *CB);

      return TargetTTI->getIntrinsicInstrCost(CostAttrs, CostKind);

    }

    case Instruction::Br:

    case Instruction::Ret:

    case Instruction::PHI:

    case Instruction::Switch:

      return TargetTTI->getCFInstrCost(Opcode, CostKind, I);

    case Instruction::Freeze:

      return TTI::TCC_Free;

    case Instruction::ExtractValue:

    case Instruction::InsertValue:

      return TargetTTI->getInsertExtractValueCost(Opcode, CostKind);

    case Instruction::Alloca:

      if (cast<AllocaInst>(U)->isStaticAlloca())

        return TTI::TCC_Free;

      break;

    case Instruction::GetElementPtr: {

      const auto *GEP = cast<GEPOperator>(U);

      Type *AccessType = nullptr;

      // For now, only provide the AccessType in the simple case where the GEP

      // only has one user.

      if (GEP->hasOneUser() && I)

        AccessType = I->user_back()->getAccessType();


      return TargetTTI->getGEPCost(GEP->getSourceElementType(),

                                   Operands.front(), Operands.drop_front(),

                                   AccessType, CostKind);

    }

    case Instruction::Add:

    case Instruction::FAdd:

    case Instruction::Sub:

    case Instruction::FSub:

    case Instruction::Mul:

    case Instruction::FMul:

    case Instruction::UDiv:

    case Instruction::SDiv:

    case Instruction::FDiv:

    case Instruction::URem:

    case Instruction::SRem:

    case Instruction::FRem:

    case Instruction::Shl:

    case Instruction::LShr:

    case Instruction::AShr:

    case Instruction::And:

    case Instruction::Or:

    case Instruction::Xor:

    case Instruction::FNeg: {

      const TTI::OperandValueInfo Op1Info = TTI::getOperandInfo(Operands[0]);

      TTI::OperandValueInfo Op2Info;

      if (Opcode != Instruction::FNeg)

        Op2Info = TTI::getOperandInfo(Operands[1]);

      return TargetTTI->getArithmeticInstrCost(Opcode, Ty, CostKind, Op1Info,

                                               Op2Info, Operands, I);

    }

    case Instruction::IntToPtr:

    case Instruction::PtrToAddr:

    case Instruction::PtrToInt:

    case Instruction::SIToFP:

    case Instruction::UIToFP:

    case Instruction::FPToUI:

    case Instruction::FPToSI:

    case Instruction::Trunc:

    case Instruction::FPTrunc:

    case Instruction::BitCast:

    case Instruction::FPExt:

    case Instruction::SExt:

    case Instruction::ZExt:

    case Instruction::AddrSpaceCast: {

      Type *OpTy = Operands[0]->getType();

      return TargetTTI->getCastInstrCost(

          Opcode, Ty, OpTy, TTI::getCastContextHint(I), CostKind, I);

    }

    case Instruction::Store: {

      auto *SI = cast<StoreInst>(U);

      Type *ValTy = Operands[0]->getType();

      TTI::OperandValueInfo OpInfo = TTI::getOperandInfo(Operands[0]);

      return TargetTTI->getMemoryOpCost(Opcode, ValTy, SI->getAlign(),

                                        SI->getPointerAddressSpace(), CostKind,

                                        OpInfo, I);

    }

    case Instruction::Load: {

      // FIXME: Arbitary cost which could come from the backend.

      if (CostKind == TTI::TCK_Latency)

        return 4;

      auto *LI = cast<LoadInst>(U);

      Type *LoadType = U->getType();

      // If there is a non-register sized type, the cost estimation may expand

      // it to be several instructions to load into multiple registers on the

      // target.  But, if the only use of the load is a trunc instruction to a

      // register sized type, the instruction selector can combine these

      // instructions to be a single load.  So, in this case, we use the

      // destination type of the trunc instruction rather than the load to

      // accurately estimate the cost of this load instruction.

      if (CostKind == TTI::TCK_CodeSize && LI->hasOneUse() &&

          !LoadType->isVectorTy()) {

        if (const TruncInst *TI = dyn_cast<TruncInst>(*LI->user_begin()))

          LoadType = TI->getDestTy();

      }

      return TargetTTI->getMemoryOpCost(Opcode, LoadType, LI->getAlign(),

                                        LI->getPointerAddressSpace(), CostKind,

                                        {TTI::OK_AnyValue, TTI::OP_None}, I);

    }

    case Instruction::Select: {

      const Value *Op0, *Op1;

      if (match(U, m_LogicalAnd(m_Value(Op0), m_Value(Op1))) ||

          match(U, m_LogicalOr(m_Value(Op0), m_Value(Op1)))) {

        // select x, y, false --> x & y

        // select x, true, y --> x | y

        const auto Op1Info = TTI::getOperandInfo(Op0);

        const auto Op2Info = TTI::getOperandInfo(Op1);

        assert(Op0->getType()->getScalarSizeInBits() == 1 &&

               Op1->getType()->getScalarSizeInBits() == 1);


        SmallVector<const Value *, 2> Operands{Op0, Op1};

        return TargetTTI->getArithmeticInstrCost(

            match(U, m_LogicalOr()) ? Instruction::Or : Instruction::And, Ty,

            CostKind, Op1Info, Op2Info, Operands, I);

      }

      const auto Op1Info = TTI::getOperandInfo(Operands[1]);

      const auto Op2Info = TTI::getOperandInfo(Operands[2]);

      Type *CondTy = Operands[0]->getType();

      return TargetTTI->getCmpSelInstrCost(Opcode, U->getType(), CondTy,

                                           CmpInst::BAD_ICMP_PREDICATE,

                                           CostKind, Op1Info, Op2Info, I);

    }

    case Instruction::ICmp:

    case Instruction::FCmp: {

      const auto Op1Info = TTI::getOperandInfo(Operands[0]);

      const auto Op2Info = TTI::getOperandInfo(Operands[1]);

      Type *ValTy = Operands[0]->getType();

      // TODO: Also handle ICmp/FCmp constant expressions.

      return TargetTTI->getCmpSelInstrCost(Opcode, ValTy, U->getType(),

                                           I ? cast<CmpInst>(I)->getPredicate()

                                             : CmpInst::BAD_ICMP_PREDICATE,

                                           CostKind, Op1Info, Op2Info, I);

    }

    case Instruction::InsertElement: {

      auto *IE = dyn_cast<InsertElementInst>(U);

      if (!IE)

        return TTI::TCC_Basic; // FIXME

      unsigned Idx = -1;

      if (auto *CI = dyn_cast<ConstantInt>(Operands[2]))

        if (CI->getValue().getActiveBits() <= 32)

          Idx = CI->getZExtValue();

      return TargetTTI->getVectorInstrCost(*IE, Ty, CostKind, Idx);

    }

    case Instruction::ShuffleVector: {

      auto *Shuffle = dyn_cast<ShuffleVectorInst>(U);

      if (!Shuffle)

        return TTI::TCC_Basic; // FIXME


      auto *VecTy = cast<VectorType>(U->getType());

      auto *VecSrcTy = cast<VectorType>(Operands[0]->getType());

      ArrayRef<int> Mask = Shuffle->getShuffleMask();

      int NumSubElts, SubIndex;


      // Treat undef/poison mask as free (no matter the length).

      if (all_of(Mask, [](int M) { return M < 0; }))

        return TTI::TCC_Free;


      // TODO: move more of this inside improveShuffleKindFromMask.

      if (Shuffle->changesLength()) {

        // Treat a 'subvector widening' as a free shuffle.

        if (Shuffle->increasesLength() && Shuffle->isIdentityWithPadding())

          return TTI::TCC_Free;


        if (Shuffle->isExtractSubvectorMask(SubIndex))

          return TargetTTI->getShuffleCost(TTI::SK_ExtractSubvector, VecTy,

                                           VecSrcTy, Mask, CostKind, SubIndex,

                                           VecTy, Operands, Shuffle);


        if (Shuffle->isInsertSubvectorMask(NumSubElts, SubIndex))

          return TargetTTI->getShuffleCost(

              TTI::SK_InsertSubvector, VecTy, VecSrcTy, Mask, CostKind,

              SubIndex,

              FixedVectorType::get(VecTy->getScalarType(), NumSubElts),

              Operands, Shuffle);


        int ReplicationFactor, VF;

        if (Shuffle->isReplicationMask(ReplicationFactor, VF)) {

          APInt DemandedDstElts = APInt::getZero(Mask.size());

          for (auto I : enumerate(Mask)) {

            if (I.value() != PoisonMaskElem)

              DemandedDstElts.setBit(I.index());

          }

          return TargetTTI->getReplicationShuffleCost(

              VecSrcTy->getElementType(), ReplicationFactor, VF,

              DemandedDstElts, CostKind);

        }


        bool IsUnary = isa<UndefValue>(Operands[1]);

        NumSubElts = VecSrcTy->getElementCount().getKnownMinValue();

        SmallVector<int, 16> AdjustMask(Mask);


        // Widening shuffle - widening the source(s) to the new length

        // (treated as free - see above), and then perform the adjusted

        // shuffle at that width.

        if (Shuffle->increasesLength()) {

          for (int &M : AdjustMask)

            M = M >= NumSubElts ? (M + (Mask.size() - NumSubElts)) : M;


          return TargetTTI->getShuffleCost(

              IsUnary ? TTI::SK_PermuteSingleSrc : TTI::SK_PermuteTwoSrc, VecTy,

              VecTy, AdjustMask, CostKind, 0, nullptr, Operands, Shuffle);

        }


        // Narrowing shuffle - perform shuffle at original wider width and

        // then extract the lower elements.

        // FIXME: This can assume widening, which is not true of all vector

        // architectures (and is not even the default).

        AdjustMask.append(NumSubElts - Mask.size(), PoisonMaskElem);


        InstructionCost ShuffleCost = TargetTTI->getShuffleCost(

            IsUnary ? TTI::SK_PermuteSingleSrc : TTI::SK_PermuteTwoSrc,

            VecSrcTy, VecSrcTy, AdjustMask, CostKind, 0, nullptr, Operands,

            Shuffle);


        SmallVector<int, 16> ExtractMask(Mask.size());

        std::iota(ExtractMask.begin(), ExtractMask.end(), 0);

        return ShuffleCost + TargetTTI->getShuffleCost(

                                 TTI::SK_ExtractSubvector, VecTy, VecSrcTy,

                                 ExtractMask, CostKind, 0, VecTy, {}, Shuffle);

      }


      if (Shuffle->isIdentity())

        return TTI::TCC_Free;


      if (Shuffle->isReverse())

        return TargetTTI->getShuffleCost(TTI::SK_Reverse, VecTy, VecSrcTy, Mask,

                                         CostKind, 0, nullptr, Operands,

                                         Shuffle);


      if (Shuffle->isTranspose())

        return TargetTTI->getShuffleCost(TTI::SK_Transpose, VecTy, VecSrcTy,

                                         Mask, CostKind, 0, nullptr, Operands,

                                         Shuffle);


      if (Shuffle->isZeroEltSplat())

        return TargetTTI->getShuffleCost(TTI::SK_Broadcast, VecTy, VecSrcTy,

                                         Mask, CostKind, 0, nullptr, Operands,

                                         Shuffle);


      if (Shuffle->isSingleSource())

        return TargetTTI->getShuffleCost(TTI::SK_PermuteSingleSrc, VecTy,

                                         VecSrcTy, Mask, CostKind, 0, nullptr,

                                         Operands, Shuffle);


      if (Shuffle->isInsertSubvectorMask(NumSubElts, SubIndex))

        return TargetTTI->getShuffleCost(

            TTI::SK_InsertSubvector, VecTy, VecSrcTy, Mask, CostKind, SubIndex,

            FixedVectorType::get(VecTy->getScalarType(), NumSubElts), Operands,

            Shuffle);


      if (Shuffle->isSelect())

        return TargetTTI->getShuffleCost(TTI::SK_Select, VecTy, VecSrcTy, Mask,

                                         CostKind, 0, nullptr, Operands,

                                         Shuffle);


      if (Shuffle->isSplice(SubIndex))

        return TargetTTI->getShuffleCost(TTI::SK_Splice, VecTy, VecSrcTy, Mask,

                                         CostKind, SubIndex, nullptr, Operands,

                                         Shuffle);


      return TargetTTI->getShuffleCost(TTI::SK_PermuteTwoSrc, VecTy, VecSrcTy,

                                       Mask, CostKind, 0, nullptr, Operands,

                                       Shuffle);

    }

    case Instruction::ExtractElement: {

      auto *EEI = dyn_cast<ExtractElementInst>(U);

      if (!EEI)

        return TTI::TCC_Basic; // FIXME

      unsigned Idx = -1;

      if (auto *CI = dyn_cast<ConstantInt>(Operands[1]))

        if (CI->getValue().getActiveBits() <= 32)

          Idx = CI->getZExtValue();

      Type *DstTy = Operands[0]->getType();

      return TargetTTI->getVectorInstrCost(*EEI, DstTy, CostKind, Idx);

    }

    }


    // By default, just classify everything remaining as 'basic'.

    return TTI::TCC_Basic;

  }


  bool isExpensiveToSpeculativelyExecute(const Instruction *I) const override {

    auto *TargetTTI = static_cast<const T *>(this);

    SmallVector<const Value *, 4> Ops(I->operand_values());

    InstructionCost Cost = TargetTTI->getInstructionCost(

        I, Ops, TargetTransformInfo::TCK_SizeAndLatency);

    return Cost >= TargetTransformInfo::TCC_Expensive;

  }


  bool supportsTailCallFor(const CallBase *CB) const override {

    return static_cast<const T *>(this)->supportsTailCalls();

  }


};


} // namespace llvm


#endif

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

Info
Analysis containing CSE Info
Definition CSEInfo.cpp:27

CostKind
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))

IntrinsicCostStrategy::InstructionCost
@ InstructionCost
Definition CostModel.cpp:52

DataLayout.h

isSigned
static bool isSigned(unsigned int Opcode)
Definition ExpandLargeDivRem.cpp:52

GetElementPtrTypeIterator.h

GEP
Hexagon Common GEP
Definition HexagonCommonGEP.cpp:164

IntrinsicInst.h

Operator.h

InlinePriorityMode::Size
@ Size
Definition InlineOrder.cpp:25

Ops
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Definition ItaniumDemangle.h:3368

F
#define F(x, y, z)
Definition MD5.cpp:55

I
#define I(x, y, z)
Definition MD5.cpp:58

Operands
mir Rename Register Operands
Definition MIRNamerPass.cpp:74

T
#define T
Definition Mips16ISelLowering.cpp:353

II
uint64_t IntrinsicInst * II
Definition NVVMIntrRange.cpp:46

Field
OptimizedStructLayoutField Field
Definition OptimizedStructLayout.cpp:18

PatternMatch.h

Mode
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))

ScalarEvolutionExpressions.h

getType
static SymbolRef::Type getType(const Symbol *Sym)
Definition TapiFile.cpp:39

Ptr
@ Ptr
Definition TargetLibraryInfo.cpp:77

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

VectorUtils.h

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::APInt::setBit
void setBit(unsigned BitPosition)
Set the given bit to 1 whose position is given as "bitPosition".
Definition APInt.h:1330

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1488

llvm::APInt::sextOrTrunc
LLVM_ABI APInt sextOrTrunc(unsigned width) const
Sign extend or truncate to width.
Definition APInt.cpp:1041

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:200

llvm::APInt::getSExtValue
int64_t getSExtValue() const
Get sign extended value.
Definition APInt.h:1562

llvm::AllocaInst
an instruction to allocate memory on the stack
Definition Instructions.h:65

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41

llvm::ArrayType
Class to represent array types.
Definition DerivedTypes.h:398

llvm::AssumptionCache
A cache of @llvm.assume calls within a function.
Definition AssumptionCache.h:44

llvm::BlockFrequencyInfo
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Definition BlockFrequencyInfo.h:38

llvm::BranchInst
Conditional or Unconditional Branch instruction.
Definition Instructions.h:3058

llvm::BranchProbability
Definition BranchProbability.h:32

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition InstrTypes.h:1116

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:678

llvm::CmpInst::BAD_ICMP_PREDICATE
@ BAD_ICMP_PREDICATE
Definition InstrTypes.h:711

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition Constants.h:87

llvm::ConstantInt::getZExtValue
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
Definition Constants.h:163

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition Constants.h:154

llvm::Constant
This is an important base class in LLVM.
Definition Constant.h:43

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:63

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:165

llvm::ElementCount
Definition TypeSize.h:299

llvm::ElementCount::get
static constexpr ElementCount get(ScalarTy MinVal, bool Scalable)
Definition TypeSize.h:316

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition FMF.h:22

llvm::FixedVectorType::get
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition Type.cpp:803

llvm::Function
Definition Function.h:64

llvm::GlobalValue
Definition GlobalValue.h:49

llvm::InstCombiner
The core instruction combiner logic.
Definition InstCombiner.h:48

llvm::InstructionCost
Definition InstructionCost.h:30

llvm::InstructionCost::getInvalid
static InstructionCost getInvalid(CostType Val=0)
Definition InstructionCost.h:74

llvm::Instruction
Definition Instruction.h:69

llvm::IntrinsicCostAttributes
Definition TargetTransformInfo.h:126

llvm::IntrinsicCostAttributes::getID
Intrinsic::ID getID() const
Definition TargetTransformInfo.h:159

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition IntrinsicInst.h:49

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68

llvm::LoadInst
An instruction for reading from memory.
Definition Instructions.h:181

llvm::LoopInfo
Definition LoopInfo.h:408

llvm::Loop
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40

llvm::Operator::getOpcode
unsigned getOpcode() const
Return the opcode for this Instruction or ConstantExpr.
Definition Operator.h:43

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition OptimizationRemarkEmitter.h:33

llvm::ProfileSummaryInfo
Analysis providing profile information.
Definition ProfileSummaryInfo.h:42

llvm::RecurrenceDescriptor
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
Definition IVDescriptors.h:90

llvm::SCEVAddRecExpr
This node represents a polynomial recurrence on the trip count of the specified loop.
Definition ScalarEvolutionExpressions.h:348

llvm::SCEVAddRecExpr::getStepRecurrence
const SCEV * getStepRecurrence(ScalarEvolution &SE) const
Constructs and returns the recurrence indicating how much this expression steps by.
Definition ScalarEvolutionExpressions.h:366

llvm::SCEVConstant
This class represents a constant integer value.
Definition ScalarEvolutionExpressions.h:61

llvm::SCEVConstant::getAPInt
const APInt & getAPInt() const
Definition ScalarEvolutionExpressions.h:71

llvm::SCEV
This class represents an analyzed expression in the program.
Definition ScalarEvolution.h:72

llvm::ScalarEvolution
The main scalar evolution driver.
Definition ScalarEvolution.h:448

llvm::SmallBitVector
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
Definition SmallBitVector.h:35

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:573

llvm::SmallVectorImpl::append
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
Definition SmallVector.h:683

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:416

llvm::SmallVectorTemplateCommon::end
iterator end()
Definition SmallVector.h:272

llvm::SmallVectorTemplateCommon::begin
iterator begin()
Definition SmallVector.h:270

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1196

llvm::StackOffset
StackOffset holds a fixed and a scalable offset in bytes.
Definition TypeSize.h:31

llvm::StackOffset::getScalable
static StackOffset getScalable(int64_t Scalable)
Definition TypeSize.h:41

llvm::StackOffset::getFixed
static StackOffset getFixed(int64_t Fixed)
Definition TypeSize.h:40

llvm::StoreInst
An instruction for storing to memory.
Definition Instructions.h:297

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55

llvm::StructType
Class to represent struct types.
Definition DerivedTypes.h:218

llvm::SwitchInst
Multiway switch.
Definition Instructions.h:3196

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition TargetLibraryInfo.h:285

llvm::TargetTransformInfoImplBase::getPointersChainCost
virtual InstructionCost getPointersChainCost(ArrayRef< const Value * > Ptrs, const Value *Base, const TTI::PointersChainInfo &Info, Type *AccessTy, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:68

llvm::TargetTransformInfoImplBase::preferAlternateOpcodeVectorization
virtual bool preferAlternateOpcodeVectorization() const
Definition TargetTransformInfoImpl.h:1094

llvm::TargetTransformInfoImplBase::isProfitableLSRChainElement
virtual bool isProfitableLSRChainElement(Instruction *I) const
Definition TargetTransformInfoImpl.h:294

llvm::TargetTransformInfoImplBase::getCallerAllocaCost
virtual unsigned getCallerAllocaCost(const CallBase *CB, const AllocaInst *AI) const
Definition TargetTransformInfoImpl.h:105

llvm::TargetTransformInfoImplBase::shouldBuildLookupTables
virtual bool shouldBuildLookupTables() const
Definition TargetTransformInfoImpl.h:424

llvm::TargetTransformInfoImplBase::getInliningLastCallToStaticBonus
virtual int getInliningLastCallToStaticBonus() const
Definition TargetTransformInfoImpl.h:97

llvm::TargetTransformInfoImplBase::getTgtMemIntrinsic
virtual bool getTgtMemIntrinsic(IntrinsicInst *Inst, MemIntrinsicInfo &Info) const
Definition TargetTransformInfoImpl.h:976

llvm::TargetTransformInfoImplBase::getCostOfKeepingLiveOverCall
virtual InstructionCost getCostOfKeepingLiveOverCall(ArrayRef< Type * > Tys) const
Definition TargetTransformInfoImpl.h:972

llvm::TargetTransformInfoImplBase::getMaximumVF
virtual unsigned getMaximumVF(unsigned ElemWidth, unsigned Opcode) const
Definition TargetTransformInfoImpl.h:604

llvm::TargetTransformInfoImplBase::getMulAccReductionCost
virtual InstructionCost getMulAccReductionCost(bool IsUnsigned, unsigned RedOpcode, Type *ResTy, VectorType *Ty, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:966

llvm::TargetTransformInfoImplBase::getDataLayout
virtual const DataLayout & getDataLayout() const
Definition TargetTransformInfoImpl.h:50

llvm::TargetTransformInfoImplBase::preferFixedOverScalableIfEqualCost
virtual bool preferFixedOverScalableIfEqualCost(bool IsEpilogue) const
Definition TargetTransformInfoImpl.h:1087

llvm::TargetTransformInfoImplBase::getCacheAssociativity
virtual std::optional< unsigned > getCacheAssociativity(TargetTransformInfo::CacheLevel Level) const
Definition TargetTransformInfoImpl.h:630

llvm::TargetTransformInfoImplBase::getCallInstrCost
virtual InstructionCost getCallInstrCost(Function *F, Type *RetTy, ArrayRef< Type * > Tys, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:929

llvm::TargetTransformInfoImplBase::enableInterleavedAccessVectorization
virtual bool enableInterleavedAccessVectorization() const
Definition TargetTransformInfoImpl.h:499

llvm::TargetTransformInfoImplBase::getGatherScatterOpCost
virtual InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const
Definition TargetTransformInfoImpl.h:852

llvm::TargetTransformInfoImplBase::getFPOpCost
virtual InstructionCost getFPOpCost(Type *Ty) const
Definition TargetTransformInfoImpl.h:528

llvm::TargetTransformInfoImplBase::getMaxInterleaveFactor
virtual unsigned getMaxInterleaveFactor(ElementCount VF) const
Definition TargetTransformInfoImpl.h:662

llvm::TargetTransformInfoImplBase::isLegalMaskedExpandLoad
virtual bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment) const
Definition TargetTransformInfoImpl.h:369

llvm::TargetTransformInfoImplBase::enableMemCmpExpansion
virtual TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const
Definition TargetTransformInfoImpl.h:480

llvm::TargetTransformInfoImplBase::supportsTailCalls
virtual bool supportsTailCalls() const
Definition TargetTransformInfoImpl.h:469

llvm::TargetTransformInfoImplBase::isLegalToVectorizeLoadChain
virtual bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes, Align Alignment, unsigned AddrSpace) const
Definition TargetTransformInfoImpl.h:1054

llvm::TargetTransformInfoImplBase::isStridedAccess
bool isStridedAccess(const SCEV *Ptr) const
Definition TargetTransformInfoImpl.h:1215

llvm::TargetTransformInfoImplBase::~TargetTransformInfoImplBase
virtual ~TargetTransformInfoImplBase()

llvm::TargetTransformInfoImplBase::getAtomicMemIntrinsicMaxElementSize
virtual unsigned getAtomicMemIntrinsicMaxElementSize() const
Definition TargetTransformInfoImpl.h:981

llvm::TargetTransformInfoImplBase::rewriteIntrinsicWithAddressSpace
virtual Value * rewriteIntrinsicWithAddressSpace(IntrinsicInst *II, Value *OldV, Value *NewV) const
Definition TargetTransformInfoImpl.h:168

llvm::TargetTransformInfoImplBase::isLegalMaskedLoad
virtual bool isLegalMaskedLoad(Type *DataType, Align Alignment, unsigned AddressSpace) const
Definition TargetTransformInfoImpl.h:316

llvm::TargetTransformInfoImplBase::supportsScalableVectors
virtual bool supportsScalableVectors() const
Definition TargetTransformInfoImpl.h:1115

llvm::TargetTransformInfoImplBase::getVPLegalizationStrategy
virtual TargetTransformInfo::VPLegalization getVPLegalizationStrategy(const VPIntrinsic &PI) const
Definition TargetTransformInfoImpl.h:1129

llvm::TargetTransformInfoImplBase::enableAggressiveInterleaving
virtual bool enableAggressiveInterleaving(bool LoopHasReductions) const
Definition TargetTransformInfoImpl.h:475

llvm::TargetTransformInfoImplBase::simplifyDemandedVectorEltsIntrinsic
virtual std::optional< Value * > simplifyDemandedVectorEltsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts, APInt &UndefElts2, APInt &UndefElts3, std::function< void(Instruction *, unsigned, APInt, APInt &)> SimplifyAndSetOp) const
Definition TargetTransformInfoImpl.h:251

llvm::TargetTransformInfoImplBase::getAddressComputationCost
virtual InstructionCost getAddressComputationCost(Type *PtrTy, ScalarEvolution *, const SCEV *, TTI::TargetCostKind) const
Definition TargetTransformInfoImpl.h:938

llvm::TargetTransformInfoImplBase::getVectorInstrCost
virtual InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1) const
Definition TargetTransformInfoImpl.h:787

llvm::TargetTransformInfoImplBase::isLegalBroadcastLoad
virtual bool isLegalBroadcastLoad(Type *ElementTy, ElementCount NumElements) const
Definition TargetTransformInfoImpl.h:335

llvm::TargetTransformInfoImplBase::isSingleThreaded
virtual bool isSingleThreaded() const
Definition TargetTransformInfoImpl.h:161

llvm::TargetTransformInfoImplBase::isIndexedLoadLegal
virtual bool isIndexedLoadLegal(TTI::MemIndexedMode Mode, Type *Ty) const
Definition TargetTransformInfoImpl.h:1038

llvm::TargetTransformInfoImplBase::adjustInliningThreshold
virtual unsigned adjustInliningThreshold(const CallBase *CB) const
Definition TargetTransformInfoImpl.h:102

llvm::TargetTransformInfoImplBase::getPartialReductionCost
virtual InstructionCost getPartialReductionCost(unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType, ElementCount VF, TTI::PartialReductionExtendKind OpAExtend, TTI::PartialReductionExtendKind OpBExtend, std::optional< unsigned > BinOp, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:654

llvm::TargetTransformInfoImplBase::getLoadVectorFactor
virtual unsigned getLoadVectorFactor(unsigned VF, unsigned LoadSize, unsigned ChainSizeInBytes, VectorType *VecTy) const
Definition TargetTransformInfoImpl.h:1075

llvm::TargetTransformInfoImplBase::shouldDropLSRSolutionIfLessProfitable
virtual bool shouldDropLSRSolutionIfLessProfitable() const
Definition TargetTransformInfoImpl.h:292

llvm::TargetTransformInfoImplBase::hasVolatileVariant
virtual bool hasVolatileVariant(Instruction *I, unsigned AddrSpace) const
Definition TargetTransformInfoImpl.h:394

llvm::TargetTransformInfoImplBase::canMacroFuseCmp
virtual bool canMacroFuseCmp() const
Definition TargetTransformInfoImpl.h:298

llvm::TargetTransformInfoImplBase::getInlinerVectorBonusPercent
virtual int getInlinerVectorBonusPercent() const
Definition TargetTransformInfoImpl.h:110

llvm::TargetTransformInfoImplBase::prefersVectorizedAddressing
virtual bool prefersVectorizedAddressing() const
Definition TargetTransformInfoImpl.h:398

llvm::TargetTransformInfoImplBase::hasDivRemOp
virtual bool hasDivRemOp(Type *DataType, bool IsSigned) const
Definition TargetTransformInfoImpl.h:390

llvm::TargetTransformInfoImplBase::isLegalStridedLoadStore
virtual bool isLegalStridedLoadStore(Type *DataType, Align Alignment) const
Definition TargetTransformInfoImpl.h:373

llvm::TargetTransformInfoImplBase::getStoreMinimumVF
virtual unsigned getStoreMinimumVF(unsigned VF, Type *, Type *) const
Definition TargetTransformInfoImpl.h:607

llvm::TargetTransformInfoImplBase::isLegalICmpImmediate
virtual bool isLegalICmpImmediate(int64_t Imm) const
Definition TargetTransformInfoImpl.h:270

llvm::TargetTransformInfoImplBase::LSRWithInstrQueries
virtual bool LSRWithInstrQueries() const
Definition TargetTransformInfoImpl.h:412

llvm::TargetTransformInfoImplBase::preferPredicatedReductionSelect
virtual bool preferPredicatedReductionSelect() const
Definition TargetTransformInfoImpl.h:1096

llvm::TargetTransformInfoImplBase::getMemoryOpCost
virtual InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo, const Instruction *I) const
Definition TargetTransformInfoImpl.h:838

llvm::TargetTransformInfoImplBase::useAA
virtual bool useAA() const
Definition TargetTransformInfoImpl.h:418

llvm::TargetTransformInfoImplBase::preferPredicateOverEpilogue
virtual bool preferPredicateOverEpilogue(TailFoldingInfo *TFI) const
Definition TargetTransformInfoImpl.h:230

llvm::TargetTransformInfoImplBase::haveFastSqrt
virtual bool haveFastSqrt(Type *Ty) const
Definition TargetTransformInfoImpl.h:520

llvm::TargetTransformInfoImplBase::getMinimumVF
virtual ElementCount getMinimumVF(unsigned ElemWidth, bool IsScalable) const
Definition TargetTransformInfoImpl.h:600

llvm::TargetTransformInfoImplBase::collectFlatAddressOperands
virtual bool collectFlatAddressOperands(SmallVectorImpl< int > &OpIndexes, Intrinsic::ID IID) const
Definition TargetTransformInfoImpl.h:148

llvm::TargetTransformInfoImplBase::addrspacesMayAlias
virtual bool addrspacesMayAlias(unsigned AS0, unsigned AS1) const
Definition TargetTransformInfoImpl.h:142

llvm::TargetTransformInfoImplBase::canSaveCmp
virtual bool canSaveCmp(Loop *L, BranchInst **BI, ScalarEvolution *SE, LoopInfo *LI, DominatorTree *DT, AssumptionCache *AC, TargetLibraryInfo *LibInfo) const
Definition TargetTransformInfoImpl.h:300

llvm::TargetTransformInfoImplBase::getVectorInstrCost
virtual InstructionCost getVectorInstrCost(const Instruction &I, Type *Val, TTI::TargetCostKind CostKind, unsigned Index) const
Definition TargetTransformInfoImpl.h:805

llvm::TargetTransformInfoImplBase::getRegisterClassForType
virtual unsigned getRegisterClassForType(bool Vector, Type *Ty=nullptr) const
Definition TargetTransformInfoImpl.h:566

llvm::TargetTransformInfoImplBase::getVScaleForTuning
virtual std::optional< unsigned > getVScaleForTuning() const
Definition TargetTransformInfoImpl.h:590

llvm::TargetTransformInfoImplBase::getIntImmCost
virtual InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:538

llvm::TargetTransformInfoImplBase::getScalingFactorCost
virtual InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, StackOffset BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace) const
Definition TargetTransformInfoImpl.h:400

llvm::TargetTransformInfoImplBase::getNumberOfParts
virtual unsigned getNumberOfParts(Type *Tp) const
Definition TargetTransformInfoImpl.h:936

llvm::TargetTransformInfoImplBase::isLegalMaskedCompressStore
virtual bool isLegalMaskedCompressStore(Type *DataType, Align Alignment) const
Definition TargetTransformInfoImpl.h:358

llvm::TargetTransformInfoImplBase::isHardwareLoopProfitable
virtual bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE, AssumptionCache &AC, TargetLibraryInfo *LibInfo, HardwareLoopInfo &HWLoopInfo) const
Definition TargetTransformInfoImpl.h:221

llvm::TargetTransformInfoImplBase::getPeelingPreferences
virtual void getPeelingPreferences(Loop *, ScalarEvolution &, TTI::PeelingPreferences &) const
Definition TargetTransformInfoImpl.h:263

llvm::TargetTransformInfoImplBase::simplifyDemandedUseBitsIntrinsic
virtual std::optional< Value * > simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedMask, KnownBits &Known, bool &KnownBitsComputed) const
Definition TargetTransformInfoImpl.h:245

llvm::TargetTransformInfoImplBase::useColdCCForColdCall
virtual bool useColdCCForColdCall(Function &F) const
Definition TargetTransformInfoImpl.h:432

llvm::TargetTransformInfoImplBase::getStridedMemoryOpCost
virtual InstructionCost getStridedMemoryOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const
Definition TargetTransformInfoImpl.h:866

llvm::TargetTransformInfoImplBase::getNumberOfRegisters
virtual unsigned getNumberOfRegisters(unsigned ClassID) const
Definition TargetTransformInfoImpl.h:561

llvm::TargetTransformInfoImplBase::getPrefetchDistance
virtual unsigned getPrefetchDistance() const
Definition TargetTransformInfoImpl.h:643

llvm::TargetTransformInfoImplBase::canHaveNonUndefGlobalInitializerInAddressSpace
virtual bool canHaveNonUndefGlobalInitializerInAddressSpace(unsigned AS) const
Definition TargetTransformInfoImpl.h:155

llvm::TargetTransformInfoImplBase::isLegalAddScalableImmediate
virtual bool isLegalAddScalableImmediate(int64_t Imm) const
Definition TargetTransformInfoImpl.h:268

llvm::TargetTransformInfoImplBase::isLegalInterleavedAccessType
virtual bool isLegalInterleavedAccessType(VectorType *VTy, unsigned Factor, Align Alignment, unsigned AddrSpace) const
Definition TargetTransformInfoImpl.h:377

llvm::TargetTransformInfoImplBase::TargetTransformInfoImplBase
TargetTransformInfoImplBase(TargetTransformInfoImplBase &&Arg)
Definition TargetTransformInfoImpl.h:48

llvm::TargetTransformInfoImplBase::shouldPrefetchAddressSpace
virtual bool shouldPrefetchAddressSpace(unsigned AS) const
Definition TargetTransformInfoImpl.h:652

llvm::TargetTransformInfoImplBase::forceScalarizeMaskedScatter
virtual bool forceScalarizeMaskedScatter(VectorType *DataType, Align Alignment) const
Definition TargetTransformInfoImpl.h:353

llvm::TargetTransformInfoImplBase::getMaxMemIntrinsicInlineSizeThreshold
virtual uint64_t getMaxMemIntrinsicInlineSizeThreshold() const
Definition TargetTransformInfoImpl.h:116

llvm::TargetTransformInfoImplBase::getMinVectorRegisterBitWidth
virtual unsigned getMinVectorRegisterBitWidth() const
Definition TargetTransformInfoImpl.h:587

llvm::TargetTransformInfoImplBase::minRequiredElementSize
unsigned minRequiredElementSize(const Value *Val, bool &isSigned) const
Definition TargetTransformInfoImpl.h:1161

llvm::TargetTransformInfoImplBase::shouldBuildLookupTablesForConstant
virtual bool shouldBuildLookupTablesForConstant(Constant *C) const
Definition TargetTransformInfoImpl.h:426

llvm::TargetTransformInfoImplBase::isFPVectorizationPotentiallyUnsafe
virtual bool isFPVectorizationPotentiallyUnsafe() const
Definition TargetTransformInfoImpl.h:505

llvm::TargetTransformInfoImplBase::isLegalToVectorizeReduction
virtual bool isLegalToVectorizeReduction(const RecurrenceDescriptor &RdxDesc, ElementCount VF) const
Definition TargetTransformInfoImpl.h:1066

llvm::TargetTransformInfoImplBase::getIntImmCostInst
virtual InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind, Instruction *Inst=nullptr) const
Definition TargetTransformInfoImpl.h:543

llvm::TargetTransformInfoImplBase::areTypesABICompatible
virtual bool areTypesABICompatible(const Function *Caller, const Function *Callee, const ArrayRef< Type * > &Types) const
Definition TargetTransformInfoImpl.h:1029

llvm::TargetTransformInfoImplBase::isLegalAltInstr
virtual bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask) const
Definition TargetTransformInfoImpl.h:363

llvm::TargetTransformInfoImplBase::getMaskedMemoryOpCost
virtual InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:845

llvm::TargetTransformInfoImplBase::getIndexedVectorInstrCostFromEnd
virtual InstructionCost getIndexedVectorInstrCostFromEnd(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index) const
Definition TargetTransformInfoImpl.h:812

llvm::TargetTransformInfoImplBase::getCacheSize
virtual std::optional< unsigned > getCacheSize(TargetTransformInfo::CacheLevel Level) const
Definition TargetTransformInfoImpl.h:619

llvm::TargetTransformInfoImplBase::getExtractWithExtendCost
virtual InstructionCost getExtractWithExtendCost(unsigned Opcode, Type *Dst, VectorType *VecTy, unsigned Index, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:765

llvm::TargetTransformInfoImplBase::shouldTreatInstructionLikeSelect
virtual bool shouldTreatInstructionLikeSelect(const Instruction *I) const
Definition TargetTransformInfoImpl.h:486

llvm::TargetTransformInfoImplBase::instCombineIntrinsic
virtual std::optional< Instruction * > instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const
Definition TargetTransformInfoImpl.h:240

llvm::TargetTransformInfoImplBase::getEpilogueVectorizationMinVF
virtual unsigned getEpilogueVectorizationMinVF() const
Definition TargetTransformInfoImpl.h:228

llvm::TargetTransformInfoImplBase::getPredicatedAddrSpace
virtual std::pair< const Value *, unsigned > getPredicatedAddrSpace(const Value *V) const
Definition TargetTransformInfoImpl.h:164

llvm::TargetTransformInfoImplBase::shouldMaximizeVectorBandwidth
virtual bool shouldMaximizeVectorBandwidth(TargetTransformInfo::RegisterKind K) const
Definition TargetTransformInfoImpl.h:596

llvm::TargetTransformInfoImplBase::getMemcpyLoopResidualLoweringType
virtual void getMemcpyLoopResidualLoweringType(SmallVectorImpl< Type * > &OpsOut, LLVMContext &Context, unsigned RemainingBytes, unsigned SrcAddrSpace, unsigned DestAddrSpace, Align SrcAlign, Align DestAlign, std::optional< uint32_t > AtomicCpySize) const
Definition TargetTransformInfoImpl.h:1005

llvm::TargetTransformInfoImplBase::getPopcntSupport
virtual TTI::PopcntSupportKind getPopcntSupport(unsigned IntTyWidthInBit) const
Definition TargetTransformInfoImpl.h:516

llvm::TargetTransformInfoImplBase::getPreferredAddressingMode
virtual TTI::AddressingModeKind getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const
Definition TargetTransformInfoImpl.h:307

llvm::TargetTransformInfoImplBase::forceScalarizeMaskedGather
virtual bool forceScalarizeMaskedGather(VectorType *DataType, Align Alignment) const
Definition TargetTransformInfoImpl.h:348

llvm::TargetTransformInfoImplBase::getMaxPrefetchIterationsAhead
virtual unsigned getMaxPrefetchIterationsAhead() const
Definition TargetTransformInfoImpl.h:650

llvm::TargetTransformInfoImplBase::allowVectorElementIndexingUsingGEP
virtual bool allowVectorElementIndexingUsingGEP() const
Definition TargetTransformInfoImpl.h:1156

llvm::TargetTransformInfoImplBase::getInstructionCost
virtual InstructionCost getInstructionCost(const User *U, ArrayRef< const Value * > Operands, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:85

llvm::TargetTransformInfoImplBase::getPreferredExpandedReductionShuffle
virtual TTI::ReductionShuffle getPreferredExpandedReductionShuffle(const IntrinsicInst *II) const
Definition TargetTransformInfoImpl.h:1107

llvm::TargetTransformInfoImplBase::getConstantStrideStep
const SCEVConstant * getConstantStrideStep(ScalarEvolution *SE, const SCEV *Ptr) const
Definition TargetTransformInfoImpl.h:1219

llvm::TargetTransformInfoImplBase::hasBranchDivergence
virtual bool hasBranchDivergence(const Function *F=nullptr) const
Definition TargetTransformInfoImpl.h:130

llvm::TargetTransformInfoImplBase::getArithmeticReductionCost
virtual InstructionCost getArithmeticReductionCost(unsigned, VectorType *, std::optional< FastMathFlags > FMF, TTI::TargetCostKind) const
Definition TargetTransformInfoImpl.h:946

llvm::TargetTransformInfoImplBase::isProfitableToHoist
virtual bool isProfitableToHoist(Instruction *I) const
Definition TargetTransformInfoImpl.h:416

llvm::TargetTransformInfoImplBase::getRegisterClassName
virtual const char * getRegisterClassName(unsigned ClassID) const
Definition TargetTransformInfoImpl.h:571

llvm::TargetTransformInfoImplBase::getMinMaxReductionCost
virtual InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *, FastMathFlags, TTI::TargetCostKind) const
Definition TargetTransformInfoImpl.h:952

llvm::TargetTransformInfoImplBase::getCacheLineSize
virtual unsigned getCacheLineSize() const
Definition TargetTransformInfoImpl.h:617

llvm::TargetTransformInfoImplBase::isLegalToVectorizeLoad
virtual bool isLegalToVectorizeLoad(LoadInst *LI) const
Definition TargetTransformInfoImpl.h:1050

llvm::TargetTransformInfoImplBase::isTargetIntrinsicTriviallyScalarizable
virtual bool isTargetIntrinsicTriviallyScalarizable(Intrinsic::ID ID) const
Definition TargetTransformInfoImpl.h:434

llvm::TargetTransformInfoImplBase::getLoadStoreVecRegBitWidth
virtual unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const
Definition TargetTransformInfoImpl.h:1046

llvm::TargetTransformInfoImplBase::getAltInstrCost
virtual InstructionCost getAltInstrCost(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:704

llvm::TargetTransformInfoImplBase::getInlineCallPenalty
virtual unsigned getInlineCallPenalty(const Function *F, const CallBase &Call, unsigned DefaultCallPenalty) const
Definition TargetTransformInfoImpl.h:1024

llvm::TargetTransformInfoImplBase::hasArmWideBranch
virtual bool hasArmWideBranch(bool) const
Definition TargetTransformInfoImpl.h:1135

llvm::TargetTransformInfoImplBase::isVectorShiftByScalarCheap
virtual bool isVectorShiftByScalarCheap(Type *Ty) const
Definition TargetTransformInfoImpl.h:1126

llvm::TargetTransformInfoImplBase::isLegalNTStore
virtual bool isLegalNTStore(Type *DataType, Align Alignment) const
Definition TargetTransformInfoImpl.h:321

llvm::TargetTransformInfoImplBase::getExpandCompressMemoryOpCost
virtual InstructionCost getExpandCompressMemoryOpCost(unsigned Opcode, Type *DataTy, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const
Definition TargetTransformInfoImpl.h:859

llvm::TargetTransformInfoImplBase::getFeatureMask
virtual APInt getFeatureMask(const Function &F) const
Definition TargetTransformInfoImpl.h:1137

llvm::TargetTransformInfoImplBase::getMinPageSize
virtual std::optional< unsigned > getMinPageSize() const
Definition TargetTransformInfoImpl.h:641

llvm::TargetTransformInfoImplBase::getRegUsageForType
virtual unsigned getRegUsageForType(Type *Ty) const
Definition TargetTransformInfoImpl.h:422

llvm::TargetTransformInfoImplBase::isLegalAddressingMode
virtual bool isLegalAddressingMode(Type *Ty, GlobalValue *BaseGV, int64_t BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace, Instruction *I=nullptr, int64_t ScalableOffset=0) const
Definition TargetTransformInfoImpl.h:272

llvm::TargetTransformInfoImplBase::isElementTypeLegalForScalableVector
virtual bool isElementTypeLegalForScalableVector(Type *Ty) const
Definition TargetTransformInfoImpl.h:1071

llvm::TargetTransformInfoImplBase::isLoweredToCall
virtual bool isLoweredToCall(const Function *F) const
Definition TargetTransformInfoImpl.h:174

llvm::TargetTransformInfoImplBase::isLegalMaskedScatter
virtual bool isLegalMaskedScatter(Type *DataType, Align Alignment) const
Definition TargetTransformInfoImpl.h:340

llvm::TargetTransformInfoImplBase::isTruncateFree
virtual bool isTruncateFree(Type *Ty1, Type *Ty2) const
Definition TargetTransformInfoImpl.h:414

llvm::TargetTransformInfoImplBase::getArithmeticInstrCost
virtual InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Opd1Info, TTI::OperandValueInfo Opd2Info, ArrayRef< const Value * > Args, const Instruction *CxtI=nullptr) const
Definition TargetTransformInfoImpl.h:664

llvm::TargetTransformInfoImplBase::isIndexedStoreLegal
virtual bool isIndexedStoreLegal(TTI::MemIndexedMode Mode, Type *Ty) const
Definition TargetTransformInfoImpl.h:1042

llvm::TargetTransformInfoImplBase::getGEPCost
virtual InstructionCost getGEPCost(Type *PointeeType, const Value *Ptr, ArrayRef< const Value * > Operands, Type *AccessType, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:54

llvm::TargetTransformInfoImplBase::getPredictableBranchThreshold
virtual BranchProbability getPredictableBranchThreshold() const
Definition TargetTransformInfoImpl.h:124

llvm::TargetTransformInfoImplBase::isValidAddrSpaceCast
virtual bool isValidAddrSpaceCast(unsigned FromAS, unsigned ToAS) const
Definition TargetTransformInfoImpl.h:138

llvm::TargetTransformInfoImplBase::getReplicationShuffleCost
virtual InstructionCost getReplicationShuffleCost(Type *EltTy, int ReplicationFactor, int VF, const APInt &DemandedDstElts, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:819

llvm::TargetTransformInfoImplBase::enableScalableVectorization
virtual bool enableScalableVectorization() const
Definition TargetTransformInfoImpl.h:1117

llvm::TargetTransformInfoImplBase::isLegalToVectorizeStore
virtual bool isLegalToVectorizeStore(StoreInst *SI) const
Definition TargetTransformInfoImpl.h:1052

llvm::TargetTransformInfoImplBase::areInlineCompatible
virtual bool areInlineCompatible(const Function *Caller, const Function *Callee) const
Definition TargetTransformInfoImpl.h:1016

llvm::TargetTransformInfoImplBase::isTargetIntrinsicWithStructReturnOverloadAtField
virtual bool isTargetIntrinsicWithStructReturnOverloadAtField(Intrinsic::ID ID, int RetIdx) const
Definition TargetTransformInfoImpl.h:449

llvm::TargetTransformInfoImplBase::hasConditionalLoadStoreForType
virtual bool hasConditionalLoadStoreForType(Type *Ty, bool IsStore) const
Definition TargetTransformInfoImpl.h:562

llvm::TargetTransformInfoImplBase::preferInLoopReduction
virtual bool preferInLoopReduction(RecurKind Kind, Type *Ty) const
Definition TargetTransformInfoImpl.h:1091

llvm::TargetTransformInfoImplBase::isMultiversionedFunction
virtual bool isMultiversionedFunction(const Function &F) const
Definition TargetTransformInfoImpl.h:1141

llvm::TargetTransformInfoImplBase::getCFInstrCost
virtual InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const
Definition TargetTransformInfoImpl.h:770

llvm::TargetTransformInfoImplBase::isNoopAddrSpaceCast
virtual bool isNoopAddrSpaceCast(unsigned, unsigned) const
Definition TargetTransformInfoImpl.h:153

llvm::TargetTransformInfoImplBase::isVScaleKnownToBeAPowerOfTwo
virtual bool isVScaleKnownToBeAPowerOfTwo() const
Definition TargetTransformInfoImpl.h:593

llvm::TargetTransformInfoImplBase::isExpensiveToSpeculativelyExecute
virtual bool isExpensiveToSpeculativelyExecute(const Instruction *I) const
Definition TargetTransformInfoImpl.h:522

llvm::TargetTransformInfoImplBase::isLSRCostLess
virtual bool isLSRCostLess(const TTI::LSRCost &C1, const TTI::LSRCost &C2) const
Definition TargetTransformInfoImpl.h:282

llvm::TargetTransformInfoImplBase::isLegalMaskedVectorHistogram
virtual bool isLegalMaskedVectorHistogram(Type *AddrType, Type *DataType) const
Definition TargetTransformInfoImpl.h:383

llvm::TargetTransformInfoImplBase::isLegalMaskedGather
virtual bool isLegalMaskedGather(Type *DataType, Align Alignment) const
Definition TargetTransformInfoImpl.h:344

llvm::TargetTransformInfoImplBase::getEstimatedNumberOfCaseClusters
virtual unsigned getEstimatedNumberOfCaseClusters(const SwitchInst &SI, unsigned &JTSize, ProfileSummaryInfo *PSI, BlockFrequencyInfo *BFI) const
Definition TargetTransformInfoImpl.h:75

llvm::TargetTransformInfoImplBase::hasActiveVectorLength
virtual bool hasActiveVectorLength() const
Definition TargetTransformInfoImpl.h:1119

llvm::TargetTransformInfoImplBase::isLegalAddImmediate
virtual bool isLegalAddImmediate(int64_t Imm) const
Definition TargetTransformInfoImpl.h:266

llvm::TargetTransformInfoImplBase::getInsertExtractValueCost
virtual InstructionCost getInsertExtractValueCost(unsigned Opcode, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:826

llvm::TargetTransformInfoImplBase::getCastInstrCost
virtual InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I) const
Definition TargetTransformInfoImpl.h:719

llvm::TargetTransformInfoImplBase::isLegalNTLoad
virtual bool isLegalNTLoad(Type *DataType, Align Alignment) const
Definition TargetTransformInfoImpl.h:328

llvm::TargetTransformInfoImplBase::getBranchMispredictPenalty
virtual InstructionCost getBranchMispredictPenalty() const
Definition TargetTransformInfoImpl.h:128

llvm::TargetTransformInfoImplBase::isTargetIntrinsicWithOverloadTypeAtArg
virtual bool isTargetIntrinsicWithOverloadTypeAtArg(Intrinsic::ID ID, int OpdIdx) const
Definition TargetTransformInfoImpl.h:443

llvm::TargetTransformInfoImplBase::getIntImmCostIntrin
virtual InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:551

llvm::TargetTransformInfoImplBase::TTI
TargetTransformInfo TTI
Definition TargetTransformInfoImpl.h:37

llvm::TargetTransformInfoImplBase::getIntImmCodeSizeCost
virtual InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty) const
Definition TargetTransformInfoImpl.h:532

llvm::TargetTransformInfoImplBase::isConstantStridedAccessLessThan
bool isConstantStridedAccessLessThan(ScalarEvolution *SE, const SCEV *Ptr, int64_t MergeDistance) const
Definition TargetTransformInfoImpl.h:1227

llvm::TargetTransformInfoImplBase::enableOrderedReductions
virtual bool enableOrderedReductions() const
Definition TargetTransformInfoImpl.h:388

llvm::TargetTransformInfoImplBase::getOrCreateResultFromMemIntrinsic
virtual Value * getOrCreateResultFromMemIntrinsic(IntrinsicInst *Inst, Type *ExpectedType, bool CanCreate=true) const
Definition TargetTransformInfoImpl.h:991

llvm::TargetTransformInfoImplBase::enableMaskedInterleavedAccessVectorization
virtual bool enableMaskedInterleavedAccessVectorization() const
Definition TargetTransformInfoImpl.h:501

llvm::TargetTransformInfoImplBase::getMemcpyLoopLoweringType
virtual Type * getMemcpyLoopLoweringType(LLVMContext &Context, Value *Length, unsigned SrcAddrSpace, unsigned DestAddrSpace, Align SrcAlign, Align DestAlign, std::optional< uint32_t > AtomicElementSize) const
Definition TargetTransformInfoImpl.h:997

llvm::TargetTransformInfoImplBase::getInliningThresholdMultiplier
virtual unsigned getInliningThresholdMultiplier() const
Definition TargetTransformInfoImpl.h:90

llvm::TargetTransformInfoImplBase::TargetTransformInfoImplBase
TargetTransformInfoImplBase(const DataLayout &DL)
Definition TargetTransformInfoImpl.h:41

llvm::TargetTransformInfoImplBase::getIntrinsicInstrCost
virtual InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:881

llvm::TargetTransformInfoImplBase::isAlwaysUniform
virtual bool isAlwaysUniform(const Value *V) const
Definition TargetTransformInfoImpl.h:136

llvm::TargetTransformInfoImplBase::getCmpSelInstrCost
virtual InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info, TTI::OperandValueInfo Op2Info, const Instruction *I) const
Definition TargetTransformInfoImpl.h:780

llvm::TargetTransformInfoImplBase::shouldExpandReduction
virtual bool shouldExpandReduction(const IntrinsicInst *II) const
Definition TargetTransformInfoImpl.h:1102

llvm::TargetTransformInfoImplBase::isLegalToVectorizeStoreChain
virtual bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes, Align Alignment, unsigned AddrSpace) const
Definition TargetTransformInfoImpl.h:1060

llvm::TargetTransformInfoImplBase::getGISelRematGlobalCost
virtual unsigned getGISelRematGlobalCost() const
Definition TargetTransformInfoImpl.h:1111

llvm::TargetTransformInfoImplBase::getInterleavedMemoryOpCost
virtual InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond, bool UseMaskForGaps) const
Definition TargetTransformInfoImpl.h:873

llvm::TargetTransformInfoImplBase::isTypeLegal
virtual bool isTypeLegal(Type *Ty) const
Definition TargetTransformInfoImpl.h:420

llvm::TargetTransformInfoImplBase::enableSelectOptimize
virtual bool enableSelectOptimize() const
Definition TargetTransformInfoImpl.h:484

llvm::TargetTransformInfoImplBase::getAssumedAddrSpace
virtual unsigned getAssumedAddrSpace(const Value *V) const
Definition TargetTransformInfoImpl.h:159

llvm::TargetTransformInfoImplBase::allowsMisalignedMemoryAccesses
virtual bool allowsMisalignedMemoryAccesses(LLVMContext &Context, unsigned BitWidth, unsigned AddressSpace, Align Alignment, unsigned *Fast) const
Definition TargetTransformInfoImpl.h:507

llvm::TargetTransformInfoImplBase::enableWritePrefetching
virtual bool enableWritePrefetching() const
Definition TargetTransformInfoImpl.h:651

llvm::TargetTransformInfoImplBase::getStoreVectorFactor
virtual unsigned getStoreVectorFactor(unsigned VF, unsigned StoreSize, unsigned ChainSizeInBytes, VectorType *VecTy) const
Definition TargetTransformInfoImpl.h:1081

llvm::TargetTransformInfoImplBase::getExtendedReductionCost
virtual InstructionCost getExtendedReductionCost(unsigned Opcode, bool IsUnsigned, Type *ResTy, VectorType *Ty, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:959

llvm::TargetTransformInfoImplBase::getInliningCostBenefitAnalysisSavingsMultiplier
virtual unsigned getInliningCostBenefitAnalysisSavingsMultiplier() const
Definition TargetTransformInfoImpl.h:91

llvm::TargetTransformInfoImplBase::getVectorInstrCost
virtual InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Scalar, ArrayRef< std::tuple< Value *, User *, int > > ScalarUserAndIdx) const
Definition TargetTransformInfoImpl.h:798

llvm::TargetTransformInfoImplBase::getMaxNumArgs
virtual unsigned getMaxNumArgs() const
Definition TargetTransformInfoImpl.h:1145

llvm::TargetTransformInfoImplBase::getNumBytesToPadGlobalArray
virtual unsigned getNumBytesToPadGlobalArray(unsigned Size, Type *ArrayType) const
Definition TargetTransformInfoImpl.h:1147

llvm::TargetTransformInfoImplBase::preferToKeepConstantsAttached
virtual bool preferToKeepConstantsAttached(const Instruction &Inst, const Function &Fn) const
Definition TargetTransformInfoImpl.h:556

llvm::TargetTransformInfoImplBase::getShuffleCost
virtual InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy, ArrayRef< int > Mask, TTI::TargetCostKind CostKind, int Index, VectorType *SubTp, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const
Definition TargetTransformInfoImpl.h:712

llvm::TargetTransformInfoImplBase::isLegalMaskedStore
virtual bool isLegalMaskedStore(Type *DataType, Align Alignment, unsigned AddressSpace) const
Definition TargetTransformInfoImpl.h:311

llvm::TargetTransformInfoImplBase::isFCmpOrdCheaperThanFCmpZero
virtual bool isFCmpOrdCheaperThanFCmpZero(Type *Ty) const
Definition TargetTransformInfoImpl.h:526

llvm::TargetTransformInfoImplBase::supportsTailCallFor
virtual bool supportsTailCallFor(const CallBase *CB) const
Definition TargetTransformInfoImpl.h:471

llvm::TargetTransformInfoImplBase::getMaxVScale
virtual std::optional< unsigned > getMaxVScale() const
Definition TargetTransformInfoImpl.h:589

llvm::TargetTransformInfoImplBase::shouldBuildRelLookupTables
virtual bool shouldBuildRelLookupTables() const
Definition TargetTransformInfoImpl.h:430

llvm::TargetTransformInfoImplBase::shouldConsiderAddressTypePromotion
virtual bool shouldConsiderAddressTypePromotion(const Instruction &I, bool &AllowPromotionWithoutCommonHeader) const
Definition TargetTransformInfoImpl.h:611

llvm::TargetTransformInfoImplBase::getScalarizationOverhead
virtual InstructionCost getScalarizationOverhead(VectorType *Ty, const APInt &DemandedElts, bool Insert, bool Extract, TTI::TargetCostKind CostKind, bool ForPoisonSrc=true, ArrayRef< Value * > VL={}) const
Definition TargetTransformInfoImpl.h:454

llvm::TargetTransformInfoImplBase::getFlatAddressSpace
virtual unsigned getFlatAddressSpace() const
Definition TargetTransformInfoImpl.h:146

llvm::TargetTransformInfoImplBase::isTargetIntrinsicWithScalarOpAtArg
virtual bool isTargetIntrinsicWithScalarOpAtArg(Intrinsic::ID ID, unsigned ScalarOpdIdx) const
Definition TargetTransformInfoImpl.h:438

llvm::TargetTransformInfoImplBase::shouldConsiderVectorizationRegPressure
virtual bool shouldConsiderVectorizationRegPressure() const
Definition TargetTransformInfoImpl.h:1100

llvm::TargetTransformInfoImplBase::DL
const DataLayout & DL
Definition TargetTransformInfoImpl.h:39

llvm::TargetTransformInfoImplBase::getMemcpyCost
virtual InstructionCost getMemcpyCost(const Instruction *I) const
Definition TargetTransformInfoImpl.h:112

llvm::TargetTransformInfoImplBase::getInliningCostBenefitAnalysisProfitableMultiplier
virtual unsigned getInliningCostBenefitAnalysisProfitableMultiplier() const
Definition TargetTransformInfoImpl.h:94

llvm::TargetTransformInfoImplBase::isSourceOfDivergence
virtual bool isSourceOfDivergence(const Value *V) const
Definition TargetTransformInfoImpl.h:134

llvm::TargetTransformInfoImplBase::isNumRegsMajorCostOfLSR
virtual bool isNumRegsMajorCostOfLSR() const
Definition TargetTransformInfoImpl.h:290

llvm::TargetTransformInfoImplBase::getOperandsScalarizationOverhead
virtual InstructionCost getOperandsScalarizationOverhead(ArrayRef< Type * > Tys, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:462

llvm::TargetTransformInfoImplBase::getPreferredTailFoldingStyle
virtual TailFoldingStyle getPreferredTailFoldingStyle(bool IVUpdateMayOverflow=true) const
Definition TargetTransformInfoImpl.h:235

llvm::TargetTransformInfoImplBase::getUnrollingPreferences
virtual void getUnrollingPreferences(Loop *, ScalarEvolution &, TTI::UnrollingPreferences &, OptimizationRemarkEmitter *) const
Definition TargetTransformInfoImpl.h:259

llvm::TargetTransformInfoImplBase::TargetTransformInfoImplBase
TargetTransformInfoImplBase(const TargetTransformInfoImplBase &Arg)=default

llvm::TargetTransformInfoImplBase::isProfitableToSinkOperands
virtual bool isProfitableToSinkOperands(Instruction *I, SmallVectorImpl< Use * > &Ops) const
Definition TargetTransformInfoImpl.h:1121

llvm::TargetTransformInfoImplBase::supportsEfficientVectorElementLoadStore
virtual bool supportsEfficientVectorElementLoadStore() const
Definition TargetTransformInfoImpl.h:467

llvm::TargetTransformInfoImplBase::getMinPrefetchStride
virtual unsigned getMinPrefetchStride(unsigned NumMemAccesses, unsigned NumStridedMemAccesses, unsigned NumPrefetches, bool HasCall) const
Definition TargetTransformInfoImpl.h:644

llvm::TargetTransformInfoImplBase::getMinTripCountTailFoldingThreshold
virtual unsigned getMinTripCountTailFoldingThreshold() const
Definition TargetTransformInfoImpl.h:1113

llvm::TargetTransformInfoImplBase::getRegisterBitWidth
virtual TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const
Definition TargetTransformInfoImpl.h:583

llvm::TargetTransformInfoImplBase::collectKernelLaunchBounds
virtual void collectKernelLaunchBounds(const Function &F, SmallVectorImpl< std::pair< StringRef, int64_t > > &LB) const
Definition TargetTransformInfoImpl.h:1152

llvm::TargetTransformInfoImplBase::preferEpilogueVectorization
virtual bool preferEpilogueVectorization() const
Definition TargetTransformInfoImpl.h:1098

llvm::TargetTransformInfoImplCRTPBase::supportsTailCallFor
bool supportsTailCallFor(const CallBase *CB) const override
Definition TargetTransformInfoImpl.h:1687

llvm::TargetTransformInfoImplCRTPBase::TargetTransformInfoImplCRTPBase
TargetTransformInfoImplCRTPBase(const DataLayout &DL)
Definition TargetTransformInfoImpl.h:1248

llvm::TargetTransformInfoImplCRTPBase::isExpensiveToSpeculativelyExecute
bool isExpensiveToSpeculativelyExecute(const Instruction *I) const override
Definition TargetTransformInfoImpl.h:1679

llvm::TargetTransformInfoImplCRTPBase::getInstructionCost
InstructionCost getInstructionCost(const User *U, ArrayRef< const Value * > Operands, TTI::TargetCostKind CostKind) const override
Definition TargetTransformInfoImpl.h:1366

llvm::TargetTransformInfoImplCRTPBase::getPointersChainCost
InstructionCost getPointersChainCost(ArrayRef< const Value * > Ptrs, const Value *Base, const TTI::PointersChainInfo &Info, Type *AccessTy, TTI::TargetCostKind CostKind) const override
Definition TargetTransformInfoImpl.h:1330

llvm::TargetTransformInfoImplCRTPBase::getGEPCost
InstructionCost getGEPCost(Type *PointeeType, const Value *Ptr, ArrayRef< const Value * > Operands, Type *AccessType, TTI::TargetCostKind CostKind) const override
Definition TargetTransformInfoImpl.h:1251

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition TargetTransformInfo.h:223

llvm::TargetTransformInfo::ReductionShuffle
ReductionShuffle
Definition TargetTransformInfo.h:1859

llvm::TargetTransformInfo::ReductionShuffle::SplitHalf
@ SplitHalf
Definition TargetTransformInfo.h:1859

llvm::TargetTransformInfo::getCastContextHint
static LLVM_ABI CastContextHint getCastContextHint(const Instruction *I)
Calculates a CastContextHint from I.
Definition TargetTransformInfo.cpp:1012

llvm::TargetTransformInfo::getOperandInfo
static LLVM_ABI OperandValueInfo getOperandInfo(const Value *V)
Collect properties of V used in cost analysis, e.g. OP_PowerOf2.
Definition TargetTransformInfo.cpp:886

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition TargetTransformInfo.h:275

llvm::TargetTransformInfo::TCK_RecipThroughput
@ TCK_RecipThroughput
Reciprocal throughput.
Definition TargetTransformInfo.h:276

llvm::TargetTransformInfo::TCK_CodeSize
@ TCK_CodeSize
Instruction code size.
Definition TargetTransformInfo.h:278

llvm::TargetTransformInfo::TCK_SizeAndLatency
@ TCK_SizeAndLatency
The weighted sum of size and latency.
Definition TargetTransformInfo.h:279

llvm::TargetTransformInfo::TCK_Latency
@ TCK_Latency
The latency of instruction.
Definition TargetTransformInfo.h:277

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition TargetTransformInfo.h:1215

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition TargetTransformInfo.h:741

llvm::TargetTransformInfo::PSK_Software
@ PSK_Software
Definition TargetTransformInfo.h:741

llvm::TargetTransformInfo::PartialReductionExtendKind
PartialReductionExtendKind
Definition TargetTransformInfo.h:225

llvm::TargetTransformInfo::TCC_Expensive
@ TCC_Expensive
The cost of a 'div' instruction on x86.
Definition TargetTransformInfo.h:303

llvm::TargetTransformInfo::TCC_Free
@ TCC_Free
Expected to fold away in lowering.
Definition TargetTransformInfo.h:301

llvm::TargetTransformInfo::TCC_Basic
@ TCC_Basic
The cost of a typical 'add' instruction.
Definition TargetTransformInfo.h:302

llvm::TargetTransformInfo::MemIndexedMode
MemIndexedMode
The type of load/store indexing.
Definition TargetTransformInfo.h:1767

llvm::TargetTransformInfo::AddressingModeKind
AddressingModeKind
Which addressing mode Loop Strength Reduction will try to generate.
Definition TargetTransformInfo.h:804

llvm::TargetTransformInfo::AMK_None
@ AMK_None
Don't prefer any addressing mode.
Definition TargetTransformInfo.h:805

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition TargetTransformInfo.h:1132

llvm::TargetTransformInfo::SK_InsertSubvector
@ SK_InsertSubvector
InsertSubvector. Index indicates start offset.
Definition TargetTransformInfo.h:1139

llvm::TargetTransformInfo::SK_Select
@ SK_Select
Selects elements from the corresponding lane of either source operand.
Definition TargetTransformInfo.h:1135

llvm::TargetTransformInfo::SK_PermuteSingleSrc
@ SK_PermuteSingleSrc
Shuffle elements of single source vector with any shuffle mask.
Definition TargetTransformInfo.h:1143

llvm::TargetTransformInfo::SK_Transpose
@ SK_Transpose
Transpose two vectors.
Definition TargetTransformInfo.h:1138

llvm::TargetTransformInfo::SK_Splice
@ SK_Splice
Concatenates elements from the first input vector with elements of the second input vector.
Definition TargetTransformInfo.h:1145

llvm::TargetTransformInfo::SK_Broadcast
@ SK_Broadcast
Broadcast element 0 to all other elements.
Definition TargetTransformInfo.h:1133

llvm::TargetTransformInfo::SK_PermuteTwoSrc
@ SK_PermuteTwoSrc
Merge elements from two source vectors into one with any shuffle mask.
Definition TargetTransformInfo.h:1141

llvm::TargetTransformInfo::SK_Reverse
@ SK_Reverse
Reverse the order of the vector.
Definition TargetTransformInfo.h:1134

llvm::TargetTransformInfo::SK_ExtractSubvector
@ SK_ExtractSubvector
ExtractSubvector Index indicates start offset.
Definition TargetTransformInfo.h:1140

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition TargetTransformInfo.h:1437

llvm::TargetTransformInfo::CacheLevel
CacheLevel
The possible cache levels.
Definition TargetTransformInfo.h:1275

llvm::TargetTransformInfo::CacheLevel::L1D
@ L1D
Definition TargetTransformInfo.h:1276

llvm::TargetTransformInfo::CacheLevel::L2D
@ L2D
Definition TargetTransformInfo.h:1277

llvm::TruncInst
This class represents a truncation of integer types.
Definition Instructions.h:4554

llvm::TypeSize
Definition TypeSize.h:333

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:344

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:273

llvm::Type::isScalableTy
LLVM_ABI bool isScalableTy(SmallPtrSetImpl< const Type * > &Visited) const
Return true if this is a type whose size is a known multiple of vscale.
Definition Type.cpp:62

llvm::Type::getPointerAddressSpace
LLVM_ABI unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.
Definition DerivedTypes.h:773

llvm::Type::getInt8Ty
static LLVM_ABI IntegerType * getInt8Ty(LLVMContext &C)
Definition Type.cpp:295

llvm::Type::getScalarSizeInBits
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:231

llvm::Type::getIntNTy
static LLVM_ABI IntegerType * getIntNTy(LLVMContext &C, unsigned N)
Definition Type.cpp:301

llvm::User
Definition User.h:44

llvm::VPIntrinsic
This is the common base class for vector predication intrinsics.
Definition IntrinsicInst.h:566

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256

llvm::VectorType
Base class of all SIMD vector types.
Definition DerivedTypes.h:430

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:201

llvm::details::FixedOrScalableQuantity::isScalable
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition TypeSize.h:169

uint64_t

Call
CallInst * Call
Definition ObjCARCOpts.cpp:2360

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24

llvm::CallingConv::Fast
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition CallingConv.h:41

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::Intrinsic
This namespace contains an enum with a value for every intrinsic/builtin function known by LLVM.
Definition GenericSSAContext.h:27

llvm::Intrinsic::ID
unsigned ID
Definition GenericSSAContext.h:28

llvm::NVPTXAS::AddressSpace
AddressSpace
Definition NVPTXAddrSpace.h:21

llvm::PatternMatch
Definition PatternMatch.h:47

llvm::PatternMatch::m_Constant
class_match< Constant > m_Constant()
Match an arbitrary Constant and ignore it.
Definition PatternMatch.h:178

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition PatternMatch.h:49

llvm::PatternMatch::m_Select
ThreeOps_match< Cond, LHS, RHS, Instruction::Select > m_Select(const Cond &C, const LHS &L, const RHS &R)
Matches SelectInst.
Definition PatternMatch.h:1920

llvm::PatternMatch::m_LogicalOr
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
Definition PatternMatch.h:3240

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition PatternMatch.h:105

llvm::PatternMatch::m_LogicalAnd
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
Definition PatternMatch.h:3222

llvm::PatternMatch::m_CombineOr
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
Definition PatternMatch.h:252

llvm::SI
Definition SIInstrInfo.h:1745

llvm::sampleprof::Base
@ Base
Definition Discriminator.h:58

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::Length
@ Length
Definition DWP.cpp:477

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1705

llvm::Cost
InstructionCost Cost
Definition FunctionSpecialization.h:103

llvm::enumerate
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2452

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:644

llvm::DataSize
FunctionAddr VTableAddr uintptr_t uintptr_t DataSize
Definition InstrProf.h:267

llvm::getSplatValue
LLVM_ABI Value * getSplatValue(const Value *V)
Get splat value if the input is a splat vector or return nullptr.
Definition VectorUtils.cpp:391

llvm::any_of
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1712

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition MathExtras.h:288

llvm::ComplexDeinterleavingOperation::Splat
@ Splat
Definition ComplexDeinterleavingPass.h:42

llvm::isa
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:548

llvm::PoisonMaskElem
constexpr int PoisonMaskElem
Definition Instructions.h:1923

llvm::RecurKind
RecurKind
These are the kinds of recurrences that we support.
Definition IVDescriptors.h:34

llvm::BitWidth
constexpr unsigned BitWidth
Definition BitmaskEnum.h:220

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:560

llvm::gep_type_begin
gep_type_iterator gep_type_begin(const User *GEP)
Definition GetElementPtrTypeIterator.h:173

llvm::TailFoldingStyle
TailFoldingStyle
Definition TargetTransformInfo.h:175

llvm::TailFoldingStyle::DataWithoutLaneMask
@ DataWithoutLaneMask
Same as Data, but avoids using the get.active.lane.mask intrinsic to calculate the mask and instead i...
Definition TargetTransformInfo.h:192

llvm::VFParamKind::Vector
@ Vector
Definition VFABIDemangler.h:27

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39

llvm::HardwareLoopInfo
Attributes of a target dependent hardware loop.
Definition TargetTransformInfo.h:102

llvm::KnownBits
Definition KnownBits.h:24

llvm::MemIntrinsicInfo
Information about a load/store intrinsic defined by the target.
Definition TargetTransformInfo.h:75

llvm::TailFoldingInfo
Definition TargetTransformInfo.h:208

llvm::TargetTransformInfo::LSRCost
Definition TargetTransformInfo.h:537

llvm::TargetTransformInfo::LSRCost::NumIVMuls
unsigned NumIVMuls
Definition TargetTransformInfo.h:543

llvm::TargetTransformInfo::LSRCost::ScaleCost
unsigned ScaleCost
Definition TargetTransformInfo.h:547

llvm::TargetTransformInfo::LSRCost::ImmCost
unsigned ImmCost
Definition TargetTransformInfo.h:545

llvm::TargetTransformInfo::LSRCost::AddRecCost
unsigned AddRecCost
Definition TargetTransformInfo.h:542

llvm::TargetTransformInfo::LSRCost::NumRegs
unsigned NumRegs
Definition TargetTransformInfo.h:541

llvm::TargetTransformInfo::LSRCost::NumBaseAdds
unsigned NumBaseAdds
Definition TargetTransformInfo.h:544

llvm::TargetTransformInfo::LSRCost::SetupCost
unsigned SetupCost
Definition TargetTransformInfo.h:546

llvm::TargetTransformInfo::MemCmpExpansionOptions
Returns options for expansion of memcmp. IsZeroCmp is.
Definition TargetTransformInfo.h:994

llvm::TargetTransformInfo::OperandValueInfo
Definition TargetTransformInfo.h:1169

llvm::TargetTransformInfo::PeelingPreferences
Definition TargetTransformInfo.h:681

llvm::TargetTransformInfo::PointersChainInfo
Describe known properties for a set of pointers.
Definition TargetTransformInfo.h:323

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition TargetTransformInfo.h:551

llvm::TargetTransformInfo::VPLegalization
Definition TargetTransformInfo.h:1902

llvm::TargetTransformInfo::VPLegalization::Convert
@ Convert
Definition TargetTransformInfo.h:1909

llvm::TargetTransformInfo::VPLegalization::Discard
@ Discard
Definition TargetTransformInfo.h:1907