LLVM: lib/Transforms/Vectorize/LoopVectorizationPlanner.h Source File

//===- LoopVectorizationPlanner.h - Planner for LoopVectorization ---------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

///

/// \file

/// This file provides a LoopVectorizationPlanner class.

/// InnerLoopVectorizer vectorizes loops which contain only one basic

/// LoopVectorizationPlanner - drives the vectorization process after having

/// passed Legality checks.

/// The planner builds and optimizes the Vectorization Plans which record the

/// decisions how to vectorize the given loop. In particular, represent the

/// control-flow of the vectorized version, the replication of instructions that

/// are to be scalarized, and interleave access groups.

///

/// Also provides a VPlan-based builder utility analogous to IRBuilder.

/// It provides an instruction-level API for generating VPInstructions while

/// abstracting away the Recipe manipulation details.

//===----------------------------------------------------------------------===//


#ifndef LLVM_TRANSFORMS_VECTORIZE_LOOPVECTORIZATIONPLANNER_H

#define LLVM_TRANSFORMS_VECTORIZE_LOOPVECTORIZATIONPLANNER_H


#include "VPlan.h"

#include "llvm/ADT/SmallSet.h"

#include "llvm/Support/InstructionCost.h"


namespace {

class GeneratedRTChecks;

}


namespace llvm {


class LoopInfo;

class DominatorTree;

class LoopVectorizationLegality;

class LoopVectorizationCostModel;

class PredicatedScalarEvolution;

class LoopVectorizeHints;

class LoopVersioning;

class OptimizationRemarkEmitter;

class TargetTransformInfo;

class TargetLibraryInfo;

class VPRecipeBuilder;

struct VFRange;


extern cl::opt<bool> EnableVPlanNativePath;

extern cl::opt<unsigned> ForceTargetInstructionCost;


/// VPlan-based builder utility analogous to IRBuilder.

class VPBuilder {

  VPBasicBlock *BB = nullptr;

  VPBasicBlock::iterator InsertPt = VPBasicBlock::iterator();


  /// Insert \p VPI in BB at InsertPt if BB is set.

  template <typename T> T *tryInsertInstruction(T *R) {

    if (BB)

      BB->insert(R, InsertPt);

    return R;

  }


  VPInstruction *createInstruction(unsigned Opcode,

                                   ArrayRef<VPValue *> Operands, DebugLoc DL,

                                   const Twine &Name = "") {

    return tryInsertInstruction(new VPInstruction(Opcode, Operands, DL, Name));

  }


public:

  VPBuilder() = default;

  VPBuilder(VPBasicBlock *InsertBB) { setInsertPoint(InsertBB); }

  VPBuilder(VPRecipeBase *InsertPt) { setInsertPoint(InsertPt); }

  VPBuilder(VPBasicBlock *TheBB, VPBasicBlock::iterator IP) {

    setInsertPoint(TheBB, IP);

  }


  /// Clear the insertion point: created instructions will not be inserted into

  /// a block.

  void clearInsertionPoint() {

    BB = nullptr;

    InsertPt = VPBasicBlock::iterator();

  }


  VPBasicBlock *getInsertBlock() const { return BB; }

  VPBasicBlock::iterator getInsertPoint() const { return InsertPt; }


  /// Create a VPBuilder to insert after \p R.

  static VPBuilder getToInsertAfter(VPRecipeBase *R) {

    VPBuilder B;

    B.setInsertPoint(R->getParent(), std::next(R->getIterator()));

    return B;

  }


  /// InsertPoint - A saved insertion point.

  class VPInsertPoint {

    VPBasicBlock *Block = nullptr;

    VPBasicBlock::iterator Point;


  public:

    /// Creates a new insertion point which doesn't point to anything.

    VPInsertPoint() = default;


    /// Creates a new insertion point at the given location.

    VPInsertPoint(VPBasicBlock *InsertBlock, VPBasicBlock::iterator InsertPoint)

        : Block(InsertBlock), Point(InsertPoint) {}


    /// Returns true if this insert point is set.

    bool isSet() const { return Block != nullptr; }


    VPBasicBlock *getBlock() const { return Block; }

    VPBasicBlock::iterator getPoint() const { return Point; }

  };


  /// Sets the current insert point to a previously-saved location.

  void restoreIP(VPInsertPoint IP) {

    if (IP.isSet())

      setInsertPoint(IP.getBlock(), IP.getPoint());

    else

      clearInsertionPoint();

  }


  /// This specifies that created VPInstructions should be appended to the end

  /// of the specified block.

  void setInsertPoint(VPBasicBlock *TheBB) {

    assert(TheBB && "Attempting to set a null insert point");

    BB = TheBB;

    InsertPt = BB->end();

  }


  /// This specifies that created instructions should be inserted at the

  /// specified point.

  void setInsertPoint(VPBasicBlock *TheBB, VPBasicBlock::iterator IP) {

    BB = TheBB;

    InsertPt = IP;

  }


  /// This specifies that created instructions should be inserted at the

  /// specified point.

  void setInsertPoint(VPRecipeBase *IP) {

    BB = IP->getParent();

    InsertPt = IP->getIterator();

  }


  /// Insert \p R at the current insertion point.

  void insert(VPRecipeBase *R) { BB->insert(R, InsertPt); }


  /// Create an N-ary operation with \p Opcode, \p Operands and set \p Inst as

  /// its underlying Instruction.

  VPInstruction *createNaryOp(unsigned Opcode, ArrayRef<VPValue *> Operands,

                              Instruction *Inst = nullptr,

                              const Twine &Name = "") {

    DebugLoc DL = DebugLoc::getUnknown();

    if (Inst)

      DL = Inst->getDebugLoc();

    VPInstruction *NewVPInst = createInstruction(Opcode, Operands, DL, Name);

    NewVPInst->setUnderlyingValue(Inst);

    return NewVPInst;

  }

  VPInstruction *createNaryOp(unsigned Opcode, ArrayRef<VPValue *> Operands,

                              DebugLoc DL, const Twine &Name = "") {

    return createInstruction(Opcode, Operands, DL, Name);

  }

  VPInstruction *createNaryOp(unsigned Opcode, ArrayRef<VPValue *> Operands,

                              const VPIRFlags &Flags,

                              DebugLoc DL = DebugLoc::getUnknown(),

                              const Twine &Name = "") {

    return tryInsertInstruction(

        new VPInstruction(Opcode, Operands, Flags, DL, Name));

  }


  VPInstruction *createNaryOp(unsigned Opcode, ArrayRef<VPValue *> Operands,

                              Type *ResultTy, const VPIRFlags &Flags = {},

                              DebugLoc DL = DebugLoc::getUnknown(),

                              const Twine &Name = "") {

    return tryInsertInstruction(

        new VPInstructionWithType(Opcode, Operands, ResultTy, Flags, DL, Name));

  }


  VPInstruction *createOverflowingOp(unsigned Opcode,

                                     ArrayRef<VPValue *> Operands,

                                     VPRecipeWithIRFlags::WrapFlagsTy WrapFlags,

                                     DebugLoc DL = DebugLoc::getUnknown(),

                                     const Twine &Name = "") {

    return tryInsertInstruction(

        new VPInstruction(Opcode, Operands, WrapFlags, DL, Name));

  }


  VPInstruction *createNot(VPValue *Operand,

                           DebugLoc DL = DebugLoc::getUnknown(),

                           const Twine &Name = "") {

    return createInstruction(VPInstruction::Not, {Operand}, DL, Name);

  }


  VPInstruction *createAnd(VPValue *LHS, VPValue *RHS,

                           DebugLoc DL = DebugLoc::getUnknown(),

                           const Twine &Name = "") {

    return createInstruction(Instruction::BinaryOps::And, {LHS, RHS}, DL, Name);

  }


  VPInstruction *createOr(VPValue *LHS, VPValue *RHS,

                          DebugLoc DL = DebugLoc::getUnknown(),

                          const Twine &Name = "") {


    return tryInsertInstruction(new VPInstruction(

        Instruction::BinaryOps::Or, {LHS, RHS},

        VPRecipeWithIRFlags::DisjointFlagsTy(false), DL, Name));

  }


  VPInstruction *createLogicalAnd(VPValue *LHS, VPValue *RHS,

                                  DebugLoc DL = DebugLoc::getUnknown(),

                                  const Twine &Name = "") {

    return tryInsertInstruction(

        new VPInstruction(VPInstruction::LogicalAnd, {LHS, RHS}, DL, Name));

  }


  VPInstruction *

  createSelect(VPValue *Cond, VPValue *TrueVal, VPValue *FalseVal,

               DebugLoc DL = DebugLoc::getUnknown(), const Twine &Name = "",

               std::optional<FastMathFlags> FMFs = std::nullopt) {

    auto *Select =

        FMFs ? new VPInstruction(Instruction::Select, {Cond, TrueVal, FalseVal},

                                 *FMFs, DL, Name)

             : new VPInstruction(Instruction::Select, {Cond, TrueVal, FalseVal},

                                 DL, Name);

    return tryInsertInstruction(Select);

  }


  /// Create a new ICmp VPInstruction with predicate \p Pred and operands \p A

  /// and \p B.

  VPInstruction *createICmp(CmpInst::Predicate Pred, VPValue *A, VPValue *B,

                            DebugLoc DL = DebugLoc::getUnknown(),

                            const Twine &Name = "") {

    assert(Pred >= CmpInst::FIRST_ICMP_PREDICATE &&

           Pred <= CmpInst::LAST_ICMP_PREDICATE && "invalid predicate");

    return tryInsertInstruction(

        new VPInstruction(Instruction::ICmp, {A, B}, Pred, DL, Name));

  }


  /// Create a new FCmp VPInstruction with predicate \p Pred and operands \p A

  /// and \p B.

  VPInstruction *createFCmp(CmpInst::Predicate Pred, VPValue *A, VPValue *B,

                            DebugLoc DL = DebugLoc::getUnknown(),

                            const Twine &Name = "") {

    assert(Pred >= CmpInst::FIRST_FCMP_PREDICATE &&

           Pred <= CmpInst::LAST_FCMP_PREDICATE && "invalid predicate");

    return tryInsertInstruction(

        new VPInstruction(Instruction::FCmp, {A, B}, Pred, DL, Name));

  }


  VPInstruction *createPtrAdd(VPValue *Ptr, VPValue *Offset,

                              DebugLoc DL = DebugLoc::getUnknown(),

                              const Twine &Name = "") {

    return tryInsertInstruction(

        new VPInstruction(VPInstruction::PtrAdd, {Ptr, Offset},

                          GEPNoWrapFlags::none(), DL, Name));

  }


  VPInstruction *createNoWrapPtrAdd(VPValue *Ptr, VPValue *Offset,

                                    GEPNoWrapFlags GEPFlags,

                                    DebugLoc DL = DebugLoc::getUnknown(),

                                    const Twine &Name = "") {

    return tryInsertInstruction(new VPInstruction(

        VPInstruction::PtrAdd, {Ptr, Offset}, GEPFlags, DL, Name));

  }


  VPInstruction *createWidePtrAdd(VPValue *Ptr, VPValue *Offset,

                                  DebugLoc DL = DebugLoc::getUnknown(),

                                  const Twine &Name = "") {

    return tryInsertInstruction(

        new VPInstruction(VPInstruction::WidePtrAdd, {Ptr, Offset},

                          GEPNoWrapFlags::none(), DL, Name));

  }


  VPPhi *createScalarPhi(ArrayRef<VPValue *> IncomingValues, DebugLoc DL,

                         const Twine &Name = "") {

    return tryInsertInstruction(new VPPhi(IncomingValues, DL, Name));

  }


  VPValue *createElementCount(Type *Ty, ElementCount EC) {

    VPlan &Plan = *getInsertBlock()->getPlan();

    VPValue *RuntimeEC =

        Plan.getOrAddLiveIn(ConstantInt::get(Ty, EC.getKnownMinValue()));

    if (EC.isScalable()) {

      VPValue *VScale = createNaryOp(VPInstruction::VScale, {}, Ty);

      RuntimeEC = EC.getKnownMinValue() == 1

                      ? VScale

                      : createOverflowingOp(Instruction::Mul,

                                            {VScale, RuntimeEC}, {true, false});

    }

    return RuntimeEC;

  }


  /// Convert the input value \p Current to the corresponding value of an

  /// induction with \p Start and \p Step values, using \p Start + \p Current *

  /// \p Step.

  VPDerivedIVRecipe *createDerivedIV(InductionDescriptor::InductionKind Kind,

                                     FPMathOperator *FPBinOp, VPValue *Start,

                                     VPValue *Current, VPValue *Step,

                                     const Twine &Name = "") {

    return tryInsertInstruction(

        new VPDerivedIVRecipe(Kind, FPBinOp, Start, Current, Step, Name));

  }


  VPInstruction *createScalarCast(Instruction::CastOps Opcode, VPValue *Op,

                                  Type *ResultTy, DebugLoc DL) {

    return tryInsertInstruction(

        new VPInstructionWithType(Opcode, Op, ResultTy, {}, DL));

  }


  VPValue *createScalarZExtOrTrunc(VPValue *Op, Type *ResultTy, Type *SrcTy,

                                   DebugLoc DL) {

    if (ResultTy == SrcTy)

      return Op;

    Instruction::CastOps CastOp =

        ResultTy->getScalarSizeInBits() < SrcTy->getScalarSizeInBits()

            ? Instruction::Trunc

            : Instruction::ZExt;

    return createScalarCast(CastOp, Op, ResultTy, DL);

  }


  VPWidenCastRecipe *createWidenCast(Instruction::CastOps Opcode, VPValue *Op,

                                     Type *ResultTy) {

    return tryInsertInstruction(new VPWidenCastRecipe(Opcode, Op, ResultTy));

  }


  VPScalarIVStepsRecipe *

  createScalarIVSteps(Instruction::BinaryOps InductionOpcode,

                      FPMathOperator *FPBinOp, VPValue *IV, VPValue *Step,

                      VPValue *VF, DebugLoc DL) {

    return tryInsertInstruction(new VPScalarIVStepsRecipe(

        IV, Step, VF, InductionOpcode,

        FPBinOp ? FPBinOp->getFastMathFlags() : FastMathFlags(), DL));

  }


  VPExpandSCEVRecipe *createExpandSCEV(const SCEV *Expr) {

    return tryInsertInstruction(new VPExpandSCEVRecipe(Expr));

  }


  //===--------------------------------------------------------------------===//

  // RAII helpers.

  //===--------------------------------------------------------------------===//


  /// RAII object that stores the current insertion point and restores it when

  /// the object is destroyed.

  class InsertPointGuard {

    VPBuilder &Builder;

    VPBasicBlock *Block;

    VPBasicBlock::iterator Point;


  public:

    InsertPointGuard(VPBuilder &B)

        : Builder(B), Block(B.getInsertBlock()), Point(B.getInsertPoint()) {}


    InsertPointGuard(const InsertPointGuard &) = delete;

    InsertPointGuard &operator=(const InsertPointGuard &) = delete;


    ~InsertPointGuard() { Builder.restoreIP(VPInsertPoint(Block, Point)); }

  };

};


/// TODO: The following VectorizationFactor was pulled out of

/// LoopVectorizationCostModel class. LV also deals with

/// VectorizerParams::VectorizationFactor.

/// We need to streamline them.


/// Information about vectorization costs.

struct VectorizationFactor {

  /// Vector width with best cost.

  ElementCount Width;


  /// Cost of the loop with that width.

  InstructionCost Cost;


  /// Cost of the scalar loop.

  InstructionCost ScalarCost;


  /// The minimum trip count required to make vectorization profitable, e.g. due

  /// to runtime checks.

  ElementCount MinProfitableTripCount;


  VectorizationFactor(ElementCount Width, InstructionCost Cost,

                      InstructionCost ScalarCost)

      : Width(Width), Cost(Cost), ScalarCost(ScalarCost) {}


  /// Width 1 means no vectorization, cost 0 means uncomputed cost.

  static VectorizationFactor Disabled() {

    return {ElementCount::getFixed(1), 0, 0};

  }


  bool operator==(const VectorizationFactor &rhs) const {

    return Width == rhs.Width && Cost == rhs.Cost;

  }


  bool operator!=(const VectorizationFactor &rhs) const {

    return !(*this == rhs);

  }

};


/// A class that represents two vectorization factors (initialized with 0 by

/// default). One for fixed-width vectorization and one for scalable

/// vectorization. This can be used by the vectorizer to choose from a range of

/// fixed and/or scalable VFs in order to find the most cost-effective VF to

/// vectorize with.

struct FixedScalableVFPair {

  ElementCount FixedVF;

  ElementCount ScalableVF;


  FixedScalableVFPair()

      : FixedVF(ElementCount::getFixed(0)),

        ScalableVF(ElementCount::getScalable(0)) {}

  FixedScalableVFPair(const ElementCount &Max) : FixedScalableVFPair() {

    *(Max.isScalable() ? &ScalableVF : &FixedVF) = Max;

  }

  FixedScalableVFPair(const ElementCount &FixedVF,

                      const ElementCount &ScalableVF)

      : FixedVF(FixedVF), ScalableVF(ScalableVF) {

    assert(!FixedVF.isScalable() && ScalableVF.isScalable() &&

           "Invalid scalable properties");

  }


  static FixedScalableVFPair getNone() { return FixedScalableVFPair(); }


  /// \return true if either fixed- or scalable VF is non-zero.

  explicit operator bool() const { return FixedVF || ScalableVF; }


  /// \return true if either fixed- or scalable VF is a valid vector VF.

  bool hasVector() const { return FixedVF.isVector() || ScalableVF.isVector(); }

};


/// Planner drives the vectorization process after having passed

/// Legality checks.

class LoopVectorizationPlanner {

  /// The loop that we evaluate.

  Loop *OrigLoop;


  /// Loop Info analysis.

  LoopInfo *LI;


  /// The dominator tree.

  DominatorTree *DT;


  /// Target Library Info.

  const TargetLibraryInfo *TLI;


  /// Target Transform Info.

  const TargetTransformInfo &TTI;


  /// The legality analysis.

  LoopVectorizationLegality *Legal;


  /// The profitability analysis.

  LoopVectorizationCostModel &CM;


  /// The interleaved access analysis.

  InterleavedAccessInfo &IAI;


  PredicatedScalarEvolution &PSE;


  const LoopVectorizeHints &Hints;


  OptimizationRemarkEmitter *ORE;


  SmallVector<VPlanPtr, 4> VPlans;


  /// Profitable vector factors.

  SmallVector<VectorizationFactor, 8> ProfitableVFs;


  /// A builder used to construct the current plan.

  VPBuilder Builder;


  /// Computes the cost of \p Plan for vectorization factor \p VF.

  ///

  /// The current implementation requires access to the

  /// LoopVectorizationLegality to handle inductions and reductions, which is

  /// why it is kept separate from the VPlan-only cost infrastructure.

  ///

  /// TODO: Move to VPlan::cost once the use of LoopVectorizationLegality has

  /// been retired.

  InstructionCost cost(VPlan &Plan, ElementCount VF) const;


  /// Precompute costs for certain instructions using the legacy cost model. The

  /// function is used to bring up the VPlan-based cost model to initially avoid

  /// taking different decisions due to inaccuracies in the legacy cost model.

  InstructionCost precomputeCosts(VPlan &Plan, ElementCount VF,

                                  VPCostContext &CostCtx) const;


public:

  LoopVectorizationPlanner(

      Loop *L, LoopInfo *LI, DominatorTree *DT, const TargetLibraryInfo *TLI,

      const TargetTransformInfo &TTI, LoopVectorizationLegality *Legal,

      LoopVectorizationCostModel &CM, InterleavedAccessInfo &IAI,

      PredicatedScalarEvolution &PSE, const LoopVectorizeHints &Hints,

      OptimizationRemarkEmitter *ORE)

      : OrigLoop(L), LI(LI), DT(DT), TLI(TLI), TTI(TTI), Legal(Legal), CM(CM),

        IAI(IAI), PSE(PSE), Hints(Hints), ORE(ORE) {}


  /// Build VPlans for the specified \p UserVF and \p UserIC if they are

  /// non-zero or all applicable candidate VFs otherwise. If vectorization and

  /// interleaving should be avoided up-front, no plans are generated.

  void plan(ElementCount UserVF, unsigned UserIC);


  /// Use the VPlan-native path to plan how to best vectorize, return the best

  /// VF and its cost.

  VectorizationFactor planInVPlanNativePath(ElementCount UserVF);


  /// Return the VPlan for \p VF. At the moment, there is always a single VPlan

  /// for each VF.

  VPlan &getPlanFor(ElementCount VF) const;


  /// Compute and return the most profitable vectorization factor. Also collect

  /// all profitable VFs in ProfitableVFs.

  VectorizationFactor computeBestVF();


  /// \return The desired interleave count.

  /// If interleave count has been specified by metadata it will be returned.

  /// Otherwise, the interleave count is computed and returned. VF and LoopCost

  /// are the selected vectorization factor and the cost of the selected VF.

  unsigned selectInterleaveCount(VPlan &Plan, ElementCount VF,

                                 InstructionCost LoopCost);


  /// Generate the IR code for the vectorized loop captured in VPlan \p BestPlan

  /// according to the best selected \p VF and  \p UF.

  ///

  /// TODO: \p VectorizingEpilogue indicates if the executed VPlan is for the

  /// epilogue vector loop. It should be removed once the re-use issue has been

  /// fixed.

  ///

  /// Returns a mapping of SCEVs to their expanded IR values.

  /// Note that this is a temporary workaround needed due to the current

  /// epilogue handling.

  DenseMap<const SCEV *, Value *> executePlan(ElementCount VF, unsigned UF,

                                              VPlan &BestPlan,

                                              InnerLoopVectorizer &LB,

                                              DominatorTree *DT,

                                              bool VectorizingEpilogue);


#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)

  void printPlans(raw_ostream &O);

#endif


  /// Look through the existing plans and return true if we have one with

  /// vectorization factor \p VF.

  bool hasPlanWithVF(ElementCount VF) const {

    return any_of(VPlans,

                  [&](const VPlanPtr &Plan) { return Plan->hasVF(VF); });

  }


  /// Test a \p Predicate on a \p Range of VF's. Return the value of applying

  /// \p Predicate on Range.Start, possibly decreasing Range.End such that the

  /// returned value holds for the entire \p Range.

  static bool

  getDecisionAndClampRange(const std::function<bool(ElementCount)> &Predicate,

                           VFRange &Range);


  /// \return The most profitable vectorization factor and the cost of that VF

  /// for vectorizing the epilogue. Returns VectorizationFactor::Disabled if

  /// epilogue vectorization is not supported for the loop.

  VectorizationFactor

  selectEpilogueVectorizationFactor(const ElementCount MaxVF, unsigned IC);


  /// Emit remarks for recipes with invalid costs in the available VPlans.

  void emitInvalidCostRemarks(OptimizationRemarkEmitter *ORE);


  /// Create a check to \p Plan to see if the vector loop should be executed

  /// based on its trip count.

  void addMinimumIterationCheck(VPlan &Plan, ElementCount VF, unsigned UF,

                                ElementCount MinProfitableTripCount) const;


protected:

  /// Build VPlans for power-of-2 VF's between \p MinVF and \p MaxVF inclusive,

  /// according to the information gathered by Legal when it checked if it is

  /// legal to vectorize the loop.

  void buildVPlans(ElementCount MinVF, ElementCount MaxVF);


private:

  /// Build a VPlan according to the information gathered by Legal. \return a

  /// VPlan for vectorization factors \p Range.Start and up to \p Range.End

  /// exclusive, possibly decreasing \p Range.End. If no VPlan can be built for

  /// the input range, set the largest included VF to the maximum VF for which

  /// no plan could be built.

  VPlanPtr tryToBuildVPlan(VFRange &Range);


  /// Build a VPlan using VPRecipes according to the information gather by

  /// Legal. This method is only used for the legacy inner loop vectorizer.

  /// \p Range's largest included VF is restricted to the maximum VF the

  /// returned VPlan is valid for. If no VPlan can be built for the input range,

  /// set the largest included VF to the maximum VF for which no plan could be

  /// built. Each VPlan is built starting from a copy of \p InitialPlan, which

  /// is a plain CFG VPlan wrapping the original scalar loop.

  VPlanPtr tryToBuildVPlanWithVPRecipes(VPlanPtr InitialPlan, VFRange &Range,

                                        LoopVersioning *LVer);


  /// Build VPlans for power-of-2 VF's between \p MinVF and \p MaxVF inclusive,

  /// according to the information gathered by Legal when it checked if it is

  /// legal to vectorize the loop. This method creates VPlans using VPRecipes.

  void buildVPlansWithVPRecipes(ElementCount MinVF, ElementCount MaxVF);


  // Adjust the recipes for reductions. For in-loop reductions the chain of

  // instructions leading from the loop exit instr to the phi need to be

  // converted to reductions, with one operand being vector and the other being

  // the scalar reduction chain. For other reductions, a select is introduced

  // between the phi and users outside the vector region when folding the tail.

  void adjustRecipesForReductions(VPlanPtr &Plan,

                                  VPRecipeBuilder &RecipeBuilder,

                                  ElementCount MinVF);


  /// Attach the runtime checks of \p RTChecks to \p Plan.

  void attachRuntimeChecks(VPlan &Plan, GeneratedRTChecks &RTChecks,

                           bool HasBranchWeights) const;


#ifndef NDEBUG

  /// \return The most profitable vectorization factor for the available VPlans

  /// and the cost of that VF.

  /// This is now only used to verify the decisions by the new VPlan-based

  /// cost-model and will be retired once the VPlan-based cost-model is

  /// stabilized.

  VectorizationFactor selectVectorizationFactor();

#endif


  /// Returns true if the per-lane cost of VectorizationFactor A is lower than

  /// that of B.

  bool isMoreProfitable(const VectorizationFactor &A,

                        const VectorizationFactor &B, bool HasTail) const;


  /// Returns true if the per-lane cost of VectorizationFactor A is lower than

  /// that of B in the context of vectorizing a loop with known \p MaxTripCount.

  bool isMoreProfitable(const VectorizationFactor &A,

                        const VectorizationFactor &B,

                        const unsigned MaxTripCount, bool HasTail) const;


  /// Determines if we have the infrastructure to vectorize the loop and its

  /// epilogue, assuming the main loop is vectorized by \p VF.

  bool isCandidateForEpilogueVectorization(const ElementCount VF) const;

};


} // namespace llvm


#endif // LLVM_TRANSFORMS_VECTORIZE_LOOPVECTORIZATIONPLANNER_H

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

Select
AMDGPU Register Bank Select
Definition: AMDGPURegBankSelect.cpp:68

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

Name
std::string Name
Definition: ELFObjHandler.cpp:77

InstructionCost.h
This file defines an InstructionCost class that is used when calculating the cost of an instruction,...

Operands
mir Rename Register Operands
Definition: MIRNamerPass.cpp:74

Range
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition: RISCVRedundantCopyElimination.cpp:71

SmallSet.h
This file defines the SmallSet class.

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:77

VPlan.h
This file contains the declarations of the Vectorization Plan base classes:

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

IV
static const uint32_t IV[8]
Definition: blake3_impl.h:83

Predicate
Definition: AMDGPURegBankLegalizeRules.cpp:376

T

bool

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:678

llvm::CmpInst::FIRST_ICMP_PREDICATE
@ FIRST_ICMP_PREDICATE
Definition: InstrTypes.h:709

llvm::CmpInst::FIRST_FCMP_PREDICATE
@ FIRST_FCMP_PREDICATE
Definition: InstrTypes.h:696

llvm::CmpInst::LAST_ICMP_PREDICATE
@ LAST_ICMP_PREDICATE
Definition: InstrTypes.h:710

llvm::CmpInst::LAST_FCMP_PREDICATE
@ LAST_FCMP_PREDICATE
Definition: InstrTypes.h:697

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:33

llvm::DebugLoc
A debug info location.
Definition: DebugLoc.h:124

llvm::DebugLoc::getUnknown
static DebugLoc getUnknown()
Definition: DebugLoc.h:162

llvm::DenseMap
Definition: DenseMap.h:730

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition: Dominators.h:165

llvm::ElementCount
Definition: TypeSize.h:301

llvm::ElementCount::isVector
constexpr bool isVector() const
One or more elements.
Definition: TypeSize.h:327

llvm::ElementCount::getFixed
static constexpr ElementCount getFixed(ScalarTy MinVal)
Definition: TypeSize.h:312

llvm::FPMathOperator
Utility class for floating point operations which can have information about relaxed accuracy require...
Definition: Operator.h:200

llvm::FPMathOperator::getFastMathFlags
FastMathFlags getFastMathFlags() const
Convenience function for getting all the fast-math flags.
Definition: Operator.h:333

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition: FMF.h:22

llvm::GEPNoWrapFlags
Represents flags for the getelementptr instruction/expression.
Definition: GEPNoWrapFlags.h:26

llvm::GEPNoWrapFlags::none
static GEPNoWrapFlags none()
Definition: GEPNoWrapFlags.h:46

llvm::InductionDescriptor::InductionKind
InductionKind
This enum represents the kinds of inductions that we support.
Definition: IVDescriptors.h:383

llvm::InnerLoopVectorizer
InnerLoopVectorizer vectorizes loops which contain only one basic block to a specified vectorization ...
Definition: LoopVectorize.cpp:498

llvm::InstructionCost
Definition: InstructionCost.h:30

llvm::Instruction
Definition: Instruction.h:69

llvm::Instruction::BinaryOps
BinaryOps
Definition: Instruction.h:998

llvm::Instruction::CastOps
CastOps
Definition: Instruction.h:1012

llvm::InterleavedAccessInfo
Drive the analysis of interleaved memory accesses in the loop.
Definition: VectorUtils.h:669

llvm::LoopInfo
Definition: LoopInfo.h:409

llvm::LoopVectorizationCostModel
LoopVectorizationCostModel - estimates the expected speedups due to vectorization.
Definition: LoopVectorize.cpp:894

llvm::LoopVectorizationLegality
LoopVectorizationLegality checks if it is legal to vectorize a loop, and to what vectorization factor...
Definition: LoopVectorizationLegality.h:252

llvm::LoopVectorizationPlanner
Planner drives the vectorization process after having passed Legality checks.
Definition: LoopVectorizationPlanner.h:434

llvm::LoopVectorizationPlanner::selectEpilogueVectorizationFactor
VectorizationFactor selectEpilogueVectorizationFactor(const ElementCount MaxVF, unsigned IC)
Definition: LoopVectorize.cpp:4344

llvm::LoopVectorizationPlanner::getPlanFor
VPlan & getPlanFor(ElementCount VF) const
Return the VPlan for VF.
Definition: VPlan.cpp:1602

llvm::LoopVectorizationPlanner::LoopVectorizationPlanner
LoopVectorizationPlanner(Loop *L, LoopInfo *LI, DominatorTree *DT, const TargetLibraryInfo *TLI, const TargetTransformInfo &TTI, LoopVectorizationLegality *Legal, LoopVectorizationCostModel &CM, InterleavedAccessInfo &IAI, PredicatedScalarEvolution &PSE, const LoopVectorizeHints &Hints, OptimizationRemarkEmitter *ORE)
Definition: LoopVectorizationPlanner.h:490

llvm::LoopVectorizationPlanner::planInVPlanNativePath
VectorizationFactor planInVPlanNativePath(ElementCount UserVF)
Use the VPlan-native path to plan how to best vectorize, return the best VF and its cost.
Definition: LoopVectorize.cpp:6572

llvm::LoopVectorizationPlanner::buildVPlans
void buildVPlans(ElementCount MinVF, ElementCount MaxVF)
Build VPlans for power-of-2 VF's between MinVF and MaxVF inclusive, according to the information gath...
Definition: VPlan.cpp:1586

llvm::LoopVectorizationPlanner::computeBestVF
VectorizationFactor computeBestVF()
Compute and return the most profitable vectorization factor.
Definition: LoopVectorize.cpp:6965

llvm::LoopVectorizationPlanner::executePlan
DenseMap< const SCEV *, Value * > executePlan(ElementCount VF, unsigned UF, VPlan &BestPlan, InnerLoopVectorizer &LB, DominatorTree *DT, bool VectorizingEpilogue)
Generate the IR code for the vectorized loop captured in VPlan BestPlan according to the best selecte...
Definition: LoopVectorize.cpp:7188

llvm::LoopVectorizationPlanner::selectInterleaveCount
unsigned selectInterleaveCount(VPlan &Plan, ElementCount VF, InstructionCost LoopCost)
Definition: LoopVectorize.cpp:4529

llvm::LoopVectorizationPlanner::emitInvalidCostRemarks
void emitInvalidCostRemarks(OptimizationRemarkEmitter *ORE)
Emit remarks for recipes with invalid costs in the available VPlans.
Definition: LoopVectorize.cpp:3922

llvm::LoopVectorizationPlanner::getDecisionAndClampRange
static bool getDecisionAndClampRange(const std::function< bool(ElementCount)> &Predicate, VFRange &Range)
Test a Predicate on a Range of VF's.
Definition: VPlan.cpp:1567

llvm::LoopVectorizationPlanner::printPlans
void printPlans(raw_ostream &O)
Definition: VPlan.cpp:1616

llvm::LoopVectorizationPlanner::plan
void plan(ElementCount UserVF, unsigned UserIC)
Build VPlans for the specified UserVF and UserIC if they are non-zero or all applicable candidate VFs...
Definition: LoopVectorize.cpp:6626

llvm::LoopVectorizationPlanner::addMinimumIterationCheck
void addMinimumIterationCheck(VPlan &Plan, ElementCount VF, unsigned UF, ElementCount MinProfitableTripCount) const
Create a check to Plan to see if the vector loop should be executed based on its trip count.
Definition: LoopVectorize.cpp:9280

llvm::LoopVectorizationPlanner::hasPlanWithVF
bool hasPlanWithVF(ElementCount VF) const
Look through the existing plans and return true if we have one with vectorization factor VF.
Definition: LoopVectorizationPlanner.h:545

llvm::LoopVectorizeHints
Utility class for getting and setting loop vectorizer hints in the form of loop metadata.
Definition: LoopVectorizationLegality.h:60

llvm::LoopVersioning
This class emits a version of the loop where run-time checks ensure that may-alias pointers can't ove...
Definition: LoopVersioning.h:41

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:40

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition: OptimizationRemarkEmitter.h:33

llvm::PredicatedScalarEvolution
An interface layer with SCEV used to manage how we see SCEV expressions for values in the context of ...
Definition: ScalarEvolution.h:2423

llvm::SCEV
This class represents an analyzed expression in the program.
Definition: ScalarEvolution.h:72

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1197

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition: TargetLibraryInfo.h:285

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition: TargetTransformInfo.h:219

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition: Twine.h:82

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getScalarSizeInBits
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.

llvm::VPBasicBlock
VPBasicBlock serves as the leaf of the Hierarchical Control-Flow Graph.
Definition: VPlan.h:3639

llvm::VPBasicBlock::iterator
RecipeListTy::iterator iterator
Instruction iterators...
Definition: VPlan.h:3666

llvm::VPBasicBlock::end
iterator end()
Definition: VPlan.h:3676

llvm::VPBasicBlock::insert
void insert(VPRecipeBase *Recipe, iterator InsertPt)
Definition: VPlan.h:3705

llvm::VPBlockBase::getPlan
VPlan * getPlan()
Definition: VPlan.cpp:155

llvm::VPBuilder::InsertPointGuard
RAII object that stores the current insertion point and restores it when the object is destroyed.
Definition: LoopVectorizationPlanner.h:347

llvm::VPBuilder::InsertPointGuard::InsertPointGuard
InsertPointGuard(const InsertPointGuard &)=delete

llvm::VPBuilder::InsertPointGuard::InsertPointGuard
InsertPointGuard(VPBuilder &B)
Definition: LoopVectorizationPlanner.h:353

llvm::VPBuilder::InsertPointGuard::operator=
InsertPointGuard & operator=(const InsertPointGuard &)=delete

llvm::VPBuilder::InsertPointGuard::~InsertPointGuard
~InsertPointGuard()
Definition: LoopVectorizationPlanner.h:359

llvm::VPBuilder::VPInsertPoint
InsertPoint - A saved insertion point.
Definition: LoopVectorizationPlanner.h:97

llvm::VPBuilder::VPInsertPoint::VPInsertPoint
VPInsertPoint(VPBasicBlock *InsertBlock, VPBasicBlock::iterator InsertPoint)
Creates a new insertion point at the given location.
Definition: LoopVectorizationPlanner.h:106

llvm::VPBuilder::VPInsertPoint::getBlock
VPBasicBlock * getBlock() const
Definition: LoopVectorizationPlanner.h:112

llvm::VPBuilder::VPInsertPoint::getPoint
VPBasicBlock::iterator getPoint() const
Definition: LoopVectorizationPlanner.h:113

llvm::VPBuilder::VPInsertPoint::VPInsertPoint
VPInsertPoint()=default
Creates a new insertion point which doesn't point to anything.

llvm::VPBuilder::VPInsertPoint::isSet
bool isSet() const
Returns true if this insert point is set.
Definition: LoopVectorizationPlanner.h:110

llvm::VPBuilder
VPlan-based builder utility analogous to IRBuilder.
Definition: LoopVectorizationPlanner.h:54

llvm::VPBuilder::createOr
VPInstruction * createOr(VPValue *LHS, VPValue *RHS, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:202

llvm::VPBuilder::createScalarZExtOrTrunc
VPValue * createScalarZExtOrTrunc(VPValue *Op, Type *ResultTy, Type *SrcTy, DebugLoc DL)
Definition: LoopVectorizationPlanner.h:312

llvm::VPBuilder::setInsertPoint
void setInsertPoint(VPBasicBlock *TheBB, VPBasicBlock::iterator IP)
This specifies that created instructions should be inserted at the specified point.
Definition: LoopVectorizationPlanner.h:134

llvm::VPBuilder::setInsertPoint
void setInsertPoint(VPRecipeBase *IP)
This specifies that created instructions should be inserted at the specified point.
Definition: LoopVectorizationPlanner.h:141

llvm::VPBuilder::createElementCount
VPValue * createElementCount(Type *Ty, ElementCount EC)
Definition: LoopVectorizationPlanner.h:281

llvm::VPBuilder::restoreIP
void restoreIP(VPInsertPoint IP)
Sets the current insert point to a previously-saved location.
Definition: LoopVectorizationPlanner.h:117

llvm::VPBuilder::createNot
VPInstruction * createNot(VPValue *Operand, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:190

llvm::VPBuilder::createLogicalAnd
VPInstruction * createLogicalAnd(VPValue *LHS, VPValue *RHS, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:211

llvm::VPBuilder::getInsertBlock
VPBasicBlock * getInsertBlock() const
Definition: LoopVectorizationPlanner.h:86

llvm::VPBuilder::createDerivedIV
VPDerivedIVRecipe * createDerivedIV(InductionDescriptor::InductionKind Kind, FPMathOperator *FPBinOp, VPValue *Start, VPValue *Current, VPValue *Step, const Twine &Name="")
Convert the input value Current to the corresponding value of an induction with Start and Step values...
Definition: LoopVectorizationPlanner.h:298

llvm::VPBuilder::insert
void insert(VPRecipeBase *R)
Insert R at the current insertion point.
Definition: LoopVectorizationPlanner.h:147

llvm::VPBuilder::createSelect
VPInstruction * createSelect(VPValue *Cond, VPValue *TrueVal, VPValue *FalseVal, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="", std::optional< FastMathFlags > FMFs=std::nullopt)
Definition: LoopVectorizationPlanner.h:219

llvm::VPBuilder::getInsertPoint
VPBasicBlock::iterator getInsertPoint() const
Definition: LoopVectorizationPlanner.h:87

llvm::VPBuilder::createScalarIVSteps
VPScalarIVStepsRecipe * createScalarIVSteps(Instruction::BinaryOps InductionOpcode, FPMathOperator *FPBinOp, VPValue *IV, VPValue *Step, VPValue *VF, DebugLoc DL)
Definition: LoopVectorizationPlanner.h:329

llvm::VPBuilder::VPBuilder
VPBuilder(VPBasicBlock *InsertBB)
Definition: LoopVectorizationPlanner.h:73

llvm::VPBuilder::createNoWrapPtrAdd
VPInstruction * createNoWrapPtrAdd(VPValue *Ptr, VPValue *Offset, GEPNoWrapFlags GEPFlags, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:260

llvm::VPBuilder::createFCmp
VPInstruction * createFCmp(CmpInst::Predicate Pred, VPValue *A, VPValue *B, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Create a new FCmp VPInstruction with predicate Pred and operands A and B.
Definition: LoopVectorizationPlanner.h:243

llvm::VPBuilder::createPtrAdd
VPInstruction * createPtrAdd(VPValue *Ptr, VPValue *Offset, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:252

llvm::VPBuilder::createOverflowingOp
VPInstruction * createOverflowingOp(unsigned Opcode, ArrayRef< VPValue * > Operands, VPRecipeWithIRFlags::WrapFlagsTy WrapFlags, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:181

llvm::VPBuilder::getToInsertAfter
static VPBuilder getToInsertAfter(VPRecipeBase *R)
Create a VPBuilder to insert after R.
Definition: LoopVectorizationPlanner.h:90

llvm::VPBuilder::createNaryOp
VPInstruction * createNaryOp(unsigned Opcode, ArrayRef< VPValue * > Operands, DebugLoc DL, const Twine &Name="")
Definition: LoopVectorizationPlanner.h:161

llvm::VPBuilder::VPBuilder
VPBuilder(VPRecipeBase *InsertPt)
Definition: LoopVectorizationPlanner.h:74

llvm::VPBuilder::createScalarPhi
VPPhi * createScalarPhi(ArrayRef< VPValue * > IncomingValues, DebugLoc DL, const Twine &Name="")
Definition: LoopVectorizationPlanner.h:276

llvm::VPBuilder::createWidenCast
VPWidenCastRecipe * createWidenCast(Instruction::CastOps Opcode, VPValue *Op, Type *ResultTy)
Definition: LoopVectorizationPlanner.h:323

llvm::VPBuilder::createICmp
VPInstruction * createICmp(CmpInst::Predicate Pred, VPValue *A, VPValue *B, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Create a new ICmp VPInstruction with predicate Pred and operands A and B.
Definition: LoopVectorizationPlanner.h:232

llvm::VPBuilder::clearInsertionPoint
void clearInsertionPoint()
Clear the insertion point: created instructions will not be inserted into a block.
Definition: LoopVectorizationPlanner.h:81

llvm::VPBuilder::createAnd
VPInstruction * createAnd(VPValue *LHS, VPValue *RHS, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:196

llvm::VPBuilder::createNaryOp
VPInstruction * createNaryOp(unsigned Opcode, ArrayRef< VPValue * > Operands, Instruction *Inst=nullptr, const Twine &Name="")
Create an N-ary operation with Opcode, Operands and set Inst as its underlying Instruction.
Definition: LoopVectorizationPlanner.h:151

llvm::VPBuilder::createNaryOp
VPInstruction * createNaryOp(unsigned Opcode, ArrayRef< VPValue * > Operands, Type *ResultTy, const VPIRFlags &Flags={}, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:173

llvm::VPBuilder::VPBuilder
VPBuilder()=default

llvm::VPBuilder::createNaryOp
VPInstruction * createNaryOp(unsigned Opcode, ArrayRef< VPValue * > Operands, const VPIRFlags &Flags, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:165

llvm::VPBuilder::createScalarCast
VPInstruction * createScalarCast(Instruction::CastOps Opcode, VPValue *Op, Type *ResultTy, DebugLoc DL)
Definition: LoopVectorizationPlanner.h:306

llvm::VPBuilder::createExpandSCEV
VPExpandSCEVRecipe * createExpandSCEV(const SCEV *Expr)
Definition: LoopVectorizationPlanner.h:337

llvm::VPBuilder::VPBuilder
VPBuilder(VPBasicBlock *TheBB, VPBasicBlock::iterator IP)
Definition: LoopVectorizationPlanner.h:75

llvm::VPBuilder::createWidePtrAdd
VPInstruction * createWidePtrAdd(VPValue *Ptr, VPValue *Offset, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Definition: LoopVectorizationPlanner.h:268

llvm::VPBuilder::setInsertPoint
void setInsertPoint(VPBasicBlock *TheBB)
This specifies that created VPInstructions should be appended to the end of the specified block.
Definition: LoopVectorizationPlanner.h:126

llvm::VPDerivedIVRecipe
A recipe for converting the input value IV value to the corresponding value of an IV with different s...
Definition: VPlan.h:3460

llvm::VPExpandSCEVRecipe
Recipe to expand a SCEV expression.
Definition: VPlan.h:3258

llvm::VPIRFlags
Class to record and manage LLVM IR flags.
Definition: VPlan.h:596

llvm::VPInstructionWithType
A specialization of VPInstruction augmenting it with a dedicated result type, to be used when the opc...
Definition: VPlan.h:1172

llvm::VPInstruction
This is a concrete Recipe that models a single VPlan-level instruction.
Definition: VPlan.h:967

llvm::VPInstruction::PtrAdd
@ PtrAdd
Definition: VPlan.h:1011

llvm::VPInstruction::WidePtrAdd
@ WidePtrAdd
Definition: VPlan.h:1014

llvm::VPInstruction::LogicalAnd
@ LogicalAnd
Definition: VPlan.h:1007

llvm::VPInstruction::VScale
@ VScale
Returns the value for vscale.
Definition: VPlan.h:1045

llvm::VPInstruction::Not
@ Not
Definition: VPlan.h:976

llvm::VPRecipeBase
VPRecipeBase is a base class modeling a sequence of one or more output IR instructions.
Definition: VPlan.h:391

llvm::VPRecipeBase::getParent
VPBasicBlock * getParent()
Definition: VPlan.h:412

llvm::VPRecipeBuilder
Helper class to create VPRecipies from IR instructions.
Definition: VPRecipeBuilder.h:47

llvm::VPScalarIVStepsRecipe
A recipe for handling phi nodes of integer and floating-point inductions, producing their scalar valu...
Definition: VPlan.h:3529

llvm::VPValue
Definition: VPlanValue.h:48

llvm::VPValue::setUnderlyingValue
void setUnderlyingValue(Value *Val)
Definition: VPlanValue.h:184

llvm::VPWidenCastRecipe
VPWidenCastRecipe is a recipe to create vector cast instructions.
Definition: VPlan.h:1467

llvm::VPlan
VPlan models a candidate for vectorization, encoding various decisions take to produce efficient outp...
Definition: VPlan.h:3930

llvm::VPlan::getOrAddLiveIn
VPValue * getOrAddLiveIn(Value *V)
Gets the live-in VPValue for V or adds a new live-in (if none exists yet) for V.
Definition: VPlan.h:4181

llvm::details::FixedOrScalableQuantity::isScalable
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition: TypeSize.h:172

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition: ilist_node.h:134

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:53

llvm::IRSimilarity::Legal
@ Legal
Definition: IRSimilarityIdentifier.h:77

llvm::cl::opt< bool >
template class LLVM_TEMPLATE_ABI opt< bool >
Definition: CommandLine.cpp:79

llvm::cl::opt< unsigned >
template class LLVM_TEMPLATE_ABI opt< unsigned >
Definition: CommandLine.cpp:82

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Offset
@ Offset
Definition: DWP.cpp:477

llvm::any_of
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1751

llvm::VPlanPtr
std::unique_ptr< VPlan > VPlanPtr
Definition: VPlan.h:77

llvm::ForceTargetInstructionCost
cl::opt< unsigned > ForceTargetInstructionCost

llvm::Op
DWARFExpression::Operation Op
Definition: DWARFExpressionPrinter.cpp:22

llvm::EnableVPlanNativePath
cl::opt< bool > EnableVPlanNativePath
Definition: VPlan.cpp:55

llvm::FixedScalableVFPair
A class that represents two vectorization factors (initialized with 0 by default).
Definition: LoopVectorizationPlanner.h:406

llvm::FixedScalableVFPair::FixedVF
ElementCount FixedVF
Definition: LoopVectorizationPlanner.h:407

llvm::FixedScalableVFPair::ScalableVF
ElementCount ScalableVF
Definition: LoopVectorizationPlanner.h:408

llvm::FixedScalableVFPair::FixedScalableVFPair
FixedScalableVFPair(const ElementCount &FixedVF, const ElementCount &ScalableVF)
Definition: LoopVectorizationPlanner.h:416

llvm::FixedScalableVFPair::FixedScalableVFPair
FixedScalableVFPair(const ElementCount &Max)
Definition: LoopVectorizationPlanner.h:413

llvm::FixedScalableVFPair::hasVector
bool hasVector() const
Definition: LoopVectorizationPlanner.h:429

llvm::FixedScalableVFPair::getNone
static FixedScalableVFPair getNone()
Definition: LoopVectorizationPlanner.h:423

llvm::FixedScalableVFPair::FixedScalableVFPair
FixedScalableVFPair()
Definition: LoopVectorizationPlanner.h:410

llvm::VFRange
A range of powers-of-2 vectorization factors with fixed start and adjustable end.
Definition: VPlanHelpers.h:71

llvm::VPCostContext
Struct to hold various analysis needed for cost computations.
Definition: VPlanHelpers.h:344

llvm::VPIRFlags::DisjointFlagsTy
Definition: VPlan.h:624

llvm::VPIRFlags::WrapFlagsTy
Definition: VPlan.h:610

llvm::VPPhi
Definition: VPlan.h:1289

llvm::VectorizationFactor
TODO: The following VectorizationFactor was pulled out of LoopVectorizationCostModel class.
Definition: LoopVectorizationPlanner.h:369

llvm::VectorizationFactor::Cost
InstructionCost Cost
Cost of the loop with that width.
Definition: LoopVectorizationPlanner.h:374

llvm::VectorizationFactor::MinProfitableTripCount
ElementCount MinProfitableTripCount
The minimum trip count required to make vectorization profitable, e.g.
Definition: LoopVectorizationPlanner.h:381

llvm::VectorizationFactor::operator==
bool operator==(const VectorizationFactor &rhs) const
Definition: LoopVectorizationPlanner.h:392

llvm::VectorizationFactor::Width
ElementCount Width
Vector width with best cost.
Definition: LoopVectorizationPlanner.h:371

llvm::VectorizationFactor::ScalarCost
InstructionCost ScalarCost
Cost of the scalar loop.
Definition: LoopVectorizationPlanner.h:377

llvm::VectorizationFactor::operator!=
bool operator!=(const VectorizationFactor &rhs) const
Definition: LoopVectorizationPlanner.h:396

llvm::VectorizationFactor::Disabled
static VectorizationFactor Disabled()
Width 1 means no vectorization, cost 0 means uncomputed cost.
Definition: LoopVectorizationPlanner.h:388

llvm::VectorizationFactor::VectorizationFactor
VectorizationFactor(ElementCount Width, InstructionCost Cost, InstructionCost ScalarCost)
Definition: LoopVectorizationPlanner.h:383