LLVM: lib/Analysis/Delinearization.cpp Source File

//===---- Delinearization.cpp - MultiDimensional Index Delinearization ----===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This implements an analysis pass that tries to delinearize all GEP

// instructions in all loops using the SCEV analysis functionality. This pass is

// only used for testing purposes: if your pass needs delinearization, please

// use the on-demand SCEVAddRecExpr::delinearize() function.

//

//===----------------------------------------------------------------------===//


#include "llvm/Analysis/Delinearization.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/ScalarEvolution.h"

#include "llvm/Analysis/ScalarEvolutionDivision.h"

#include "llvm/Analysis/ScalarEvolutionExpressions.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/DerivedTypes.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/InstIterator.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/PassManager.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/raw_ostream.h"


using namespace llvm;


#define DL_NAME "delinearize"

#define DEBUG_TYPE DL_NAME


static cl::opt<bool> UseFixedSizeArrayHeuristic(

    "delinearize-use-fixed-size-array-heuristic", cl::init(false), cl::Hidden,

    cl::desc("When printing analysis, use the heuristic for fixed-size arrays "

             "if the default delinearizetion fails."));


// Return true when S contains at least an undef value.

static inline bool containsUndefs(const SCEV *S) {

  return SCEVExprContains(S, [](const SCEV *S) {

    if (const auto *SU = dyn_cast<SCEVUnknown>(S))

      return isa<UndefValue>(SU->getValue());

    return false;

  });

}


namespace {


// Collect all steps of SCEV expressions.

struct SCEVCollectStrides {

  ScalarEvolution &SE;

  SmallVectorImpl<const SCEV *> &Strides;


  SCEVCollectStrides(ScalarEvolution &SE, SmallVectorImpl<const SCEV *> &S)

      : SE(SE), Strides(S) {}


  bool follow(const SCEV *S) {

    if (const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(S))

      Strides.push_back(AR->getStepRecurrence(SE));

    return true;

  }


  bool isDone() const { return false; }

};


// Collect all SCEVUnknown and SCEVMulExpr expressions.

struct SCEVCollectTerms {

  SmallVectorImpl<const SCEV *> &Terms;


  SCEVCollectTerms(SmallVectorImpl<const SCEV *> &T) : Terms(T) {}


  bool follow(const SCEV *S) {

    if (isa<SCEVUnknown>(S) || isa<SCEVMulExpr>(S) ||

        isa<SCEVSignExtendExpr>(S)) {

      if (!containsUndefs(S))

        Terms.push_back(S);


      // Stop recursion: once we collected a term, do not walk its operands.

      return false;

    }


    // Keep looking.

    return true;

  }


  bool isDone() const { return false; }

};


// Check if a SCEV contains an AddRecExpr.

struct SCEVHasAddRec {

  bool &ContainsAddRec;


  SCEVHasAddRec(bool &ContainsAddRec) : ContainsAddRec(ContainsAddRec) {

    ContainsAddRec = false;

  }


  bool follow(const SCEV *S) {

    if (isa<SCEVAddRecExpr>(S)) {

      ContainsAddRec = true;


      // Stop recursion: once we collected a term, do not walk its operands.

      return false;

    }


    // Keep looking.

    return true;

  }


  bool isDone() const { return false; }

};


// Find factors that are multiplied with an expression that (possibly as a

// subexpression) contains an AddRecExpr. In the expression:

//

//  8 * (100 +  %p * %q * (%a + {0, +, 1}_loop))

//

// "%p * %q" are factors multiplied by the expression "(%a + {0, +, 1}_loop)"

// that contains the AddRec {0, +, 1}_loop. %p * %q are likely to be array size

// parameters as they form a product with an induction variable.

//

// This collector expects all array size parameters to be in the same MulExpr.

// It might be necessary to later add support for collecting parameters that are

// spread over different nested MulExpr.

struct SCEVCollectAddRecMultiplies {

  SmallVectorImpl<const SCEV *> &Terms;

  ScalarEvolution &SE;


  SCEVCollectAddRecMultiplies(SmallVectorImpl<const SCEV *> &T,

                              ScalarEvolution &SE)

      : Terms(T), SE(SE) {}


  bool follow(const SCEV *S) {

    if (auto *Mul = dyn_cast<SCEVMulExpr>(S)) {

      bool HasAddRec = false;

      SmallVector<const SCEV *, 0> Operands;

      for (const SCEV *Op : Mul->operands()) {

        const SCEVUnknown *Unknown = dyn_cast<SCEVUnknown>(Op);

        if (Unknown && !isa<CallInst>(Unknown->getValue())) {

          Operands.push_back(Op);

        } else if (Unknown) {

          HasAddRec = true;

        } else {

          bool ContainsAddRec = false;

          SCEVHasAddRec ContiansAddRec(ContainsAddRec);

          visitAll(Op, ContiansAddRec);

          HasAddRec |= ContainsAddRec;

        }

      }

      if (Operands.size() == 0)

        return true;


      if (!HasAddRec)

        return false;


      Terms.push_back(SE.getMulExpr(Operands));

      // Stop recursion: once we collected a term, do not walk its operands.

      return false;

    }


    // Keep looking.

    return true;

  }


  bool isDone() const { return false; }

};


} // end anonymous namespace


/// Find parametric terms in this SCEVAddRecExpr. We first for parameters in

/// two places:

///   1) The strides of AddRec expressions.

///   2) Unknowns that are multiplied with AddRec expressions.

void llvm::collectParametricTerms(ScalarEvolution &SE, const SCEV *Expr,

                                  SmallVectorImpl<const SCEV *> &Terms) {

  SmallVector<const SCEV *, 4> Strides;

  SCEVCollectStrides StrideCollector(SE, Strides);

  visitAll(Expr, StrideCollector);


  LLVM_DEBUG({

    dbgs() << "Strides:\n";

    for (const SCEV *S : Strides)

      dbgs() << *S << "\n";

  });


  for (const SCEV *S : Strides) {

    SCEVCollectTerms TermCollector(Terms);

    visitAll(S, TermCollector);

  }


  LLVM_DEBUG({

    dbgs() << "Terms:\n";

    for (const SCEV *T : Terms)

      dbgs() << *T << "\n";

  });


  SCEVCollectAddRecMultiplies MulCollector(Terms, SE);

  visitAll(Expr, MulCollector);

}


static bool findArrayDimensionsRec(ScalarEvolution &SE,

                                   SmallVectorImpl<const SCEV *> &Terms,

                                   SmallVectorImpl<const SCEV *> &Sizes) {

  int Last = Terms.size() - 1;

  const SCEV *Step = Terms[Last];


  // End of recursion.

  if (Last == 0) {

    if (const SCEVMulExpr *M = dyn_cast<SCEVMulExpr>(Step)) {

      SmallVector<const SCEV *, 2> Qs;

      for (const SCEV *Op : M->operands())

        if (!isa<SCEVConstant>(Op))

          Qs.push_back(Op);


      Step = SE.getMulExpr(Qs);

    }


    Sizes.push_back(Step);

    return true;

  }


  for (const SCEV *&Term : Terms) {

    // Normalize the terms before the next call to findArrayDimensionsRec.

    const SCEV *Q, *R;

    SCEVDivision::divide(SE, Term, Step, &Q, &R);


    // Bail out when GCD does not evenly divide one of the terms.

    if (!R->isZero())

      return false;


    Term = Q;

  }


  // Remove all SCEVConstants.

  erase_if(Terms, [](const SCEV *E) { return isa<SCEVConstant>(E); });


  if (Terms.size() > 0)

    if (!findArrayDimensionsRec(SE, Terms, Sizes))

      return false;


  Sizes.push_back(Step);

  return true;

}


// Returns true when one of the SCEVs of Terms contains a SCEVUnknown parameter.

static inline bool containsParameters(SmallVectorImpl<const SCEV *> &Terms) {

  for (const SCEV *T : Terms)

    if (SCEVExprContains(T, [](const SCEV *S) { return isa<SCEVUnknown>(S); }))

      return true;


  return false;

}


// Return the number of product terms in S.

static inline int numberOfTerms(const SCEV *S) {

  if (const SCEVMulExpr *Expr = dyn_cast<SCEVMulExpr>(S))

    return Expr->getNumOperands();

  return 1;

}


static const SCEV *removeConstantFactors(ScalarEvolution &SE, const SCEV *T) {

  if (isa<SCEVConstant>(T))

    return nullptr;


  if (isa<SCEVUnknown>(T))

    return T;


  if (const SCEVMulExpr *M = dyn_cast<SCEVMulExpr>(T)) {

    SmallVector<const SCEV *, 2> Factors;

    for (const SCEV *Op : M->operands())

      if (!isa<SCEVConstant>(Op))

        Factors.push_back(Op);


    return SE.getMulExpr(Factors);

  }


  return T;

}


void llvm::findArrayDimensions(ScalarEvolution &SE,

                               SmallVectorImpl<const SCEV *> &Terms,

                               SmallVectorImpl<const SCEV *> &Sizes,

                               const SCEV *ElementSize) {

  if (Terms.size() < 1 || !ElementSize)

    return;


  // Early return when Terms do not contain parameters: we do not delinearize

  // non parametric SCEVs.

  if (!containsParameters(Terms))

    return;


  LLVM_DEBUG({

    dbgs() << "Terms:\n";

    for (const SCEV *T : Terms)

      dbgs() << *T << "\n";

  });


  // Remove duplicates.

  array_pod_sort(Terms.begin(), Terms.end());

  Terms.erase(llvm::unique(Terms), Terms.end());


  // Put larger terms first.

  llvm::sort(Terms, [](const SCEV *LHS, const SCEV *RHS) {

    return numberOfTerms(LHS) > numberOfTerms(RHS);

  });


  // Try to divide all terms by the element size. If term is not divisible by

  // element size, proceed with the original term.

  for (const SCEV *&Term : Terms) {

    const SCEV *Q, *R;

    SCEVDivision::divide(SE, Term, ElementSize, &Q, &R);

    if (!Q->isZero())

      Term = Q;

  }


  SmallVector<const SCEV *, 4> NewTerms;


  // Remove constant factors.

  for (const SCEV *T : Terms)

    if (const SCEV *NewT = removeConstantFactors(SE, T))

      NewTerms.push_back(NewT);


  LLVM_DEBUG({

    dbgs() << "Terms after sorting:\n";

    for (const SCEV *T : NewTerms)

      dbgs() << *T << "\n";

  });


  if (NewTerms.empty() || !findArrayDimensionsRec(SE, NewTerms, Sizes)) {

    Sizes.clear();

    return;

  }


  // The last element to be pushed into Sizes is the size of an element.

  Sizes.push_back(ElementSize);


  LLVM_DEBUG({

    dbgs() << "Sizes:\n";

    for (const SCEV *S : Sizes)

      dbgs() << *S << "\n";

  });

}


void llvm::computeAccessFunctions(ScalarEvolution &SE, const SCEV *Expr,

                                  SmallVectorImpl<const SCEV *> &Subscripts,

                                  SmallVectorImpl<const SCEV *> &Sizes) {

  // Early exit in case this SCEV is not an affine multivariate function.

  if (Sizes.empty())

    return;


  if (auto *AR = dyn_cast<SCEVAddRecExpr>(Expr))

    if (!AR->isAffine())

      return;


  const SCEV *Res = Expr;

  int Last = Sizes.size() - 1;

  for (int i = Last; i >= 0; i--) {

    const SCEV *Q, *R;

    SCEVDivision::divide(SE, Res, Sizes[i], &Q, &R);


    LLVM_DEBUG({

      dbgs() << "Res: " << *Res << "\n";

      dbgs() << "Sizes[i]: " << *Sizes[i] << "\n";

      dbgs() << "Res divided by Sizes[i]:\n";

      dbgs() << "Quotient: " << *Q << "\n";

      dbgs() << "Remainder: " << *R << "\n";

    });


    Res = Q;


    // Do not record the last subscript corresponding to the size of elements in

    // the array.

    if (i == Last) {


      // Bail out if the byte offset is non-zero.

      if (!R->isZero()) {

        Subscripts.clear();

        Sizes.clear();

        return;

      }


      continue;

    }


    // Record the access function for the current subscript.

    Subscripts.push_back(R);

  }


  // Also push in last position the remainder of the last division: it will be

  // the access function of the innermost dimension.

  Subscripts.push_back(Res);


  std::reverse(Subscripts.begin(), Subscripts.end());


  LLVM_DEBUG({

    dbgs() << "Subscripts:\n";

    for (const SCEV *S : Subscripts)

      dbgs() << *S << "\n";

  });

}


/// Splits the SCEV into two vectors of SCEVs representing the subscripts and

/// sizes of an array access. Returns the remainder of the delinearization that

/// is the offset start of the array.  The SCEV->delinearize algorithm computes

/// the multiples of SCEV coefficients: that is a pattern matching of sub

/// expressions in the stride and base of a SCEV corresponding to the

/// computation of a GCD (greatest common divisor) of base and stride.  When

/// SCEV->delinearize fails, it returns the SCEV unchanged.

///

/// For example: when analyzing the memory access A[i][j][k] in this loop nest

///

///  void foo(long n, long m, long o, double A[n][m][o]) {

///

///    for (long i = 0; i < n; i++)

///      for (long j = 0; j < m; j++)

///        for (long k = 0; k < o; k++)

///          A[i][j][k] = 1.0;

///  }

///

/// the delinearization input is the following AddRec SCEV:

///

///  AddRec: {{{%A,+,(8 * %m * %o)}<%for.i>,+,(8 * %o)}<%for.j>,+,8}<%for.k>

///

/// From this SCEV, we are able to say that the base offset of the access is %A

/// because it appears as an offset that does not divide any of the strides in

/// the loops:

///

///  CHECK: Base offset: %A

///

/// and then SCEV->delinearize determines the size of some of the dimensions of

/// the array as these are the multiples by which the strides are happening:

///

///  CHECK: ArrayDecl[UnknownSize][%m][%o] with elements of sizeof(double)

///  bytes.

///

/// Note that the outermost dimension remains of UnknownSize because there are

/// no strides that would help identifying the size of the last dimension: when

/// the array has been statically allocated, one could compute the size of that

/// dimension by dividing the overall size of the array by the size of the known

/// dimensions: %m * %o * 8.

///

/// Finally delinearize provides the access functions for the array reference

/// that does correspond to A[i][j][k] of the above C testcase:

///

///  CHECK: ArrayRef[{0,+,1}<%for.i>][{0,+,1}<%for.j>][{0,+,1}<%for.k>]

///

/// The testcases are checking the output of a function pass:

/// DelinearizationPass that walks through all loads and stores of a function

/// asking for the SCEV of the memory access with respect to all enclosing

/// loops, calling SCEV->delinearize on that and printing the results.

void llvm::delinearize(ScalarEvolution &SE, const SCEV *Expr,

                       SmallVectorImpl<const SCEV *> &Subscripts,

                       SmallVectorImpl<const SCEV *> &Sizes,

                       const SCEV *ElementSize) {

  // First step: collect parametric terms.

  SmallVector<const SCEV *, 4> Terms;

  collectParametricTerms(SE, Expr, Terms);


  if (Terms.empty())

    return;


  // Second step: find subscript sizes.

  findArrayDimensions(SE, Terms, Sizes, ElementSize);


  if (Sizes.empty())

    return;


  // Third step: compute the access functions for each subscript.

  computeAccessFunctions(SE, Expr, Subscripts, Sizes);


  if (Subscripts.empty())

    return;


  LLVM_DEBUG({

    dbgs() << "succeeded to delinearize " << *Expr << "\n";

    dbgs() << "ArrayDecl[UnknownSize]";

    for (const SCEV *S : Sizes)

      dbgs() << "[" << *S << "]";


    dbgs() << "\nArrayRef";

    for (const SCEV *S : Subscripts)

      dbgs() << "[" << *S << "]";

    dbgs() << "\n";

  });

}


static std::optional<APInt> tryIntoAPInt(const SCEV *S) {

  if (const auto *Const = dyn_cast<SCEVConstant>(S))

    return Const->getAPInt();

  return std::nullopt;

}


/// Collects the absolute values of constant steps for all induction variables.

/// Returns true if we can prove that all step recurrences are constants and \p

/// Expr is divisible by \p ElementSize. Each step recurrence is stored in \p

/// Steps after divided by \p ElementSize.

static bool collectConstantAbsSteps(ScalarEvolution &SE, const SCEV *Expr,

                                    SmallVectorImpl<uint64_t> &Steps,

                                    uint64_t ElementSize) {

  // End of recursion. The constant value also must be a multiple of

  // ElementSize.

  if (const auto *Const = dyn_cast<SCEVConstant>(Expr)) {

    const uint64_t Mod = Const->getAPInt().urem(ElementSize);

    return Mod == 0;

  }


  const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(Expr);

  if (!AR || !AR->isAffine())

    return false;


  const SCEV *Step = AR->getStepRecurrence(SE);

  std::optional<APInt> StepAPInt = tryIntoAPInt(Step);

  if (!StepAPInt)

    return false;


  APInt Q;

  uint64_t R;

  APInt::udivrem(StepAPInt->abs(), ElementSize, Q, R);

  if (R != 0)

    return false;


  // Bail out when the step is too large.

  std::optional<uint64_t> StepVal = Q.tryZExtValue();

  if (!StepVal)

    return false;


  Steps.push_back(*StepVal);

  return collectConstantAbsSteps(SE, AR->getStart(), Steps, ElementSize);

}


bool llvm::findFixedSizeArrayDimensions(ScalarEvolution &SE, const SCEV *Expr,

                                        SmallVectorImpl<uint64_t> &Sizes,

                                        const SCEV *ElementSize) {

  if (!ElementSize)

    return false;


  std::optional<APInt> ElementSizeAPInt = tryIntoAPInt(ElementSize);

  if (!ElementSizeAPInt || *ElementSizeAPInt == 0)

    return false;


  std::optional<uint64_t> ElementSizeConst = ElementSizeAPInt->tryZExtValue();


  // Early exit when ElementSize is not a positive constant.

  if (!ElementSizeConst)

    return false;


  if (!collectConstantAbsSteps(SE, Expr, Sizes, *ElementSizeConst) ||

      Sizes.empty()) {

    Sizes.clear();

    return false;

  }


  // At this point, Sizes contains the absolute step recurrences for all

  // induction variables. Each step recurrence must be a multiple of the size of

  // the array element. Assuming that the each value represents the size of an

  // array for each dimension, attempts to restore the length of each dimension

  // by dividing the step recurrence by the next smaller value. For example, if

  // we have the following AddRec SCEV:

  //

  //   AddRec: {{{0,+,2048}<%for.i>,+,256}<%for.j>,+,8}<%for.k> (ElementSize=8)

  //

  // Then Sizes will become [256, 32, 1] after sorted. We don't know the size of

  // the outermost dimension, the next dimension will be computed as 256 / 32 =

  // 8, and the last dimension will be computed as 32 / 1 = 32. Thus it results

  // in like Arr[UnknownSize][8][32] with elements of size 8 bytes, where Arr is

  // a base pointer.

  //

  // TODO: Catch more cases, e.g., when a step recurrence is not divisible by

  // the next smaller one, like A[i][3*j].

  llvm::sort(Sizes.rbegin(), Sizes.rend());

  Sizes.erase(llvm::unique(Sizes), Sizes.end());


  // The last element in Sizes should be ElementSize. At this point, all values

  // in Sizes are assumed to be divided by ElementSize, so replace it with 1.

  assert(Sizes.back() != 0 && "Unexpected zero size in Sizes.");

  Sizes.back() = 1;


  for (unsigned I = 0; I + 1 < Sizes.size(); I++) {

    uint64_t PrevSize = Sizes[I + 1];

    if (Sizes[I] % PrevSize) {

      Sizes.clear();

      return false;

    }

    Sizes[I] /= PrevSize;

  }


  // Finally, the last element in Sizes should be ElementSize.

  Sizes.back() = *ElementSizeConst;

  return true;

}


/// Splits the SCEV into two vectors of SCEVs representing the subscripts and

/// sizes of an array access, assuming that the array is a fixed size array.

///

/// E.g., if we have the code like as follows:

///

///  double A[42][8][32];

///  for i

///    for j

///      for k

///        use A[i][j][k]

///

/// The access function will be represented as an AddRec SCEV like:

///

///  AddRec: {{{0,+,2048}<%for.i>,+,256}<%for.j>,+,8}<%for.k> (ElementSize=8)

///

/// Then findFixedSizeArrayDimensions infers the size of each dimension of the

/// array based on the fact that the value of the step recurrence is a multiple

/// of the size of the corresponding array element. In the above example, it

/// results in the following:

///

///  CHECK: ArrayDecl[UnknownSize][8][32] with elements of 8 bytes.

///

/// Finally each subscript will be computed as follows:

///

///  CHECK: ArrayRef[{0,+,1}<%for.i>][{0,+,1}<%for.j>][{0,+,1}<%for.k>]

///

/// Note that this function doesn't check the range of possible values for each

/// subscript, so the caller should perform additional boundary checks if

/// necessary.

///

/// Also note that this function doesn't guarantee that the original array size

/// is restored "correctly". For example, in the following case:

///

///  double A[42][4][64];

///  double B[42][8][32];

///  for i

///    for j

///      for k

///        use A[i][j][k]

///        use B[i][2*j][k]

///

/// The access function for both accesses will be the same:

///

///  AddRec: {{{0,+,2048}<%for.i>,+,512}<%for.j>,+,8}<%for.k> (ElementSize=8)

///

/// The array sizes for both A and B will be computed as

/// ArrayDecl[UnknownSize][4][64], which matches for A, but not for B.

///

/// TODO: At the moment, this function can handle only simple cases. For

/// example, we cannot handle a case where a step recurrence is not divisible

/// by the next smaller step recurrence, e.g., A[i][3*j].

bool llvm::delinearizeFixedSizeArray(ScalarEvolution &SE, const SCEV *Expr,

                                     SmallVectorImpl<const SCEV *> &Subscripts,

                                     SmallVectorImpl<const SCEV *> &Sizes,

                                     const SCEV *ElementSize) {


  // First step: find the fixed array size.

  SmallVector<uint64_t, 4> ConstSizes;

  if (!findFixedSizeArrayDimensions(SE, Expr, ConstSizes, ElementSize)) {

    Sizes.clear();

    return false;

  }


  // Convert the constant size to SCEV.

  for (uint64_t Size : ConstSizes)

    Sizes.push_back(SE.getConstant(Expr->getType(), Size));


  // Second step: compute the access functions for each subscript.

  computeAccessFunctions(SE, Expr, Subscripts, Sizes);


  return !Subscripts.empty();

}


bool llvm::getIndexExpressionsFromGEP(ScalarEvolution &SE,

                                      const GetElementPtrInst *GEP,

                                      SmallVectorImpl<const SCEV *> &Subscripts,

                                      SmallVectorImpl<int> &Sizes) {

  assert(Subscripts.empty() && Sizes.empty() &&

         "Expected output lists to be empty on entry to this function.");

  assert(GEP && "getIndexExpressionsFromGEP called with a null GEP");

  Type *Ty = nullptr;

  bool DroppedFirstDim = false;

  for (unsigned i = 1; i < GEP->getNumOperands(); i++) {

    const SCEV *Expr = SE.getSCEV(GEP->getOperand(i));

    if (i == 1) {

      Ty = GEP->getSourceElementType();

      if (auto *Const = dyn_cast<SCEVConstant>(Expr))

        if (Const->getValue()->isZero()) {

          DroppedFirstDim = true;

          continue;

        }

      Subscripts.push_back(Expr);

      continue;

    }


    auto *ArrayTy = dyn_cast<ArrayType>(Ty);

    if (!ArrayTy) {

      Subscripts.clear();

      Sizes.clear();

      return false;

    }


    Subscripts.push_back(Expr);

    if (!(DroppedFirstDim && i == 2))

      Sizes.push_back(ArrayTy->getNumElements());


    Ty = ArrayTy->getElementType();

  }

  return !Subscripts.empty();

}


bool llvm::tryDelinearizeFixedSizeImpl(

    ScalarEvolution *SE, Instruction *Inst, const SCEV *AccessFn,

    SmallVectorImpl<const SCEV *> &Subscripts, SmallVectorImpl<int> &Sizes) {

  Value *SrcPtr = getLoadStorePointerOperand(Inst);


  // Check the simple case where the array dimensions are fixed size.

  auto *SrcGEP = dyn_cast<GetElementPtrInst>(SrcPtr);

  if (!SrcGEP)

    return false;


  getIndexExpressionsFromGEP(*SE, SrcGEP, Subscripts, Sizes);


  // Check that the two size arrays are non-empty and equal in length and

  // value.

  // TODO: it would be better to let the caller to clear Subscripts, similar

  // to how we handle Sizes.

  if (Sizes.empty() || Subscripts.size() <= 1) {

    Subscripts.clear();

    return false;

  }


  // Check that for identical base pointers we do not miss index offsets

  // that have been added before this GEP is applied.

  Value *SrcBasePtr = SrcGEP->getOperand(0)->stripPointerCasts();

  const SCEVUnknown *SrcBase =

      dyn_cast<SCEVUnknown>(SE->getPointerBase(AccessFn));

  if (!SrcBase || SrcBasePtr != SrcBase->getValue()) {

    Subscripts.clear();

    return false;

  }


  assert(Subscripts.size() == Sizes.size() + 1 &&

         "Expected equal number of entries in the list of size and "

         "subscript.");


  return true;

}


namespace {


void printDelinearization(raw_ostream &O, Function *F, LoopInfo *LI,

                          ScalarEvolution *SE) {

  O << "Printing analysis 'Delinearization' for function '" << F->getName()

    << "':";

  for (Instruction &Inst : instructions(F)) {

    // Only analyze loads and stores.

    if (!isa<StoreInst>(&Inst) && !isa<LoadInst>(&Inst))

      continue;


    const BasicBlock *BB = Inst.getParent();

    Loop *L = LI->getLoopFor(BB);

    // Only delinearize the memory access in the innermost loop.

    // Do not analyze memory accesses outside loops.

    if (!L)

      continue;


    const SCEV *AccessFn = SE->getSCEVAtScope(getPointerOperand(&Inst), L);


    const SCEVUnknown *BasePointer =

        dyn_cast<SCEVUnknown>(SE->getPointerBase(AccessFn));

    // Do not delinearize if we cannot find the base pointer.

    if (!BasePointer)

      break;

    AccessFn = SE->getMinusSCEV(AccessFn, BasePointer);


    O << "\n";

    O << "Inst:" << Inst << "\n";

    O << "In Loop with Header: " << L->getHeader()->getName() << "\n";

    O << "AccessFunction: " << *AccessFn << "\n";


    SmallVector<const SCEV *, 3> Subscripts, Sizes;


    auto IsDelinearizationFailed = [&]() {

      return Subscripts.size() == 0 || Sizes.size() == 0 ||

             Subscripts.size() != Sizes.size();

    };


    delinearize(*SE, AccessFn, Subscripts, Sizes, SE->getElementSize(&Inst));

    if (UseFixedSizeArrayHeuristic && IsDelinearizationFailed()) {

      Subscripts.clear();

      Sizes.clear();

      delinearizeFixedSizeArray(*SE, AccessFn, Subscripts, Sizes,

                                SE->getElementSize(&Inst));

    }


      if (IsDelinearizationFailed()) {

        O << "failed to delinearize\n";

        continue;

      }


      O << "Base offset: " << *BasePointer << "\n";

      O << "ArrayDecl[UnknownSize]";

      int Size = Subscripts.size();

      for (int i = 0; i < Size - 1; i++)

        O << "[" << *Sizes[i] << "]";

      O << " with elements of " << *Sizes[Size - 1] << " bytes.\n";


      O << "ArrayRef";

      for (int i = 0; i < Size; i++)

        O << "[" << *Subscripts[i] << "]";

      O << "\n";

  }

}


} // end anonymous namespace


DelinearizationPrinterPass::DelinearizationPrinterPass(raw_ostream &OS)

    : OS(OS) {}

PreservedAnalyses DelinearizationPrinterPass::run(Function &F,

                                                  FunctionAnalysisManager &AM) {

  printDelinearization(OS, &F, &AM.getResult<LoopAnalysis>(F),

                       &AM.getResult<ScalarEvolutionAnalysis>(F));

  return PreservedAnalyses::all();

}

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

instructions
Expand Atomic instructions
Definition: AtomicExpandPass.cpp:183

CommandLine.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

removeConstantFactors
static const SCEV * removeConstantFactors(ScalarEvolution &SE, const SCEV *T)
Definition: Delinearization.cpp:263

collectConstantAbsSteps
static bool collectConstantAbsSteps(ScalarEvolution &SE, const SCEV *Expr, SmallVectorImpl< uint64_t > &Steps, uint64_t ElementSize)
Collects the absolute values of constant steps for all induction variables.
Definition: Delinearization.cpp:499

UseFixedSizeArrayHeuristic
static cl::opt< bool > UseFixedSizeArrayHeuristic("delinearize-use-fixed-size-array-heuristic", cl::init(false), cl::Hidden, cl::desc("When printing analysis, use the heuristic for fixed-size arrays " "if the default delinearizetion fails."))

findArrayDimensionsRec
static bool findArrayDimensionsRec(ScalarEvolution &SE, SmallVectorImpl< const SCEV * > &Terms, SmallVectorImpl< const SCEV * > &Sizes)
Definition: Delinearization.cpp:203

containsUndefs
static bool containsUndefs(const SCEV *S)
Definition: Delinearization.cpp:42

tryIntoAPInt
static std::optional< APInt > tryIntoAPInt(const SCEV *S)
Definition: Delinearization.cpp:489

containsParameters
static bool containsParameters(SmallVectorImpl< const SCEV * > &Terms)
Definition: Delinearization.cpp:248

numberOfTerms
static int numberOfTerms(const SCEV *S)
Definition: Delinearization.cpp:257

Delinearization.h

DerivedTypes.h

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

GEP
Hexagon Common GEP
Definition: HexagonCommonGEP.cpp:164

Function.h

PassManager.h
This header defines various interfaces for pass management in LLVM.

InstIterator.h

Instructions.h

LoopInfo.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

Operands
mir Rename Register Operands
Definition: MIRNamerPass.cpp:74

Unknown
@ Unknown
Definition: NVPTXISelLowering.cpp:5389

Mod
if(auto Err=PB.parsePassPipeline(MPM, Passes)) return wrap(std MPM run * Mod
Definition: PassBuilderBindings.cpp:95

OS
raw_pwrite_stream & OS
Definition: SampleProfWriter.cpp:51

ScalarEvolutionDivision.h

ScalarEvolutionExpressions.h

ScalarEvolution.h

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition: Debug.h:119

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

Mul
BinaryOperator * Mul
Definition: X86PartialReduction.cpp:68

T

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::APInt::tryZExtValue
std::optional< uint64_t > tryZExtValue() const
Get zero extended value if possible.
Definition: APInt.h:1552

llvm::APInt::udivrem
static LLVM_ABI void udivrem(const APInt &LHS, const APInt &RHS, APInt &Quotient, APInt &Remainder)
Dual division/remainder interface.
Definition: APInt.cpp:1758

llvm::AnalysisManager
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:255

llvm::AnalysisManager::getResult
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Definition: PassManager.h:412

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:62

llvm::BasicBlock::getParent
const Function * getParent() const
Return the enclosing method, or null if none.
Definition: BasicBlock.h:213

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:33

llvm::Function
Definition: Function.h:64

llvm::GetElementPtrInst
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
Definition: Instructions.h:949

llvm::Instruction
Definition: Instruction.h:69

llvm::LoopAnalysis
Analysis pass that exposes the LoopInfo for a function.
Definition: LoopInfo.h:570

llvm::LoopInfoBase::getLoopFor
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
Definition: GenericLoopInfo.h:606

llvm::LoopInfo
Definition: LoopInfo.h:409

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:40

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:112

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:118

llvm::SCEVAddRecExpr
This node represents a polynomial recurrence on the trip count of the specified loop.
Definition: ScalarEvolutionExpressions.h:348

llvm::SCEVAddRecExpr::getStart
const SCEV * getStart() const
Definition: ScalarEvolutionExpressions.h:359

llvm::SCEVAddRecExpr::getStepRecurrence
const SCEV * getStepRecurrence(ScalarEvolution &SE) const
Constructs and returns the recurrence indicating how much this expression steps by.
Definition: ScalarEvolutionExpressions.h:366

llvm::SCEVAddRecExpr::isAffine
bool isAffine() const
Return true if this represents an expression A + B*x where A and B are loop invariant values.
Definition: ScalarEvolutionExpressions.h:376

llvm::SCEVMulExpr
This node represents multiplication of some number of SCEVs.
Definition: ScalarEvolutionExpressions.h:291

llvm::SCEVUnknown
This means that we are dealing with an entirely unknown SCEV value, and only represent it as its LLVM...
Definition: ScalarEvolutionExpressions.h:580

llvm::SCEVUnknown::getValue
Value * getValue() const
Definition: ScalarEvolutionExpressions.h:601

llvm::SCEV
This class represents an analyzed expression in the program.
Definition: ScalarEvolution.h:72

llvm::SCEV::isZero
LLVM_ABI bool isZero() const
Return true if the expression is a constant zero.
Definition: ScalarEvolution.cpp:445

llvm::SCEV::getType
LLVM_ABI Type * getType() const
Return the LLVM type of this SCEV expression.
Definition: ScalarEvolution.cpp:383

llvm::ScalarEvolutionAnalysis
Analysis pass that exposes the ScalarEvolution for a function.
Definition: ScalarEvolution.h:2360

llvm::ScalarEvolution
The main scalar evolution driver.
Definition: ScalarEvolution.h:448

llvm::ScalarEvolution::getSCEVAtScope
LLVM_ABI const SCEV * getSCEVAtScope(const SCEV *S, const Loop *L)
Return a SCEV expression for the specified value at the specified scope in the program.
Definition: ScalarEvolution.cpp:9877

llvm::ScalarEvolution::getConstant
LLVM_ABI const SCEV * getConstant(ConstantInt *V)
Definition: ScalarEvolution.cpp:470

llvm::ScalarEvolution::getSCEV
LLVM_ABI const SCEV * getSCEV(Value *V)
Return a SCEV expression for the full generality of the specified expression.
Definition: ScalarEvolution.cpp:4572

llvm::ScalarEvolution::getMinusSCEV
LLVM_ABI const SCEV * getMinusSCEV(const SCEV *LHS, const SCEV *RHS, SCEV::NoWrapFlags Flags=SCEV::FlagAnyWrap, unsigned Depth=0)
Return LHS-RHS.
Definition: ScalarEvolution.cpp:4680

llvm::ScalarEvolution::getPointerBase
LLVM_ABI const SCEV * getPointerBase(const SCEV *V)
Transitively follow the chain of pointer-type operands until reaching a SCEV that does not have a sin...
Definition: ScalarEvolution.cpp:4848

llvm::ScalarEvolution::getMulExpr
LLVM_ABI const SCEV * getMulExpr(SmallVectorImpl< const SCEV * > &Ops, SCEV::NoWrapFlags Flags=SCEV::FlagAnyWrap, unsigned Depth=0)
Get a canonical multiply expression, or something simpler if possible.
Definition: ScalarEvolution.cpp:3117

llvm::ScalarEvolution::getElementSize
LLVM_ABI const SCEV * getElementSize(Instruction *Inst)
Return the size of an element read or written by Inst.
Definition: ScalarEvolution.cpp:13663

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:82

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:79

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:574

llvm::SmallVectorImpl::erase
iterator erase(const_iterator CI)
Definition: SmallVector.h:738

llvm::SmallVectorImpl::clear
void clear()
Definition: SmallVector.h:611

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:414

llvm::SmallVectorTemplateCommon::end
iterator end()
Definition: SmallVector.h:270

llvm::SmallVectorTemplateCommon::begin
iterator begin()
Definition: SmallVector.h:268

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1197

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::User::operands
op_range operands()
Definition: User.h:292

llvm::Value
LLVM Value Representation.
Definition: Value.h:75

llvm::Value::stripPointerCasts
LLVM_ABI const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition: Value.cpp:701

llvm::cl::opt
Definition: CommandLine.h:1429

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:53

uint64_t

llvm::RISCVFenceField::O
@ O
Definition: RISCVBaseInfo.h:399

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:138

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:444

llvm::logicalview::LVPrintKind::Sizes
@ Sizes

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::visitAll
void visitAll(const SCEV *Root, SV &Visitor)
Use SCEVTraversal to visit all nodes in the given expression tree.
Definition: ScalarEvolutionExpressions.h:716

llvm::collectParametricTerms
void collectParametricTerms(ScalarEvolution &SE, const SCEV *Expr, SmallVectorImpl< const SCEV * > &Terms)
Collect parametric terms occurring in step expressions (first step of delinearization).
Definition: Delinearization.cpp:176

llvm::findArrayDimensions
void findArrayDimensions(ScalarEvolution &SE, SmallVectorImpl< const SCEV * > &Terms, SmallVectorImpl< const SCEV * > &Sizes, const SCEV *ElementSize)
Compute the array dimensions Sizes from the set of Terms extracted from the memory access function of...
Definition: Delinearization.cpp:282

llvm::getLoadStorePointerOperand
const Value * getLoadStorePointerOperand(const Value *V)
A helper function that returns the pointer operand of a load or store instruction.
Definition: Instructions.h:5088

llvm::unique
auto unique(Range &&R, Predicate P)
Definition: STLExtras.h:2095

llvm::getPointerOperand
const Value * getPointerOperand(const Value *V)
A helper function that returns the pointer operand of a load, store or GEP instruction.
Definition: Instructions.h:5102

llvm::computeAccessFunctions
void computeAccessFunctions(ScalarEvolution &SE, const SCEV *Expr, SmallVectorImpl< const SCEV * > &Subscripts, SmallVectorImpl< const SCEV * > &Sizes)
Return in Subscripts the access functions for each dimension in Sizes (third step of delinearization)...
Definition: Delinearization.cpp:346

llvm::delinearizeFixedSizeArray
bool delinearizeFixedSizeArray(ScalarEvolution &SE, const SCEV *Expr, SmallVectorImpl< const SCEV * > &Subscripts, SmallVectorImpl< const SCEV * > &Sizes, const SCEV *ElementSize)
Split this SCEVAddRecExpr into two vectors of SCEVs representing the subscripts and sizes of an acces...
Definition: Delinearization.cpp:645

llvm::sort
void sort(IteratorTy Start, IteratorTy End)
Definition: STLExtras.h:1669

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:207

llvm::getIndexExpressionsFromGEP
bool getIndexExpressionsFromGEP(ScalarEvolution &SE, const GetElementPtrInst *GEP, SmallVectorImpl< const SCEV * > &Subscripts, SmallVectorImpl< int > &Sizes)
Gathers the individual index expressions from a GEP instruction.
Definition: Delinearization.cpp:667

llvm::tryDelinearizeFixedSizeImpl
bool tryDelinearizeFixedSizeImpl(ScalarEvolution *SE, Instruction *Inst, const SCEV *AccessFn, SmallVectorImpl< const SCEV * > &Subscripts, SmallVectorImpl< int > &Sizes)
Implementation of fixed size array delinearization.
Definition: Delinearization.cpp:705

llvm::delinearize
void delinearize(ScalarEvolution &SE, const SCEV *Expr, SmallVectorImpl< const SCEV * > &Subscripts, SmallVectorImpl< const SCEV * > &Sizes, const SCEV *ElementSize)
Split this SCEVAddRecExpr into two vectors of SCEVs representing the subscripts and sizes of an array...
Definition: Delinearization.cpp:453

llvm::findFixedSizeArrayDimensions
bool findFixedSizeArrayDimensions(ScalarEvolution &SE, const SCEV *Expr, SmallVectorImpl< uint64_t > &Sizes, const SCEV *ElementSize)
Compute the dimensions of fixed size array from \Expr and save the results in Sizes.
Definition: Delinearization.cpp:533

llvm::PseudoProbeReservedId::Last
@ Last

llvm::erase_if
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
Definition: STLExtras.h:2139

llvm::array_pod_sort
void array_pod_sort(IteratorTy Start, IteratorTy End)
array_pod_sort - This sorts an array with the specified start and end extent.
Definition: STLExtras.h:1629

llvm::SCEVExprContains
bool SCEVExprContains(const SCEV *Root, PredTy Pred)
Return true if any node in Root satisfies the predicate Pred.
Definition: ScalarEvolutionExpressions.h:723

raw_ostream.h

llvm::DelinearizationPrinterPass::run
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
Definition: Delinearization.cpp:813

llvm::DelinearizationPrinterPass::DelinearizationPrinterPass
DelinearizationPrinterPass(raw_ostream &OS)
Definition: Delinearization.cpp:811

llvm::SCEVDivision::divide
static void divide(ScalarEvolution &SE, const SCEV *Numerator, const SCEV *Denominator, const SCEV **Quotient, const SCEV **Remainder)
Computes the Quotient and Remainder of the division of Numerator by Denominator.
Definition: ScalarEvolutionDivision.cpp:59

llvm::cl::desc
Definition: CommandLine.h:410