Vector/Utils/VectorUtils.cpp

99ef9eebSMatthias Springer//===- VectorUtils.cpp - MLIR Utilities for VectorOps   ------------------===//
99ef9eebSMatthias Springer//
99ef9eebSMatthias Springer// Part of the MLIR Project, under the Apache License v2.0 with LLVM Exceptions.
99ef9eebSMatthias Springer// See https://llvm.org/LICENSE.txt for license information.
99ef9eebSMatthias Springer// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
99ef9eebSMatthias Springer//
99ef9eebSMatthias Springer//===----------------------------------------------------------------------===//
99ef9eebSMatthias Springer//
99ef9eebSMatthias Springer// This file implements utility methods for working with the Vector dialect.
99ef9eebSMatthias Springer//
99ef9eebSMatthias Springer//===----------------------------------------------------------------------===//
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer#include "mlir/Dialect/Vector/Utils/VectorUtils.h"
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer#include "mlir/Dialect/Affine/Analysis/LoopAnalysis.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/Affine/IR/AffineOps.h"
abc362a1SJakub Kuderski#include "mlir/Dialect/Arith/IR/Arith.h"
23aa5a74SRiver Riddle#include "mlir/Dialect/Func/IR/FuncOps.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/MemRef/IR/MemRef.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/Tensor/IR/Tensor.h"
7a69a9d7SNicolas Vasilache#include "mlir/Dialect/Utils/IndexingUtils.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/Vector/IR/VectorOps.h"
99ef9eebSMatthias Springer#include "mlir/IR/Builders.h"
99ef9eebSMatthias Springer#include "mlir/IR/IntegerSet.h"
99ef9eebSMatthias Springer#include "mlir/IR/Operation.h"
9b5a3d14SMatthias Springer#include "mlir/IR/TypeUtilities.h"
99ef9eebSMatthias Springer#include "mlir/Support/LLVM.h"
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer#include "llvm/ADT/DenseSet.h"
99ef9eebSMatthias Springer#include "llvm/ADT/SetVector.h"
99ef9eebSMatthias Springer
30d4f6afSLubomir Litchev#define DEBUG_TYPE "vector-utils"
30d4f6afSLubomir Litchev
30d4f6afSLubomir Litchev#define DBGS() (llvm::dbgs() << '[' << DEBUG_TYPE << "] ")
30d4f6afSLubomir Litchev#define LDBG(X) LLVM_DEBUG(DBGS() << X << "\n")
30d4f6afSLubomir Litchev
99ef9eebSMatthias Springerusing namespace mlir;
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer/// Helper function that creates a memref::DimOp or tensor::DimOp depending on
99ef9eebSMatthias Springer/// the type of `source`.
99ef9eebSMatthias SpringerValue mlir::vector::createOrFoldDimOp(OpBuilder &b, Location loc, Value source,
99ef9eebSMatthias Springer                                      int64_t dim) {
5550c821STres Popp  if (isa<UnrankedMemRefType, MemRefType>(source.getType()))
99ef9eebSMatthias Springer    return b.createOrFold<memref::DimOp>(loc, source, dim);
5550c821STres Popp  if (isa<UnrankedTensorType, RankedTensorType>(source.getType()))
99ef9eebSMatthias Springer    return b.createOrFold<tensor::DimOp>(loc, source, dim);
99ef9eebSMatthias Springer  llvm_unreachable("Expected MemRefType or TensorType");
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
25cc5a71SHanhan Wang/// Given the n-D transpose pattern 'transp', return true if 'dim0' and 'dim1'
25cc5a71SHanhan Wang/// should be transposed with each other within the context of their 2D
25cc5a71SHanhan Wang/// transposition slice.
25cc5a71SHanhan Wang///
25cc5a71SHanhan Wang/// Example 1: dim0 = 0, dim1 = 2, transp = [2, 1, 0]
25cc5a71SHanhan Wang///   Return true: dim0 and dim1 are transposed within the context of their 2D
25cc5a71SHanhan Wang///   transposition slice ([1, 0]).
25cc5a71SHanhan Wang///
25cc5a71SHanhan Wang/// Example 2: dim0 = 0, dim1 = 1, transp = [2, 1, 0]
25cc5a71SHanhan Wang///   Return true: dim0 and dim1 are transposed within the context of their 2D
25cc5a71SHanhan Wang///   transposition slice ([1, 0]). Paradoxically, note how dim1 (1) is *not*
25cc5a71SHanhan Wang///   transposed within the full context of the transposition.
25cc5a71SHanhan Wang///
25cc5a71SHanhan Wang/// Example 3: dim0 = 0, dim1 = 1, transp = [2, 0, 1]
25cc5a71SHanhan Wang///   Return false: dim0 and dim1 are *not* transposed within the context of
25cc5a71SHanhan Wang///   their 2D transposition slice ([0, 1]). Paradoxically, note how dim0 (0)
25cc5a71SHanhan Wang///   and dim1 (1) are transposed within the full context of the of the
25cc5a71SHanhan Wang///   transposition.
25cc5a71SHanhan Wangstatic bool areDimsTransposedIn2DSlice(int64_t dim0, int64_t dim1,
25cc5a71SHanhan Wang                                       ArrayRef<int64_t> transp) {
25cc5a71SHanhan Wang  // Perform a linear scan along the dimensions of the transposed pattern. If
25cc5a71SHanhan Wang  // dim0 is found first, dim0 and dim1 are not transposed within the context of
25cc5a71SHanhan Wang  // their 2D slice. Otherwise, 'dim1' is found first and they are transposed.
25cc5a71SHanhan Wang  for (int64_t permDim : transp) {
25cc5a71SHanhan Wang    if (permDim == dim0)
25cc5a71SHanhan Wang      return false;
25cc5a71SHanhan Wang    if (permDim == dim1)
25cc5a71SHanhan Wang      return true;
25cc5a71SHanhan Wang  }
25cc5a71SHanhan Wang
25cc5a71SHanhan Wang  llvm_unreachable("Ill-formed transpose pattern");
25cc5a71SHanhan Wang}
25cc5a71SHanhan Wang
25cc5a71SHanhan WangFailureOr<std::pair<int, int>>
25cc5a71SHanhan Wangmlir::vector::isTranspose2DSlice(vector::TransposeOp op) {
25cc5a71SHanhan Wang  VectorType srcType = op.getSourceVectorType();
25cc5a71SHanhan Wang  SmallVector<int64_t> srcGtOneDims;
25cc5a71SHanhan Wang  for (auto [index, size] : llvm::enumerate(srcType.getShape()))
25cc5a71SHanhan Wang    if (size > 1)
25cc5a71SHanhan Wang      srcGtOneDims.push_back(index);
25cc5a71SHanhan Wang
25cc5a71SHanhan Wang  if (srcGtOneDims.size() != 2)
25cc5a71SHanhan Wang    return failure();
25cc5a71SHanhan Wang
25cc5a71SHanhan Wang  // Check whether the two source vector dimensions that are greater than one
25cc5a71SHanhan Wang  // must be transposed with each other so that we can apply one of the 2-D
25cc5a71SHanhan Wang  // transpose pattens. Otherwise, these patterns are not applicable.
32c3decbSMatthias Springer  if (!areDimsTransposedIn2DSlice(srcGtOneDims[0], srcGtOneDims[1],
32c3decbSMatthias Springer                                  op.getPermutation()))
25cc5a71SHanhan Wang    return failure();
25cc5a71SHanhan Wang
25cc5a71SHanhan Wang  return std::pair<int, int>(srcGtOneDims[0], srcGtOneDims[1]);
25cc5a71SHanhan Wang}
25cc5a71SHanhan Wang
99ef9eebSMatthias Springer/// Constructs a permutation map from memref indices to vector dimension.
99ef9eebSMatthias Springer///
99ef9eebSMatthias Springer/// The implementation uses the knowledge of the mapping of enclosing loop to
99ef9eebSMatthias Springer/// vector dimension. `enclosingLoopToVectorDim` carries this information as a
99ef9eebSMatthias Springer/// map with:
99ef9eebSMatthias Springer///   - keys representing "vectorized enclosing loops";
99ef9eebSMatthias Springer///   - values representing the corresponding vector dimension.
99ef9eebSMatthias Springer/// The algorithm traverses "vectorized enclosing loops" and extracts the
99ef9eebSMatthias Springer/// at-most-one MemRef index that is invariant along said loop. This index is
99ef9eebSMatthias Springer/// guaranteed to be at most one by construction: otherwise the MemRef is not
99ef9eebSMatthias Springer/// vectorizable.
99ef9eebSMatthias Springer/// If this invariant index is found, it is added to the permutation_map at the
99ef9eebSMatthias Springer/// proper vector dimension.
99ef9eebSMatthias Springer/// If no index is found to be invariant, 0 is added to the permutation_map and
99ef9eebSMatthias Springer/// corresponds to a vector broadcast along that dimension.
99ef9eebSMatthias Springer///
99ef9eebSMatthias Springer/// Returns an empty AffineMap if `enclosingLoopToVectorDim` is empty,
99ef9eebSMatthias Springer/// signalling that no permutation map can be constructed given
99ef9eebSMatthias Springer/// `enclosingLoopToVectorDim`.
99ef9eebSMatthias Springer///
99ef9eebSMatthias Springer/// Examples can be found in the documentation of `makePermutationMap`, in the
99ef9eebSMatthias Springer/// header file.
99ef9eebSMatthias Springerstatic AffineMap makePermutationMap(
99ef9eebSMatthias Springer    ArrayRef<Value> indices,
99ef9eebSMatthias Springer    const DenseMap<Operation *, unsigned> &enclosingLoopToVectorDim) {
99ef9eebSMatthias Springer  if (enclosingLoopToVectorDim.empty())
99ef9eebSMatthias Springer    return AffineMap();
99ef9eebSMatthias Springer  MLIRContext *context =
99ef9eebSMatthias Springer      enclosingLoopToVectorDim.begin()->getFirst()->getContext();
7a69a9d7SNicolas Vasilache  SmallVector<AffineExpr> perm(enclosingLoopToVectorDim.size(),
99ef9eebSMatthias Springer                               getAffineConstantExpr(0, context));
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  for (auto kvp : enclosingLoopToVectorDim) {
99ef9eebSMatthias Springer    assert(kvp.second < perm.size());
4c48f016SMatthias Springer    auto invariants = affine::getInvariantAccesses(
4c48f016SMatthias Springer        cast<affine::AffineForOp>(kvp.first).getInductionVar(), indices);
99ef9eebSMatthias Springer    unsigned numIndices = indices.size();
99ef9eebSMatthias Springer    unsigned countInvariantIndices = 0;
99ef9eebSMatthias Springer    for (unsigned dim = 0; dim < numIndices; ++dim) {
99ef9eebSMatthias Springer      if (!invariants.count(indices[dim])) {
99ef9eebSMatthias Springer        assert(perm[kvp.second] == getAffineConstantExpr(0, context) &&
99ef9eebSMatthias Springer               "permutationMap already has an entry along dim");
99ef9eebSMatthias Springer        perm[kvp.second] = getAffineDimExpr(dim, context);
99ef9eebSMatthias Springer      } else {
99ef9eebSMatthias Springer        ++countInvariantIndices;
99ef9eebSMatthias Springer      }
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer    assert((countInvariantIndices == numIndices ||
99ef9eebSMatthias Springer            countInvariantIndices == numIndices - 1) &&
99ef9eebSMatthias Springer           "Vectorization prerequisite violated: at most 1 index may be "
99ef9eebSMatthias Springer           "invariant wrt a vectorized loop");
22a4b336SFangrui Song    (void)countInvariantIndices;
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer  return AffineMap::get(indices.size(), 0, perm, context);
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer/// Implementation detail that walks up the parents and records the ones with
99ef9eebSMatthias Springer/// the specified type.
99ef9eebSMatthias Springer/// TODO: could also be implemented as a collect parents followed by a
99ef9eebSMatthias Springer/// filter and made available outside this file.
99ef9eebSMatthias Springertemplate <typename T>
99ef9eebSMatthias Springerstatic SetVector<Operation *> getParentsOfType(Block *block) {
99ef9eebSMatthias Springer  SetVector<Operation *> res;
99ef9eebSMatthias Springer  auto *current = block->getParentOp();
99ef9eebSMatthias Springer  while (current) {
0a0aff2dSMikhail Goncharov    if ([[maybe_unused]] auto typedParent = dyn_cast<T>(current)) {
99ef9eebSMatthias Springer      assert(res.count(current) == 0 && "Already inserted");
99ef9eebSMatthias Springer      res.insert(current);
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer    current = current->getParentOp();
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer  return res;
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer/// Returns the enclosing AffineForOp, from closest to farthest.
99ef9eebSMatthias Springerstatic SetVector<Operation *> getEnclosingforOps(Block *block) {
4c48f016SMatthias Springer  return getParentsOfType<affine::AffineForOp>(block);
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias SpringerAffineMap mlir::makePermutationMap(
99ef9eebSMatthias Springer    Block *insertPoint, ArrayRef<Value> indices,
99ef9eebSMatthias Springer    const DenseMap<Operation *, unsigned> &loopToVectorDim) {
99ef9eebSMatthias Springer  DenseMap<Operation *, unsigned> enclosingLoopToVectorDim;
99ef9eebSMatthias Springer  auto enclosingLoops = getEnclosingforOps(insertPoint);
99ef9eebSMatthias Springer  for (auto *forInst : enclosingLoops) {
99ef9eebSMatthias Springer    auto it = loopToVectorDim.find(forInst);
99ef9eebSMatthias Springer    if (it != loopToVectorDim.end()) {
99ef9eebSMatthias Springer      enclosingLoopToVectorDim.insert(*it);
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer  return ::makePermutationMap(indices, enclosingLoopToVectorDim);
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias SpringerAffineMap mlir::makePermutationMap(
99ef9eebSMatthias Springer    Operation *op, ArrayRef<Value> indices,
99ef9eebSMatthias Springer    const DenseMap<Operation *, unsigned> &loopToVectorDim) {
99ef9eebSMatthias Springer  return makePermutationMap(op->getBlock(), indices, loopToVectorDim);
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias Springerbool matcher::operatesOnSuperVectorsOf(Operation &op,
99ef9eebSMatthias Springer                                       VectorType subVectorType) {
99ef9eebSMatthias Springer  // First, extract the vector type and distinguish between:
99ef9eebSMatthias Springer  //   a. ops that *must* lower a super-vector (i.e. vector.transfer_read,
99ef9eebSMatthias Springer  //      vector.transfer_write); and
99ef9eebSMatthias Springer  //   b. ops that *may* lower a super-vector (all other ops).
99ef9eebSMatthias Springer  // The ops that *may* lower a super-vector only do so if the super-vector to
99ef9eebSMatthias Springer  // sub-vector ratio exists. The ops that *must* lower a super-vector are
99ef9eebSMatthias Springer  // explicitly checked for this property.
99ef9eebSMatthias Springer  /// TODO: there should be a single function for all ops to do this so we
99ef9eebSMatthias Springer  /// do not have to special case. Maybe a trait, or just a method, unclear atm.
99ef9eebSMatthias Springer  bool mustDivide = false;
99ef9eebSMatthias Springer  (void)mustDivide;
99ef9eebSMatthias Springer  VectorType superVectorType;
99ef9eebSMatthias Springer  if (auto transfer = dyn_cast<VectorTransferOpInterface>(op)) {
99ef9eebSMatthias Springer    superVectorType = transfer.getVectorType();
99ef9eebSMatthias Springer    mustDivide = true;
99ef9eebSMatthias Springer  } else if (op.getNumResults() == 0) {
23aa5a74SRiver Riddle    if (!isa<func::ReturnOp>(op)) {
99ef9eebSMatthias Springer      op.emitError("NYI: assuming only return operations can have 0 "
99ef9eebSMatthias Springer                   " results at this point");
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer    return false;
99ef9eebSMatthias Springer  } else if (op.getNumResults() == 1) {
5550c821STres Popp    if (auto v = dyn_cast<VectorType>(op.getResult(0).getType())) {
99ef9eebSMatthias Springer      superVectorType = v;
99ef9eebSMatthias Springer    } else {
99ef9eebSMatthias Springer      // Not a vector type.
99ef9eebSMatthias Springer      return false;
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer  } else {
99ef9eebSMatthias Springer    // Not a vector.transfer and has more than 1 result, fail hard for now to
99ef9eebSMatthias Springer    // wake us up when something changes.
99ef9eebSMatthias Springer    op.emitError("NYI: operation has more than 1 result");
99ef9eebSMatthias Springer    return false;
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  // Get the ratio.
7a69a9d7SNicolas Vasilache  auto ratio =
7a69a9d7SNicolas Vasilache      computeShapeRatio(superVectorType.getShape(), subVectorType.getShape());
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  // Sanity check.
5413bf1bSKazu Hirata  assert((ratio || !mustDivide) &&
99ef9eebSMatthias Springer         "vector.transfer operation in which super-vector size is not an"
99ef9eebSMatthias Springer         " integer multiple of sub-vector size");
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  // This catches cases that are not strictly necessary to have multiplicity but
99ef9eebSMatthias Springer  // still aren't divisible by the sub-vector shape.
99ef9eebSMatthias Springer  // This could be useful information if we wanted to reshape at the level of
99ef9eebSMatthias Springer  // the vector type (but we would have to look at the compute and distinguish
99ef9eebSMatthias Springer  // between parallel, reduction and possibly other cases.
064a08cdSKazu Hirata  return ratio.has_value();
99ef9eebSMatthias Springer}
8171eac2SAndrzej Warzyński
8171eac2SAndrzej Warzyńskibool vector::isContiguousSlice(MemRefType memrefType, VectorType vectorType) {
8171eac2SAndrzej Warzyński  if (vectorType.isScalable())
8171eac2SAndrzej Warzyński    return false;
8171eac2SAndrzej Warzyński
8171eac2SAndrzej Warzyński  ArrayRef<int64_t> vectorShape = vectorType.getShape();
8171eac2SAndrzej Warzyński  auto vecRank = vectorType.getRank();
8171eac2SAndrzej Warzyński
*6aaa8f25SMatthias Springer  if (!memrefType.areTrailingDimsContiguous(vecRank))
9478bf0cSAndrzej Warzyński    return false;
9478bf0cSAndrzej Warzyński
8171eac2SAndrzej Warzyński  // Extract the trailing dims and strides of the input memref
8171eac2SAndrzej Warzyński  auto memrefShape = memrefType.getShape().take_back(vecRank);
8171eac2SAndrzej Warzyński
9478bf0cSAndrzej Warzyński  // Compare the dims of `vectorType` against `memrefType` (in reverse).
8171eac2SAndrzej Warzyński  // In the most basic case, all dims will match.
8171eac2SAndrzej Warzyński  auto firstNonMatchingDim =
8171eac2SAndrzej Warzyński      std::mismatch(vectorShape.rbegin(), vectorShape.rend(),
8171eac2SAndrzej Warzyński                    memrefShape.rbegin(), memrefShape.rend());
8171eac2SAndrzej Warzyński  if (firstNonMatchingDim.first == vectorShape.rend())
8171eac2SAndrzej Warzyński    return true;
8171eac2SAndrzej Warzyński
8171eac2SAndrzej Warzyński  // One non-matching dim is still fine, however the remaining leading dims of
8171eac2SAndrzej Warzyński  // `vectorType` need to be 1.
8171eac2SAndrzej Warzyński  SmallVector<int64_t> leadingDims(++firstNonMatchingDim.first,
8171eac2SAndrzej Warzyński                                   vectorShape.rend());
8171eac2SAndrzej Warzyński
8171eac2SAndrzej Warzyński  return llvm::all_of(leadingDims, [](auto x) { return x == 1; });
8171eac2SAndrzej Warzyński}
a1a68603SBenjamin Maxwell
a1a68603SBenjamin Maxwellstd::optional<StaticTileOffsetRange>
a1a68603SBenjamin Maxwellvector::createUnrollIterator(VectorType vType, int64_t targetRank) {
a1a68603SBenjamin Maxwell  if (vType.getRank() <= targetRank)
a1a68603SBenjamin Maxwell    return {};
a1a68603SBenjamin Maxwell  // Attempt to unroll until targetRank or the first scalable dimension (which
a1a68603SBenjamin Maxwell  // cannot be unrolled).
a1a68603SBenjamin Maxwell  auto shapeToUnroll = vType.getShape().drop_back(targetRank);
a1a68603SBenjamin Maxwell  auto scalableDimsToUnroll = vType.getScalableDims().drop_back(targetRank);
a1a68603SBenjamin Maxwell  auto it =
a1a68603SBenjamin Maxwell      std::find(scalableDimsToUnroll.begin(), scalableDimsToUnroll.end(), true);
a1a68603SBenjamin Maxwell  auto firstScalableDim = it - scalableDimsToUnroll.begin();
a1a68603SBenjamin Maxwell  if (firstScalableDim == 0)
a1a68603SBenjamin Maxwell    return {};
a1a68603SBenjamin Maxwell  // All scalable dimensions should be removed now.
a1a68603SBenjamin Maxwell  scalableDimsToUnroll = scalableDimsToUnroll.slice(0, firstScalableDim);
a1a68603SBenjamin Maxwell  assert(!llvm::is_contained(scalableDimsToUnroll, true) &&
a1a68603SBenjamin Maxwell         "unexpected leading scalable dimension");
a1a68603SBenjamin Maxwell  // Create an unroll iterator for leading dimensions.
a1a68603SBenjamin Maxwell  shapeToUnroll = shapeToUnroll.slice(0, firstScalableDim);
a1a68603SBenjamin Maxwell  return StaticTileOffsetRange(shapeToUnroll, /*unrollStep=*/1);
a1a68603SBenjamin Maxwell}
c56bd7abSAndrzej Warzyński
c56bd7abSAndrzej WarzyńskiSmallVector<OpFoldResult> vector::getMixedSizesXfer(bool hasTensorSemantics,
c56bd7abSAndrzej Warzyński                                                    Operation *xfer,
c56bd7abSAndrzej Warzyński                                                    RewriterBase &rewriter) {
c56bd7abSAndrzej Warzyński  auto loc = xfer->getLoc();
c56bd7abSAndrzej Warzyński
c56bd7abSAndrzej Warzyński  Value base = TypeSwitch<Operation *, Value>(xfer)
c56bd7abSAndrzej Warzyński                   .Case<vector::TransferReadOp>(
c56bd7abSAndrzej Warzyński                       [&](auto readOp) { return readOp.getSource(); })
c56bd7abSAndrzej Warzyński                   .Case<vector::TransferWriteOp>(
c56bd7abSAndrzej Warzyński                       [&](auto writeOp) { return writeOp.getOperand(1); });
c56bd7abSAndrzej Warzyński
c56bd7abSAndrzej Warzyński  SmallVector<OpFoldResult> mixedSourceDims =
c56bd7abSAndrzej Warzyński      hasTensorSemantics ? tensor::getMixedSizes(rewriter, loc, base)
c56bd7abSAndrzej Warzyński                         : memref::getMixedSizes(rewriter, loc, base);
c56bd7abSAndrzej Warzyński  return mixedSourceDims;
c56bd7abSAndrzej Warzyński}
d3aa92edSAndrzej Warzyński
d3aa92edSAndrzej Warzyńskibool vector::isLinearizableVector(VectorType type) {
fe07d9aaSAndrzej Warzyński  return (type.getRank() > 1) && (type.getNumScalableDims() <= 1);
d3aa92edSAndrzej Warzyński}
30d4f6afSLubomir Litchev
30d4f6afSLubomir LitchevValue vector::createReadOrMaskedRead(OpBuilder &builder, Location loc,
30d4f6afSLubomir Litchev                                     Value source, ArrayRef<int64_t> readShape,
30d4f6afSLubomir Litchev                                     Value padValue,
30d4f6afSLubomir Litchev                                     bool useInBoundsInsteadOfMasking) {
30d4f6afSLubomir Litchev  assert(llvm::none_of(readShape,
30d4f6afSLubomir Litchev                       [](int64_t s) { return s == ShapedType::kDynamic; }) &&
30d4f6afSLubomir Litchev         "expected static shape");
30d4f6afSLubomir Litchev  auto sourceShapedType = cast<ShapedType>(source.getType());
30d4f6afSLubomir Litchev  auto sourceShape = sourceShapedType.getShape();
30d4f6afSLubomir Litchev  assert(sourceShape.size() == readShape.size() && "expected same ranks.");
30d4f6afSLubomir Litchev  auto maskType = VectorType::get(readShape, builder.getI1Type());
30d4f6afSLubomir Litchev  auto vectorType = VectorType::get(readShape, padValue.getType());
30d4f6afSLubomir Litchev  assert(padValue.getType() == sourceShapedType.getElementType() &&
30d4f6afSLubomir Litchev         "expected same pad element type to match source element type");
30d4f6afSLubomir Litchev  int64_t readRank = readShape.size();
30d4f6afSLubomir Litchev  auto zero = builder.create<arith::ConstantIndexOp>(loc, 0);
30d4f6afSLubomir Litchev  SmallVector<bool> inBoundsVal(readRank, true);
8feedd5eSPrashant Kumar  if (useInBoundsInsteadOfMasking) {
30d4f6afSLubomir Litchev    // Update the inBounds attribute.
30d4f6afSLubomir Litchev    for (unsigned i = 0; i < readRank; i++)
30d4f6afSLubomir Litchev      inBoundsVal[i] = (sourceShape[i] == readShape[i]) &&
30d4f6afSLubomir Litchev                       !ShapedType::isDynamic(sourceShape[i]);
30d4f6afSLubomir Litchev  }
30d4f6afSLubomir Litchev  auto transferReadOp = builder.create<vector::TransferReadOp>(
30d4f6afSLubomir Litchev      loc,
30d4f6afSLubomir Litchev      /*vectorType=*/vectorType,
30d4f6afSLubomir Litchev      /*source=*/source,
30d4f6afSLubomir Litchev      /*indices=*/SmallVector<Value>(readRank, zero),
30d4f6afSLubomir Litchev      /*padding=*/padValue,
30d4f6afSLubomir Litchev      /*inBounds=*/inBoundsVal);
30d4f6afSLubomir Litchev
8feedd5eSPrashant Kumar  if (llvm::equal(readShape, sourceShape) || useInBoundsInsteadOfMasking)
30d4f6afSLubomir Litchev    return transferReadOp;
30d4f6afSLubomir Litchev  SmallVector<OpFoldResult> mixedSourceDims =
30d4f6afSLubomir Litchev      tensor::getMixedSizes(builder, loc, source);
30d4f6afSLubomir Litchev  Value mask =
30d4f6afSLubomir Litchev      builder.create<vector::CreateMaskOp>(loc, maskType, mixedSourceDims);
30d4f6afSLubomir Litchev  return mlir::vector::maskOperation(builder, transferReadOp, mask)
30d4f6afSLubomir Litchev      ->getResult(0);
30d4f6afSLubomir Litchev}
30d4f6afSLubomir Litchev
30d4f6afSLubomir LitchevLogicalResult
30d4f6afSLubomir Litchevvector::isValidMaskedInputVector(ArrayRef<int64_t> shape,
30d4f6afSLubomir Litchev                                 ArrayRef<int64_t> inputVectorSizes) {
30d4f6afSLubomir Litchev  LDBG("Iteration space static sizes:");
30d4f6afSLubomir Litchev  LLVM_DEBUG(llvm::interleaveComma(shape, llvm::dbgs()));
30d4f6afSLubomir Litchev  LLVM_DEBUG(llvm::dbgs() << "\n");
30d4f6afSLubomir Litchev
30d4f6afSLubomir Litchev  if (inputVectorSizes.size() != shape.size()) {
30d4f6afSLubomir Litchev    LDBG("Input vector sizes don't match the number of loops");
30d4f6afSLubomir Litchev    return failure();
30d4f6afSLubomir Litchev  }
30d4f6afSLubomir Litchev  if (ShapedType::isDynamicShape(inputVectorSizes)) {
30d4f6afSLubomir Litchev    LDBG("Input vector sizes can't have dynamic dimensions");
30d4f6afSLubomir Litchev    return failure();
30d4f6afSLubomir Litchev  }
30d4f6afSLubomir Litchev  if (!llvm::all_of(llvm::zip(shape, inputVectorSizes),
30d4f6afSLubomir Litchev                    [](std::tuple<int64_t, int64_t> sizePair) {
30d4f6afSLubomir Litchev                      int64_t staticSize = std::get<0>(sizePair);
30d4f6afSLubomir Litchev                      int64_t inputSize = std::get<1>(sizePair);
30d4f6afSLubomir Litchev                      return ShapedType::isDynamic(staticSize) ||
30d4f6afSLubomir Litchev                             staticSize <= inputSize;
30d4f6afSLubomir Litchev                    })) {
30d4f6afSLubomir Litchev    LDBG("Input vector sizes must be greater than or equal to iteration space "
30d4f6afSLubomir Litchev         "static sizes");
30d4f6afSLubomir Litchev    return failure();
30d4f6afSLubomir Litchev  }
30d4f6afSLubomir Litchev  return success();
30d4f6afSLubomir Litchev}