Vector/Transforms/VectorLinearize.cpp

35ef3994SIvan Butygin//===- VectorLinearize.cpp - vector linearization transforms --------------===//
35ef3994SIvan Butygin//
35ef3994SIvan Butygin// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
35ef3994SIvan Butygin// See https://llvm.org/LICENSE.txt for license information.
35ef3994SIvan Butygin// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
35ef3994SIvan Butygin//
35ef3994SIvan Butygin//===----------------------------------------------------------------------===//
35ef3994SIvan Butygin//
35ef3994SIvan Butygin// This file implements patterns and pass for linearizing ND vectors into 1D.
35ef3994SIvan Butygin//
35ef3994SIvan Butygin//===----------------------------------------------------------------------===//
35ef3994SIvan Butygin
35ef3994SIvan Butygin#include "mlir/Dialect/Arith/IR/Arith.h"
35ef3994SIvan Butygin#include "mlir/Dialect/Vector/IR/VectorOps.h"
35ef3994SIvan Butygin#include "mlir/Dialect/Vector/Transforms/VectorRewritePatterns.h"
c577f91dSCharitha Saumya#include "mlir/IR/Attributes.h"
c577f91dSCharitha Saumya#include "mlir/IR/BuiltinAttributes.h"
c577f91dSCharitha Saumya#include "mlir/IR/Operation.h"
35ef3994SIvan Butygin#include "mlir/IR/PatternMatch.h"
35ef3994SIvan Butygin#include "mlir/IR/TypeUtilities.h"
35ef3994SIvan Butygin#include "mlir/Transforms/DialectConversion.h"
c577f91dSCharitha Saumya#include "llvm/ADT/ArrayRef.h"
c577f91dSCharitha Saumya#include <cstdint>
c577f91dSCharitha Saumya#include <numeric>
35ef3994SIvan Butygin
35ef3994SIvan Butyginusing namespace mlir;
35ef3994SIvan Butygin
6f5c4f2eSBalaji V. Iyerstatic bool isLessThanTargetBitWidth(Operation *op, unsigned targetBitWidth) {
6f5c4f2eSBalaji V. Iyer  auto resultTypes = op->getResultTypes();
6f5c4f2eSBalaji V. Iyer  for (auto resType : resultTypes) {
5f1f9cfaSBalaji V. Iyer    VectorType vecType = dyn_cast<VectorType>(resType);
6f5c4f2eSBalaji V. Iyer    // Reject index since getElementTypeBitWidth will abort for Index types.
5f1f9cfaSBalaji V. Iyer    if (!vecType || vecType.getElementType().isIndex())
6f5c4f2eSBalaji V. Iyer      return false;
ef5a7109SHan-Chung Wang    // There are no dimension to fold if it is a 0-D vector.
ef5a7109SHan-Chung Wang    if (vecType.getRank() == 0)
ef5a7109SHan-Chung Wang      return false;
6f5c4f2eSBalaji V. Iyer    unsigned trailingVecDimBitWidth =
6f5c4f2eSBalaji V. Iyer        vecType.getShape().back() * vecType.getElementTypeBitWidth();
6f5c4f2eSBalaji V. Iyer    if (trailingVecDimBitWidth >= targetBitWidth)
6f5c4f2eSBalaji V. Iyer      return false;
6f5c4f2eSBalaji V. Iyer  }
6f5c4f2eSBalaji V. Iyer  return true;
6f5c4f2eSBalaji V. Iyer}
6f5c4f2eSBalaji V. Iyer
01fbc565SArtem Kroviakovstatic bool isLessThanOrEqualTargetBitWidth(Type t, unsigned targetBitWidth) {
01fbc565SArtem Kroviakov  VectorType vecType = dyn_cast<VectorType>(t);
01fbc565SArtem Kroviakov  // Reject index since getElementTypeBitWidth will abort for Index types.
01fbc565SArtem Kroviakov  if (!vecType || vecType.getElementType().isIndex())
01fbc565SArtem Kroviakov    return false;
01fbc565SArtem Kroviakov  // There are no dimension to fold if it is a 0-D vector.
01fbc565SArtem Kroviakov  if (vecType.getRank() == 0)
01fbc565SArtem Kroviakov    return false;
01fbc565SArtem Kroviakov  unsigned trailingVecDimBitWidth =
01fbc565SArtem Kroviakov      vecType.getShape().back() * vecType.getElementTypeBitWidth();
01fbc565SArtem Kroviakov  return trailingVecDimBitWidth <= targetBitWidth;
01fbc565SArtem Kroviakov}
01fbc565SArtem Kroviakov
35ef3994SIvan Butyginnamespace {
35ef3994SIvan Butyginstruct LinearizeConstant final : OpConversionPattern<arith::ConstantOp> {
35ef3994SIvan Butygin  using OpConversionPattern::OpConversionPattern;
6f5c4f2eSBalaji V. Iyer  LinearizeConstant(
6f5c4f2eSBalaji V. Iyer      const TypeConverter &typeConverter, MLIRContext *context,
6f5c4f2eSBalaji V. Iyer      unsigned targetVectBitWidth = std::numeric_limits<unsigned>::max(),
6f5c4f2eSBalaji V. Iyer      PatternBenefit benefit = 1)
6f5c4f2eSBalaji V. Iyer      : OpConversionPattern(typeConverter, context, benefit),
6f5c4f2eSBalaji V. Iyer        targetVectorBitWidth(targetVectBitWidth) {}
35ef3994SIvan Butygin  LogicalResult
35ef3994SIvan Butygin  matchAndRewrite(arith::ConstantOp constOp, OpAdaptor adaptor,
35ef3994SIvan Butygin                  ConversionPatternRewriter &rewriter) const override {
35ef3994SIvan Butygin    Location loc = constOp.getLoc();
35ef3994SIvan Butygin    auto resType =
35ef3994SIvan Butygin        getTypeConverter()->convertType<VectorType>(constOp.getType());
d3aa92edSAndrzej Warzyński
*bd5d361cSChao Chen    if (!resType)
*bd5d361cSChao Chen      return rewriter.notifyMatchFailure(loc, "can't convert return type");
*bd5d361cSChao Chen
d3aa92edSAndrzej Warzyński    if (resType.isScalable() && !isa<SplatElementsAttr>(constOp.getValue()))
d3aa92edSAndrzej Warzyński      return rewriter.notifyMatchFailure(
d3aa92edSAndrzej Warzyński          loc,
d3aa92edSAndrzej Warzyński          "Cannot linearize a constant scalable vector that's not a splat");
d3aa92edSAndrzej Warzyński
6f5c4f2eSBalaji V. Iyer    if (!isLessThanTargetBitWidth(constOp, targetVectorBitWidth))
6f5c4f2eSBalaji V. Iyer      return rewriter.notifyMatchFailure(
6f5c4f2eSBalaji V. Iyer          loc, "Can't flatten since targetBitWidth <= OpSize");
35ef3994SIvan Butygin    auto dstElementsAttr = dyn_cast<DenseElementsAttr>(constOp.getValue());
35ef3994SIvan Butygin    if (!dstElementsAttr)
35ef3994SIvan Butygin      return rewriter.notifyMatchFailure(loc, "unsupported attr type");
35ef3994SIvan Butygin
35ef3994SIvan Butygin    dstElementsAttr = dstElementsAttr.reshape(resType);
35ef3994SIvan Butygin    rewriter.replaceOpWithNewOp<arith::ConstantOp>(constOp, resType,
35ef3994SIvan Butygin                                                   dstElementsAttr);
35ef3994SIvan Butygin    return success();
35ef3994SIvan Butygin  }
6f5c4f2eSBalaji V. Iyer
6f5c4f2eSBalaji V. Iyerprivate:
6f5c4f2eSBalaji V. Iyer  unsigned targetVectorBitWidth;
35ef3994SIvan Butygin};
35ef3994SIvan Butygin
35ef3994SIvan Butyginstruct LinearizeVectorizable final
35ef3994SIvan Butygin    : OpTraitConversionPattern<OpTrait::Vectorizable> {
35ef3994SIvan Butygin  using OpTraitConversionPattern::OpTraitConversionPattern;
35ef3994SIvan Butygin
6f5c4f2eSBalaji V. Iyerpublic:
6f5c4f2eSBalaji V. Iyer  LinearizeVectorizable(
6f5c4f2eSBalaji V. Iyer      const TypeConverter &typeConverter, MLIRContext *context,
6f5c4f2eSBalaji V. Iyer      unsigned targetVectBitWidth = std::numeric_limits<unsigned>::max(),
6f5c4f2eSBalaji V. Iyer      PatternBenefit benefit = 1)
6f5c4f2eSBalaji V. Iyer      : OpTraitConversionPattern(typeConverter, context, benefit),
6f5c4f2eSBalaji V. Iyer        targetVectorBitWidth(targetVectBitWidth) {}
35ef3994SIvan Butygin  LogicalResult
35ef3994SIvan Butygin  matchAndRewrite(Operation *op, ArrayRef<Value> operands,
35ef3994SIvan Butygin                  ConversionPatternRewriter &rewriter) const override {
6f5c4f2eSBalaji V. Iyer    if (!isLessThanTargetBitWidth(op, targetVectorBitWidth))
6f5c4f2eSBalaji V. Iyer      return rewriter.notifyMatchFailure(
6f5c4f2eSBalaji V. Iyer          op->getLoc(), "Can't flatten since targetBitWidth <= OpSize");
35ef3994SIvan Butygin    FailureOr<Operation *> newOp =
35ef3994SIvan Butygin        convertOpResultTypes(op, operands, *getTypeConverter(), rewriter);
35ef3994SIvan Butygin    if (failed(newOp))
35ef3994SIvan Butygin      return failure();
35ef3994SIvan Butygin
35ef3994SIvan Butygin    rewriter.replaceOp(op, (*newOp)->getResults());
35ef3994SIvan Butygin    return success();
35ef3994SIvan Butygin  }
6f5c4f2eSBalaji V. Iyer
6f5c4f2eSBalaji V. Iyerprivate:
6f5c4f2eSBalaji V. Iyer  unsigned targetVectorBitWidth;
35ef3994SIvan Butygin};
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya/// This pattern converts the ExtractStridedSliceOp into a ShuffleOp that works
c577f91dSCharitha Saumya/// on a linearized vector.
c577f91dSCharitha Saumya/// Following,
c577f91dSCharitha Saumya///   vector.extract_strided_slice %source
c577f91dSCharitha Saumya///         { offsets = [..], strides = [..], sizes = [..] }
c577f91dSCharitha Saumya/// is converted to :
c577f91dSCharitha Saumya///   %source_1d = vector.shape_cast %source
c577f91dSCharitha Saumya///   %out_1d = vector.shuffle %source_1d, %source_1d [ shuffle_indices_1d ]
c577f91dSCharitha Saumya///   %out_nd = vector.shape_cast %out_1d
c577f91dSCharitha Saumya/// `shuffle_indices_1d` is computed using the offsets and sizes of the
c577f91dSCharitha Saumya/// extraction.
c577f91dSCharitha Saumyastruct LinearizeVectorExtractStridedSlice final
c577f91dSCharitha Saumya    : public mlir::OpConversionPattern<mlir::vector::ExtractStridedSliceOp> {
c577f91dSCharitha Saumya  using OpConversionPattern::OpConversionPattern;
c577f91dSCharitha Saumya  LinearizeVectorExtractStridedSlice(
c577f91dSCharitha Saumya      const TypeConverter &typeConverter, MLIRContext *context,
c577f91dSCharitha Saumya      unsigned targetVectBitWidth = std::numeric_limits<unsigned>::max(),
c577f91dSCharitha Saumya      PatternBenefit benefit = 1)
c577f91dSCharitha Saumya      : OpConversionPattern(typeConverter, context, benefit),
c577f91dSCharitha Saumya        targetVectorBitWidth(targetVectBitWidth) {}
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya  LogicalResult
c577f91dSCharitha Saumya  matchAndRewrite(vector::ExtractStridedSliceOp extractOp, OpAdaptor adaptor,
c577f91dSCharitha Saumya                  ConversionPatternRewriter &rewriter) const override {
74a105adSArtem Kroviakov    VectorType dstType =
74a105adSArtem Kroviakov        getTypeConverter()->convertType<VectorType>(extractOp.getType());
74a105adSArtem Kroviakov    assert(dstType && "vector type destination expected.");
74a105adSArtem Kroviakov    if (extractOp.getVector().getType().isScalable() || dstType.isScalable())
74a105adSArtem Kroviakov      return rewriter.notifyMatchFailure(extractOp,
c577f91dSCharitha Saumya                                         "scalable vectors are not supported.");
c577f91dSCharitha Saumya    if (!isLessThanTargetBitWidth(extractOp, targetVectorBitWidth))
c577f91dSCharitha Saumya      return rewriter.notifyMatchFailure(
c577f91dSCharitha Saumya          extractOp, "Can't flatten since targetBitWidth <= OpSize");
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya    ArrayAttr offsets = extractOp.getOffsets();
c577f91dSCharitha Saumya    ArrayAttr sizes = extractOp.getSizes();
c577f91dSCharitha Saumya    ArrayAttr strides = extractOp.getStrides();
c577f91dSCharitha Saumya    if (!isConstantIntValue(strides[0], 1))
c577f91dSCharitha Saumya      return rewriter.notifyMatchFailure(
c577f91dSCharitha Saumya          extractOp, "Strided slice with stride != 1 is not supported.");
c577f91dSCharitha Saumya    Value srcVector = adaptor.getVector();
c577f91dSCharitha Saumya    // If kD offsets are specified for nD source vector (n > k), the granularity
c577f91dSCharitha Saumya    // of the extraction is greater than 1. In this case last (n-k) dimensions
c577f91dSCharitha Saumya    // form the extraction granularity.
c577f91dSCharitha Saumya    // Example :
c577f91dSCharitha Saumya    //  vector.extract_strided_slice %src {
c577f91dSCharitha Saumya    //      offsets = [0, 0], sizes = [2, 2], strides = [1, 1]} :
c577f91dSCharitha Saumya    //      vector<4x8x8xf32> to vector<2x2x8xf32>
c577f91dSCharitha Saumya    // Here, extraction granularity is 8.
c577f91dSCharitha Saumya    int64_t extractGranularitySize = 1;
c577f91dSCharitha Saumya    int64_t nD = extractOp.getSourceVectorType().getRank();
c577f91dSCharitha Saumya    int64_t kD = (int64_t)offsets.size();
c577f91dSCharitha Saumya    int64_t k = kD;
c577f91dSCharitha Saumya    while (k < nD) {
c577f91dSCharitha Saumya      extractGranularitySize *= extractOp.getSourceVectorType().getShape()[k];
c577f91dSCharitha Saumya      ++k;
c577f91dSCharitha Saumya    }
c577f91dSCharitha Saumya    // Get total number of extracted slices.
c577f91dSCharitha Saumya    int64_t nExtractedSlices = 1;
c577f91dSCharitha Saumya    for (Attribute size : sizes) {
fac349a1SChristian Sigg      nExtractedSlices *= cast<IntegerAttr>(size).getInt();
c577f91dSCharitha Saumya    }
c577f91dSCharitha Saumya    // Compute the strides of the source vector considering first k dimensions.
c577f91dSCharitha Saumya    llvm::SmallVector<int64_t, 4> sourceStrides(kD, extractGranularitySize);
c577f91dSCharitha Saumya    for (int i = kD - 2; i >= 0; --i) {
c577f91dSCharitha Saumya      sourceStrides[i] = sourceStrides[i + 1] *
c577f91dSCharitha Saumya                         extractOp.getSourceVectorType().getShape()[i + 1];
c577f91dSCharitha Saumya    }
c577f91dSCharitha Saumya    // Final shuffle indices has nExtractedSlices * extractGranularitySize
c577f91dSCharitha Saumya    // elements.
c577f91dSCharitha Saumya    llvm::SmallVector<int64_t, 4> indices(nExtractedSlices *
c577f91dSCharitha Saumya                                          extractGranularitySize);
c577f91dSCharitha Saumya    // Compute the strides of the extracted kD vector.
c577f91dSCharitha Saumya    llvm::SmallVector<int64_t, 4> extractedStrides(kD, 1);
c577f91dSCharitha Saumya    // Compute extractedStrides.
c577f91dSCharitha Saumya    for (int i = kD - 2; i >= 0; --i) {
c577f91dSCharitha Saumya      extractedStrides[i] =
fac349a1SChristian Sigg          extractedStrides[i + 1] * cast<IntegerAttr>(sizes[i + 1]).getInt();
c577f91dSCharitha Saumya    }
c577f91dSCharitha Saumya    // Iterate over all extracted slices from 0 to nExtractedSlices - 1
c577f91dSCharitha Saumya    // and compute the multi-dimensional index and the corresponding linearized
c577f91dSCharitha Saumya    // index within the source vector.
c577f91dSCharitha Saumya    for (int64_t i = 0; i < nExtractedSlices; ++i) {
c577f91dSCharitha Saumya      int64_t index = i;
c577f91dSCharitha Saumya      // Compute the corresponding multi-dimensional index.
c577f91dSCharitha Saumya      llvm::SmallVector<int64_t, 4> multiDimIndex(kD, 0);
c577f91dSCharitha Saumya      for (int64_t j = 0; j < kD; ++j) {
c577f91dSCharitha Saumya        multiDimIndex[j] = (index / extractedStrides[j]);
c577f91dSCharitha Saumya        index -= multiDimIndex[j] * extractedStrides[j];
c577f91dSCharitha Saumya      }
c577f91dSCharitha Saumya      // Compute the corresponding linearized index in the source vector
c577f91dSCharitha Saumya      // i.e. shift the multiDimIndex by the offsets.
c577f91dSCharitha Saumya      int64_t linearizedIndex = 0;
c577f91dSCharitha Saumya      for (int64_t j = 0; j < kD; ++j) {
c577f91dSCharitha Saumya        linearizedIndex +=
fac349a1SChristian Sigg            (cast<IntegerAttr>(offsets[j]).getInt() + multiDimIndex[j]) *
c577f91dSCharitha Saumya            sourceStrides[j];
c577f91dSCharitha Saumya      }
c577f91dSCharitha Saumya      // Fill the indices array form linearizedIndex to linearizedIndex +
c577f91dSCharitha Saumya      // extractGranularitySize.
c577f91dSCharitha Saumya      for (int64_t j = 0; j < extractGranularitySize; ++j) {
c577f91dSCharitha Saumya        indices[i * extractGranularitySize + j] = linearizedIndex + j;
c577f91dSCharitha Saumya      }
c577f91dSCharitha Saumya    }
c577f91dSCharitha Saumya    // Perform a shuffle to extract the kD vector.
c577f91dSCharitha Saumya    rewriter.replaceOpWithNewOp<vector::ShuffleOp>(
b4444dcaSBenjamin Maxwell        extractOp, dstType, srcVector, srcVector, indices);
c577f91dSCharitha Saumya    return success();
c577f91dSCharitha Saumya  }
c577f91dSCharitha Saumya
c577f91dSCharitha Saumyaprivate:
c577f91dSCharitha Saumya  unsigned targetVectorBitWidth;
c577f91dSCharitha Saumya};
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya/// This pattern converts the ShuffleOp that works on nD (n > 1)
c577f91dSCharitha Saumya/// vectors to a ShuffleOp that works on linearized vectors.
c577f91dSCharitha Saumya/// Following,
c577f91dSCharitha Saumya///   vector.shuffle %v1, %v2 [ shuffle_indices ]
c577f91dSCharitha Saumya/// is converted to :
c577f91dSCharitha Saumya///   %v1_1d = vector.shape_cast %v1
c577f91dSCharitha Saumya///   %v2_1d = vector.shape_cast %v2
c577f91dSCharitha Saumya///   %out_1d = vector.shuffle %v1_1d, %v2_1d [ shuffle_indices_1d ]
c577f91dSCharitha Saumya///   %out_nd = vector.shape_cast %out_1d
c577f91dSCharitha Saumya// `shuffle_indices_1d` is computed using the sizes and `shuffle_indices`
c577f91dSCharitha Saumya/// of the original shuffle operation.
c577f91dSCharitha Saumyastruct LinearizeVectorShuffle final
c577f91dSCharitha Saumya    : public OpConversionPattern<vector::ShuffleOp> {
c577f91dSCharitha Saumya  using OpConversionPattern::OpConversionPattern;
c577f91dSCharitha Saumya  LinearizeVectorShuffle(
c577f91dSCharitha Saumya      const TypeConverter &typeConverter, MLIRContext *context,
c577f91dSCharitha Saumya      unsigned targetVectBitWidth = std::numeric_limits<unsigned>::max(),
c577f91dSCharitha Saumya      PatternBenefit benefit = 1)
c577f91dSCharitha Saumya      : OpConversionPattern(typeConverter, context, benefit),
c577f91dSCharitha Saumya        targetVectorBitWidth(targetVectBitWidth) {}
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya  LogicalResult
c577f91dSCharitha Saumya  matchAndRewrite(vector::ShuffleOp shuffleOp, OpAdaptor adaptor,
c577f91dSCharitha Saumya                  ConversionPatternRewriter &rewriter) const override {
74a105adSArtem Kroviakov    VectorType dstType =
74a105adSArtem Kroviakov        getTypeConverter()->convertType<VectorType>(shuffleOp.getType());
74a105adSArtem Kroviakov    assert(dstType && "vector type destination expected.");
74a105adSArtem Kroviakov    // The assert is used because vector.shuffle does not support scalable
74a105adSArtem Kroviakov    // vectors.
c577f91dSCharitha Saumya    assert(!(shuffleOp.getV1VectorType().isScalable() ||
c577f91dSCharitha Saumya             shuffleOp.getV2VectorType().isScalable() ||
74a105adSArtem Kroviakov             dstType.isScalable()) &&
c577f91dSCharitha Saumya           "scalable vectors are not supported.");
c577f91dSCharitha Saumya    if (!isLessThanTargetBitWidth(shuffleOp, targetVectorBitWidth))
c577f91dSCharitha Saumya      return rewriter.notifyMatchFailure(
c577f91dSCharitha Saumya          shuffleOp, "Can't flatten since targetBitWidth <= OpSize");
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya    Value vec1 = adaptor.getV1();
c577f91dSCharitha Saumya    Value vec2 = adaptor.getV2();
c577f91dSCharitha Saumya    int shuffleSliceLen = 1;
c577f91dSCharitha Saumya    int rank = shuffleOp.getV1().getType().getRank();
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya    // If rank > 1, we need to do the shuffle in the granularity of slices
c577f91dSCharitha Saumya    // instead of scalars. Size of the slice is equal to the rank-1 innermost
c577f91dSCharitha Saumya    // dims. Mask of the shuffle op specifies which slice to take from the
c577f91dSCharitha Saumya    // outermost dim.
c577f91dSCharitha Saumya    if (rank > 1) {
c577f91dSCharitha Saumya      llvm::ArrayRef<int64_t> shape = shuffleOp.getV1().getType().getShape();
c577f91dSCharitha Saumya      for (unsigned i = 1; i < shape.size(); ++i) {
c577f91dSCharitha Saumya        shuffleSliceLen *= shape[i];
c577f91dSCharitha Saumya      }
c577f91dSCharitha Saumya    }
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya    // For each value in the mask, we generate the indices of the source vectors
c577f91dSCharitha Saumya    // that needs to be shuffled to the destination vector. If shuffleSliceLen >
c577f91dSCharitha Saumya    // 1 we need to shuffle the slices (consecutive shuffleSliceLen number of
c577f91dSCharitha Saumya    // elements) instead of scalars.
b4444dcaSBenjamin Maxwell    ArrayRef<int64_t> mask = shuffleOp.getMask();
c577f91dSCharitha Saumya    int64_t totalSizeOfShuffledElmnts = mask.size() * shuffleSliceLen;
c577f91dSCharitha Saumya    llvm::SmallVector<int64_t, 2> indices(totalSizeOfShuffledElmnts);
b4444dcaSBenjamin Maxwell    for (auto [i, value] : llvm::enumerate(mask)) {
c577f91dSCharitha Saumya      std::iota(indices.begin() + shuffleSliceLen * i,
c577f91dSCharitha Saumya                indices.begin() + shuffleSliceLen * (i + 1),
b4444dcaSBenjamin Maxwell                shuffleSliceLen * value);
c577f91dSCharitha Saumya    }
c577f91dSCharitha Saumya
b4444dcaSBenjamin Maxwell    rewriter.replaceOpWithNewOp<vector::ShuffleOp>(shuffleOp, dstType, vec1,
b4444dcaSBenjamin Maxwell                                                   vec2, indices);
c577f91dSCharitha Saumya    return success();
c577f91dSCharitha Saumya  }
c577f91dSCharitha Saumya
c577f91dSCharitha Saumyaprivate:
c577f91dSCharitha Saumya  unsigned targetVectorBitWidth;
c577f91dSCharitha Saumya};
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya/// This pattern converts the ExtractOp to a ShuffleOp that works on a
c577f91dSCharitha Saumya/// linearized vector.
c577f91dSCharitha Saumya/// Following,
c577f91dSCharitha Saumya///   vector.extract %source [ position ]
c577f91dSCharitha Saumya/// is converted to :
c577f91dSCharitha Saumya///   %source_1d = vector.shape_cast %source
c577f91dSCharitha Saumya///   %out_1d = vector.shuffle %source_1d, %source_1d [ shuffle_indices_1d ]
c577f91dSCharitha Saumya///   %out_nd = vector.shape_cast %out_1d
c577f91dSCharitha Saumya/// `shuffle_indices_1d` is computed using the position of the original extract.
c577f91dSCharitha Saumyastruct LinearizeVectorExtract final
c577f91dSCharitha Saumya    : public OpConversionPattern<vector::ExtractOp> {
c577f91dSCharitha Saumya  using OpConversionPattern::OpConversionPattern;
c577f91dSCharitha Saumya  LinearizeVectorExtract(
c577f91dSCharitha Saumya      const TypeConverter &typeConverter, MLIRContext *context,
c577f91dSCharitha Saumya      unsigned targetVectBitWidth = std::numeric_limits<unsigned>::max(),
c577f91dSCharitha Saumya      PatternBenefit benefit = 1)
c577f91dSCharitha Saumya      : OpConversionPattern(typeConverter, context, benefit),
c577f91dSCharitha Saumya        targetVectorBitWidth(targetVectBitWidth) {}
c577f91dSCharitha Saumya  LogicalResult
c577f91dSCharitha Saumya  matchAndRewrite(vector::ExtractOp extractOp, OpAdaptor adaptor,
c577f91dSCharitha Saumya                  ConversionPatternRewriter &rewriter) const override {
c577f91dSCharitha Saumya    Type dstTy = getTypeConverter()->convertType(extractOp.getType());
50febdebSLongsheng Mou    if (!dstTy)
50febdebSLongsheng Mou      return rewriter.notifyMatchFailure(extractOp,
50febdebSLongsheng Mou                                         "expected n-D vector type.");
50febdebSLongsheng Mou
74a105adSArtem Kroviakov    if (extractOp.getVector().getType().isScalable() ||
74a105adSArtem Kroviakov        cast<VectorType>(dstTy).isScalable())
74a105adSArtem Kroviakov      return rewriter.notifyMatchFailure(extractOp,
c577f91dSCharitha Saumya                                         "scalable vectors are not supported.");
c577f91dSCharitha Saumya    if (!isLessThanTargetBitWidth(extractOp, targetVectorBitWidth))
c577f91dSCharitha Saumya      return rewriter.notifyMatchFailure(
c577f91dSCharitha Saumya          extractOp, "Can't flatten since targetBitWidth <= OpSize");
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya    // Dynamic position is not supported.
c577f91dSCharitha Saumya    if (extractOp.hasDynamicPosition())
c577f91dSCharitha Saumya      return rewriter.notifyMatchFailure(extractOp,
c577f91dSCharitha Saumya                                         "dynamic position is not supported.");
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya    llvm::ArrayRef<int64_t> shape = extractOp.getVector().getType().getShape();
c577f91dSCharitha Saumya    int64_t size = extractOp.getVector().getType().getNumElements();
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya    // Compute linearized offset.
c577f91dSCharitha Saumya    int64_t linearizedOffset = 0;
c577f91dSCharitha Saumya    llvm::ArrayRef<int64_t> offsets = extractOp.getStaticPosition();
c577f91dSCharitha Saumya    for (auto [i, off] : llvm::enumerate(offsets)) {
c577f91dSCharitha Saumya      size /= shape[i];
c577f91dSCharitha Saumya      linearizedOffset += offsets[i] * size;
c577f91dSCharitha Saumya    }
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya    llvm::SmallVector<int64_t, 2> indices(size);
c577f91dSCharitha Saumya    std::iota(indices.begin(), indices.end(), linearizedOffset);
c577f91dSCharitha Saumya    rewriter.replaceOpWithNewOp<vector::ShuffleOp>(
b4444dcaSBenjamin Maxwell        extractOp, dstTy, adaptor.getVector(), adaptor.getVector(), indices);
c577f91dSCharitha Saumya
c577f91dSCharitha Saumya    return success();
c577f91dSCharitha Saumya  }
c577f91dSCharitha Saumya
c577f91dSCharitha Saumyaprivate:
c577f91dSCharitha Saumya  unsigned targetVectorBitWidth;
c577f91dSCharitha Saumya};
01fbc565SArtem Kroviakov
01fbc565SArtem Kroviakov/// This pattern converts the InsertOp to a ShuffleOp that works on a
01fbc565SArtem Kroviakov/// linearized vector.
01fbc565SArtem Kroviakov/// Following,
01fbc565SArtem Kroviakov///   vector.insert %source %destination [ position ]
01fbc565SArtem Kroviakov/// is converted to :
01fbc565SArtem Kroviakov///   %source_1d = vector.shape_cast %source
01fbc565SArtem Kroviakov///   %destination_1d = vector.shape_cast %destination
01fbc565SArtem Kroviakov///   %out_1d = vector.shuffle %destination_1d, %source_1d [ shuffle_indices_1d
01fbc565SArtem Kroviakov///   ] %out_nd = vector.shape_cast %out_1d
01fbc565SArtem Kroviakov/// `shuffle_indices_1d` is computed using the position of the original insert.
01fbc565SArtem Kroviakovstruct LinearizeVectorInsert final
01fbc565SArtem Kroviakov    : public OpConversionPattern<vector::InsertOp> {
01fbc565SArtem Kroviakov  using OpConversionPattern::OpConversionPattern;
01fbc565SArtem Kroviakov  LinearizeVectorInsert(
01fbc565SArtem Kroviakov      const TypeConverter &typeConverter, MLIRContext *context,
01fbc565SArtem Kroviakov      unsigned targetVectBitWidth = std::numeric_limits<unsigned>::max(),
01fbc565SArtem Kroviakov      PatternBenefit benefit = 1)
01fbc565SArtem Kroviakov      : OpConversionPattern(typeConverter, context, benefit),
01fbc565SArtem Kroviakov        targetVectorBitWidth(targetVectBitWidth) {}
01fbc565SArtem Kroviakov  LogicalResult
01fbc565SArtem Kroviakov  matchAndRewrite(vector::InsertOp insertOp, OpAdaptor adaptor,
01fbc565SArtem Kroviakov                  ConversionPatternRewriter &rewriter) const override {
74a105adSArtem Kroviakov    VectorType dstTy = getTypeConverter()->convertType<VectorType>(
74a105adSArtem Kroviakov        insertOp.getDestVectorType());
74a105adSArtem Kroviakov    assert(dstTy && "vector type destination expected.");
74a105adSArtem Kroviakov    if (insertOp.getDestVectorType().isScalable() || dstTy.isScalable())
74a105adSArtem Kroviakov      return rewriter.notifyMatchFailure(insertOp,
01fbc565SArtem Kroviakov                                         "scalable vectors are not supported.");
01fbc565SArtem Kroviakov
01fbc565SArtem Kroviakov    if (!isLessThanOrEqualTargetBitWidth(insertOp.getSourceType(),
01fbc565SArtem Kroviakov                                         targetVectorBitWidth))
01fbc565SArtem Kroviakov      return rewriter.notifyMatchFailure(
01fbc565SArtem Kroviakov          insertOp, "Can't flatten since targetBitWidth < OpSize");
01fbc565SArtem Kroviakov
01fbc565SArtem Kroviakov    // dynamic position is not supported
01fbc565SArtem Kroviakov    if (insertOp.hasDynamicPosition())
01fbc565SArtem Kroviakov      return rewriter.notifyMatchFailure(insertOp,
01fbc565SArtem Kroviakov                                         "dynamic position is not supported.");
01fbc565SArtem Kroviakov    auto srcTy = insertOp.getSourceType();
01fbc565SArtem Kroviakov    auto srcAsVec = dyn_cast<VectorType>(srcTy);
01fbc565SArtem Kroviakov    uint64_t srcSize = 0;
01fbc565SArtem Kroviakov    if (srcAsVec) {
01fbc565SArtem Kroviakov      srcSize = srcAsVec.getNumElements();
01fbc565SArtem Kroviakov    } else {
01fbc565SArtem Kroviakov      return rewriter.notifyMatchFailure(insertOp,
01fbc565SArtem Kroviakov                                         "scalars are not supported.");
01fbc565SArtem Kroviakov    }
01fbc565SArtem Kroviakov
01fbc565SArtem Kroviakov    auto dstShape = insertOp.getDestVectorType().getShape();
01fbc565SArtem Kroviakov    const auto dstSize = insertOp.getDestVectorType().getNumElements();
01fbc565SArtem Kroviakov    auto dstSizeForOffsets = dstSize;
01fbc565SArtem Kroviakov
01fbc565SArtem Kroviakov    // compute linearized offset
01fbc565SArtem Kroviakov    int64_t linearizedOffset = 0;
01fbc565SArtem Kroviakov    auto offsetsNd = insertOp.getStaticPosition();
01fbc565SArtem Kroviakov    for (auto [dim, offset] : llvm::enumerate(offsetsNd)) {
01fbc565SArtem Kroviakov      dstSizeForOffsets /= dstShape[dim];
01fbc565SArtem Kroviakov      linearizedOffset += offset * dstSizeForOffsets;
01fbc565SArtem Kroviakov    }
01fbc565SArtem Kroviakov
01fbc565SArtem Kroviakov    llvm::SmallVector<int64_t, 2> indices(dstSize);
01fbc565SArtem Kroviakov    auto origValsUntil = indices.begin();
01fbc565SArtem Kroviakov    std::advance(origValsUntil, linearizedOffset);
01fbc565SArtem Kroviakov    std::iota(indices.begin(), origValsUntil,
01fbc565SArtem Kroviakov              0); // original values that remain [0, offset)
01fbc565SArtem Kroviakov    auto newValsUntil = origValsUntil;
01fbc565SArtem Kroviakov    std::advance(newValsUntil, srcSize);
01fbc565SArtem Kroviakov    std::iota(origValsUntil, newValsUntil,
01fbc565SArtem Kroviakov              dstSize); // new values [offset, offset+srcNumElements)
01fbc565SArtem Kroviakov    std::iota(newValsUntil, indices.end(),
01fbc565SArtem Kroviakov              linearizedOffset + srcSize); // the rest of original values
01fbc565SArtem Kroviakov                                           // [offset+srcNumElements, end)
01fbc565SArtem Kroviakov
01fbc565SArtem Kroviakov    rewriter.replaceOpWithNewOp<vector::ShuffleOp>(
b4444dcaSBenjamin Maxwell        insertOp, dstTy, adaptor.getDest(), adaptor.getSource(), indices);
01fbc565SArtem Kroviakov
01fbc565SArtem Kroviakov    return success();
01fbc565SArtem Kroviakov  }
01fbc565SArtem Kroviakov
01fbc565SArtem Kroviakovprivate:
01fbc565SArtem Kroviakov  unsigned targetVectorBitWidth;
01fbc565SArtem Kroviakov};
*bd5d361cSChao Chen
*bd5d361cSChao Chen/// This pattern converts the BitCastOp that works on nD (n > 1)
*bd5d361cSChao Chen/// vectors to a BitCastOp that works on linearized vectors.
*bd5d361cSChao Chen/// Following,
*bd5d361cSChao Chen///   vector.bitcast %v1: vector<4x2xf32> to vector<4x4xf16>
*bd5d361cSChao Chen/// is converted to :
*bd5d361cSChao Chen///   %v1_1d = vector.shape_cast %v1: vector<4x2xf32> to vector<8xf32>
*bd5d361cSChao Chen///   %out_1d = vector.bitcast %v1_1d: vector<8xf32> to vector<16xf16>
*bd5d361cSChao Chen///   %out_nd = vector.shape_cast %out_1d: vector<16xf16> to vector<4x4xf16>
*bd5d361cSChao Chenstruct LinearizeVectorBitCast final
*bd5d361cSChao Chen    : public OpConversionPattern<vector::BitCastOp> {
*bd5d361cSChao Chen  using OpConversionPattern::OpConversionPattern;
*bd5d361cSChao Chen  LinearizeVectorBitCast(
*bd5d361cSChao Chen      const TypeConverter &typeConverter, MLIRContext *context,
*bd5d361cSChao Chen      unsigned targetVectBitWidth = std::numeric_limits<unsigned>::max(),
*bd5d361cSChao Chen      PatternBenefit benefit = 1)
*bd5d361cSChao Chen      : OpConversionPattern(typeConverter, context, benefit),
*bd5d361cSChao Chen        targetVectorBitWidth(targetVectBitWidth) {}
*bd5d361cSChao Chen  LogicalResult
*bd5d361cSChao Chen  matchAndRewrite(vector::BitCastOp castOp, OpAdaptor adaptor,
*bd5d361cSChao Chen                  ConversionPatternRewriter &rewriter) const override {
*bd5d361cSChao Chen    Location loc = castOp.getLoc();
*bd5d361cSChao Chen    auto resType = getTypeConverter()->convertType(castOp.getType());
*bd5d361cSChao Chen    if (!resType)
*bd5d361cSChao Chen      return rewriter.notifyMatchFailure(loc, "can't convert return type.");
*bd5d361cSChao Chen
*bd5d361cSChao Chen    if (!isLessThanTargetBitWidth(castOp, targetVectorBitWidth))
*bd5d361cSChao Chen      return rewriter.notifyMatchFailure(
*bd5d361cSChao Chen          loc, "Can't flatten since targetBitWidth <= OpSize");
*bd5d361cSChao Chen
*bd5d361cSChao Chen    rewriter.replaceOpWithNewOp<vector::BitCastOp>(castOp, resType,
*bd5d361cSChao Chen                                                   adaptor.getSource());
*bd5d361cSChao Chen    return mlir::success();
*bd5d361cSChao Chen  }
*bd5d361cSChao Chen
*bd5d361cSChao Chenprivate:
*bd5d361cSChao Chen  unsigned targetVectorBitWidth;
*bd5d361cSChao Chen};
*bd5d361cSChao Chen
35ef3994SIvan Butygin} // namespace
35ef3994SIvan Butygin
35ef3994SIvan Butyginvoid mlir::vector::populateVectorLinearizeTypeConversionsAndLegality(
35ef3994SIvan Butygin    TypeConverter &typeConverter, RewritePatternSet &patterns,
6f5c4f2eSBalaji V. Iyer    ConversionTarget &target, unsigned targetBitWidth) {
6f5c4f2eSBalaji V. Iyer
35ef3994SIvan Butygin  typeConverter.addConversion([](VectorType type) -> std::optional<Type> {
d3aa92edSAndrzej Warzyński    if (!isLinearizableVector(type))
35ef3994SIvan Butygin      return type;
35ef3994SIvan Butygin
d3aa92edSAndrzej Warzyński    return VectorType::get(type.getNumElements(), type.getElementType(),
d3aa92edSAndrzej Warzyński                           type.isScalable());
35ef3994SIvan Butygin  });
35ef3994SIvan Butygin
35ef3994SIvan Butygin  auto materializeCast = [](OpBuilder &builder, Type type, ValueRange inputs,
35ef3994SIvan Butygin                            Location loc) -> Value {
35ef3994SIvan Butygin    if (inputs.size() != 1 || !isa<VectorType>(inputs.front().getType()) ||
35ef3994SIvan Butygin        !isa<VectorType>(type))
35ef3994SIvan Butygin      return nullptr;
35ef3994SIvan Butygin
35ef3994SIvan Butygin    return builder.create<vector::ShapeCastOp>(loc, type, inputs.front());
35ef3994SIvan Butygin  };
35ef3994SIvan Butygin  typeConverter.addSourceMaterialization(materializeCast);
35ef3994SIvan Butygin  typeConverter.addTargetMaterialization(materializeCast);
35ef3994SIvan Butygin  target.markUnknownOpDynamicallyLegal(
6f5c4f2eSBalaji V. Iyer      [=](Operation *op) -> std::optional<bool> {
*bd5d361cSChao Chen        if ((isa<arith::ConstantOp>(op) || isa<vector::BitCastOp>(op) ||
6f5c4f2eSBalaji V. Iyer             op->hasTrait<OpTrait::Vectorizable>())) {
6f5c4f2eSBalaji V. Iyer          return (isLessThanTargetBitWidth(op, targetBitWidth)
6f5c4f2eSBalaji V. Iyer                      ? typeConverter.isLegal(op)
6f5c4f2eSBalaji V. Iyer                      : true);
6f5c4f2eSBalaji V. Iyer        }
35ef3994SIvan Butygin        return std::nullopt;
35ef3994SIvan Butygin      });
35ef3994SIvan Butygin
*bd5d361cSChao Chen  patterns
*bd5d361cSChao Chen      .add<LinearizeConstant, LinearizeVectorizable, LinearizeVectorBitCast>(
6f5c4f2eSBalaji V. Iyer          typeConverter, patterns.getContext(), targetBitWidth);
35ef3994SIvan Butygin}
c577f91dSCharitha Saumya
c577f91dSCharitha Saumyavoid mlir::vector::populateVectorLinearizeShuffleLikeOpsPatterns(
206fad0eSMatthias Springer    const TypeConverter &typeConverter, RewritePatternSet &patterns,
c577f91dSCharitha Saumya    ConversionTarget &target, unsigned int targetBitWidth) {
c577f91dSCharitha Saumya  target.addDynamicallyLegalOp<vector::ShuffleOp>(
c577f91dSCharitha Saumya      [=](vector::ShuffleOp shuffleOp) -> bool {
c577f91dSCharitha Saumya        return isLessThanTargetBitWidth(shuffleOp, targetBitWidth)
c577f91dSCharitha Saumya                   ? (typeConverter.isLegal(shuffleOp) &&
fac349a1SChristian Sigg                      cast<mlir::VectorType>(shuffleOp.getResult().getType())
c577f91dSCharitha Saumya                              .getRank() == 1)
c577f91dSCharitha Saumya                   : true;
c577f91dSCharitha Saumya      });
c577f91dSCharitha Saumya  patterns.add<LinearizeVectorShuffle, LinearizeVectorExtract,
01fbc565SArtem Kroviakov               LinearizeVectorInsert, LinearizeVectorExtractStridedSlice>(
c577f91dSCharitha Saumya      typeConverter, patterns.getContext(), targetBitWidth);
c577f91dSCharitha Saumya}