1a1a68603SBenjamin Maxwell //===- LowerVectorInterleave.cpp - Lower 'vector.interleave' operation ----===//
2a1a68603SBenjamin Maxwell //
3a1a68603SBenjamin Maxwell // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4a1a68603SBenjamin Maxwell // See https://llvm.org/LICENSE.txt for license information.
5a1a68603SBenjamin Maxwell // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6a1a68603SBenjamin Maxwell //
7a1a68603SBenjamin Maxwell //===----------------------------------------------------------------------===//
8a1a68603SBenjamin Maxwell //
9a1a68603SBenjamin Maxwell // This file implements target-independent rewrites and utilities to lower the
10a1a68603SBenjamin Maxwell // 'vector.interleave' operation.
11a1a68603SBenjamin Maxwell //
12a1a68603SBenjamin Maxwell //===----------------------------------------------------------------------===//
13a1a68603SBenjamin Maxwell
14a1a68603SBenjamin Maxwell #include "mlir/Dialect/Vector/IR/VectorOps.h"
15a1a68603SBenjamin Maxwell #include "mlir/Dialect/Vector/Transforms/LoweringPatterns.h"
16a1a68603SBenjamin Maxwell #include "mlir/Dialect/Vector/Utils/VectorUtils.h"
17a1a68603SBenjamin Maxwell #include "mlir/IR/BuiltinTypes.h"
18a1a68603SBenjamin Maxwell #include "mlir/IR/PatternMatch.h"
19a1a68603SBenjamin Maxwell
20a1a68603SBenjamin Maxwell #define DEBUG_TYPE "vector-interleave-lowering"
21a1a68603SBenjamin Maxwell
22a1a68603SBenjamin Maxwell using namespace mlir;
23a1a68603SBenjamin Maxwell using namespace mlir::vector;
24a1a68603SBenjamin Maxwell
25a1a68603SBenjamin Maxwell namespace {
26a1a68603SBenjamin Maxwell
27a1a68603SBenjamin Maxwell /// A one-shot unrolling of vector.interleave to the `targetRank`.
28a1a68603SBenjamin Maxwell ///
29a1a68603SBenjamin Maxwell /// Example:
30a1a68603SBenjamin Maxwell ///
31a1a68603SBenjamin Maxwell /// ```mlir
32714aee31SJakub Kuderski /// vector.interleave %a, %b : vector<1x2x3x4xi64> -> vector<1x2x3x8xi64>
33a1a68603SBenjamin Maxwell /// ```
34a1a68603SBenjamin Maxwell /// Would be unrolled to:
35a1a68603SBenjamin Maxwell /// ```mlir
36a1a68603SBenjamin Maxwell /// %result = arith.constant dense<0> : vector<1x2x3x8xi64>
37a1a68603SBenjamin Maxwell /// %0 = vector.extract %a[0, 0, 0] ─┐
38a1a68603SBenjamin Maxwell /// : vector<4xi64> from vector<1x2x3x4xi64> |
39a1a68603SBenjamin Maxwell /// %1 = vector.extract %b[0, 0, 0] |
40a1a68603SBenjamin Maxwell /// : vector<4xi64> from vector<1x2x3x4xi64> | - Repeated 6x for
41714aee31SJakub Kuderski /// %2 = vector.interleave %0, %1 : | all leading positions
42714aee31SJakub Kuderski /// : vector<4xi64> -> vector<8xi64> |
43a1a68603SBenjamin Maxwell /// %3 = vector.insert %2, %result [0, 0, 0] |
44a1a68603SBenjamin Maxwell /// : vector<8xi64> into vector<1x2x3x8xi64> ┘
45a1a68603SBenjamin Maxwell /// ```
46a1a68603SBenjamin Maxwell ///
47a1a68603SBenjamin Maxwell /// Note: If any leading dimension before the `targetRank` is scalable the
48a1a68603SBenjamin Maxwell /// unrolling will stop before the scalable dimension.
49714aee31SJakub Kuderski class UnrollInterleaveOp final : public OpRewritePattern<vector::InterleaveOp> {
50a1a68603SBenjamin Maxwell public:
UnrollInterleaveOp(int64_t targetRank,MLIRContext * context,PatternBenefit benefit=1)51a1a68603SBenjamin Maxwell UnrollInterleaveOp(int64_t targetRank, MLIRContext *context,
52a1a68603SBenjamin Maxwell PatternBenefit benefit = 1)
53a1a68603SBenjamin Maxwell : OpRewritePattern(context, benefit), targetRank(targetRank){};
54a1a68603SBenjamin Maxwell
matchAndRewrite(vector::InterleaveOp op,PatternRewriter & rewriter) const55a1a68603SBenjamin Maxwell LogicalResult matchAndRewrite(vector::InterleaveOp op,
56a1a68603SBenjamin Maxwell PatternRewriter &rewriter) const override {
57a1a68603SBenjamin Maxwell VectorType resultType = op.getResultVectorType();
58a1a68603SBenjamin Maxwell auto unrollIterator = vector::createUnrollIterator(resultType, targetRank);
59a1a68603SBenjamin Maxwell if (!unrollIterator)
60a1a68603SBenjamin Maxwell return failure();
61a1a68603SBenjamin Maxwell
62a1a68603SBenjamin Maxwell auto loc = op.getLoc();
63a1a68603SBenjamin Maxwell Value result = rewriter.create<arith::ConstantOp>(
64a1a68603SBenjamin Maxwell loc, resultType, rewriter.getZeroAttr(resultType));
65a1a68603SBenjamin Maxwell for (auto position : *unrollIterator) {
66a1a68603SBenjamin Maxwell Value extractLhs = rewriter.create<ExtractOp>(loc, op.getLhs(), position);
67a1a68603SBenjamin Maxwell Value extractRhs = rewriter.create<ExtractOp>(loc, op.getRhs(), position);
68a1a68603SBenjamin Maxwell Value interleave =
69a1a68603SBenjamin Maxwell rewriter.create<InterleaveOp>(loc, extractLhs, extractRhs);
70a1a68603SBenjamin Maxwell result = rewriter.create<InsertOp>(loc, interleave, result, position);
71a1a68603SBenjamin Maxwell }
72a1a68603SBenjamin Maxwell
73a1a68603SBenjamin Maxwell rewriter.replaceOp(op, result);
74a1a68603SBenjamin Maxwell return success();
75a1a68603SBenjamin Maxwell }
76a1a68603SBenjamin Maxwell
77a1a68603SBenjamin Maxwell private:
78a1a68603SBenjamin Maxwell int64_t targetRank = 1;
79a1a68603SBenjamin Maxwell };
80a1a68603SBenjamin Maxwell
81*b87a80d4SMubashar Ahmad /// A one-shot unrolling of vector.deinterleave to the `targetRank`.
82*b87a80d4SMubashar Ahmad ///
83*b87a80d4SMubashar Ahmad /// Example:
84*b87a80d4SMubashar Ahmad ///
85*b87a80d4SMubashar Ahmad /// ```mlir
86*b87a80d4SMubashar Ahmad /// %0, %1 = vector.deinterleave %a : vector<1x2x3x8xi64> -> vector<1x2x3x4xi64>
87*b87a80d4SMubashar Ahmad /// ```
88*b87a80d4SMubashar Ahmad /// Would be unrolled to:
89*b87a80d4SMubashar Ahmad /// ```mlir
90*b87a80d4SMubashar Ahmad /// %result = arith.constant dense<0> : vector<1x2x3x4xi64>
91*b87a80d4SMubashar Ahmad /// %0 = vector.extract %a[0, 0, 0] ─┐
92*b87a80d4SMubashar Ahmad /// : vector<8xi64> from vector<1x2x3x8xi64> |
93*b87a80d4SMubashar Ahmad /// %1, %2 = vector.deinterleave %0 |
94*b87a80d4SMubashar Ahmad /// : vector<8xi64> -> vector<4xi64> | -- Initial deinterleave
95*b87a80d4SMubashar Ahmad /// %3 = vector.insert %1, %result [0, 0, 0] | operation unrolled.
96*b87a80d4SMubashar Ahmad /// : vector<4xi64> into vector<1x2x3x4xi64> |
97*b87a80d4SMubashar Ahmad /// %4 = vector.insert %2, %result [0, 0, 0] |
98*b87a80d4SMubashar Ahmad /// : vector<4xi64> into vector<1x2x3x4xi64> ┘
99*b87a80d4SMubashar Ahmad /// %5 = vector.extract %a[0, 0, 1] ─┐
100*b87a80d4SMubashar Ahmad /// : vector<8xi64> from vector<1x2x3x8xi64> |
101*b87a80d4SMubashar Ahmad /// %6, %7 = vector.deinterleave %5 |
102*b87a80d4SMubashar Ahmad /// : vector<8xi64> -> vector<4xi64> | -- Recursive pattern for
103*b87a80d4SMubashar Ahmad /// %8 = vector.insert %6, %3 [0, 0, 1] | subsequent unrolled
104*b87a80d4SMubashar Ahmad /// : vector<4xi64> into vector<1x2x3x4xi64> | deinterleave
105*b87a80d4SMubashar Ahmad /// %9 = vector.insert %7, %4 [0, 0, 1] | operations. Repeated
106*b87a80d4SMubashar Ahmad /// : vector<4xi64> into vector<1x2x3x4xi64> ┘ 5x in this case.
107*b87a80d4SMubashar Ahmad /// ```
108*b87a80d4SMubashar Ahmad ///
109*b87a80d4SMubashar Ahmad /// Note: If any leading dimension before the `targetRank` is scalable the
110*b87a80d4SMubashar Ahmad /// unrolling will stop before the scalable dimension.
111*b87a80d4SMubashar Ahmad class UnrollDeinterleaveOp final
112*b87a80d4SMubashar Ahmad : public OpRewritePattern<vector::DeinterleaveOp> {
113*b87a80d4SMubashar Ahmad public:
UnrollDeinterleaveOp(int64_t targetRank,MLIRContext * context,PatternBenefit benefit=1)114*b87a80d4SMubashar Ahmad UnrollDeinterleaveOp(int64_t targetRank, MLIRContext *context,
115*b87a80d4SMubashar Ahmad PatternBenefit benefit = 1)
116*b87a80d4SMubashar Ahmad : OpRewritePattern(context, benefit), targetRank(targetRank) {};
117*b87a80d4SMubashar Ahmad
matchAndRewrite(vector::DeinterleaveOp op,PatternRewriter & rewriter) const118*b87a80d4SMubashar Ahmad LogicalResult matchAndRewrite(vector::DeinterleaveOp op,
119*b87a80d4SMubashar Ahmad PatternRewriter &rewriter) const override {
120*b87a80d4SMubashar Ahmad VectorType resultType = op.getResultVectorType();
121*b87a80d4SMubashar Ahmad auto unrollIterator = vector::createUnrollIterator(resultType, targetRank);
122*b87a80d4SMubashar Ahmad if (!unrollIterator)
123*b87a80d4SMubashar Ahmad return failure();
124*b87a80d4SMubashar Ahmad
125*b87a80d4SMubashar Ahmad auto loc = op.getLoc();
126*b87a80d4SMubashar Ahmad Value emptyResult = rewriter.create<arith::ConstantOp>(
127*b87a80d4SMubashar Ahmad loc, resultType, rewriter.getZeroAttr(resultType));
128*b87a80d4SMubashar Ahmad Value evenResult = emptyResult;
129*b87a80d4SMubashar Ahmad Value oddResult = emptyResult;
130*b87a80d4SMubashar Ahmad
131*b87a80d4SMubashar Ahmad for (auto position : *unrollIterator) {
132*b87a80d4SMubashar Ahmad auto extractSrc =
133*b87a80d4SMubashar Ahmad rewriter.create<vector::ExtractOp>(loc, op.getSource(), position);
134*b87a80d4SMubashar Ahmad auto deinterleave =
135*b87a80d4SMubashar Ahmad rewriter.create<vector::DeinterleaveOp>(loc, extractSrc);
136*b87a80d4SMubashar Ahmad evenResult = rewriter.create<vector::InsertOp>(
137*b87a80d4SMubashar Ahmad loc, deinterleave.getRes1(), evenResult, position);
138*b87a80d4SMubashar Ahmad oddResult = rewriter.create<vector::InsertOp>(loc, deinterleave.getRes2(),
139*b87a80d4SMubashar Ahmad oddResult, position);
140*b87a80d4SMubashar Ahmad }
141*b87a80d4SMubashar Ahmad rewriter.replaceOp(op, ValueRange{evenResult, oddResult});
142*b87a80d4SMubashar Ahmad return success();
143*b87a80d4SMubashar Ahmad }
144*b87a80d4SMubashar Ahmad
145*b87a80d4SMubashar Ahmad private:
146*b87a80d4SMubashar Ahmad int64_t targetRank = 1;
147*b87a80d4SMubashar Ahmad };
148a1d43c14SBenoit Jacob /// Rewrite vector.interleave op into an equivalent vector.shuffle op, when
149a1d43c14SBenoit Jacob /// applicable: `sourceType` must be 1D and non-scalable.
150a1d43c14SBenoit Jacob ///
151a1d43c14SBenoit Jacob /// Example:
152a1d43c14SBenoit Jacob ///
153a1d43c14SBenoit Jacob /// ```mlir
154714aee31SJakub Kuderski /// vector.interleave %a, %b : vector<7xi16> -> vector<14xi16>
155a1d43c14SBenoit Jacob /// ```
156a1d43c14SBenoit Jacob ///
157a1d43c14SBenoit Jacob /// Is rewritten into:
158a1d43c14SBenoit Jacob ///
159a1d43c14SBenoit Jacob /// ```mlir
160a1d43c14SBenoit Jacob /// vector.shuffle %arg0, %arg1 [0, 7, 1, 8, 2, 9, 3, 10, 4, 11, 5, 12, 6, 13]
161a1d43c14SBenoit Jacob /// : vector<7xi16>, vector<7xi16>
162a1d43c14SBenoit Jacob /// ```
163714aee31SJakub Kuderski struct InterleaveToShuffle final : OpRewritePattern<vector::InterleaveOp> {
164714aee31SJakub Kuderski using OpRewritePattern::OpRewritePattern;
165a1d43c14SBenoit Jacob
matchAndRewrite__anon4ebd91ac0111::InterleaveToShuffle166a1d43c14SBenoit Jacob LogicalResult matchAndRewrite(vector::InterleaveOp op,
167a1d43c14SBenoit Jacob PatternRewriter &rewriter) const override {
168a1d43c14SBenoit Jacob VectorType sourceType = op.getSourceVectorType();
169a1d43c14SBenoit Jacob if (sourceType.getRank() != 1 || sourceType.isScalable()) {
170a1d43c14SBenoit Jacob return failure();
171a1d43c14SBenoit Jacob }
172a1d43c14SBenoit Jacob int64_t n = sourceType.getNumElements();
173a1d43c14SBenoit Jacob auto seq = llvm::seq<int64_t>(2 * n);
174a1d43c14SBenoit Jacob auto zip = llvm::to_vector(llvm::map_range(
175a1d43c14SBenoit Jacob seq, [n](int64_t i) { return (i % 2 ? n : 0) + i / 2; }));
176a1d43c14SBenoit Jacob rewriter.replaceOpWithNewOp<ShuffleOp>(op, op.getLhs(), op.getRhs(), zip);
177a1d43c14SBenoit Jacob return success();
178a1d43c14SBenoit Jacob }
179a1d43c14SBenoit Jacob };
180a1d43c14SBenoit Jacob
181a1a68603SBenjamin Maxwell } // namespace
182a1a68603SBenjamin Maxwell
populateVectorInterleaveLoweringPatterns(RewritePatternSet & patterns,int64_t targetRank,PatternBenefit benefit)183a1a68603SBenjamin Maxwell void mlir::vector::populateVectorInterleaveLoweringPatterns(
184a1a68603SBenjamin Maxwell RewritePatternSet &patterns, int64_t targetRank, PatternBenefit benefit) {
185*b87a80d4SMubashar Ahmad patterns.add<UnrollInterleaveOp, UnrollDeinterleaveOp>(
186*b87a80d4SMubashar Ahmad targetRank, patterns.getContext(), benefit);
187a1a68603SBenjamin Maxwell }
188a1d43c14SBenoit Jacob
populateVectorInterleaveToShufflePatterns(RewritePatternSet & patterns,PatternBenefit benefit)189a1d43c14SBenoit Jacob void mlir::vector::populateVectorInterleaveToShufflePatterns(
190a1d43c14SBenoit Jacob RewritePatternSet &patterns, PatternBenefit benefit) {
191a1d43c14SBenoit Jacob patterns.add<InterleaveToShuffle>(patterns.getContext(), benefit);
192a1d43c14SBenoit Jacob }
193