xref: /llvm-project/mlir/lib/Dialect/Vector/Transforms/LowerVectorInterleave.cpp (revision db791b278a414fb6df1acc1799adcf11d8fb9169)
1a1a68603SBenjamin Maxwell //===- LowerVectorInterleave.cpp - Lower 'vector.interleave' operation ----===//
2a1a68603SBenjamin Maxwell //
3a1a68603SBenjamin Maxwell // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4a1a68603SBenjamin Maxwell // See https://llvm.org/LICENSE.txt for license information.
5a1a68603SBenjamin Maxwell // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6a1a68603SBenjamin Maxwell //
7a1a68603SBenjamin Maxwell //===----------------------------------------------------------------------===//
8a1a68603SBenjamin Maxwell //
9a1a68603SBenjamin Maxwell // This file implements target-independent rewrites and utilities to lower the
10a1a68603SBenjamin Maxwell // 'vector.interleave' operation.
11a1a68603SBenjamin Maxwell //
12a1a68603SBenjamin Maxwell //===----------------------------------------------------------------------===//
13a1a68603SBenjamin Maxwell 
14a1a68603SBenjamin Maxwell #include "mlir/Dialect/Vector/IR/VectorOps.h"
15a1a68603SBenjamin Maxwell #include "mlir/Dialect/Vector/Transforms/LoweringPatterns.h"
16a1a68603SBenjamin Maxwell #include "mlir/Dialect/Vector/Utils/VectorUtils.h"
17a1a68603SBenjamin Maxwell #include "mlir/IR/BuiltinTypes.h"
18a1a68603SBenjamin Maxwell #include "mlir/IR/PatternMatch.h"
19a1a68603SBenjamin Maxwell 
20a1a68603SBenjamin Maxwell #define DEBUG_TYPE "vector-interleave-lowering"
21a1a68603SBenjamin Maxwell 
22a1a68603SBenjamin Maxwell using namespace mlir;
23a1a68603SBenjamin Maxwell using namespace mlir::vector;
24a1a68603SBenjamin Maxwell 
25a1a68603SBenjamin Maxwell namespace {
26a1a68603SBenjamin Maxwell 
27a1a68603SBenjamin Maxwell /// A one-shot unrolling of vector.interleave to the `targetRank`.
28a1a68603SBenjamin Maxwell ///
29a1a68603SBenjamin Maxwell /// Example:
30a1a68603SBenjamin Maxwell ///
31a1a68603SBenjamin Maxwell /// ```mlir
32714aee31SJakub Kuderski /// vector.interleave %a, %b : vector<1x2x3x4xi64> -> vector<1x2x3x8xi64>
33a1a68603SBenjamin Maxwell /// ```
34a1a68603SBenjamin Maxwell /// Would be unrolled to:
35a1a68603SBenjamin Maxwell /// ```mlir
36a1a68603SBenjamin Maxwell /// %result = arith.constant dense<0> : vector<1x2x3x8xi64>
37a1a68603SBenjamin Maxwell /// %0 = vector.extract %a[0, 0, 0]                 ─┐
38a1a68603SBenjamin Maxwell ///        : vector<4xi64> from vector<1x2x3x4xi64>  |
39a1a68603SBenjamin Maxwell /// %1 = vector.extract %b[0, 0, 0]                  |
40a1a68603SBenjamin Maxwell ///        : vector<4xi64> from vector<1x2x3x4xi64>  | - Repeated 6x for
41714aee31SJakub Kuderski /// %2 = vector.interleave %0, %1 :                  |   all leading positions
42714aee31SJakub Kuderski ///        : vector<4xi64> -> vector<8xi64>          |
43a1a68603SBenjamin Maxwell /// %3 = vector.insert %2, %result [0, 0, 0]         |
44a1a68603SBenjamin Maxwell ///        : vector<8xi64> into vector<1x2x3x8xi64>  ┘
45a1a68603SBenjamin Maxwell /// ```
46a1a68603SBenjamin Maxwell ///
47a1a68603SBenjamin Maxwell /// Note: If any leading dimension before the `targetRank` is scalable the
48a1a68603SBenjamin Maxwell /// unrolling will stop before the scalable dimension.
49714aee31SJakub Kuderski class UnrollInterleaveOp final : public OpRewritePattern<vector::InterleaveOp> {
50a1a68603SBenjamin Maxwell public:
UnrollInterleaveOp(int64_t targetRank,MLIRContext * context,PatternBenefit benefit=1)51a1a68603SBenjamin Maxwell   UnrollInterleaveOp(int64_t targetRank, MLIRContext *context,
52a1a68603SBenjamin Maxwell                      PatternBenefit benefit = 1)
53a1a68603SBenjamin Maxwell       : OpRewritePattern(context, benefit), targetRank(targetRank){};
54a1a68603SBenjamin Maxwell 
matchAndRewrite(vector::InterleaveOp op,PatternRewriter & rewriter) const55a1a68603SBenjamin Maxwell   LogicalResult matchAndRewrite(vector::InterleaveOp op,
56a1a68603SBenjamin Maxwell                                 PatternRewriter &rewriter) const override {
57a1a68603SBenjamin Maxwell     VectorType resultType = op.getResultVectorType();
58a1a68603SBenjamin Maxwell     auto unrollIterator = vector::createUnrollIterator(resultType, targetRank);
59a1a68603SBenjamin Maxwell     if (!unrollIterator)
60a1a68603SBenjamin Maxwell       return failure();
61a1a68603SBenjamin Maxwell 
62a1a68603SBenjamin Maxwell     auto loc = op.getLoc();
63a1a68603SBenjamin Maxwell     Value result = rewriter.create<arith::ConstantOp>(
64a1a68603SBenjamin Maxwell         loc, resultType, rewriter.getZeroAttr(resultType));
65a1a68603SBenjamin Maxwell     for (auto position : *unrollIterator) {
66a1a68603SBenjamin Maxwell       Value extractLhs = rewriter.create<ExtractOp>(loc, op.getLhs(), position);
67a1a68603SBenjamin Maxwell       Value extractRhs = rewriter.create<ExtractOp>(loc, op.getRhs(), position);
68a1a68603SBenjamin Maxwell       Value interleave =
69a1a68603SBenjamin Maxwell           rewriter.create<InterleaveOp>(loc, extractLhs, extractRhs);
70a1a68603SBenjamin Maxwell       result = rewriter.create<InsertOp>(loc, interleave, result, position);
71a1a68603SBenjamin Maxwell     }
72a1a68603SBenjamin Maxwell 
73a1a68603SBenjamin Maxwell     rewriter.replaceOp(op, result);
74a1a68603SBenjamin Maxwell     return success();
75a1a68603SBenjamin Maxwell   }
76a1a68603SBenjamin Maxwell 
77a1a68603SBenjamin Maxwell private:
78a1a68603SBenjamin Maxwell   int64_t targetRank = 1;
79a1a68603SBenjamin Maxwell };
80a1a68603SBenjamin Maxwell 
81*b87a80d4SMubashar Ahmad /// A one-shot unrolling of vector.deinterleave to the `targetRank`.
82*b87a80d4SMubashar Ahmad ///
83*b87a80d4SMubashar Ahmad /// Example:
84*b87a80d4SMubashar Ahmad ///
85*b87a80d4SMubashar Ahmad /// ```mlir
86*b87a80d4SMubashar Ahmad /// %0, %1 = vector.deinterleave %a : vector<1x2x3x8xi64> -> vector<1x2x3x4xi64>
87*b87a80d4SMubashar Ahmad /// ```
88*b87a80d4SMubashar Ahmad /// Would be unrolled to:
89*b87a80d4SMubashar Ahmad /// ```mlir
90*b87a80d4SMubashar Ahmad /// %result = arith.constant dense<0> : vector<1x2x3x4xi64>
91*b87a80d4SMubashar Ahmad /// %0 = vector.extract %a[0, 0, 0]                  ─┐
92*b87a80d4SMubashar Ahmad ///        : vector<8xi64> from vector<1x2x3x8xi64>   |
93*b87a80d4SMubashar Ahmad /// %1, %2 = vector.deinterleave %0                   |
94*b87a80d4SMubashar Ahmad ///        : vector<8xi64> -> vector<4xi64>           | -- Initial deinterleave
95*b87a80d4SMubashar Ahmad /// %3 = vector.insert %1, %result [0, 0, 0]          |    operation unrolled.
96*b87a80d4SMubashar Ahmad ///        : vector<4xi64> into vector<1x2x3x4xi64>   |
97*b87a80d4SMubashar Ahmad /// %4 = vector.insert %2, %result [0, 0, 0]          |
98*b87a80d4SMubashar Ahmad ///        : vector<4xi64> into vector<1x2x3x4xi64>   ┘
99*b87a80d4SMubashar Ahmad /// %5 = vector.extract %a[0, 0, 1]                  ─┐
100*b87a80d4SMubashar Ahmad ///        : vector<8xi64> from vector<1x2x3x8xi64>   |
101*b87a80d4SMubashar Ahmad /// %6, %7 = vector.deinterleave %5                   |
102*b87a80d4SMubashar Ahmad ///        : vector<8xi64> -> vector<4xi64>           | -- Recursive pattern for
103*b87a80d4SMubashar Ahmad /// %8 = vector.insert %6, %3 [0, 0, 1]               |    subsequent unrolled
104*b87a80d4SMubashar Ahmad ///        : vector<4xi64> into vector<1x2x3x4xi64>   |    deinterleave
105*b87a80d4SMubashar Ahmad /// %9 = vector.insert %7, %4 [0, 0, 1]               |    operations. Repeated
106*b87a80d4SMubashar Ahmad ///        : vector<4xi64> into vector<1x2x3x4xi64>   ┘    5x in this case.
107*b87a80d4SMubashar Ahmad /// ```
108*b87a80d4SMubashar Ahmad ///
109*b87a80d4SMubashar Ahmad /// Note: If any leading dimension before the `targetRank` is scalable the
110*b87a80d4SMubashar Ahmad /// unrolling will stop before the scalable dimension.
111*b87a80d4SMubashar Ahmad class UnrollDeinterleaveOp final
112*b87a80d4SMubashar Ahmad     : public OpRewritePattern<vector::DeinterleaveOp> {
113*b87a80d4SMubashar Ahmad public:
UnrollDeinterleaveOp(int64_t targetRank,MLIRContext * context,PatternBenefit benefit=1)114*b87a80d4SMubashar Ahmad   UnrollDeinterleaveOp(int64_t targetRank, MLIRContext *context,
115*b87a80d4SMubashar Ahmad                        PatternBenefit benefit = 1)
116*b87a80d4SMubashar Ahmad       : OpRewritePattern(context, benefit), targetRank(targetRank) {};
117*b87a80d4SMubashar Ahmad 
matchAndRewrite(vector::DeinterleaveOp op,PatternRewriter & rewriter) const118*b87a80d4SMubashar Ahmad   LogicalResult matchAndRewrite(vector::DeinterleaveOp op,
119*b87a80d4SMubashar Ahmad                                 PatternRewriter &rewriter) const override {
120*b87a80d4SMubashar Ahmad     VectorType resultType = op.getResultVectorType();
121*b87a80d4SMubashar Ahmad     auto unrollIterator = vector::createUnrollIterator(resultType, targetRank);
122*b87a80d4SMubashar Ahmad     if (!unrollIterator)
123*b87a80d4SMubashar Ahmad       return failure();
124*b87a80d4SMubashar Ahmad 
125*b87a80d4SMubashar Ahmad     auto loc = op.getLoc();
126*b87a80d4SMubashar Ahmad     Value emptyResult = rewriter.create<arith::ConstantOp>(
127*b87a80d4SMubashar Ahmad         loc, resultType, rewriter.getZeroAttr(resultType));
128*b87a80d4SMubashar Ahmad     Value evenResult = emptyResult;
129*b87a80d4SMubashar Ahmad     Value oddResult = emptyResult;
130*b87a80d4SMubashar Ahmad 
131*b87a80d4SMubashar Ahmad     for (auto position : *unrollIterator) {
132*b87a80d4SMubashar Ahmad       auto extractSrc =
133*b87a80d4SMubashar Ahmad           rewriter.create<vector::ExtractOp>(loc, op.getSource(), position);
134*b87a80d4SMubashar Ahmad       auto deinterleave =
135*b87a80d4SMubashar Ahmad           rewriter.create<vector::DeinterleaveOp>(loc, extractSrc);
136*b87a80d4SMubashar Ahmad       evenResult = rewriter.create<vector::InsertOp>(
137*b87a80d4SMubashar Ahmad           loc, deinterleave.getRes1(), evenResult, position);
138*b87a80d4SMubashar Ahmad       oddResult = rewriter.create<vector::InsertOp>(loc, deinterleave.getRes2(),
139*b87a80d4SMubashar Ahmad                                                     oddResult, position);
140*b87a80d4SMubashar Ahmad     }
141*b87a80d4SMubashar Ahmad     rewriter.replaceOp(op, ValueRange{evenResult, oddResult});
142*b87a80d4SMubashar Ahmad     return success();
143*b87a80d4SMubashar Ahmad   }
144*b87a80d4SMubashar Ahmad 
145*b87a80d4SMubashar Ahmad private:
146*b87a80d4SMubashar Ahmad   int64_t targetRank = 1;
147*b87a80d4SMubashar Ahmad };
148a1d43c14SBenoit Jacob /// Rewrite vector.interleave op into an equivalent vector.shuffle op, when
149a1d43c14SBenoit Jacob /// applicable: `sourceType` must be 1D and non-scalable.
150a1d43c14SBenoit Jacob ///
151a1d43c14SBenoit Jacob /// Example:
152a1d43c14SBenoit Jacob ///
153a1d43c14SBenoit Jacob /// ```mlir
154714aee31SJakub Kuderski /// vector.interleave %a, %b : vector<7xi16> -> vector<14xi16>
155a1d43c14SBenoit Jacob /// ```
156a1d43c14SBenoit Jacob ///
157a1d43c14SBenoit Jacob /// Is rewritten into:
158a1d43c14SBenoit Jacob ///
159a1d43c14SBenoit Jacob /// ```mlir
160a1d43c14SBenoit Jacob /// vector.shuffle %arg0, %arg1 [0, 7, 1, 8, 2, 9, 3, 10, 4, 11, 5, 12, 6, 13]
161a1d43c14SBenoit Jacob ///   : vector<7xi16>, vector<7xi16>
162a1d43c14SBenoit Jacob /// ```
163714aee31SJakub Kuderski struct InterleaveToShuffle final : OpRewritePattern<vector::InterleaveOp> {
164714aee31SJakub Kuderski   using OpRewritePattern::OpRewritePattern;
165a1d43c14SBenoit Jacob 
matchAndRewrite__anon4ebd91ac0111::InterleaveToShuffle166a1d43c14SBenoit Jacob   LogicalResult matchAndRewrite(vector::InterleaveOp op,
167a1d43c14SBenoit Jacob                                 PatternRewriter &rewriter) const override {
168a1d43c14SBenoit Jacob     VectorType sourceType = op.getSourceVectorType();
169a1d43c14SBenoit Jacob     if (sourceType.getRank() != 1 || sourceType.isScalable()) {
170a1d43c14SBenoit Jacob       return failure();
171a1d43c14SBenoit Jacob     }
172a1d43c14SBenoit Jacob     int64_t n = sourceType.getNumElements();
173a1d43c14SBenoit Jacob     auto seq = llvm::seq<int64_t>(2 * n);
174a1d43c14SBenoit Jacob     auto zip = llvm::to_vector(llvm::map_range(
175a1d43c14SBenoit Jacob         seq, [n](int64_t i) { return (i % 2 ? n : 0) + i / 2; }));
176a1d43c14SBenoit Jacob     rewriter.replaceOpWithNewOp<ShuffleOp>(op, op.getLhs(), op.getRhs(), zip);
177a1d43c14SBenoit Jacob     return success();
178a1d43c14SBenoit Jacob   }
179a1d43c14SBenoit Jacob };
180a1d43c14SBenoit Jacob 
181a1a68603SBenjamin Maxwell } // namespace
182a1a68603SBenjamin Maxwell 
populateVectorInterleaveLoweringPatterns(RewritePatternSet & patterns,int64_t targetRank,PatternBenefit benefit)183a1a68603SBenjamin Maxwell void mlir::vector::populateVectorInterleaveLoweringPatterns(
184a1a68603SBenjamin Maxwell     RewritePatternSet &patterns, int64_t targetRank, PatternBenefit benefit) {
185*b87a80d4SMubashar Ahmad   patterns.add<UnrollInterleaveOp, UnrollDeinterleaveOp>(
186*b87a80d4SMubashar Ahmad       targetRank, patterns.getContext(), benefit);
187a1a68603SBenjamin Maxwell }
188a1d43c14SBenoit Jacob 
populateVectorInterleaveToShufflePatterns(RewritePatternSet & patterns,PatternBenefit benefit)189a1d43c14SBenoit Jacob void mlir::vector::populateVectorInterleaveToShufflePatterns(
190a1d43c14SBenoit Jacob     RewritePatternSet &patterns, PatternBenefit benefit) {
191a1d43c14SBenoit Jacob   patterns.add<InterleaveToShuffle>(patterns.getContext(), benefit);
192a1d43c14SBenoit Jacob }
193