xref: /llvm-project/mlir/test/Conversion/GPUCommon/transfer_write.mlir (revision 099fd018d1b04013ef46c0e26ed008585ab8bcbb)
1// RUN: mlir-opt %s --gpu-to-llvm | FileCheck %s
2
3// CHECK-LABEL: @warp_extract
4// CHECK-SAME: %[[VEC:[a-zA-Z0-9_]+]]: vector<1xf32>
5// CHECK:%[[BASE:[0-9]+]] = llvm.extractvalue
6// CHECK:%[[PTR:[0-9]+]] = llvm.getelementptr %[[BASE]]
7// CHECK:llvm.store %[[VEC]], %[[PTR]] {alignment = 4 : i64} : vector<1xf32>, !llvm.ptr
8
9func.func @warp_extract(%arg0: index, %arg1: memref<1024x1024xf32>, %arg2: vector<1xf32>) {
10    %c0 = arith.constant 0 : index
11    gpu.warp_execute_on_lane_0(%arg0)[32] {
12      vector.transfer_write %arg2, %arg1[%c0, %c0] {in_bounds = [true]} : vector<1xf32>, memref<1024x1024xf32>
13    }
14    return
15  }
16