xref: /llvm-project/llvm/test/CodeGen/SPIRV/transcoding/OpenCL/barrier.ll (revision 0a443f13b49b3f392461a0bb60b0146cfc4607c7)
113453c98SAndrey Tretyakov; RUN: llc -O0 -mtriple=spirv32-unknown-unknown %s -o - | FileCheck %s --check-prefix=CHECK-SPIRV
2*0a443f13SVyacheslav Levytskyy; RUN: %if spirv-tools %{ llc -O0 -mtriple=spirv32-unknown-unknown %s -o - -filetype=obj | spirv-val %}
313453c98SAndrey Tretyakov
413453c98SAndrey Tretyakov;; This test checks that the backend is capable to correctly translate
513453c98SAndrey Tretyakov;; barrier OpenCL C 1.2 built-in function [1] into corresponding SPIR-V
613453c98SAndrey Tretyakov;; instruction.
713453c98SAndrey Tretyakov
813453c98SAndrey Tretyakov;; FIXME: Strictly speaking, this flag is not supported by barrier in OpenCL 1.2
913453c98SAndrey Tretyakov;; #define CLK_IMAGE_MEM_FENCE 0x04
1013453c98SAndrey Tretyakov;;
1113453c98SAndrey Tretyakov;; void __attribute__((overloadable)) __attribute__((convergent)) barrier(cl_mem_fence_flags);
1213453c98SAndrey Tretyakov;;
1313453c98SAndrey Tretyakov;; __kernel void test_barrier_const_flags() {
1413453c98SAndrey Tretyakov;;   barrier(CLK_LOCAL_MEM_FENCE);
1513453c98SAndrey Tretyakov;;   barrier(CLK_GLOBAL_MEM_FENCE);
1613453c98SAndrey Tretyakov;;   barrier(CLK_IMAGE_MEM_FENCE);
1713453c98SAndrey Tretyakov;;
1813453c98SAndrey Tretyakov;;   barrier(CLK_LOCAL_MEM_FENCE | CLK_GLOBAL_MEM_FENCE);
1913453c98SAndrey Tretyakov;;   barrier(CLK_LOCAL_MEM_FENCE | CLK_IMAGE_MEM_FENCE);
2013453c98SAndrey Tretyakov;;   barrier(CLK_GLOBAL_MEM_FENCE | CLK_LOCAL_MEM_FENCE | CLK_IMAGE_MEM_FENCE);
2113453c98SAndrey Tretyakov;; }
2213453c98SAndrey Tretyakov;;
2313453c98SAndrey Tretyakov;; __kernel void test_barrier_non_const_flags(cl_mem_fence_flags flags) {
2413453c98SAndrey Tretyakov  ;; FIXME: OpenCL spec doesn't require flags to be compile-time known
2513453c98SAndrey Tretyakov  ;; barrier(flags);
2613453c98SAndrey Tretyakov;; }
2713453c98SAndrey Tretyakov
2813453c98SAndrey Tretyakov; CHECK-SPIRV: OpName %[[#TEST_CONST_FLAGS:]] "test_barrier_const_flags"
2913453c98SAndrey Tretyakov; CHECK-SPIRV: %[[#UINT:]] = OpTypeInt 32 0
3013453c98SAndrey Tretyakov
3113453c98SAndrey Tretyakov;; In SPIR-V, barrier is represented as OpControlBarrier [3] and OpenCL
3213453c98SAndrey Tretyakov;; cl_mem_fence_flags are represented as part of Memory Semantics [2], which
3313453c98SAndrey Tretyakov;; also includes memory order constraints. The backend applies some default
3413453c98SAndrey Tretyakov;; memory order for OpControlBarrier and therefore, constants below include a
3513453c98SAndrey Tretyakov;; bit more information than original source
3613453c98SAndrey Tretyakov
3713453c98SAndrey Tretyakov;; 0x10 SequentiallyConsistent + 0x100 WorkgroupMemory
3813453c98SAndrey Tretyakov; CHECK-SPIRV:     %[[#LOCAL:]] = OpConstant %[[#UINT]] 272
3913453c98SAndrey Tretyakov;; 0x2 Workgroup
4013453c98SAndrey Tretyakov; CHECK-SPIRV:     %[[#WG:]] = OpConstant %[[#UINT]] 2
4113453c98SAndrey Tretyakov;; 0x10 SequentiallyConsistent + 0x200 CrossWorkgroupMemory
4213453c98SAndrey Tretyakov; CHECK-SPIRV-DAG: %[[#GLOBAL:]] = OpConstant %[[#UINT]] 528
4313453c98SAndrey Tretyakov;; 0x10 SequentiallyConsistent + 0x800 ImageMemory
4413453c98SAndrey Tretyakov; CHECK-SPIRV-DAG: %[[#IMAGE:]] = OpConstant %[[#UINT]] 2064
4513453c98SAndrey Tretyakov;; 0x10 SequentiallyConsistent + 0x100 WorkgroupMemory + 0x200 CrossWorkgroupMemory
4613453c98SAndrey Tretyakov; CHECK-SPIRV-DAG: %[[#LOCAL_GLOBAL:]] = OpConstant %[[#UINT]] 784
4713453c98SAndrey Tretyakov;; 0x10 SequentiallyConsistent + 0x100 WorkgroupMemory + 0x800 ImageMemory
4813453c98SAndrey Tretyakov; CHECK-SPIRV-DAG: %[[#LOCAL_IMAGE:]] = OpConstant %[[#UINT]] 2320
4913453c98SAndrey Tretyakov;; 0x10 SequentiallyConsistent + 0x100 WorkgroupMemory + 0x200 CrossWorkgroupMemory + 0x800 ImageMemory
5013453c98SAndrey Tretyakov; CHECK-SPIRV-DAG: %[[#LOCAL_GLOBAL_IMAGE:]] = OpConstant %[[#UINT]] 2832
5113453c98SAndrey Tretyakov
5213453c98SAndrey Tretyakov; CHECK-SPIRV: %[[#TEST_CONST_FLAGS]] = OpFunction %[[#]]
5313453c98SAndrey Tretyakov; CHECK-SPIRV: OpControlBarrier %[[#WG]] %[[#WG]] %[[#LOCAL]]
5413453c98SAndrey Tretyakov; CHECK-SPIRV: OpControlBarrier %[[#WG]] %[[#WG]] %[[#GLOBAL]]
5513453c98SAndrey Tretyakov; CHECK-SPIRV: OpControlBarrier %[[#WG]] %[[#WG]] %[[#IMAGE]]
5613453c98SAndrey Tretyakov; CHECK-SPIRV: OpControlBarrier %[[#WG]] %[[#WG]] %[[#LOCAL_GLOBAL]]
5713453c98SAndrey Tretyakov; CHECK-SPIRV: OpControlBarrier %[[#WG]] %[[#WG]] %[[#LOCAL_IMAGE]]
5813453c98SAndrey Tretyakov; CHECK-SPIRV: OpControlBarrier %[[#WG]] %[[#WG]] %[[#LOCAL_GLOBAL_IMAGE]]
5913453c98SAndrey Tretyakov
6013453c98SAndrey Tretyakovdefine dso_local spir_kernel void @test_barrier_const_flags() local_unnamed_addr {
6113453c98SAndrey Tretyakoventry:
6213453c98SAndrey Tretyakov  tail call spir_func void @_Z7barrierj(i32 noundef 1)
6313453c98SAndrey Tretyakov  tail call spir_func void @_Z7barrierj(i32 noundef 2)
6413453c98SAndrey Tretyakov  tail call spir_func void @_Z7barrierj(i32 noundef 4)
6513453c98SAndrey Tretyakov  tail call spir_func void @_Z7barrierj(i32 noundef 3)
6613453c98SAndrey Tretyakov  tail call spir_func void @_Z7barrierj(i32 noundef 5)
6713453c98SAndrey Tretyakov  tail call spir_func void @_Z7barrierj(i32 noundef 7)
6813453c98SAndrey Tretyakov  ret void
6913453c98SAndrey Tretyakov}
7013453c98SAndrey Tretyakov
7113453c98SAndrey Tretyakovdeclare spir_func void @_Z7barrierj(i32 noundef) local_unnamed_addr
7213453c98SAndrey Tretyakov
7313453c98SAndrey Tretyakovdefine dso_local spir_kernel void @test_barrier_non_const_flags(i32 noundef %flags) local_unnamed_addr {
7413453c98SAndrey Tretyakoventry:
7513453c98SAndrey Tretyakov  ret void
7613453c98SAndrey Tretyakov}
7713453c98SAndrey Tretyakov
7813453c98SAndrey Tretyakov;; References:
7913453c98SAndrey Tretyakov;; [1]: https://www.khronos.org/registry/OpenCL/sdk/1.2/docs/man/xhtml/barrier.html
8013453c98SAndrey Tretyakov;; [2]: https://www.khronos.org/registry/spir-v/specs/unified1/SPIRV.html#_a_id_memory_semantics__id_a_memory_semantics_lt_id_gt
8113453c98SAndrey Tretyakov;; [3]: https://www.khronos.org/registry/spir-v/specs/unified1/SPIRV.html#OpControlBarrier
82