xref: /llvm-project/llvm/test/CodeGen/AMDGPU/lds-size-hsa-gfx950.ll (revision 5a556d55fb753d7e6e7a310a3fc0f7e83f8f9144)
1*5a556d55SMatt Arsenault; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx950 -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
2*5a556d55SMatt Arsenault; RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx950 -verify-machineinstrs < %s | FileCheck -check-prefix=MESA %s
3*5a556d55SMatt Arsenault
4*5a556d55SMatt Arsenault; gfx950 supports upto 160 KB configurable LDS memory.
5*5a556d55SMatt Arsenault; This test checks the max and above the old i.e. 128 KiB size of LDS that can be allocated.
6*5a556d55SMatt Arsenault
7*5a556d55SMatt Arsenault@lds.i32 = addrspace(3) global i32 poison
8*5a556d55SMatt Arsenault@lds.array.size.131076 = addrspace(3) global [32768 x i32] poison
9*5a556d55SMatt Arsenault@lds.array.size.163840 = addrspace(3) global [40959 x i32] poison
10*5a556d55SMatt Arsenault
11*5a556d55SMatt Arsenault; GCN-LABEL: test_lds_array_size_131076:
12*5a556d55SMatt Arsenault; GCN: .amdhsa_group_segment_fixed_size 131076
13*5a556d55SMatt Arsenault; GCN: ; LDSByteSize: 131076 bytes/workgroup
14*5a556d55SMatt Arsenault; MESA: granulated_lds_size = 65
15*5a556d55SMatt Arsenaultdefine amdgpu_kernel void @test_lds_array_size_131076() {
16*5a556d55SMatt Arsenault  %gep = getelementptr inbounds [32768 x i32], ptr addrspace(3) @lds.array.size.131076, i32 0, i32 20
17*5a556d55SMatt Arsenault  %val = load i32, ptr addrspace(3) %gep
18*5a556d55SMatt Arsenault  store i32 %val, ptr addrspace(3) @lds.i32
19*5a556d55SMatt Arsenault  ret void
20*5a556d55SMatt Arsenault}
21*5a556d55SMatt Arsenault
22*5a556d55SMatt Arsenault; GCN-LABEL: test_lds_array_size_163840:
23*5a556d55SMatt Arsenault; GCN: .amdhsa_group_segment_fixed_size 163840
24*5a556d55SMatt Arsenault; GCN: ; LDSByteSize: 163840 bytes/workgroup
25*5a556d55SMatt Arsenault; MESA: granulated_lds_size = 80
26*5a556d55SMatt Arsenaultdefine amdgpu_kernel void @test_lds_array_size_163840() {
27*5a556d55SMatt Arsenault  %gep = getelementptr inbounds [40959 x i32], ptr addrspace(3) @lds.array.size.163840 , i32 0, i32 20
28*5a556d55SMatt Arsenault  %val = load i32, ptr addrspace(3) %gep
29*5a556d55SMatt Arsenault  store i32 %val, ptr addrspace(3) @lds.i32
30*5a556d55SMatt Arsenault  ret void
31*5a556d55SMatt Arsenault}
32