xref: /llvm-project/llvm/test/CodeGen/AMDGPU/s_code_end.ll (revision d7762a3b369ec2be8ccb5f585aa6a96026caaa33)
1; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1010 -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX10END-ASM %s
2; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1010 -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx1010 -d - | FileCheck --check-prefixes=GCN,GCN-OBJ,GFX10END-OBJ %s
3; RUN: llc -mtriple=amdgcn-amd-amdpal -mcpu=gfx1010 -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX10END-ASM %s
4; RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx1010 -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX10NOEND %s
5; RUN: llc -mtriple=amdgcn-- -mcpu=gfx1010 -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx1010 -d - | FileCheck --check-prefixes=GCN,GCN-OBJ,GFX10NOEND,GFX10NOEND-OBJ %s
6
7; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1100 -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX11END-ASM %s
8; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1100 -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx1100 -d - | FileCheck --check-prefixes=GCN,GCN-OBJ,GFX11END-OBJ %s
9
10; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX90AEND-ASM %s
11; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx90a --disassemble - | FileCheck -check-prefixes=GCN,GCN-OBJ,GFX90AEND-OBJ %s
12
13; GCN:            a_kernel1{{>?}}:
14; GCN:                    s_endpgm
15; GCN-ASM:        [[END_LABEL1:\.Lfunc_end.*]]:
16; GCN-ASM-NEXT:           .size   a_kernel1, [[END_LABEL1]]-a_kernel1
17
18; GCN-OBJ-NEXT:           s_nop 0
19
20define amdgpu_kernel void @a_kernel1() #0 {
21  ret void
22}
23
24; GCN:            a_kernel2{{>?}}:
25; GCN:                    s_endpgm
26; GCN-ASM:        [[END_LABEL2:\.Lfunc_end.*]]:
27; GCN-ASM-NEXT:           .size   a_kernel2, [[END_LABEL2]]-a_kernel2
28
29; GCN-OBJ:   {{^$}}
30
31define amdgpu_kernel void @a_kernel2() #0 {
32  ret void
33}
34
35; GCN-ASM:                .globl  a_function
36; GCN-ASM-NEXT:           .p2align        2
37; GCN-ASM-NEXT:           .type   a_function,@function
38
39; GCN-NEXT:       a_function{{>?}}:
40; GCN:                    s_setpc_b64
41; GCN-ASM-NEXT:   [[END_LABEL3:\.Lfunc_end.*]]:
42; GCN-ASM-NEXT:           .size   a_function, [[END_LABEL3]]-a_function
43; GFX10END-ASM:           .p2alignl 6, 3214868480
44; GFX11END-ASM:           .p2alignl 7, 3214868480
45; GFX90AEND-ASM:          .p2alignl 6, 3212836864
46; GFX10END-ASM-NEXT:      .fill 48, 4, 3214868480
47; GFX11END-ASM-NEXT:      .fill 96, 4, 3214868480
48; GFX90AEND-ASM-NEXT:     .fill 256, 4, 3212836864
49; GFX10NOEND-NOT:         .fill
50; GFX11NOEND-NOT:         .fill
51
52; GFX10NOEND-OBJ-NOT:     s_code_end
53; GFX10END-OBJ-NEXT:      s_code_end
54; GFX11NOEND-OBJ-NOT:     s_code_end
55; GFX11END-OBJ-NEXT:      s_code_end
56; GFX90AEND-OBJ-NEXT:     s_nop 0
57
58; GFX10END-OBJ:           s_code_end // 000000000140:
59; GFX10END-OBJ-COUNT-47:  s_code_end
60; GFX11END-OBJ:           s_code_end // 000000000140:
61; GFX11END-OBJ-COUNT-47:  s_code_end
62; GFX90AEND-OBJ:           s_nop 0 // 000000000140:
63; GFX90AEND-OBJ-COUNT-255: s_nop 0
64
65define void @a_function() #0 {
66  ret void
67}
68
69attributes #0 = { "amdgpu-flat-work-group-size"="1,512" }
70