1; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1010 -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX10END-ASM %s 2; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1010 -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx1010 -d - | FileCheck --check-prefixes=GCN,GCN-OBJ,GFX10END-OBJ %s 3; RUN: llc -mtriple=amdgcn-amd-amdpal -mcpu=gfx1010 -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX10END-ASM %s 4; RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx1010 -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX10NOEND %s 5; RUN: llc -mtriple=amdgcn-- -mcpu=gfx1010 -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx1010 -d - | FileCheck --check-prefixes=GCN,GCN-OBJ,GFX10NOEND,GFX10NOEND-OBJ %s 6 7; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1100 -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX11END-ASM %s 8; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1100 -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx1100 -d - | FileCheck --check-prefixes=GCN,GCN-OBJ,GFX11END-OBJ %s 9 10; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,GCN-ASM,GFX90AEND-ASM %s 11; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx90a --disassemble - | FileCheck -check-prefixes=GCN,GCN-OBJ,GFX90AEND-OBJ %s 12 13; GCN: a_kernel1{{>?}}: 14; GCN: s_endpgm 15; GCN-ASM: [[END_LABEL1:\.Lfunc_end.*]]: 16; GCN-ASM-NEXT: .size a_kernel1, [[END_LABEL1]]-a_kernel1 17 18; GCN-OBJ-NEXT: s_nop 0 19 20define amdgpu_kernel void @a_kernel1() #0 { 21 ret void 22} 23 24; GCN: a_kernel2{{>?}}: 25; GCN: s_endpgm 26; GCN-ASM: [[END_LABEL2:\.Lfunc_end.*]]: 27; GCN-ASM-NEXT: .size a_kernel2, [[END_LABEL2]]-a_kernel2 28 29; GCN-OBJ: {{^$}} 30 31define amdgpu_kernel void @a_kernel2() #0 { 32 ret void 33} 34 35; GCN-ASM: .globl a_function 36; GCN-ASM-NEXT: .p2align 2 37; GCN-ASM-NEXT: .type a_function,@function 38 39; GCN-NEXT: a_function{{>?}}: 40; GCN: s_setpc_b64 41; GCN-ASM-NEXT: [[END_LABEL3:\.Lfunc_end.*]]: 42; GCN-ASM-NEXT: .size a_function, [[END_LABEL3]]-a_function 43; GFX10END-ASM: .p2alignl 6, 3214868480 44; GFX11END-ASM: .p2alignl 7, 3214868480 45; GFX90AEND-ASM: .p2alignl 6, 3212836864 46; GFX10END-ASM-NEXT: .fill 48, 4, 3214868480 47; GFX11END-ASM-NEXT: .fill 96, 4, 3214868480 48; GFX90AEND-ASM-NEXT: .fill 256, 4, 3212836864 49; GFX10NOEND-NOT: .fill 50; GFX11NOEND-NOT: .fill 51 52; GFX10NOEND-OBJ-NOT: s_code_end 53; GFX10END-OBJ-NEXT: s_code_end 54; GFX11NOEND-OBJ-NOT: s_code_end 55; GFX11END-OBJ-NEXT: s_code_end 56; GFX90AEND-OBJ-NEXT: s_nop 0 57 58; GFX10END-OBJ: s_code_end // 000000000140: 59; GFX10END-OBJ-COUNT-47: s_code_end 60; GFX11END-OBJ: s_code_end // 000000000140: 61; GFX11END-OBJ-COUNT-47: s_code_end 62; GFX90AEND-OBJ: s_nop 0 // 000000000140: 63; GFX90AEND-OBJ-COUNT-255: s_nop 0 64 65define void @a_function() #0 { 66 ret void 67} 68 69attributes #0 = { "amdgpu-flat-work-group-size"="1,512" } 70