xref: /llvm-project/llvm/test/CodeGen/AMDGPU/llvm.amdgcn.readlane.ptr.ll (revision 5feb32ba929f9e517c530217cabb09d1d734a763)
1*5feb32baSVikram Hegde; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4
2*5feb32baSVikram Hegde; RUN: llc -mtriple=amdgcn--amdhsa -mcpu=fiji -verify-machineinstrs < %s | FileCheck --check-prefix=CHECK-SDAG -enable-var-scope %s
3*5feb32baSVikram Hegde
4*5feb32baSVikram Hegdedefine void @test_readlane_p0(ptr addrspace(1) %out, ptr %src, i32 %src1) {
5*5feb32baSVikram Hegde; CHECK-SDAG-LABEL: test_readlane_p0:
6*5feb32baSVikram Hegde; CHECK-SDAG:       ; %bb.0:
7*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
8*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readfirstlane_b32 s4, v4
9*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_nop 3
10*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s5, v3, s4
11*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s4, v2, s4
12*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMSTART
13*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ; use s[4:5]
14*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMEND
15*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_setpc_b64 s[30:31]
16*5feb32baSVikram Hegde  %x = call ptr @llvm.amdgcn.readlane.p0(ptr %src, i32 %src1)
17*5feb32baSVikram Hegde  call void asm sideeffect "; use $0", "s"(ptr %x)
18*5feb32baSVikram Hegde  ret void
19*5feb32baSVikram Hegde}
20*5feb32baSVikram Hegde
21*5feb32baSVikram Hegdedefine void @test_readlane_v3p0(ptr addrspace(1) %out, <3 x ptr> %src, i32 %src1) {
22*5feb32baSVikram Hegde; CHECK-SDAG-LABEL: test_readlane_v3p0:
23*5feb32baSVikram Hegde; CHECK-SDAG:       ; %bb.0:
24*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
25*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readfirstlane_b32 s4, v8
26*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_nop 3
27*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s9, v7, s4
28*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s8, v6, s4
29*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s7, v5, s4
30*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s6, v4, s4
31*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s5, v3, s4
32*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s4, v2, s4
33*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMSTART
34*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ; use s[4:9]
35*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMEND
36*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_setpc_b64 s[30:31]
37*5feb32baSVikram Hegde  %x = call <3 x ptr> @llvm.amdgcn.readlane.v3p0(<3 x ptr> %src, i32 %src1)
38*5feb32baSVikram Hegde  call void asm sideeffect "; use $0", "s"(<3 x ptr> %x)
39*5feb32baSVikram Hegde  ret void
40*5feb32baSVikram Hegde}
41*5feb32baSVikram Hegde
42*5feb32baSVikram Hegdedefine void @test_readlane_p3(ptr addrspace(1) %out, ptr addrspace(3) %src, i32 %src1) {
43*5feb32baSVikram Hegde; CHECK-SDAG-LABEL: test_readlane_p3:
44*5feb32baSVikram Hegde; CHECK-SDAG:       ; %bb.0:
45*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
46*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readfirstlane_b32 s4, v3
47*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_nop 3
48*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s4, v2, s4
49*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMSTART
50*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ; use s4
51*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMEND
52*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_setpc_b64 s[30:31]
53*5feb32baSVikram Hegde  %x = call ptr addrspace(3) @llvm.amdgcn.readlane.p3(ptr addrspace(3) %src, i32 %src1)
54*5feb32baSVikram Hegde  call void asm sideeffect "; use $0", "s"(ptr addrspace(3) %x)
55*5feb32baSVikram Hegde  ret void
56*5feb32baSVikram Hegde}
57*5feb32baSVikram Hegde
58*5feb32baSVikram Hegdedefine void @test_readlane_v3p3(ptr addrspace(1) %out, <3 x ptr addrspace(3)> %src, i32 %src1) {
59*5feb32baSVikram Hegde; CHECK-SDAG-LABEL: test_readlane_v3p3:
60*5feb32baSVikram Hegde; CHECK-SDAG:       ; %bb.0:
61*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
62*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readfirstlane_b32 s4, v5
63*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_nop 3
64*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s6, v4, s4
65*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s5, v3, s4
66*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s4, v2, s4
67*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMSTART
68*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ; use s[4:6]
69*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMEND
70*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_setpc_b64 s[30:31]
71*5feb32baSVikram Hegde  %x = call <3 x ptr addrspace(3)> @llvm.amdgcn.readlane.v3p3(<3 x ptr addrspace(3)> %src, i32 %src1)
72*5feb32baSVikram Hegde  call void asm sideeffect "; use $0", "s"(<3 x ptr addrspace(3)> %x)
73*5feb32baSVikram Hegde  ret void
74*5feb32baSVikram Hegde}
75*5feb32baSVikram Hegde
76*5feb32baSVikram Hegdedefine void @test_readlane_p5(ptr addrspace(1) %out, ptr addrspace(5) %src, i32 %src1) {
77*5feb32baSVikram Hegde; CHECK-SDAG-LABEL: test_readlane_p5:
78*5feb32baSVikram Hegde; CHECK-SDAG:       ; %bb.0:
79*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
80*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readfirstlane_b32 s4, v3
81*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_nop 3
82*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s4, v2, s4
83*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMSTART
84*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ; use s4
85*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMEND
86*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_setpc_b64 s[30:31]
87*5feb32baSVikram Hegde  %x = call ptr addrspace(5) @llvm.amdgcn.readlane.p5(ptr addrspace(5) %src, i32 %src1)
88*5feb32baSVikram Hegde  call void asm sideeffect "; use $0", "s"(ptr addrspace(5) %x)
89*5feb32baSVikram Hegde  ret void
90*5feb32baSVikram Hegde}
91*5feb32baSVikram Hegde
92*5feb32baSVikram Hegdedefine void @test_readlane_v3p5(ptr addrspace(1) %out, <3 x ptr addrspace(5)> %src, i32 %src1) {
93*5feb32baSVikram Hegde; CHECK-SDAG-LABEL: test_readlane_v3p5:
94*5feb32baSVikram Hegde; CHECK-SDAG:       ; %bb.0:
95*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
96*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readfirstlane_b32 s4, v5
97*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_nop 3
98*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s6, v4, s4
99*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s5, v3, s4
100*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s4, v2, s4
101*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMSTART
102*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ; use s[4:6]
103*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMEND
104*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_setpc_b64 s[30:31]
105*5feb32baSVikram Hegde  %x = call <3 x ptr addrspace(5)> @llvm.amdgcn.readlane.v3p5(<3 x ptr addrspace(5)> %src, i32 %src1)
106*5feb32baSVikram Hegde  call void asm sideeffect "; use $0", "s"(<3 x ptr addrspace(5)> %x)
107*5feb32baSVikram Hegde  ret void
108*5feb32baSVikram Hegde}
109*5feb32baSVikram Hegde
110*5feb32baSVikram Hegdedefine void @test_readlane_p6(ptr addrspace(1) %out, ptr addrspace(6) %src, i32 %src1) {
111*5feb32baSVikram Hegde; CHECK-SDAG-LABEL: test_readlane_p6:
112*5feb32baSVikram Hegde; CHECK-SDAG:       ; %bb.0:
113*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
114*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readfirstlane_b32 s4, v3
115*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_nop 3
116*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s4, v2, s4
117*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMSTART
118*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ; use s4
119*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMEND
120*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_setpc_b64 s[30:31]
121*5feb32baSVikram Hegde  %x = call ptr addrspace(6) @llvm.amdgcn.readlane.p6(ptr addrspace(6) %src, i32 %src1)
122*5feb32baSVikram Hegde  call void asm sideeffect "; use $0", "s"(ptr addrspace(6) %x)
123*5feb32baSVikram Hegde  ret void
124*5feb32baSVikram Hegde}
125*5feb32baSVikram Hegde
126*5feb32baSVikram Hegdedefine void @test_readlane_v3p6(ptr addrspace(1) %out, <3 x ptr addrspace(6)> %src, i32 %src1) {
127*5feb32baSVikram Hegde; CHECK-SDAG-LABEL: test_readlane_v3p6:
128*5feb32baSVikram Hegde; CHECK-SDAG:       ; %bb.0:
129*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
130*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readfirstlane_b32 s4, v5
131*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_nop 3
132*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s6, v4, s4
133*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s5, v3, s4
134*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    v_readlane_b32 s4, v2, s4
135*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMSTART
136*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ; use s[4:6]
137*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    ;;#ASMEND
138*5feb32baSVikram Hegde; CHECK-SDAG-NEXT:    s_setpc_b64 s[30:31]
139*5feb32baSVikram Hegde  %x = call <3 x ptr addrspace(6)> @llvm.amdgcn.readlane.v3p6(<3 x ptr addrspace(6)> %src, i32 %src1)
140*5feb32baSVikram Hegde  call void asm sideeffect "; use $0", "s"(<3 x ptr addrspace(6)> %x)
141*5feb32baSVikram Hegde  ret void
142*5feb32baSVikram Hegde}
143*5feb32baSVikram Hegde
144