xref: /llvm-project/llvm/test/CodeGen/AMDGPU/exec-mask-opt-cannot-create-empty-or-backward-segment.ll (revision eeac0ffaf46cf9f9b0f680b9940cc4b68a0286d8)
1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx908 < %s | FileCheck %s
3
4define amdgpu_kernel void @cannot_create_empty_or_backwards_segment(i1 %arg, i1 %arg1, i1 %arg2, i1 %arg3, i1 %arg4, i1 %arg5) {
5; CHECK-LABEL: cannot_create_empty_or_backwards_segment:
6; CHECK:       ; %bb.0: ; %bb
7; CHECK-NEXT:    s_mov_b64 s[26:27], s[2:3]
8; CHECK-NEXT:    s_mov_b64 s[24:25], s[0:1]
9; CHECK-NEXT:    s_load_dword s2, s[8:9], 0x0
10; CHECK-NEXT:    s_load_dwordx2 s[0:1], s[8:9], 0x0
11; CHECK-NEXT:    s_load_dword s6, s[8:9], 0x4
12; CHECK-NEXT:    s_add_u32 s24, s24, s15
13; CHECK-NEXT:    s_addc_u32 s25, s25, 0
14; CHECK-NEXT:    s_waitcnt lgkmcnt(0)
15; CHECK-NEXT:    s_bitcmp1_b32 s2, 0
16; CHECK-NEXT:    s_cselect_b64 s[16:17], -1, 0
17; CHECK-NEXT:    s_bitcmp1_b32 s2, 8
18; CHECK-NEXT:    s_cselect_b64 s[10:11], -1, 0
19; CHECK-NEXT:    s_bitcmp1_b32 s2, 16
20; CHECK-NEXT:    s_cselect_b64 s[2:3], -1, 0
21; CHECK-NEXT:    s_bitcmp1_b32 s0, 24
22; CHECK-NEXT:    s_cselect_b64 s[8:9], -1, 0
23; CHECK-NEXT:    s_xor_b64 s[4:5], s[8:9], -1
24; CHECK-NEXT:    s_bitcmp1_b32 s1, 0
25; CHECK-NEXT:    v_cndmask_b32_e64 v0, 0, 1, s[2:3]
26; CHECK-NEXT:    s_cselect_b64 s[12:13], -1, 0
27; CHECK-NEXT:    s_bitcmp1_b32 s6, 8
28; CHECK-NEXT:    v_cmp_ne_u32_e64 s[2:3], 1, v0
29; CHECK-NEXT:    v_cndmask_b32_e64 v0, 0, 1, s[16:17]
30; CHECK-NEXT:    s_cselect_b64 s[14:15], -1, 0
31; CHECK-NEXT:    s_and_b64 s[4:5], exec, s[4:5]
32; CHECK-NEXT:    s_and_b64 s[6:7], exec, s[10:11]
33; CHECK-NEXT:    v_cmp_ne_u32_e64 s[0:1], 1, v0
34; CHECK-NEXT:    v_mov_b32_e32 v0, 0
35; CHECK-NEXT:    s_branch .LBB0_3
36; CHECK-NEXT:  .LBB0_1: ; in Loop: Header=BB0_3 Depth=1
37; CHECK-NEXT:    s_mov_b64 s[18:19], 0
38; CHECK-NEXT:    s_mov_b64 s[20:21], -1
39; CHECK-NEXT:    s_mov_b64 s[16:17], -1
40; CHECK-NEXT:    s_mov_b64 s[22:23], -1
41; CHECK-NEXT:  .LBB0_2: ; %Flow7
42; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
43; CHECK-NEXT:    s_and_b64 vcc, exec, s[22:23]
44; CHECK-NEXT:    s_cbranch_vccnz .LBB0_12
45; CHECK-NEXT:  .LBB0_3: ; %bb7
46; CHECK-NEXT:    ; =>This Inner Loop Header: Depth=1
47; CHECK-NEXT:    s_and_b64 vcc, exec, s[2:3]
48; CHECK-NEXT:    s_cbranch_vccnz .LBB0_1
49; CHECK-NEXT:  ; %bb.4: ; %bb8
50; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
51; CHECK-NEXT:    s_mov_b64 vcc, s[4:5]
52; CHECK-NEXT:    s_cbranch_vccz .LBB0_6
53; CHECK-NEXT:  ; %bb.5: ; %bb9
54; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
55; CHECK-NEXT:    s_mov_b64 s[16:17], 0
56; CHECK-NEXT:    s_mov_b64 s[18:19], -1
57; CHECK-NEXT:    s_mov_b64 s[22:23], s[10:11]
58; CHECK-NEXT:    s_cbranch_execz .LBB0_7
59; CHECK-NEXT:    s_branch .LBB0_8
60; CHECK-NEXT:  .LBB0_6: ; in Loop: Header=BB0_3 Depth=1
61; CHECK-NEXT:    s_mov_b64 s[16:17], -1
62; CHECK-NEXT:    s_mov_b64 s[18:19], 0
63; CHECK-NEXT:    s_mov_b64 s[22:23], 0
64; CHECK-NEXT:  .LBB0_7: ; %bb10
65; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
66; CHECK-NEXT:    s_mov_b64 s[18:19], -1
67; CHECK-NEXT:    s_mov_b64 s[16:17], 0
68; CHECK-NEXT:    s_mov_b64 s[22:23], s[14:15]
69; CHECK-NEXT:  .LBB0_8: ; %Flow9
70; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
71; CHECK-NEXT:    s_mov_b64 s[20:21], -1
72; CHECK-NEXT:    s_andn2_b64 vcc, exec, s[22:23]
73; CHECK-NEXT:    s_mov_b64 s[22:23], -1
74; CHECK-NEXT:    s_cbranch_vccnz .LBB0_2
75; CHECK-NEXT:  ; %bb.9: ; %bb13
76; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
77; CHECK-NEXT:    s_mov_b64 s[16:17], 0
78; CHECK-NEXT:    s_mov_b64 s[20:21], 0
79; CHECK-NEXT:    s_mov_b64 vcc, s[6:7]
80; CHECK-NEXT:    s_cbranch_vccz .LBB0_11
81; CHECK-NEXT:  ; %bb.10: ; %bb16
82; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
83; CHECK-NEXT:    s_mov_b64 s[20:21], -1
84; CHECK-NEXT:    s_mov_b64 s[22:23], s[12:13]
85; CHECK-NEXT:  .LBB0_11: ; %Flow11
86; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
87; CHECK-NEXT:    s_mov_b64 s[18:19], 0
88; CHECK-NEXT:    s_branch .LBB0_2
89; CHECK-NEXT:  .LBB0_12: ; %loop.exit.guard6
90; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
91; CHECK-NEXT:    s_xor_b64 s[22:23], s[20:21], -1
92; CHECK-NEXT:    s_mov_b64 s[20:21], -1
93; CHECK-NEXT:    s_and_b64 vcc, exec, s[22:23]
94; CHECK-NEXT:    s_cbranch_vccz .LBB0_16
95; CHECK-NEXT:  ; %bb.13: ; %bb14
96; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
97; CHECK-NEXT:    s_and_b64 vcc, exec, s[0:1]
98; CHECK-NEXT:    s_cbranch_vccnz .LBB0_15
99; CHECK-NEXT:  ; %bb.14: ; %bb15
100; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
101; CHECK-NEXT:    buffer_store_dword v0, off, s[24:27], 0 offset:4
102; CHECK-NEXT:    buffer_store_dword v0, off, s[24:27], 0
103; CHECK-NEXT:  .LBB0_15: ; %Flow
104; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
105; CHECK-NEXT:    s_mov_b64 s[20:21], 0
106; CHECK-NEXT:  .LBB0_16: ; %Flow13
107; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
108; CHECK-NEXT:    s_andn2_b64 vcc, exec, s[20:21]
109; CHECK-NEXT:    s_cbranch_vccnz .LBB0_3
110; CHECK-NEXT:  ; %bb.17: ; %loop.exit.guard
111; CHECK-NEXT:    s_and_b64 vcc, exec, s[16:17]
112; CHECK-NEXT:    s_cbranch_vccnz .LBB0_22
113; CHECK-NEXT:  ; %bb.18: ; %loop.exit.guard5
114; CHECK-NEXT:    s_and_b64 vcc, exec, s[18:19]
115; CHECK-NEXT:    s_cbranch_vccnz .LBB0_23
116; CHECK-NEXT:  ; %bb.19: ; %bb17
117; CHECK-NEXT:    s_and_b64 vcc, exec, s[8:9]
118; CHECK-NEXT:    s_cbranch_vccz .LBB0_21
119; CHECK-NEXT:  ; %bb.20: ; %bb19
120; CHECK-NEXT:    s_and_b64 vcc, exec, s[0:1]
121; CHECK-NEXT:    s_cbranch_vccz .LBB0_22
122; CHECK-NEXT:  .LBB0_21: ; %bb18
123; CHECK-NEXT:    s_endpgm
124; CHECK-NEXT:  .LBB0_22: ; %bb20
125; CHECK-NEXT:  .LBB0_23: ; %bb12
126bb:
127  br label %bb6
128
129bb6:                                              ; preds = %bb15, %bb14, %bb
130  br label %bb7
131
132bb7:                                              ; preds = %bb16, %bb6
133  br i1 %arg2, label %bb8, label %bb20
134
135bb8:                                              ; preds = %bb7
136  br i1 %arg3, label %bb10, label %bb9
137
138bb9:                                              ; preds = %bb8
139  br i1 %arg1, label %bb13, label %bb12
140
141bb10:                                             ; preds = %bb8
142  br i1 %arg5, label %bb11, label %bb12
143
144bb11:                                             ; preds = %bb10
145  br label %bb13
146
147bb12:                                             ; preds = %bb10, %bb9
148  unreachable
149
150bb13:                                             ; preds = %bb11, %bb9
151  br i1 %arg1, label %bb16, label %bb14
152
153bb14:                                             ; preds = %bb13
154  br i1 %arg, label %bb15, label %bb6
155
156bb15:                                             ; preds = %bb14
157  store double 0.000000e+00, ptr addrspace(5) null, align 2147483648
158  br label %bb6
159
160bb16:                                             ; preds = %bb13
161  br i1 %arg4, label %bb17, label %bb7
162
163bb17:                                             ; preds = %bb16
164  br i1 %arg3, label %bb19, label %bb18
165
166bb18:                                             ; preds = %bb17
167  ret void
168
169bb19:                                             ; preds = %bb17
170  br i1 %arg, label %bb20, label %bb21
171
172bb20:                                             ; preds = %bb19, %bb7
173  unreachable
174
175bb21:                                             ; preds = %bb19
176  ret void
177}
178