xref: /llvm-project/llvm/test/CodeGen/AMDGPU/exec-mask-opt-cannot-create-empty-or-backward-segment.ll (revision b4e17d4a314ed87ff6b40b4b05397d4b25b6636a)
1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx908 < %s | FileCheck %s
3
4define amdgpu_kernel void @cannot_create_empty_or_backwards_segment(i1 %arg, i1 %arg1, i1 %arg2, i1 %arg3, i1 %arg4, i1 %arg5) {
5; CHECK-LABEL: cannot_create_empty_or_backwards_segment:
6; CHECK:       ; %bb.0: ; %bb
7; CHECK-NEXT:    s_mov_b64 s[26:27], s[2:3]
8; CHECK-NEXT:    s_mov_b64 s[24:25], s[0:1]
9; CHECK-NEXT:    s_load_dword s4, s[8:9], 0x0
10; CHECK-NEXT:    s_load_dwordx2 s[0:1], s[8:9], 0x0
11; CHECK-NEXT:    s_load_dword s12, s[8:9], 0x4
12; CHECK-NEXT:    s_add_u32 s24, s24, s15
13; CHECK-NEXT:    s_addc_u32 s25, s25, 0
14; CHECK-NEXT:    s_waitcnt lgkmcnt(0)
15; CHECK-NEXT:    s_bitcmp1_b32 s4, 0
16; CHECK-NEXT:    s_cselect_b64 s[2:3], -1, 0
17; CHECK-NEXT:    s_bitcmp1_b32 s4, 8
18; CHECK-NEXT:    s_cselect_b64 s[6:7], -1, 0
19; CHECK-NEXT:    s_bitcmp1_b32 s4, 16
20; CHECK-NEXT:    s_cselect_b64 s[8:9], -1, 0
21; CHECK-NEXT:    s_bitcmp1_b32 s0, 24
22; CHECK-NEXT:    s_cselect_b64 s[4:5], -1, 0
23; CHECK-NEXT:    s_xor_b64 s[14:15], s[4:5], -1
24; CHECK-NEXT:    s_bitcmp1_b32 s1, 0
25; CHECK-NEXT:    s_cselect_b64 s[10:11], -1, 0
26; CHECK-NEXT:    s_bitcmp1_b32 s12, 8
27; CHECK-NEXT:    s_cselect_b64 s[12:13], -1, 0
28; CHECK-NEXT:    s_and_b64 s[0:1], exec, s[14:15]
29; CHECK-NEXT:    v_mov_b32_e32 v0, 0
30; CHECK-NEXT:    s_branch .LBB0_3
31; CHECK-NEXT:  .LBB0_1: ; in Loop: Header=BB0_3 Depth=1
32; CHECK-NEXT:    s_mov_b64 s[16:17], 0
33; CHECK-NEXT:    s_mov_b64 s[18:19], -1
34; CHECK-NEXT:    s_mov_b64 s[14:15], -1
35; CHECK-NEXT:    s_mov_b64 s[20:21], -1
36; CHECK-NEXT:  .LBB0_2: ; %Flow7
37; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
38; CHECK-NEXT:    s_and_b64 vcc, exec, s[20:21]
39; CHECK-NEXT:    s_cbranch_vccnz .LBB0_12
40; CHECK-NEXT:  .LBB0_3: ; %bb7
41; CHECK-NEXT:    ; =>This Inner Loop Header: Depth=1
42; CHECK-NEXT:    s_andn2_b64 vcc, exec, s[8:9]
43; CHECK-NEXT:    s_cbranch_vccnz .LBB0_1
44; CHECK-NEXT:  ; %bb.4: ; %bb8
45; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
46; CHECK-NEXT:    s_mov_b64 vcc, s[0:1]
47; CHECK-NEXT:    s_cbranch_vccz .LBB0_6
48; CHECK-NEXT:  ; %bb.5: ; %bb9
49; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
50; CHECK-NEXT:    s_mov_b64 s[14:15], 0
51; CHECK-NEXT:    s_mov_b64 s[16:17], -1
52; CHECK-NEXT:    s_mov_b64 s[20:21], s[6:7]
53; CHECK-NEXT:    s_cbranch_execz .LBB0_7
54; CHECK-NEXT:    s_branch .LBB0_8
55; CHECK-NEXT:  .LBB0_6: ; in Loop: Header=BB0_3 Depth=1
56; CHECK-NEXT:    s_mov_b64 s[14:15], -1
57; CHECK-NEXT:    s_mov_b64 s[16:17], 0
58; CHECK-NEXT:    s_mov_b64 s[20:21], 0
59; CHECK-NEXT:  .LBB0_7: ; %bb10
60; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
61; CHECK-NEXT:    s_mov_b64 s[16:17], -1
62; CHECK-NEXT:    s_mov_b64 s[14:15], 0
63; CHECK-NEXT:    s_mov_b64 s[20:21], s[12:13]
64; CHECK-NEXT:  .LBB0_8: ; %Flow9
65; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
66; CHECK-NEXT:    s_mov_b64 s[18:19], -1
67; CHECK-NEXT:    s_andn2_b64 vcc, exec, s[20:21]
68; CHECK-NEXT:    s_mov_b64 s[20:21], -1
69; CHECK-NEXT:    s_cbranch_vccnz .LBB0_2
70; CHECK-NEXT:  ; %bb.9: ; %bb13
71; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
72; CHECK-NEXT:    s_mov_b64 s[14:15], 0
73; CHECK-NEXT:    s_and_b64 vcc, exec, s[6:7]
74; CHECK-NEXT:    s_mov_b64 s[18:19], 0
75; CHECK-NEXT:    s_cbranch_vccz .LBB0_11
76; CHECK-NEXT:  ; %bb.10: ; %bb16
77; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
78; CHECK-NEXT:    s_mov_b64 s[18:19], -1
79; CHECK-NEXT:    s_mov_b64 s[20:21], s[10:11]
80; CHECK-NEXT:  .LBB0_11: ; %Flow11
81; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
82; CHECK-NEXT:    s_mov_b64 s[16:17], 0
83; CHECK-NEXT:    s_branch .LBB0_2
84; CHECK-NEXT:  .LBB0_12: ; %loop.exit.guard6
85; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
86; CHECK-NEXT:    s_xor_b64 s[20:21], s[18:19], -1
87; CHECK-NEXT:    s_mov_b64 s[18:19], -1
88; CHECK-NEXT:    s_and_b64 vcc, exec, s[20:21]
89; CHECK-NEXT:    s_cbranch_vccz .LBB0_16
90; CHECK-NEXT:  ; %bb.13: ; %bb14
91; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
92; CHECK-NEXT:    s_andn2_b64 vcc, exec, s[2:3]
93; CHECK-NEXT:    s_cbranch_vccnz .LBB0_15
94; CHECK-NEXT:  ; %bb.14: ; %bb15
95; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
96; CHECK-NEXT:    buffer_store_dword v0, off, s[24:27], 0 offset:4
97; CHECK-NEXT:    buffer_store_dword v0, off, s[24:27], 0
98; CHECK-NEXT:  .LBB0_15: ; %Flow
99; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
100; CHECK-NEXT:    s_mov_b64 s[18:19], 0
101; CHECK-NEXT:  .LBB0_16: ; %Flow13
102; CHECK-NEXT:    ; in Loop: Header=BB0_3 Depth=1
103; CHECK-NEXT:    s_andn2_b64 vcc, exec, s[18:19]
104; CHECK-NEXT:    s_cbranch_vccnz .LBB0_3
105; CHECK-NEXT:  ; %bb.17: ; %loop.exit.guard
106; CHECK-NEXT:    s_and_b64 vcc, exec, s[14:15]
107; CHECK-NEXT:    s_cbranch_vccnz .LBB0_22
108; CHECK-NEXT:  ; %bb.18: ; %loop.exit.guard5
109; CHECK-NEXT:    s_and_b64 vcc, exec, s[16:17]
110; CHECK-NEXT:    s_cbranch_vccnz .LBB0_23
111; CHECK-NEXT:  ; %bb.19: ; %bb17
112; CHECK-NEXT:    s_and_b64 vcc, exec, s[4:5]
113; CHECK-NEXT:    s_cbranch_vccz .LBB0_21
114; CHECK-NEXT:  ; %bb.20: ; %bb19
115; CHECK-NEXT:    s_andn2_b64 vcc, exec, s[2:3]
116; CHECK-NEXT:    s_cbranch_vccz .LBB0_22
117; CHECK-NEXT:  .LBB0_21: ; %bb18
118; CHECK-NEXT:    s_endpgm
119; CHECK-NEXT:  .LBB0_22: ; %bb20
120; CHECK-NEXT:  .LBB0_23: ; %bb12
121bb:
122  br label %bb6
123
124bb6:                                              ; preds = %bb15, %bb14, %bb
125  br label %bb7
126
127bb7:                                              ; preds = %bb16, %bb6
128  br i1 %arg2, label %bb8, label %bb20
129
130bb8:                                              ; preds = %bb7
131  br i1 %arg3, label %bb10, label %bb9
132
133bb9:                                              ; preds = %bb8
134  br i1 %arg1, label %bb13, label %bb12
135
136bb10:                                             ; preds = %bb8
137  br i1 %arg5, label %bb11, label %bb12
138
139bb11:                                             ; preds = %bb10
140  br label %bb13
141
142bb12:                                             ; preds = %bb10, %bb9
143  unreachable
144
145bb13:                                             ; preds = %bb11, %bb9
146  br i1 %arg1, label %bb16, label %bb14
147
148bb14:                                             ; preds = %bb13
149  br i1 %arg, label %bb15, label %bb6
150
151bb15:                                             ; preds = %bb14
152  store double 0.000000e+00, ptr addrspace(5) null, align 2147483648
153  br label %bb6
154
155bb16:                                             ; preds = %bb13
156  br i1 %arg4, label %bb17, label %bb7
157
158bb17:                                             ; preds = %bb16
159  br i1 %arg3, label %bb19, label %bb18
160
161bb18:                                             ; preds = %bb17
162  ret void
163
164bb19:                                             ; preds = %bb17
165  br i1 %arg, label %bb20, label %bb21
166
167bb20:                                             ; preds = %bb19, %bb7
168  unreachable
169
170bb21:                                             ; preds = %bb19
171  ret void
172}
173