xref: /llvm-project/llvm/test/CodeGen/RISCV/select-optimize-multiple.ll (revision 2967e5f8007d873a3e9d97870d2461d0827a3976)
1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2; RUN: llc -mtriple=riscv32 -mattr=+d -target-abi=ilp32 -verify-machineinstrs < %s \
3; RUN:   | FileCheck %s -check-prefix=RV32I
4; RUN: llc -mtriple=riscv64 -mattr=+d -target-abi=lp64 -verify-machineinstrs < %s \
5; RUN:   | FileCheck %s -check-prefix=RV64I
6
7; Selects of wide values are split into two selects, which can easily cause
8; unnecessary control flow. Here we check some cases where we can currently
9; emit a sequence of selects with shared control flow.
10
11define i64 @cmovcc64(i32 signext %a, i64 %b, i64 %c) nounwind {
12; RV32I-LABEL: cmovcc64:
13; RV32I:       # %bb.0: # %entry
14; RV32I-NEXT:    li a5, 123
15; RV32I-NEXT:    beq a0, a5, .LBB0_2
16; RV32I-NEXT:  # %bb.1: # %entry
17; RV32I-NEXT:    mv a1, a3
18; RV32I-NEXT:    mv a2, a4
19; RV32I-NEXT:  .LBB0_2: # %entry
20; RV32I-NEXT:    mv a0, a1
21; RV32I-NEXT:    mv a1, a2
22; RV32I-NEXT:    ret
23;
24; RV64I-LABEL: cmovcc64:
25; RV64I:       # %bb.0: # %entry
26; RV64I-NEXT:    li a3, 123
27; RV64I-NEXT:    beq a0, a3, .LBB0_2
28; RV64I-NEXT:  # %bb.1: # %entry
29; RV64I-NEXT:    mv a1, a2
30; RV64I-NEXT:  .LBB0_2: # %entry
31; RV64I-NEXT:    mv a0, a1
32; RV64I-NEXT:    ret
33entry:
34  %cmp = icmp eq i32 %a, 123
35  %cond = select i1 %cmp, i64 %b, i64 %c
36  ret i64 %cond
37}
38
39define i128 @cmovcc128(i64 signext %a, i128 %b, i128 %c) nounwind {
40; RV32I-LABEL: cmovcc128:
41; RV32I:       # %bb.0: # %entry
42; RV32I-NEXT:    xori a1, a1, 123
43; RV32I-NEXT:    or a1, a1, a2
44; RV32I-NEXT:    mv a2, a3
45; RV32I-NEXT:    beqz a1, .LBB1_2
46; RV32I-NEXT:  # %bb.1: # %entry
47; RV32I-NEXT:    mv a2, a4
48; RV32I-NEXT:  .LBB1_2: # %entry
49; RV32I-NEXT:    beqz a1, .LBB1_5
50; RV32I-NEXT:  # %bb.3: # %entry
51; RV32I-NEXT:    addi a5, a4, 4
52; RV32I-NEXT:    bnez a1, .LBB1_6
53; RV32I-NEXT:  .LBB1_4:
54; RV32I-NEXT:    addi a6, a3, 8
55; RV32I-NEXT:    j .LBB1_7
56; RV32I-NEXT:  .LBB1_5:
57; RV32I-NEXT:    addi a5, a3, 4
58; RV32I-NEXT:    beqz a1, .LBB1_4
59; RV32I-NEXT:  .LBB1_6: # %entry
60; RV32I-NEXT:    addi a6, a4, 8
61; RV32I-NEXT:  .LBB1_7: # %entry
62; RV32I-NEXT:    lw a2, 0(a2)
63; RV32I-NEXT:    lw a5, 0(a5)
64; RV32I-NEXT:    lw a6, 0(a6)
65; RV32I-NEXT:    beqz a1, .LBB1_9
66; RV32I-NEXT:  # %bb.8: # %entry
67; RV32I-NEXT:    addi a3, a4, 12
68; RV32I-NEXT:    j .LBB1_10
69; RV32I-NEXT:  .LBB1_9:
70; RV32I-NEXT:    addi a3, a3, 12
71; RV32I-NEXT:  .LBB1_10: # %entry
72; RV32I-NEXT:    lw a1, 0(a3)
73; RV32I-NEXT:    sw a2, 0(a0)
74; RV32I-NEXT:    sw a5, 4(a0)
75; RV32I-NEXT:    sw a6, 8(a0)
76; RV32I-NEXT:    sw a1, 12(a0)
77; RV32I-NEXT:    ret
78;
79; RV64I-LABEL: cmovcc128:
80; RV64I:       # %bb.0: # %entry
81; RV64I-NEXT:    li a5, 123
82; RV64I-NEXT:    beq a0, a5, .LBB1_2
83; RV64I-NEXT:  # %bb.1: # %entry
84; RV64I-NEXT:    mv a1, a3
85; RV64I-NEXT:    mv a2, a4
86; RV64I-NEXT:  .LBB1_2: # %entry
87; RV64I-NEXT:    mv a0, a1
88; RV64I-NEXT:    mv a1, a2
89; RV64I-NEXT:    ret
90entry:
91  %cmp = icmp eq i64 %a, 123
92  %cond = select i1 %cmp, i128 %b, i128 %c
93  ret i128 %cond
94}
95
96define i64 @cmov64(i1 %a, i64 %b, i64 %c) nounwind {
97; RV32I-LABEL: cmov64:
98; RV32I:       # %bb.0: # %entry
99; RV32I-NEXT:    andi a5, a0, 1
100; RV32I-NEXT:    mv a0, a1
101; RV32I-NEXT:    bnez a5, .LBB2_2
102; RV32I-NEXT:  # %bb.1: # %entry
103; RV32I-NEXT:    mv a0, a3
104; RV32I-NEXT:    mv a2, a4
105; RV32I-NEXT:  .LBB2_2: # %entry
106; RV32I-NEXT:    mv a1, a2
107; RV32I-NEXT:    ret
108;
109; RV64I-LABEL: cmov64:
110; RV64I:       # %bb.0: # %entry
111; RV64I-NEXT:    andi a3, a0, 1
112; RV64I-NEXT:    mv a0, a1
113; RV64I-NEXT:    bnez a3, .LBB2_2
114; RV64I-NEXT:  # %bb.1: # %entry
115; RV64I-NEXT:    mv a0, a2
116; RV64I-NEXT:  .LBB2_2: # %entry
117; RV64I-NEXT:    ret
118entry:
119  %cond = select i1 %a, i64 %b, i64 %c
120  ret i64 %cond
121}
122
123define i128 @cmov128(i1 %a, i128 %b, i128 %c) nounwind {
124; RV32I-LABEL: cmov128:
125; RV32I:       # %bb.0: # %entry
126; RV32I-NEXT:    andi a1, a1, 1
127; RV32I-NEXT:    mv a4, a2
128; RV32I-NEXT:    bnez a1, .LBB3_2
129; RV32I-NEXT:  # %bb.1: # %entry
130; RV32I-NEXT:    mv a4, a3
131; RV32I-NEXT:  .LBB3_2: # %entry
132; RV32I-NEXT:    bnez a1, .LBB3_5
133; RV32I-NEXT:  # %bb.3: # %entry
134; RV32I-NEXT:    addi a5, a3, 4
135; RV32I-NEXT:    beqz a1, .LBB3_6
136; RV32I-NEXT:  .LBB3_4:
137; RV32I-NEXT:    addi a6, a2, 8
138; RV32I-NEXT:    j .LBB3_7
139; RV32I-NEXT:  .LBB3_5:
140; RV32I-NEXT:    addi a5, a2, 4
141; RV32I-NEXT:    bnez a1, .LBB3_4
142; RV32I-NEXT:  .LBB3_6: # %entry
143; RV32I-NEXT:    addi a6, a3, 8
144; RV32I-NEXT:  .LBB3_7: # %entry
145; RV32I-NEXT:    lw a4, 0(a4)
146; RV32I-NEXT:    lw a5, 0(a5)
147; RV32I-NEXT:    lw a6, 0(a6)
148; RV32I-NEXT:    bnez a1, .LBB3_9
149; RV32I-NEXT:  # %bb.8: # %entry
150; RV32I-NEXT:    addi a2, a3, 12
151; RV32I-NEXT:    j .LBB3_10
152; RV32I-NEXT:  .LBB3_9:
153; RV32I-NEXT:    addi a2, a2, 12
154; RV32I-NEXT:  .LBB3_10: # %entry
155; RV32I-NEXT:    lw a1, 0(a2)
156; RV32I-NEXT:    sw a4, 0(a0)
157; RV32I-NEXT:    sw a5, 4(a0)
158; RV32I-NEXT:    sw a6, 8(a0)
159; RV32I-NEXT:    sw a1, 12(a0)
160; RV32I-NEXT:    ret
161;
162; RV64I-LABEL: cmov128:
163; RV64I:       # %bb.0: # %entry
164; RV64I-NEXT:    andi a5, a0, 1
165; RV64I-NEXT:    mv a0, a1
166; RV64I-NEXT:    bnez a5, .LBB3_2
167; RV64I-NEXT:  # %bb.1: # %entry
168; RV64I-NEXT:    mv a0, a3
169; RV64I-NEXT:    mv a2, a4
170; RV64I-NEXT:  .LBB3_2: # %entry
171; RV64I-NEXT:    mv a1, a2
172; RV64I-NEXT:    ret
173entry:
174  %cond = select i1 %a, i128 %b, i128 %c
175  ret i128 %cond
176}
177
178define float @cmovfloat(i1 %a, float %b, float %c, float %d, float %e) nounwind {
179; RV32I-LABEL: cmovfloat:
180; RV32I:       # %bb.0: # %entry
181; RV32I-NEXT:    andi a0, a0, 1
182; RV32I-NEXT:    bnez a0, .LBB4_2
183; RV32I-NEXT:  # %bb.1: # %entry
184; RV32I-NEXT:    fmv.w.x fa5, a4
185; RV32I-NEXT:    fmv.w.x fa4, a2
186; RV32I-NEXT:    j .LBB4_3
187; RV32I-NEXT:  .LBB4_2:
188; RV32I-NEXT:    fmv.w.x fa5, a3
189; RV32I-NEXT:    fmv.w.x fa4, a1
190; RV32I-NEXT:  .LBB4_3: # %entry
191; RV32I-NEXT:    fadd.s fa5, fa4, fa5
192; RV32I-NEXT:    fmv.x.w a0, fa5
193; RV32I-NEXT:    ret
194;
195; RV64I-LABEL: cmovfloat:
196; RV64I:       # %bb.0: # %entry
197; RV64I-NEXT:    andi a0, a0, 1
198; RV64I-NEXT:    bnez a0, .LBB4_2
199; RV64I-NEXT:  # %bb.1: # %entry
200; RV64I-NEXT:    fmv.w.x fa5, a4
201; RV64I-NEXT:    fmv.w.x fa4, a2
202; RV64I-NEXT:    j .LBB4_3
203; RV64I-NEXT:  .LBB4_2:
204; RV64I-NEXT:    fmv.w.x fa5, a3
205; RV64I-NEXT:    fmv.w.x fa4, a1
206; RV64I-NEXT:  .LBB4_3: # %entry
207; RV64I-NEXT:    fadd.s fa5, fa4, fa5
208; RV64I-NEXT:    fmv.x.w a0, fa5
209; RV64I-NEXT:    ret
210entry:
211  %cond1 = select i1 %a, float %b, float %c
212  %cond2 = select i1 %a, float %d, float %e
213  %ret = fadd float %cond1, %cond2
214  ret float %ret
215}
216
217define double @cmovdouble(i1 %a, double %b, double %c) nounwind {
218; RV32I-LABEL: cmovdouble:
219; RV32I:       # %bb.0: # %entry
220; RV32I-NEXT:    addi sp, sp, -16
221; RV32I-NEXT:    sw a3, 8(sp)
222; RV32I-NEXT:    sw a4, 12(sp)
223; RV32I-NEXT:    fld fa5, 8(sp)
224; RV32I-NEXT:    andi a0, a0, 1
225; RV32I-NEXT:    sw a1, 8(sp)
226; RV32I-NEXT:    sw a2, 12(sp)
227; RV32I-NEXT:    beqz a0, .LBB5_2
228; RV32I-NEXT:  # %bb.1:
229; RV32I-NEXT:    fld fa5, 8(sp)
230; RV32I-NEXT:  .LBB5_2: # %entry
231; RV32I-NEXT:    fsd fa5, 8(sp)
232; RV32I-NEXT:    lw a0, 8(sp)
233; RV32I-NEXT:    lw a1, 12(sp)
234; RV32I-NEXT:    addi sp, sp, 16
235; RV32I-NEXT:    ret
236;
237; RV64I-LABEL: cmovdouble:
238; RV64I:       # %bb.0: # %entry
239; RV64I-NEXT:    andi a0, a0, 1
240; RV64I-NEXT:    bnez a0, .LBB5_2
241; RV64I-NEXT:  # %bb.1: # %entry
242; RV64I-NEXT:    fmv.d.x fa5, a2
243; RV64I-NEXT:    fmv.x.d a0, fa5
244; RV64I-NEXT:    ret
245; RV64I-NEXT:  .LBB5_2:
246; RV64I-NEXT:    fmv.d.x fa5, a1
247; RV64I-NEXT:    fmv.x.d a0, fa5
248; RV64I-NEXT:    ret
249entry:
250  %cond = select i1 %a, double %b, double %c
251  ret double %cond
252}
253
254; Check that selects with dependencies on previous ones aren't incorrectly
255; optimized.
256
257define i32 @cmovccdep(i32 signext %a, i32 %b, i32 %c, i32 %d) nounwind {
258; RV32I-LABEL: cmovccdep:
259; RV32I:       # %bb.0: # %entry
260; RV32I-NEXT:    li a4, 123
261; RV32I-NEXT:    bne a0, a4, .LBB6_3
262; RV32I-NEXT:  # %bb.1: # %entry
263; RV32I-NEXT:    mv a2, a1
264; RV32I-NEXT:    bne a0, a4, .LBB6_4
265; RV32I-NEXT:  .LBB6_2: # %entry
266; RV32I-NEXT:    add a0, a1, a2
267; RV32I-NEXT:    ret
268; RV32I-NEXT:  .LBB6_3: # %entry
269; RV32I-NEXT:    mv a1, a2
270; RV32I-NEXT:    beq a0, a4, .LBB6_2
271; RV32I-NEXT:  .LBB6_4: # %entry
272; RV32I-NEXT:    add a0, a1, a3
273; RV32I-NEXT:    ret
274;
275; RV64I-LABEL: cmovccdep:
276; RV64I:       # %bb.0: # %entry
277; RV64I-NEXT:    li a4, 123
278; RV64I-NEXT:    bne a0, a4, .LBB6_3
279; RV64I-NEXT:  # %bb.1: # %entry
280; RV64I-NEXT:    mv a2, a1
281; RV64I-NEXT:    bne a0, a4, .LBB6_4
282; RV64I-NEXT:  .LBB6_2: # %entry
283; RV64I-NEXT:    addw a0, a1, a2
284; RV64I-NEXT:    ret
285; RV64I-NEXT:  .LBB6_3: # %entry
286; RV64I-NEXT:    mv a1, a2
287; RV64I-NEXT:    beq a0, a4, .LBB6_2
288; RV64I-NEXT:  .LBB6_4: # %entry
289; RV64I-NEXT:    addw a0, a1, a3
290; RV64I-NEXT:    ret
291entry:
292  %cmp = icmp eq i32 %a, 123
293  %cond1 = select i1 %cmp, i32 %b, i32 %c
294  %cond2 = select i1 %cmp, i32 %cond1, i32 %d
295  %ret = add i32 %cond1, %cond2
296  ret i32 %ret
297}
298
299; Check that selects with different conditions aren't incorrectly optimized.
300
301define i32 @cmovdiffcc(i1 %a, i1 %b, i32 %c, i32 %d, i32 %e, i32 %f) nounwind {
302; RV32I-LABEL: cmovdiffcc:
303; RV32I:       # %bb.0: # %entry
304; RV32I-NEXT:    andi a0, a0, 1
305; RV32I-NEXT:    andi a1, a1, 1
306; RV32I-NEXT:    beqz a0, .LBB7_3
307; RV32I-NEXT:  # %bb.1: # %entry
308; RV32I-NEXT:    beqz a1, .LBB7_4
309; RV32I-NEXT:  .LBB7_2: # %entry
310; RV32I-NEXT:    add a0, a2, a4
311; RV32I-NEXT:    ret
312; RV32I-NEXT:  .LBB7_3: # %entry
313; RV32I-NEXT:    mv a2, a3
314; RV32I-NEXT:    bnez a1, .LBB7_2
315; RV32I-NEXT:  .LBB7_4: # %entry
316; RV32I-NEXT:    add a0, a2, a5
317; RV32I-NEXT:    ret
318;
319; RV64I-LABEL: cmovdiffcc:
320; RV64I:       # %bb.0: # %entry
321; RV64I-NEXT:    andi a0, a0, 1
322; RV64I-NEXT:    andi a1, a1, 1
323; RV64I-NEXT:    beqz a0, .LBB7_3
324; RV64I-NEXT:  # %bb.1: # %entry
325; RV64I-NEXT:    beqz a1, .LBB7_4
326; RV64I-NEXT:  .LBB7_2: # %entry
327; RV64I-NEXT:    addw a0, a2, a4
328; RV64I-NEXT:    ret
329; RV64I-NEXT:  .LBB7_3: # %entry
330; RV64I-NEXT:    mv a2, a3
331; RV64I-NEXT:    bnez a1, .LBB7_2
332; RV64I-NEXT:  .LBB7_4: # %entry
333; RV64I-NEXT:    addw a0, a2, a5
334; RV64I-NEXT:    ret
335entry:
336  %cond1 = select i1 %a, i32 %c, i32 %d
337  %cond2 = select i1 %b, i32 %e, i32 %f
338  %ret = add i32 %cond1, %cond2
339  ret i32 %ret
340}
341
342define float @CascadedSelect(float noundef %a) {
343; RV32I-LABEL: CascadedSelect:
344; RV32I:       # %bb.0: # %entry
345; RV32I-NEXT:    fmv.w.x fa5, a0
346; RV32I-NEXT:    lui a0, 260096
347; RV32I-NEXT:    fmv.w.x fa4, a0
348; RV32I-NEXT:    flt.s a0, fa4, fa5
349; RV32I-NEXT:    bnez a0, .LBB8_3
350; RV32I-NEXT:  # %bb.1: # %entry
351; RV32I-NEXT:    fmv.w.x fa4, zero
352; RV32I-NEXT:    flt.s a0, fa5, fa4
353; RV32I-NEXT:    bnez a0, .LBB8_3
354; RV32I-NEXT:  # %bb.2: # %entry
355; RV32I-NEXT:    fmv.s fa4, fa5
356; RV32I-NEXT:  .LBB8_3: # %entry
357; RV32I-NEXT:    fmv.x.w a0, fa4
358; RV32I-NEXT:    ret
359;
360; RV64I-LABEL: CascadedSelect:
361; RV64I:       # %bb.0: # %entry
362; RV64I-NEXT:    fmv.w.x fa5, a0
363; RV64I-NEXT:    lui a0, 260096
364; RV64I-NEXT:    fmv.w.x fa4, a0
365; RV64I-NEXT:    flt.s a0, fa4, fa5
366; RV64I-NEXT:    bnez a0, .LBB8_3
367; RV64I-NEXT:  # %bb.1: # %entry
368; RV64I-NEXT:    fmv.w.x fa4, zero
369; RV64I-NEXT:    flt.s a0, fa5, fa4
370; RV64I-NEXT:    bnez a0, .LBB8_3
371; RV64I-NEXT:  # %bb.2: # %entry
372; RV64I-NEXT:    fmv.s fa4, fa5
373; RV64I-NEXT:  .LBB8_3: # %entry
374; RV64I-NEXT:    fmv.x.w a0, fa4
375; RV64I-NEXT:    ret
376entry:
377  %cmp = fcmp ogt float %a, 1.000000e+00
378  %cmp1 = fcmp olt float %a, 0.000000e+00
379  %.a = select i1 %cmp1, float 0.000000e+00, float %a
380  %retval.0 = select i1 %cmp, float 1.000000e+00, float %.a
381  ret float %retval.0
382}
383