1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2; RUN: llc -mtriple=riscv32 -mattr=+d -verify-machineinstrs < %s \ 3; RUN: | FileCheck %s -check-prefix=RV32I 4; RUN: llc -mtriple=riscv64 -mattr=+d -verify-machineinstrs < %s \ 5; RUN: | FileCheck %s -check-prefix=RV64I 6 7; Selects of wide values are split into two selects, which can easily cause 8; unnecessary control flow. Here we check some cases where we can currently 9; emit a sequence of selects with shared control flow. 10 11define i64 @cmovcc64(i32 signext %a, i64 %b, i64 %c) nounwind { 12; RV32I-LABEL: cmovcc64: 13; RV32I: # %bb.0: # %entry 14; RV32I-NEXT: addi a5, zero, 123 15; RV32I-NEXT: beq a0, a5, .LBB0_2 16; RV32I-NEXT: # %bb.1: # %entry 17; RV32I-NEXT: mv a1, a3 18; RV32I-NEXT: mv a2, a4 19; RV32I-NEXT: .LBB0_2: # %entry 20; RV32I-NEXT: mv a0, a1 21; RV32I-NEXT: mv a1, a2 22; RV32I-NEXT: ret 23; 24; RV64I-LABEL: cmovcc64: 25; RV64I: # %bb.0: # %entry 26; RV64I-NEXT: addi a3, zero, 123 27; RV64I-NEXT: beq a0, a3, .LBB0_2 28; RV64I-NEXT: # %bb.1: # %entry 29; RV64I-NEXT: mv a1, a2 30; RV64I-NEXT: .LBB0_2: # %entry 31; RV64I-NEXT: mv a0, a1 32; RV64I-NEXT: ret 33entry: 34 %cmp = icmp eq i32 %a, 123 35 %cond = select i1 %cmp, i64 %b, i64 %c 36 ret i64 %cond 37} 38 39define i128 @cmovcc128(i64 signext %a, i128 %b, i128 %c) nounwind { 40; RV32I-LABEL: cmovcc128: 41; RV32I: # %bb.0: # %entry 42; RV32I-NEXT: xori a1, a1, 123 43; RV32I-NEXT: or a2, a1, a2 44; RV32I-NEXT: mv a1, a3 45; RV32I-NEXT: beqz a2, .LBB1_2 46; RV32I-NEXT: # %bb.1: # %entry 47; RV32I-NEXT: mv a1, a4 48; RV32I-NEXT: .LBB1_2: # %entry 49; RV32I-NEXT: lw a6, 0(a1) 50; RV32I-NEXT: beqz a2, .LBB1_6 51; RV32I-NEXT: # %bb.3: # %entry 52; RV32I-NEXT: addi a1, a4, 4 53; RV32I-NEXT: lw a5, 0(a1) 54; RV32I-NEXT: bnez a2, .LBB1_7 55; RV32I-NEXT: .LBB1_4: 56; RV32I-NEXT: addi a1, a3, 8 57; RV32I-NEXT: lw a1, 0(a1) 58; RV32I-NEXT: bnez a2, .LBB1_8 59; RV32I-NEXT: .LBB1_5: 60; RV32I-NEXT: addi a2, a3, 12 61; RV32I-NEXT: j .LBB1_9 62; RV32I-NEXT: .LBB1_6: 63; RV32I-NEXT: addi a1, a3, 4 64; RV32I-NEXT: lw a5, 0(a1) 65; RV32I-NEXT: beqz a2, .LBB1_4 66; RV32I-NEXT: .LBB1_7: # %entry 67; RV32I-NEXT: addi a1, a4, 8 68; RV32I-NEXT: lw a1, 0(a1) 69; RV32I-NEXT: beqz a2, .LBB1_5 70; RV32I-NEXT: .LBB1_8: # %entry 71; RV32I-NEXT: addi a2, a4, 12 72; RV32I-NEXT: .LBB1_9: # %entry 73; RV32I-NEXT: lw a2, 0(a2) 74; RV32I-NEXT: sw a2, 12(a0) 75; RV32I-NEXT: sw a1, 8(a0) 76; RV32I-NEXT: sw a5, 4(a0) 77; RV32I-NEXT: sw a6, 0(a0) 78; RV32I-NEXT: ret 79; 80; RV64I-LABEL: cmovcc128: 81; RV64I: # %bb.0: # %entry 82; RV64I-NEXT: addi a5, zero, 123 83; RV64I-NEXT: beq a0, a5, .LBB1_2 84; RV64I-NEXT: # %bb.1: # %entry 85; RV64I-NEXT: mv a1, a3 86; RV64I-NEXT: mv a2, a4 87; RV64I-NEXT: .LBB1_2: # %entry 88; RV64I-NEXT: mv a0, a1 89; RV64I-NEXT: mv a1, a2 90; RV64I-NEXT: ret 91entry: 92 %cmp = icmp eq i64 %a, 123 93 %cond = select i1 %cmp, i128 %b, i128 %c 94 ret i128 %cond 95} 96 97define i64 @cmov64(i1 %a, i64 %b, i64 %c) nounwind { 98; RV32I-LABEL: cmov64: 99; RV32I: # %bb.0: # %entry 100; RV32I-NEXT: andi a5, a0, 1 101; RV32I-NEXT: mv a0, a1 102; RV32I-NEXT: bnez a5, .LBB2_2 103; RV32I-NEXT: # %bb.1: # %entry 104; RV32I-NEXT: mv a0, a3 105; RV32I-NEXT: mv a2, a4 106; RV32I-NEXT: .LBB2_2: # %entry 107; RV32I-NEXT: mv a1, a2 108; RV32I-NEXT: ret 109; 110; RV64I-LABEL: cmov64: 111; RV64I: # %bb.0: # %entry 112; RV64I-NEXT: andi a3, a0, 1 113; RV64I-NEXT: mv a0, a1 114; RV64I-NEXT: bnez a3, .LBB2_2 115; RV64I-NEXT: # %bb.1: # %entry 116; RV64I-NEXT: mv a0, a2 117; RV64I-NEXT: .LBB2_2: # %entry 118; RV64I-NEXT: ret 119entry: 120 %cond = select i1 %a, i64 %b, i64 %c 121 ret i64 %cond 122} 123 124define i128 @cmov128(i1 %a, i128 %b, i128 %c) nounwind { 125; RV32I-LABEL: cmov128: 126; RV32I: # %bb.0: # %entry 127; RV32I-NEXT: andi a4, a1, 1 128; RV32I-NEXT: mv a1, a2 129; RV32I-NEXT: bnez a4, .LBB3_2 130; RV32I-NEXT: # %bb.1: # %entry 131; RV32I-NEXT: mv a1, a3 132; RV32I-NEXT: .LBB3_2: # %entry 133; RV32I-NEXT: lw a6, 0(a1) 134; RV32I-NEXT: bnez a4, .LBB3_6 135; RV32I-NEXT: # %bb.3: # %entry 136; RV32I-NEXT: addi a1, a3, 4 137; RV32I-NEXT: lw a5, 0(a1) 138; RV32I-NEXT: beqz a4, .LBB3_7 139; RV32I-NEXT: .LBB3_4: 140; RV32I-NEXT: addi a1, a2, 8 141; RV32I-NEXT: lw a1, 0(a1) 142; RV32I-NEXT: beqz a4, .LBB3_8 143; RV32I-NEXT: .LBB3_5: 144; RV32I-NEXT: addi a2, a2, 12 145; RV32I-NEXT: j .LBB3_9 146; RV32I-NEXT: .LBB3_6: 147; RV32I-NEXT: addi a1, a2, 4 148; RV32I-NEXT: lw a5, 0(a1) 149; RV32I-NEXT: bnez a4, .LBB3_4 150; RV32I-NEXT: .LBB3_7: # %entry 151; RV32I-NEXT: addi a1, a3, 8 152; RV32I-NEXT: lw a1, 0(a1) 153; RV32I-NEXT: bnez a4, .LBB3_5 154; RV32I-NEXT: .LBB3_8: # %entry 155; RV32I-NEXT: addi a2, a3, 12 156; RV32I-NEXT: .LBB3_9: # %entry 157; RV32I-NEXT: lw a2, 0(a2) 158; RV32I-NEXT: sw a2, 12(a0) 159; RV32I-NEXT: sw a1, 8(a0) 160; RV32I-NEXT: sw a5, 4(a0) 161; RV32I-NEXT: sw a6, 0(a0) 162; RV32I-NEXT: ret 163; 164; RV64I-LABEL: cmov128: 165; RV64I: # %bb.0: # %entry 166; RV64I-NEXT: andi a5, a0, 1 167; RV64I-NEXT: mv a0, a1 168; RV64I-NEXT: bnez a5, .LBB3_2 169; RV64I-NEXT: # %bb.1: # %entry 170; RV64I-NEXT: mv a0, a3 171; RV64I-NEXT: mv a2, a4 172; RV64I-NEXT: .LBB3_2: # %entry 173; RV64I-NEXT: mv a1, a2 174; RV64I-NEXT: ret 175entry: 176 %cond = select i1 %a, i128 %b, i128 %c 177 ret i128 %cond 178} 179 180define float @cmovfloat(i1 %a, float %b, float %c, float %d, float %e) nounwind { 181; RV32I-LABEL: cmovfloat: 182; RV32I: # %bb.0: # %entry 183; RV32I-NEXT: andi a0, a0, 1 184; RV32I-NEXT: bnez a0, .LBB4_2 185; RV32I-NEXT: # %bb.1: # %entry 186; RV32I-NEXT: fmv.w.x ft0, a4 187; RV32I-NEXT: fmv.w.x ft1, a2 188; RV32I-NEXT: j .LBB4_3 189; RV32I-NEXT: .LBB4_2: 190; RV32I-NEXT: fmv.w.x ft0, a3 191; RV32I-NEXT: fmv.w.x ft1, a1 192; RV32I-NEXT: .LBB4_3: # %entry 193; RV32I-NEXT: fadd.s ft0, ft1, ft0 194; RV32I-NEXT: fmv.x.w a0, ft0 195; RV32I-NEXT: ret 196; 197; RV64I-LABEL: cmovfloat: 198; RV64I: # %bb.0: # %entry 199; RV64I-NEXT: andi a0, a0, 1 200; RV64I-NEXT: bnez a0, .LBB4_2 201; RV64I-NEXT: # %bb.1: # %entry 202; RV64I-NEXT: fmv.w.x ft0, a4 203; RV64I-NEXT: fmv.w.x ft1, a2 204; RV64I-NEXT: j .LBB4_3 205; RV64I-NEXT: .LBB4_2: 206; RV64I-NEXT: fmv.w.x ft0, a3 207; RV64I-NEXT: fmv.w.x ft1, a1 208; RV64I-NEXT: .LBB4_3: # %entry 209; RV64I-NEXT: fadd.s ft0, ft1, ft0 210; RV64I-NEXT: fmv.x.w a0, ft0 211; RV64I-NEXT: ret 212entry: 213 %cond1 = select i1 %a, float %b, float %c 214 %cond2 = select i1 %a, float %d, float %e 215 %ret = fadd float %cond1, %cond2 216 ret float %ret 217} 218 219define double @cmovdouble(i1 %a, double %b, double %c) nounwind { 220; RV32I-LABEL: cmovdouble: 221; RV32I: # %bb.0: # %entry 222; RV32I-NEXT: addi sp, sp, -16 223; RV32I-NEXT: sw a3, 8(sp) 224; RV32I-NEXT: sw a4, 12(sp) 225; RV32I-NEXT: fld ft0, 8(sp) 226; RV32I-NEXT: sw a1, 8(sp) 227; RV32I-NEXT: sw a2, 12(sp) 228; RV32I-NEXT: fld ft1, 8(sp) 229; RV32I-NEXT: andi a0, a0, 1 230; RV32I-NEXT: bnez a0, .LBB5_2 231; RV32I-NEXT: # %bb.1: # %entry 232; RV32I-NEXT: fmv.d ft1, ft0 233; RV32I-NEXT: .LBB5_2: # %entry 234; RV32I-NEXT: fsd ft1, 8(sp) 235; RV32I-NEXT: lw a0, 8(sp) 236; RV32I-NEXT: lw a1, 12(sp) 237; RV32I-NEXT: addi sp, sp, 16 238; RV32I-NEXT: ret 239; 240; RV64I-LABEL: cmovdouble: 241; RV64I: # %bb.0: # %entry 242; RV64I-NEXT: andi a0, a0, 1 243; RV64I-NEXT: bnez a0, .LBB5_2 244; RV64I-NEXT: # %bb.1: # %entry 245; RV64I-NEXT: fmv.d.x ft0, a2 246; RV64I-NEXT: fmv.x.d a0, ft0 247; RV64I-NEXT: ret 248; RV64I-NEXT: .LBB5_2: 249; RV64I-NEXT: fmv.d.x ft0, a1 250; RV64I-NEXT: fmv.x.d a0, ft0 251; RV64I-NEXT: ret 252entry: 253 %cond = select i1 %a, double %b, double %c 254 ret double %cond 255} 256 257; Check that selects with dependencies on previous ones aren't incorrectly 258; optimized. 259 260define i32 @cmovccdep(i32 signext %a, i32 %b, i32 %c, i32 %d) nounwind { 261; RV32I-LABEL: cmovccdep: 262; RV32I: # %bb.0: # %entry 263; RV32I-NEXT: addi a4, zero, 123 264; RV32I-NEXT: bne a0, a4, .LBB6_3 265; RV32I-NEXT: # %bb.1: # %entry 266; RV32I-NEXT: mv a2, a1 267; RV32I-NEXT: bne a0, a4, .LBB6_4 268; RV32I-NEXT: .LBB6_2: # %entry 269; RV32I-NEXT: add a0, a1, a2 270; RV32I-NEXT: ret 271; RV32I-NEXT: .LBB6_3: # %entry 272; RV32I-NEXT: mv a1, a2 273; RV32I-NEXT: mv a2, a1 274; RV32I-NEXT: beq a0, a4, .LBB6_2 275; RV32I-NEXT: .LBB6_4: # %entry 276; RV32I-NEXT: mv a2, a3 277; RV32I-NEXT: add a0, a1, a2 278; RV32I-NEXT: ret 279; 280; RV64I-LABEL: cmovccdep: 281; RV64I: # %bb.0: # %entry 282; RV64I-NEXT: addi a4, zero, 123 283; RV64I-NEXT: bne a0, a4, .LBB6_3 284; RV64I-NEXT: # %bb.1: # %entry 285; RV64I-NEXT: mv a2, a1 286; RV64I-NEXT: bne a0, a4, .LBB6_4 287; RV64I-NEXT: .LBB6_2: # %entry 288; RV64I-NEXT: addw a0, a1, a2 289; RV64I-NEXT: ret 290; RV64I-NEXT: .LBB6_3: # %entry 291; RV64I-NEXT: mv a1, a2 292; RV64I-NEXT: mv a2, a1 293; RV64I-NEXT: beq a0, a4, .LBB6_2 294; RV64I-NEXT: .LBB6_4: # %entry 295; RV64I-NEXT: mv a2, a3 296; RV64I-NEXT: addw a0, a1, a2 297; RV64I-NEXT: ret 298entry: 299 %cmp = icmp eq i32 %a, 123 300 %cond1 = select i1 %cmp, i32 %b, i32 %c 301 %cond2 = select i1 %cmp, i32 %cond1, i32 %d 302 %ret = add i32 %cond1, %cond2 303 ret i32 %ret 304} 305 306; Check that selects with different conditions aren't incorrectly optimized. 307 308define i32 @cmovdiffcc(i1 %a, i1 %b, i32 %c, i32 %d, i32 %e, i32 %f) nounwind { 309; RV32I-LABEL: cmovdiffcc: 310; RV32I: # %bb.0: # %entry 311; RV32I-NEXT: andi a0, a0, 1 312; RV32I-NEXT: andi a1, a1, 1 313; RV32I-NEXT: beqz a0, .LBB7_3 314; RV32I-NEXT: # %bb.1: # %entry 315; RV32I-NEXT: beqz a1, .LBB7_4 316; RV32I-NEXT: .LBB7_2: # %entry 317; RV32I-NEXT: add a0, a2, a4 318; RV32I-NEXT: ret 319; RV32I-NEXT: .LBB7_3: # %entry 320; RV32I-NEXT: mv a2, a3 321; RV32I-NEXT: bnez a1, .LBB7_2 322; RV32I-NEXT: .LBB7_4: # %entry 323; RV32I-NEXT: mv a4, a5 324; RV32I-NEXT: add a0, a2, a4 325; RV32I-NEXT: ret 326; 327; RV64I-LABEL: cmovdiffcc: 328; RV64I: # %bb.0: # %entry 329; RV64I-NEXT: andi a0, a0, 1 330; RV64I-NEXT: andi a1, a1, 1 331; RV64I-NEXT: beqz a0, .LBB7_3 332; RV64I-NEXT: # %bb.1: # %entry 333; RV64I-NEXT: beqz a1, .LBB7_4 334; RV64I-NEXT: .LBB7_2: # %entry 335; RV64I-NEXT: addw a0, a2, a4 336; RV64I-NEXT: ret 337; RV64I-NEXT: .LBB7_3: # %entry 338; RV64I-NEXT: mv a2, a3 339; RV64I-NEXT: bnez a1, .LBB7_2 340; RV64I-NEXT: .LBB7_4: # %entry 341; RV64I-NEXT: mv a4, a5 342; RV64I-NEXT: addw a0, a2, a4 343; RV64I-NEXT: ret 344entry: 345 %cond1 = select i1 %a, i32 %c, i32 %d 346 %cond2 = select i1 %b, i32 %e, i32 %f 347 %ret = add i32 %cond1, %cond2 348 ret i32 %ret 349} 350