1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2; RUN: llc -mtriple=riscv64 -mattr=+v,+d -mattr=+d -O0 < %s \ 3; RUN: | FileCheck --check-prefix=SPILL-O0 %s 4; RUN: llc -mtriple=riscv64 -mattr=+v,+d -mattr=+d -O2 < %s \ 5; RUN: | FileCheck --check-prefix=SPILL-O2 %s 6; RUN: llc -mtriple=riscv64 -mattr=+v,+d -mattr=+d -riscv-v-vector-bits-max=128 -O2 < %s \ 7; RUN: | FileCheck --check-prefix=SPILL-O2-VLEN128 %s 8; RUN: llc -mtriple=riscv64 -mattr=+v,+d,+zcmp -O2 < %s \ 9; RUN: | FileCheck --check-prefix=SPILL-O2-ZCMP %s 10 11 12@.str = private unnamed_addr constant [6 x i8] c"hello\00", align 1 13 14define <vscale x 1 x double> @foo(<vscale x 1 x double> %a, <vscale x 1 x double> %b, <vscale x 1 x double> %c, i64 %gvl) nounwind 15; SPILL-O0-LABEL: foo: 16; SPILL-O0: # %bb.0: 17; SPILL-O0-NEXT: addi sp, sp, -48 18; SPILL-O0-NEXT: sd ra, 40(sp) # 8-byte Folded Spill 19; SPILL-O0-NEXT: csrr a1, vlenb 20; SPILL-O0-NEXT: slli a1, a1, 1 21; SPILL-O0-NEXT: sub sp, sp, a1 22; SPILL-O0-NEXT: sd a0, 16(sp) # 8-byte Folded Spill 23; SPILL-O0-NEXT: vsetivli zero, 1, e8, m1, ta, ma 24; SPILL-O0-NEXT: vmv1r.v v10, v9 25; SPILL-O0-NEXT: vmv1r.v v9, v8 26; SPILL-O0-NEXT: csrr a1, vlenb 27; SPILL-O0-NEXT: add a1, sp, a1 28; SPILL-O0-NEXT: addi a1, a1, 32 29; SPILL-O0-NEXT: vs1r.v v9, (a1) # Unknown-size Folded Spill 30; SPILL-O0-NEXT: # implicit-def: $v8 31; SPILL-O0-NEXT: vsetvli zero, a0, e64, m1, tu, ma 32; SPILL-O0-NEXT: vfadd.vv v8, v9, v10 33; SPILL-O0-NEXT: addi a0, sp, 32 34; SPILL-O0-NEXT: vs1r.v v8, (a0) # Unknown-size Folded Spill 35; SPILL-O0-NEXT: lui a0, %hi(.L.str) 36; SPILL-O0-NEXT: addi a0, a0, %lo(.L.str) 37; SPILL-O0-NEXT: call puts 38; SPILL-O0-NEXT: addi a1, sp, 32 39; SPILL-O0-NEXT: vl1r.v v10, (a1) # Unknown-size Folded Reload 40; SPILL-O0-NEXT: csrr a1, vlenb 41; SPILL-O0-NEXT: add a1, sp, a1 42; SPILL-O0-NEXT: addi a1, a1, 32 43; SPILL-O0-NEXT: vl1r.v v9, (a1) # Unknown-size Folded Reload 44; SPILL-O0-NEXT: # kill: def $x11 killed $x10 45; SPILL-O0-NEXT: ld a0, 16(sp) # 8-byte Folded Reload 46; SPILL-O0-NEXT: # implicit-def: $v8 47; SPILL-O0-NEXT: vsetvli zero, a0, e64, m1, tu, ma 48; SPILL-O0-NEXT: vfadd.vv v8, v9, v10 49; SPILL-O0-NEXT: csrr a0, vlenb 50; SPILL-O0-NEXT: slli a0, a0, 1 51; SPILL-O0-NEXT: add sp, sp, a0 52; SPILL-O0-NEXT: ld ra, 40(sp) # 8-byte Folded Reload 53; SPILL-O0-NEXT: addi sp, sp, 48 54; SPILL-O0-NEXT: ret 55; 56; SPILL-O2-LABEL: foo: 57; SPILL-O2: # %bb.0: 58; SPILL-O2-NEXT: addi sp, sp, -32 59; SPILL-O2-NEXT: sd ra, 24(sp) # 8-byte Folded Spill 60; SPILL-O2-NEXT: sd s0, 16(sp) # 8-byte Folded Spill 61; SPILL-O2-NEXT: csrr a1, vlenb 62; SPILL-O2-NEXT: slli a1, a1, 1 63; SPILL-O2-NEXT: sub sp, sp, a1 64; SPILL-O2-NEXT: mv s0, a0 65; SPILL-O2-NEXT: addi a1, sp, 16 66; SPILL-O2-NEXT: vs1r.v v8, (a1) # Unknown-size Folded Spill 67; SPILL-O2-NEXT: vsetvli zero, a0, e64, m1, ta, ma 68; SPILL-O2-NEXT: vfadd.vv v9, v8, v9 69; SPILL-O2-NEXT: csrr a0, vlenb 70; SPILL-O2-NEXT: add a0, sp, a0 71; SPILL-O2-NEXT: addi a0, a0, 16 72; SPILL-O2-NEXT: vs1r.v v9, (a0) # Unknown-size Folded Spill 73; SPILL-O2-NEXT: lui a0, %hi(.L.str) 74; SPILL-O2-NEXT: addi a0, a0, %lo(.L.str) 75; SPILL-O2-NEXT: call puts 76; SPILL-O2-NEXT: csrr a0, vlenb 77; SPILL-O2-NEXT: add a0, sp, a0 78; SPILL-O2-NEXT: addi a0, a0, 16 79; SPILL-O2-NEXT: vl1r.v v8, (a0) # Unknown-size Folded Reload 80; SPILL-O2-NEXT: addi a0, sp, 16 81; SPILL-O2-NEXT: vl1r.v v9, (a0) # Unknown-size Folded Reload 82; SPILL-O2-NEXT: vsetvli zero, s0, e64, m1, ta, ma 83; SPILL-O2-NEXT: vfadd.vv v8, v9, v8 84; SPILL-O2-NEXT: csrr a0, vlenb 85; SPILL-O2-NEXT: slli a0, a0, 1 86; SPILL-O2-NEXT: add sp, sp, a0 87; SPILL-O2-NEXT: ld ra, 24(sp) # 8-byte Folded Reload 88; SPILL-O2-NEXT: ld s0, 16(sp) # 8-byte Folded Reload 89; SPILL-O2-NEXT: addi sp, sp, 32 90; SPILL-O2-NEXT: ret 91; 92; SPILL-O2-VLEN128-LABEL: foo: 93; SPILL-O2-VLEN128: # %bb.0: 94; SPILL-O2-VLEN128-NEXT: addi sp, sp, -32 95; SPILL-O2-VLEN128-NEXT: sd ra, 24(sp) # 8-byte Folded Spill 96; SPILL-O2-VLEN128-NEXT: sd s0, 16(sp) # 8-byte Folded Spill 97; SPILL-O2-VLEN128-NEXT: addi sp, sp, -32 98; SPILL-O2-VLEN128-NEXT: mv s0, a0 99; SPILL-O2-VLEN128-NEXT: addi a1, sp, 16 100; SPILL-O2-VLEN128-NEXT: vs1r.v v8, (a1) # Unknown-size Folded Spill 101; SPILL-O2-VLEN128-NEXT: vsetvli zero, a0, e64, m1, ta, ma 102; SPILL-O2-VLEN128-NEXT: vfadd.vv v9, v8, v9 103; SPILL-O2-VLEN128-NEXT: addi a0, sp, 32 104; SPILL-O2-VLEN128-NEXT: vs1r.v v9, (a0) # Unknown-size Folded Spill 105; SPILL-O2-VLEN128-NEXT: lui a0, %hi(.L.str) 106; SPILL-O2-VLEN128-NEXT: addi a0, a0, %lo(.L.str) 107; SPILL-O2-VLEN128-NEXT: call puts 108; SPILL-O2-VLEN128-NEXT: addi a0, sp, 32 109; SPILL-O2-VLEN128-NEXT: vl1r.v v8, (a0) # Unknown-size Folded Reload 110; SPILL-O2-VLEN128-NEXT: addi a0, sp, 16 111; SPILL-O2-VLEN128-NEXT: vl1r.v v9, (a0) # Unknown-size Folded Reload 112; SPILL-O2-VLEN128-NEXT: vsetvli zero, s0, e64, m1, ta, ma 113; SPILL-O2-VLEN128-NEXT: vfadd.vv v8, v9, v8 114; SPILL-O2-VLEN128-NEXT: addi sp, sp, 32 115; SPILL-O2-VLEN128-NEXT: ld ra, 24(sp) # 8-byte Folded Reload 116; SPILL-O2-VLEN128-NEXT: ld s0, 16(sp) # 8-byte Folded Reload 117; SPILL-O2-VLEN128-NEXT: addi sp, sp, 32 118; SPILL-O2-VLEN128-NEXT: ret 119; 120; SPILL-O2-ZCMP-LABEL: foo: 121; SPILL-O2-ZCMP: # %bb.0: 122; SPILL-O2-ZCMP-NEXT: cm.push {ra, s0}, -32 123; SPILL-O2-ZCMP-NEXT: csrr a1, vlenb 124; SPILL-O2-ZCMP-NEXT: slli a1, a1, 1 125; SPILL-O2-ZCMP-NEXT: sub sp, sp, a1 126; SPILL-O2-ZCMP-NEXT: mv s0, a0 127; SPILL-O2-ZCMP-NEXT: addi a1, sp, 16 128; SPILL-O2-ZCMP-NEXT: vs1r.v v8, (a1) # Unknown-size Folded Spill 129; SPILL-O2-ZCMP-NEXT: vsetvli zero, a0, e64, m1, ta, ma 130; SPILL-O2-ZCMP-NEXT: vfadd.vv v9, v8, v9 131; SPILL-O2-ZCMP-NEXT: csrr a0, vlenb 132; SPILL-O2-ZCMP-NEXT: add a0, a0, sp 133; SPILL-O2-ZCMP-NEXT: addi a0, a0, 16 134; SPILL-O2-ZCMP-NEXT: vs1r.v v9, (a0) # Unknown-size Folded Spill 135; SPILL-O2-ZCMP-NEXT: lui a0, %hi(.L.str) 136; SPILL-O2-ZCMP-NEXT: addi a0, a0, %lo(.L.str) 137; SPILL-O2-ZCMP-NEXT: call puts 138; SPILL-O2-ZCMP-NEXT: csrr a0, vlenb 139; SPILL-O2-ZCMP-NEXT: add a0, a0, sp 140; SPILL-O2-ZCMP-NEXT: addi a0, a0, 16 141; SPILL-O2-ZCMP-NEXT: vl1r.v v8, (a0) # Unknown-size Folded Reload 142; SPILL-O2-ZCMP-NEXT: addi a0, sp, 16 143; SPILL-O2-ZCMP-NEXT: vl1r.v v9, (a0) # Unknown-size Folded Reload 144; SPILL-O2-ZCMP-NEXT: vsetvli zero, s0, e64, m1, ta, ma 145; SPILL-O2-ZCMP-NEXT: vfadd.vv v8, v9, v8 146; SPILL-O2-ZCMP-NEXT: csrr a0, vlenb 147; SPILL-O2-ZCMP-NEXT: slli a0, a0, 1 148; SPILL-O2-ZCMP-NEXT: add sp, sp, a0 149; SPILL-O2-ZCMP-NEXT: cm.popret {ra, s0}, 32 150{ 151 %x = call <vscale x 1 x double> @llvm.riscv.vfadd.nxv1f64.nxv1f64(<vscale x 1 x double> undef, <vscale x 1 x double> %a, <vscale x 1 x double> %b, i64 7, i64 %gvl) 152 %call = call signext i32 @puts(ptr @.str) 153 %z = call <vscale x 1 x double> @llvm.riscv.vfadd.nxv1f64.nxv1f64(<vscale x 1 x double> undef, <vscale x 1 x double> %a, <vscale x 1 x double> %x, i64 7, i64 %gvl) 154 ret <vscale x 1 x double> %z 155} 156 157declare <vscale x 1 x double> @llvm.riscv.vfadd.nxv1f64.nxv1f64(<vscale x 1 x double> %passthru, <vscale x 1 x double> %a, <vscale x 1 x double> %b, i64, i64 %gvl) 158declare i32 @puts(ptr); 159