1b13f7996SCraig Topper; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 21cb59983SLuke Lau; RUN: llc -mtriple=riscv32 -mattr=+d,+zvfh,+v -target-abi=ilp32d \ 3b13f7996SCraig Topper; RUN: -verify-machineinstrs < %s | FileCheck %s 41cb59983SLuke Lau; RUN: llc -mtriple=riscv64 -mattr=+d,+zvfh,+v -target-abi=lp64d \ 5b13f7996SCraig Topper; RUN: -verify-machineinstrs < %s | FileCheck %s 6b13f7996SCraig Topper 7b13f7996SCraig Topper; This file tests the code generation for `llvm.experimental.constrained.round.*` on scalable vector type. 8b13f7996SCraig Topper 9b13f7996SCraig Topperdefine <1 x half> @round_v1f16(<1 x half> %x) strictfp { 10b13f7996SCraig Topper; CHECK-LABEL: round_v1f16: 11b13f7996SCraig Topper; CHECK: # %bb.0: 12d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 1, e16, mf4, ta, mu 13b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 14b13f7996SCraig Topper; CHECK-NEXT: lui a0, %hi(.LCPI0_0) 15b13f7996SCraig Topper; CHECK-NEXT: flh fa5, %lo(.LCPI0_0)(a0) 16b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 17b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v9, v8 18b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v9, fa5 19b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 20d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, mf4, ta, ma 21b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v9, v8, v0.t 22b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 23b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v9, v9, v0.t 24b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, mf4, ta, mu 25b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v9, v8, v0.t 26b13f7996SCraig Topper; CHECK-NEXT: ret 27b13f7996SCraig Topper %a = call <1 x half> @llvm.experimental.constrained.round.v1f16(<1 x half> %x, metadata !"fpexcept.strict") 28b13f7996SCraig Topper ret <1 x half> %a 29b13f7996SCraig Topper} 30b13f7996SCraig Topperdeclare <1 x half> @llvm.experimental.constrained.round.v1f16(<1 x half>, metadata) 31b13f7996SCraig Topper 32b13f7996SCraig Topperdefine <2 x half> @round_v2f16(<2 x half> %x) strictfp { 33b13f7996SCraig Topper; CHECK-LABEL: round_v2f16: 34b13f7996SCraig Topper; CHECK: # %bb.0: 35d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 2, e16, mf4, ta, mu 36b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 37b13f7996SCraig Topper; CHECK-NEXT: lui a0, %hi(.LCPI1_0) 38b13f7996SCraig Topper; CHECK-NEXT: flh fa5, %lo(.LCPI1_0)(a0) 39b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 40b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v9, v8 41b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v9, fa5 42b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 43d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, mf4, ta, ma 44b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v9, v8, v0.t 45b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 46b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v9, v9, v0.t 47b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, mf4, ta, mu 48b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v9, v8, v0.t 49b13f7996SCraig Topper; CHECK-NEXT: ret 50b13f7996SCraig Topper %a = call <2 x half> @llvm.experimental.constrained.round.v2f16(<2 x half> %x, metadata !"fpexcept.strict") 51b13f7996SCraig Topper ret <2 x half> %a 52b13f7996SCraig Topper} 53b13f7996SCraig Topperdeclare <2 x half> @llvm.experimental.constrained.round.v2f16(<2 x half>, metadata) 54b13f7996SCraig Topper 55b13f7996SCraig Topperdefine <4 x half> @round_v4f16(<4 x half> %x) strictfp { 56b13f7996SCraig Topper; CHECK-LABEL: round_v4f16: 57b13f7996SCraig Topper; CHECK: # %bb.0: 58d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 4, e16, mf2, ta, mu 59b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 60b13f7996SCraig Topper; CHECK-NEXT: lui a0, %hi(.LCPI2_0) 61b13f7996SCraig Topper; CHECK-NEXT: flh fa5, %lo(.LCPI2_0)(a0) 62b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 63b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v9, v8 64b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v9, fa5 65b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 66d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, mf2, ta, ma 67b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v9, v8, v0.t 68b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 69b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v9, v9, v0.t 70b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, mf2, ta, mu 71b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v9, v8, v0.t 72b13f7996SCraig Topper; CHECK-NEXT: ret 73b13f7996SCraig Topper %a = call <4 x half> @llvm.experimental.constrained.round.v4f16(<4 x half> %x, metadata !"fpexcept.strict") 74b13f7996SCraig Topper ret <4 x half> %a 75b13f7996SCraig Topper} 76b13f7996SCraig Topperdeclare <4 x half> @llvm.experimental.constrained.round.v4f16(<4 x half>, metadata) 77b13f7996SCraig Topper 78b13f7996SCraig Topperdefine <8 x half> @round_v8f16(<8 x half> %x) strictfp { 79b13f7996SCraig Topper; CHECK-LABEL: round_v8f16: 80b13f7996SCraig Topper; CHECK: # %bb.0: 81d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 8, e16, m1, ta, mu 82b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 83b13f7996SCraig Topper; CHECK-NEXT: lui a0, %hi(.LCPI3_0) 84b13f7996SCraig Topper; CHECK-NEXT: flh fa5, %lo(.LCPI3_0)(a0) 85b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 86b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v9, v8 87b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v9, fa5 88b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 89d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, m1, ta, ma 90b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v9, v8, v0.t 91b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 92b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v9, v9, v0.t 93b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, m1, ta, mu 94b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v9, v8, v0.t 95b13f7996SCraig Topper; CHECK-NEXT: ret 96b13f7996SCraig Topper %a = call <8 x half> @llvm.experimental.constrained.round.v8f16(<8 x half> %x, metadata !"fpexcept.strict") 97b13f7996SCraig Topper ret <8 x half> %a 98b13f7996SCraig Topper} 99b13f7996SCraig Topperdeclare <8 x half> @llvm.experimental.constrained.round.v8f16(<8 x half>, metadata) 100b13f7996SCraig Topper 101b13f7996SCraig Topperdefine <16 x half> @round_v16f16(<16 x half> %x) strictfp { 102b13f7996SCraig Topper; CHECK-LABEL: round_v16f16: 103b13f7996SCraig Topper; CHECK: # %bb.0: 104d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 16, e16, m2, ta, mu 105b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 106b13f7996SCraig Topper; CHECK-NEXT: lui a0, %hi(.LCPI4_0) 107b13f7996SCraig Topper; CHECK-NEXT: flh fa5, %lo(.LCPI4_0)(a0) 108b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 109b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v10, v8 110b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v10, fa5 111b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 112d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, m2, ta, ma 113b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v10, v8, v0.t 114b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 115b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v10, v10, v0.t 116b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, m2, ta, mu 117b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v10, v8, v0.t 118b13f7996SCraig Topper; CHECK-NEXT: ret 119b13f7996SCraig Topper %a = call <16 x half> @llvm.experimental.constrained.round.v16f16(<16 x half> %x, metadata !"fpexcept.strict") 120b13f7996SCraig Topper ret <16 x half> %a 121b13f7996SCraig Topper} 122b13f7996SCraig Topperdeclare <16 x half> @llvm.experimental.constrained.round.v16f16(<16 x half>, metadata) 123b13f7996SCraig Topper 124b13f7996SCraig Topperdefine <32 x half> @round_v32f16(<32 x half> %x) strictfp { 125b13f7996SCraig Topper; CHECK-LABEL: round_v32f16: 126b13f7996SCraig Topper; CHECK: # %bb.0: 127b13f7996SCraig Topper; CHECK-NEXT: li a0, 32 128*9122c523SPengcheng Wang; CHECK-NEXT: lui a1, %hi(.LCPI5_0) 129d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, a0, e16, m4, ta, mu 130b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 131*9122c523SPengcheng Wang; CHECK-NEXT: flh fa5, %lo(.LCPI5_0)(a1) 132b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 133b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v12, v8 134b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v12, fa5 135b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 136d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, m4, ta, ma 137b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v12, v8, v0.t 138b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 139b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v12, v12, v0.t 140b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e16, m4, ta, mu 141b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v12, v8, v0.t 142b13f7996SCraig Topper; CHECK-NEXT: ret 143b13f7996SCraig Topper %a = call <32 x half> @llvm.experimental.constrained.round.v32f16(<32 x half> %x, metadata !"fpexcept.strict") 144b13f7996SCraig Topper ret <32 x half> %a 145b13f7996SCraig Topper} 146b13f7996SCraig Topperdeclare <32 x half> @llvm.experimental.constrained.round.v32f16(<32 x half>, metadata) 147b13f7996SCraig Topper 148b13f7996SCraig Topperdefine <1 x float> @round_v1f32(<1 x float> %x) strictfp { 149b13f7996SCraig Topper; CHECK-LABEL: round_v1f32: 150b13f7996SCraig Topper; CHECK: # %bb.0: 151d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 1, e32, mf2, ta, mu 152b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 153b13f7996SCraig Topper; CHECK-NEXT: lui a0, 307200 154*9122c523SPengcheng Wang; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 155b13f7996SCraig Topper; CHECK-NEXT: fmv.w.x fa5, a0 156*9122c523SPengcheng Wang; CHECK-NEXT: vfabs.v v9, v8 157b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v9, fa5 158b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 159d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, mf2, ta, ma 160b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v9, v8, v0.t 161b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 162b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v9, v9, v0.t 163b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, mf2, ta, mu 164b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v9, v8, v0.t 165b13f7996SCraig Topper; CHECK-NEXT: ret 166b13f7996SCraig Topper %a = call <1 x float> @llvm.experimental.constrained.round.v1f32(<1 x float> %x, metadata !"fpexcept.strict") 167b13f7996SCraig Topper ret <1 x float> %a 168b13f7996SCraig Topper} 169b13f7996SCraig Topperdeclare <1 x float> @llvm.experimental.constrained.round.v1f32(<1 x float>, metadata) 170b13f7996SCraig Topper 171b13f7996SCraig Topperdefine <2 x float> @round_v2f32(<2 x float> %x) strictfp { 172b13f7996SCraig Topper; CHECK-LABEL: round_v2f32: 173b13f7996SCraig Topper; CHECK: # %bb.0: 174d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 2, e32, mf2, ta, mu 175b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 176b13f7996SCraig Topper; CHECK-NEXT: lui a0, 307200 177*9122c523SPengcheng Wang; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 178b13f7996SCraig Topper; CHECK-NEXT: fmv.w.x fa5, a0 179*9122c523SPengcheng Wang; CHECK-NEXT: vfabs.v v9, v8 180b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v9, fa5 181b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 182d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, mf2, ta, ma 183b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v9, v8, v0.t 184b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 185b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v9, v9, v0.t 186b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, mf2, ta, mu 187b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v9, v8, v0.t 188b13f7996SCraig Topper; CHECK-NEXT: ret 189b13f7996SCraig Topper %a = call <2 x float> @llvm.experimental.constrained.round.v2f32(<2 x float> %x, metadata !"fpexcept.strict") 190b13f7996SCraig Topper ret <2 x float> %a 191b13f7996SCraig Topper} 192b13f7996SCraig Topperdeclare <2 x float> @llvm.experimental.constrained.round.v2f32(<2 x float>, metadata) 193b13f7996SCraig Topper 194b13f7996SCraig Topperdefine <4 x float> @round_v4f32(<4 x float> %x) strictfp { 195b13f7996SCraig Topper; CHECK-LABEL: round_v4f32: 196b13f7996SCraig Topper; CHECK: # %bb.0: 197d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 4, e32, m1, ta, mu 198b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 199b13f7996SCraig Topper; CHECK-NEXT: lui a0, 307200 200*9122c523SPengcheng Wang; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 201b13f7996SCraig Topper; CHECK-NEXT: fmv.w.x fa5, a0 202*9122c523SPengcheng Wang; CHECK-NEXT: vfabs.v v9, v8 203b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v9, fa5 204b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 205d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, m1, ta, ma 206b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v9, v8, v0.t 207b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 208b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v9, v9, v0.t 209b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, m1, ta, mu 210b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v9, v8, v0.t 211b13f7996SCraig Topper; CHECK-NEXT: ret 212b13f7996SCraig Topper %a = call <4 x float> @llvm.experimental.constrained.round.v4f32(<4 x float> %x, metadata !"fpexcept.strict") 213b13f7996SCraig Topper ret <4 x float> %a 214b13f7996SCraig Topper} 215b13f7996SCraig Topperdeclare <4 x float> @llvm.experimental.constrained.round.v4f32(<4 x float>, metadata) 216b13f7996SCraig Topper 217b13f7996SCraig Topperdefine <8 x float> @round_v8f32(<8 x float> %x) strictfp { 218b13f7996SCraig Topper; CHECK-LABEL: round_v8f32: 219b13f7996SCraig Topper; CHECK: # %bb.0: 220d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 8, e32, m2, ta, mu 221b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 222b13f7996SCraig Topper; CHECK-NEXT: lui a0, 307200 223*9122c523SPengcheng Wang; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 224b13f7996SCraig Topper; CHECK-NEXT: fmv.w.x fa5, a0 225*9122c523SPengcheng Wang; CHECK-NEXT: vfabs.v v10, v8 226b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v10, fa5 227b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 228d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, m2, ta, ma 229b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v10, v8, v0.t 230b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 231b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v10, v10, v0.t 232b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, m2, ta, mu 233b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v10, v8, v0.t 234b13f7996SCraig Topper; CHECK-NEXT: ret 235b13f7996SCraig Topper %a = call <8 x float> @llvm.experimental.constrained.round.v8f32(<8 x float> %x, metadata !"fpexcept.strict") 236b13f7996SCraig Topper ret <8 x float> %a 237b13f7996SCraig Topper} 238b13f7996SCraig Topperdeclare <8 x float> @llvm.experimental.constrained.round.v8f32(<8 x float>, metadata) 239b13f7996SCraig Topper 240b13f7996SCraig Topperdefine <16 x float> @round_v16f32(<16 x float> %x) strictfp { 241b13f7996SCraig Topper; CHECK-LABEL: round_v16f32: 242b13f7996SCraig Topper; CHECK: # %bb.0: 243d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 16, e32, m4, ta, mu 244b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 245b13f7996SCraig Topper; CHECK-NEXT: lui a0, 307200 246*9122c523SPengcheng Wang; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 247b13f7996SCraig Topper; CHECK-NEXT: fmv.w.x fa5, a0 248*9122c523SPengcheng Wang; CHECK-NEXT: vfabs.v v12, v8 249b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v12, fa5 250b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 251d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, m4, ta, ma 252b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v12, v8, v0.t 253b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 254b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v12, v12, v0.t 255b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e32, m4, ta, mu 256b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v12, v8, v0.t 257b13f7996SCraig Topper; CHECK-NEXT: ret 258b13f7996SCraig Topper %a = call <16 x float> @llvm.experimental.constrained.round.v16f32(<16 x float> %x, metadata !"fpexcept.strict") 259b13f7996SCraig Topper ret <16 x float> %a 260b13f7996SCraig Topper} 261b13f7996SCraig Topperdeclare <16 x float> @llvm.experimental.constrained.round.v16f32(<16 x float>, metadata) 262b13f7996SCraig Topper 263b13f7996SCraig Topperdefine <1 x double> @round_v1f64(<1 x double> %x) strictfp { 264b13f7996SCraig Topper; CHECK-LABEL: round_v1f64: 265b13f7996SCraig Topper; CHECK: # %bb.0: 266d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 1, e64, m1, ta, mu 267b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 268b13f7996SCraig Topper; CHECK-NEXT: lui a0, %hi(.LCPI11_0) 269b13f7996SCraig Topper; CHECK-NEXT: fld fa5, %lo(.LCPI11_0)(a0) 270b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 271b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v9, v8 272b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v9, fa5 273b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 274d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e64, m1, ta, ma 275b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v9, v8, v0.t 276b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 277b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v9, v9, v0.t 278b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e64, m1, ta, mu 279b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v9, v8, v0.t 280b13f7996SCraig Topper; CHECK-NEXT: ret 281b13f7996SCraig Topper %a = call <1 x double> @llvm.experimental.constrained.round.v1f64(<1 x double> %x, metadata !"fpexcept.strict") 282b13f7996SCraig Topper ret <1 x double> %a 283b13f7996SCraig Topper} 284b13f7996SCraig Topperdeclare <1 x double> @llvm.experimental.constrained.round.v1f64(<1 x double>, metadata) 285b13f7996SCraig Topper 286b13f7996SCraig Topperdefine <2 x double> @round_v2f64(<2 x double> %x) strictfp { 287b13f7996SCraig Topper; CHECK-LABEL: round_v2f64: 288b13f7996SCraig Topper; CHECK: # %bb.0: 289d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 2, e64, m1, ta, mu 290b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 291b13f7996SCraig Topper; CHECK-NEXT: lui a0, %hi(.LCPI12_0) 292b13f7996SCraig Topper; CHECK-NEXT: fld fa5, %lo(.LCPI12_0)(a0) 293b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 294b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v9, v8 295b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v9, fa5 296b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 297d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e64, m1, ta, ma 298b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v9, v8, v0.t 299b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 300b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v9, v9, v0.t 301b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e64, m1, ta, mu 302b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v9, v8, v0.t 303b13f7996SCraig Topper; CHECK-NEXT: ret 304b13f7996SCraig Topper %a = call <2 x double> @llvm.experimental.constrained.round.v2f64(<2 x double> %x, metadata !"fpexcept.strict") 305b13f7996SCraig Topper ret <2 x double> %a 306b13f7996SCraig Topper} 307b13f7996SCraig Topperdeclare <2 x double> @llvm.experimental.constrained.round.v2f64(<2 x double>, metadata) 308b13f7996SCraig Topper 309b13f7996SCraig Topperdefine <4 x double> @round_v4f64(<4 x double> %x) strictfp { 310b13f7996SCraig Topper; CHECK-LABEL: round_v4f64: 311b13f7996SCraig Topper; CHECK: # %bb.0: 312d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 4, e64, m2, ta, mu 313b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 314b13f7996SCraig Topper; CHECK-NEXT: lui a0, %hi(.LCPI13_0) 315b13f7996SCraig Topper; CHECK-NEXT: fld fa5, %lo(.LCPI13_0)(a0) 316b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 317b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v10, v8 318b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v10, fa5 319b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 320d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e64, m2, ta, ma 321b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v10, v8, v0.t 322b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 323b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v10, v10, v0.t 324b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e64, m2, ta, mu 325b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v10, v8, v0.t 326b13f7996SCraig Topper; CHECK-NEXT: ret 327b13f7996SCraig Topper %a = call <4 x double> @llvm.experimental.constrained.round.v4f64(<4 x double> %x, metadata !"fpexcept.strict") 328b13f7996SCraig Topper ret <4 x double> %a 329b13f7996SCraig Topper} 330b13f7996SCraig Topperdeclare <4 x double> @llvm.experimental.constrained.round.v4f64(<4 x double>, metadata) 331b13f7996SCraig Topper 332b13f7996SCraig Topperdefine <8 x double> @round_v8f64(<8 x double> %x) strictfp { 333b13f7996SCraig Topper; CHECK-LABEL: round_v8f64: 334b13f7996SCraig Topper; CHECK: # %bb.0: 335d490ce22SCraig Topper; CHECK-NEXT: vsetivli zero, 8, e64, m4, ta, mu 336b13f7996SCraig Topper; CHECK-NEXT: vmfne.vv v0, v8, v8 337b13f7996SCraig Topper; CHECK-NEXT: lui a0, %hi(.LCPI14_0) 338b13f7996SCraig Topper; CHECK-NEXT: fld fa5, %lo(.LCPI14_0)(a0) 339b13f7996SCraig Topper; CHECK-NEXT: vfadd.vv v8, v8, v8, v0.t 340b13f7996SCraig Topper; CHECK-NEXT: vfabs.v v12, v8 341b13f7996SCraig Topper; CHECK-NEXT: vmflt.vf v0, v12, fa5 342b13f7996SCraig Topper; CHECK-NEXT: fsrmi a0, 4 343d490ce22SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e64, m4, ta, ma 344b13f7996SCraig Topper; CHECK-NEXT: vfcvt.x.f.v v12, v8, v0.t 345b13f7996SCraig Topper; CHECK-NEXT: fsrm a0 346b13f7996SCraig Topper; CHECK-NEXT: vfcvt.f.x.v v12, v12, v0.t 347b13f7996SCraig Topper; CHECK-NEXT: vsetvli zero, zero, e64, m4, ta, mu 348b13f7996SCraig Topper; CHECK-NEXT: vfsgnj.vv v8, v12, v8, v0.t 349b13f7996SCraig Topper; CHECK-NEXT: ret 350b13f7996SCraig Topper %a = call <8 x double> @llvm.experimental.constrained.round.v8f64(<8 x double> %x, metadata !"fpexcept.strict") 351b13f7996SCraig Topper ret <8 x double> %a 352b13f7996SCraig Topper} 353b13f7996SCraig Topperdeclare <8 x double> @llvm.experimental.constrained.round.v8f64(<8 x double>, metadata) 354