1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2; RUN: llc -O3 < %s -mtriple=riscv64 -mattr=+v | FileCheck %s 3 4declare i32 @llvm.vector.reduce.add.nxv2i32(<vscale x 2 x i32>) 5 6define i32 @test(ptr %a, i64 %n) { 7; CHECK-LABEL: test: 8; CHECK: # %bb.0: # %entry 9; CHECK-NEXT: li a3, 0 10; CHECK-NEXT: vsetvli a2, zero, e32, m1, ta, ma 11; CHECK-NEXT: vmv.s.x v8, zero 12; CHECK-NEXT: .LBB0_1: # %loop 13; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 14; CHECK-NEXT: vl1re32.v v9, (a0) 15; CHECK-NEXT: mv a2, a3 16; CHECK-NEXT: addi a1, a1, -1 17; CHECK-NEXT: vredsum.vs v9, v9, v8 18; CHECK-NEXT: vmv.x.s a3, v9 19; CHECK-NEXT: addw a3, a3, a3 20; CHECK-NEXT: addi a0, a0, 8 21; CHECK-NEXT: bnez a1, .LBB0_1 22; CHECK-NEXT: # %bb.2: # %exit 23; CHECK-NEXT: mv a0, a2 24; CHECK-NEXT: ret 25entry: 26 br label %loop 27 28loop: 29 %indvar = phi i64 [ 0, %entry ], [ %indvar.inc, %loop ] 30 %sum = phi i32 [ 0, %entry ], [ %sum.inc, %loop ] 31 %idx = getelementptr inbounds ptr, ptr %a, i64 %indvar 32 %data = load <vscale x 2 x i32>, ptr %idx 33 %reduce = tail call i32 @llvm.vector.reduce.add.nxv2i32(<vscale x 2 x i32> %data) 34 %sum.inc = add i32 %reduce, %reduce 35 %indvar.inc = add i64 %indvar, 1 36 %cmp = icmp eq i64 %indvar.inc, %n 37 br i1 %cmp, label %exit, label %loop 38 39exit: 40 ret i32 %sum 41} 42