xref: /llvm-project/llvm/test/Transforms/SLPVectorizer/RISCV/partial-vec-invalid-cost.ll (revision 947d8ebbf33724245bd419d7b5f750d6aef1057e)
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
2; RUN: opt < %s -passes=slp-vectorizer -S | FileCheck %s
3
4target triple = "riscv64-unknown-linux-gnu"
5
6define void @partial_vec_invalid_cost() #0 {
7; CHECK-LABEL: define void @partial_vec_invalid_cost(
8; CHECK-SAME: ) #[[ATTR0:[0-9]+]] {
9; CHECK-NEXT:  entry:
10; CHECK-NEXT:    [[LSHR_1:%.*]] = lshr i96 0, 0
11; CHECK-NEXT:    [[LSHR_2:%.*]] = lshr i96 0, 0
12; CHECK-NEXT:    [[TRUNC_I96_1:%.*]] = trunc i96 [[LSHR_1]] to i32
13; CHECK-NEXT:    [[TRUNC_I96_2:%.*]] = trunc i96 [[LSHR_2]] to i32
14; CHECK-NEXT:    [[TRUNC_I96_3:%.*]] = trunc i96 0 to i32
15; CHECK-NEXT:    [[TRUNC_I96_4:%.*]] = trunc i96 0 to i32
16; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @llvm.vector.reduce.or.v4i32(<4 x i32> zeroinitializer)
17; CHECK-NEXT:    [[OP_RDX:%.*]] = or i32 [[TMP1]], [[TRUNC_I96_1]]
18; CHECK-NEXT:    [[OP_RDX1:%.*]] = or i32 [[TRUNC_I96_2]], [[TRUNC_I96_3]]
19; CHECK-NEXT:    [[OP_RDX2:%.*]] = or i32 [[OP_RDX]], [[OP_RDX1]]
20; CHECK-NEXT:    [[OP_RDX3:%.*]] = or i32 [[OP_RDX2]], [[TRUNC_I96_4]]
21; CHECK-NEXT:    [[STORE_THIS:%.*]] = zext i32 [[OP_RDX3]] to i96
22; CHECK-NEXT:    store i96 [[STORE_THIS]], ptr null, align 16
23; CHECK-NEXT:    ret void
24;
25entry:
26
27  %lshr.1 = lshr i96 0, 0 ; These ops
28  %lshr.2 = lshr i96 0, 0 ; return an
29  %add.0 = add i96 0, 0   ; invalid
30  %add.1 = add i96 0, 0   ; vector cost.
31
32  %trunc.i96.1 = trunc i96 %lshr.1 to i32 ; These ops
33  %trunc.i96.2 = trunc i96 %lshr.2 to i32 ; return an
34  %trunc.i96.3 = trunc i96 %add.0 to i32  ; invalid
35  %trunc.i96.4 = trunc i96 %add.1 to i32  ; vector cost.
36
37  %or.0 = or i32 %trunc.i96.1, %trunc.i96.2
38  %or.1 = or i32 %or.0, %trunc.i96.3
39  %or.2 = or i32 %or.1, %trunc.i96.4
40
41  %zext.0 = zext i1 0 to i32 ; These
42  %zext.1 = zext i1 0 to i32 ; ops
43  %zext.2 = zext i1 0 to i32 ; are
44  %zext.3 = zext i1 0 to i32 ; vectorized
45
46  %or.3 = or i32 %or.2, %zext.0 ; users
47  %or.4 = or i32 %or.3, %zext.1 ; of
48  %or.5 = or i32 %or.4, %zext.2 ; vectorized
49  %or.6 = or i32 %or.5, %zext.3 ; ops
50
51  %store.this = zext i32 %or.6 to i96
52
53  store i96 %store.this, ptr null, align 16
54  ret void
55}
56
57attributes #0 = { "target-features"="+v" }
58