xref: /llvm-project/llvm/test/Transforms/LoopVectorize/iv-select-cmp-non-const-iv-start.ll (revision f4081711f0884ec7afe93577e118ecc89cb7b1cf)
1*f4081711SMel Chen; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2*f4081711SMel Chen; RUN: opt -passes=loop-vectorize -force-vector-interleave=1 -force-vector-width=4 -S < %s | FileCheck %s --check-prefix=CHECK
3*f4081711SMel Chen; RUN: opt -passes=loop-vectorize -force-vector-interleave=4 -force-vector-width=4 -S < %s | FileCheck %s --check-prefix=CHECK
4*f4081711SMel Chen; RUN: opt -passes=loop-vectorize -force-vector-interleave=4 -force-vector-width=1 -S < %s | FileCheck %s --check-prefix=CHECK
5*f4081711SMel Chen
6*f4081711SMel Chendefine i64 @select_non_const_iv_start_signed_guard(ptr %a, i64 %rdx_start, i64 %iv_start ,i64 %n) {
7*f4081711SMel Chen; CHECK-LABEL: define i64 @select_non_const_iv_start_signed_guard(
8*f4081711SMel Chen; CHECK-SAME: ptr [[A:%.*]], i64 [[RDX_START:%.*]], i64 [[IV_START:%.*]], i64 [[N:%.*]]) {
9*f4081711SMel Chen; CHECK-NEXT:  [[ENTRY:.*]]:
10*f4081711SMel Chen; CHECK-NEXT:    [[GUARD:%.*]] = icmp slt i64 [[IV_START]], [[N]]
11*f4081711SMel Chen; CHECK-NEXT:    br i1 [[GUARD]], label %[[FOR_BODY_PREHEADER:.*]], label %[[EXIT:.*]]
12*f4081711SMel Chen; CHECK:       [[FOR_BODY_PREHEADER]]:
13*f4081711SMel Chen; CHECK-NEXT:    br label %[[FOR_BODY:.*]]
14*f4081711SMel Chen; CHECK:       [[FOR_BODY]]:
15*f4081711SMel Chen; CHECK-NEXT:    [[IV:%.*]] = phi i64 [ [[IV_NEXT:%.*]], %[[FOR_BODY]] ], [ [[IV_START]], %[[FOR_BODY_PREHEADER]] ]
16*f4081711SMel Chen; CHECK-NEXT:    [[RDX_07:%.*]] = phi i64 [ [[COND:%.*]], %[[FOR_BODY]] ], [ [[RDX_START]], %[[FOR_BODY_PREHEADER]] ]
17*f4081711SMel Chen; CHECK-NEXT:    [[ARRAYIDX:%.*]] = getelementptr inbounds i64, ptr [[A]], i64 [[IV]]
18*f4081711SMel Chen; CHECK-NEXT:    [[TMP0:%.*]] = load i64, ptr [[ARRAYIDX]], align 4
19*f4081711SMel Chen; CHECK-NEXT:    [[CMP1:%.*]] = icmp sgt i64 [[TMP0]], 3
20*f4081711SMel Chen; CHECK-NEXT:    [[COND]] = select i1 [[CMP1]], i64 [[IV]], i64 [[RDX_07]]
21*f4081711SMel Chen; CHECK-NEXT:    [[IV_NEXT]] = add nsw i64 [[IV]], 1
22*f4081711SMel Chen; CHECK-NEXT:    [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
23*f4081711SMel Chen; CHECK-NEXT:    br i1 [[EXITCOND_NOT]], label %[[EXIT_LOOPEXIT:.*]], label %[[FOR_BODY]]
24*f4081711SMel Chen; CHECK:       [[EXIT_LOOPEXIT]]:
25*f4081711SMel Chen; CHECK-NEXT:    [[COND_LCSSA:%.*]] = phi i64 [ [[COND]], %[[FOR_BODY]] ]
26*f4081711SMel Chen; CHECK-NEXT:    br label %[[EXIT]]
27*f4081711SMel Chen; CHECK:       [[EXIT]]:
28*f4081711SMel Chen; CHECK-NEXT:    [[IDX_0_LCSSA:%.*]] = phi i64 [ [[RDX_START]], %[[ENTRY]] ], [ [[COND_LCSSA]], %[[EXIT_LOOPEXIT]] ]
29*f4081711SMel Chen; CHECK-NEXT:    ret i64 [[IDX_0_LCSSA]]
30*f4081711SMel Chen;
31*f4081711SMel Chenentry:
32*f4081711SMel Chen  %guard = icmp slt i64 %iv_start, %n
33*f4081711SMel Chen  br i1 %guard, label %for.body, label %exit
34*f4081711SMel Chen
35*f4081711SMel Chenfor.body:
36*f4081711SMel Chen  %iv = phi i64 [ %iv_start, %entry ], [ %iv.next, %for.body ]
37*f4081711SMel Chen  %rdx.07 = phi i64 [ %rdx_start, %entry ], [ %cond, %for.body ]
38*f4081711SMel Chen  %arrayidx = getelementptr inbounds i64, ptr %a, i64 %iv
39*f4081711SMel Chen  %1 = load i64, ptr %arrayidx, align 4
40*f4081711SMel Chen  %cmp1 = icmp sgt i64 %1, 3
41*f4081711SMel Chen  %cond = select i1 %cmp1, i64 %iv, i64 %rdx.07
42*f4081711SMel Chen  %iv.next = add nsw i64 %iv, 1
43*f4081711SMel Chen  %exitcond.not = icmp eq i64 %iv.next, %n
44*f4081711SMel Chen  br i1 %exitcond.not, label %exit, label %for.body
45*f4081711SMel Chen
46*f4081711SMel Chenexit:
47*f4081711SMel Chen  %idx.0.lcssa = phi i64 [ %rdx_start, %entry ], [ %cond, %for.body ]
48*f4081711SMel Chen  ret i64 %idx.0.lcssa
49*f4081711SMel Chen}
50*f4081711SMel Chen
51*f4081711SMel Chendefine i32 @select_trunc_non_const_iv_start_signed_guard(ptr %a, i32 %rdx_start, i32 %iv_start ,i32 %n) {
52*f4081711SMel Chen; CHECK-LABEL: define i32 @select_trunc_non_const_iv_start_signed_guard(
53*f4081711SMel Chen; CHECK-SAME: ptr [[A:%.*]], i32 [[RDX_START:%.*]], i32 [[IV_START:%.*]], i32 [[N:%.*]]) {
54*f4081711SMel Chen; CHECK-NEXT:  [[ENTRY:.*]]:
55*f4081711SMel Chen; CHECK-NEXT:    [[GUARD:%.*]] = icmp slt i32 [[IV_START]], [[N]]
56*f4081711SMel Chen; CHECK-NEXT:    br i1 [[GUARD]], label %[[FOR_BODY_PREHEADER:.*]], label %[[EXIT:.*]]
57*f4081711SMel Chen; CHECK:       [[FOR_BODY_PREHEADER]]:
58*f4081711SMel Chen; CHECK-NEXT:    [[TMP0:%.*]] = sext i32 [[IV_START]] to i64
59*f4081711SMel Chen; CHECK-NEXT:    [[WIDE_TRIP_COUNT:%.*]] = sext i32 [[N]] to i64
60*f4081711SMel Chen; CHECK-NEXT:    br label %[[FOR_BODY:.*]]
61*f4081711SMel Chen; CHECK:       [[FOR_BODY]]:
62*f4081711SMel Chen; CHECK-NEXT:    [[IV:%.*]] = phi i64 [ [[TMP0]], %[[FOR_BODY_PREHEADER]] ], [ [[IV_NEXT:%.*]], %[[FOR_BODY]] ]
63*f4081711SMel Chen; CHECK-NEXT:    [[RDX_07:%.*]] = phi i32 [ [[RDX_START]], %[[FOR_BODY_PREHEADER]] ], [ [[COND:%.*]], %[[FOR_BODY]] ]
64*f4081711SMel Chen; CHECK-NEXT:    [[ARRAYIDX:%.*]] = getelementptr inbounds i32, ptr [[A]], i64 [[IV]]
65*f4081711SMel Chen; CHECK-NEXT:    [[TMP1:%.*]] = load i32, ptr [[ARRAYIDX]], align 4
66*f4081711SMel Chen; CHECK-NEXT:    [[CMP1:%.*]] = icmp sgt i32 [[TMP1]], 3
67*f4081711SMel Chen; CHECK-NEXT:    [[TMP2:%.*]] = trunc i64 [[IV]] to i32
68*f4081711SMel Chen; CHECK-NEXT:    [[COND]] = select i1 [[CMP1]], i32 [[TMP2]], i32 [[RDX_07]]
69*f4081711SMel Chen; CHECK-NEXT:    [[IV_NEXT]] = add nsw i64 [[IV]], 1
70*f4081711SMel Chen; CHECK-NEXT:    [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[WIDE_TRIP_COUNT]]
71*f4081711SMel Chen; CHECK-NEXT:    br i1 [[EXITCOND_NOT]], label %[[EXIT_LOOPEXIT:.*]], label %[[FOR_BODY]]
72*f4081711SMel Chen; CHECK:       [[EXIT_LOOPEXIT]]:
73*f4081711SMel Chen; CHECK-NEXT:    [[COND_LCSSA:%.*]] = phi i32 [ [[COND]], %[[FOR_BODY]] ]
74*f4081711SMel Chen; CHECK-NEXT:    br label %[[EXIT]]
75*f4081711SMel Chen; CHECK:       [[EXIT]]:
76*f4081711SMel Chen; CHECK-NEXT:    [[IDX_0_LCSSA:%.*]] = phi i32 [ [[RDX_START]], %[[ENTRY]] ], [ [[COND_LCSSA]], %[[EXIT_LOOPEXIT]] ]
77*f4081711SMel Chen; CHECK-NEXT:    ret i32 [[IDX_0_LCSSA]]
78*f4081711SMel Chen;
79*f4081711SMel Chenentry:
80*f4081711SMel Chen  %guard = icmp slt i32 %iv_start, %n
81*f4081711SMel Chen  br i1 %guard, label %for.body.preheader, label %exit
82*f4081711SMel Chen
83*f4081711SMel Chenfor.body.preheader:
84*f4081711SMel Chen  %0 = sext i32 %iv_start to i64
85*f4081711SMel Chen  %wide.trip.count = sext i32 %n to i64
86*f4081711SMel Chen  br label %for.body
87*f4081711SMel Chen
88*f4081711SMel Chenfor.body:
89*f4081711SMel Chen  %iv = phi i64 [ %0, %for.body.preheader ], [ %iv.next, %for.body ]
90*f4081711SMel Chen  %rdx.07 = phi i32 [ %rdx_start, %for.body.preheader ], [ %cond, %for.body ]
91*f4081711SMel Chen  %arrayidx = getelementptr inbounds i32, ptr %a, i64 %iv
92*f4081711SMel Chen  %1 = load i32, ptr %arrayidx, align 4
93*f4081711SMel Chen  %cmp1 = icmp sgt i32 %1, 3
94*f4081711SMel Chen  %2 = trunc i64 %iv to i32
95*f4081711SMel Chen  %cond = select i1 %cmp1, i32 %2, i32 %rdx.07
96*f4081711SMel Chen  %iv.next = add nsw i64 %iv, 1
97*f4081711SMel Chen  %exitcond.not = icmp eq i64 %iv.next, %wide.trip.count
98*f4081711SMel Chen  br i1 %exitcond.not, label %exit, label %for.body
99*f4081711SMel Chen
100*f4081711SMel Chenexit:
101*f4081711SMel Chen  %idx.0.lcssa = phi i32 [ %rdx_start, %entry ], [ %cond, %for.body ]
102*f4081711SMel Chen  ret i32 %idx.0.lcssa
103*f4081711SMel Chen}
104