xref: /llvm-project/llvm/test/Transforms/LoopVectorize/pointer-induction-unroll.ll (revision 06bb8c9f202e37f215b26ca0dd9b2d8adaf5a83d)
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2; RUN: opt < %s -passes=loop-vectorize -force-vector-interleave=4 -force-vector-width=1 -S | FileCheck --check-prefixes=CHECK,DEFAULT %s
3; RUN: opt < %s -passes=loop-vectorize -force-vector-interleave=4 -force-vector-width=1 -lv-strided-pointer-ivs=true -S | FileCheck --check-prefixes=CHECK,STRIDED %s
4target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
5
6; Test the scalar expansion of a non-constant stride pointer IV
7define void @non_constant_scalar_expansion(i32 %0, ptr %call) {
8; DEFAULT-LABEL: @non_constant_scalar_expansion(
9; DEFAULT-NEXT:  entry:
10; DEFAULT-NEXT:    [[MUL:%.*]] = shl i32 [[TMP0:%.*]], 1
11; DEFAULT-NEXT:    br label [[FOR_COND:%.*]]
12; DEFAULT:       for.cond:
13; DEFAULT-NEXT:    [[TMP1:%.*]] = phi i32 [ 30, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[FOR_COND]] ]
14; DEFAULT-NEXT:    [[P_0:%.*]] = phi ptr [ null, [[ENTRY]] ], [ [[ADD_PTR:%.*]], [[FOR_COND]] ]
15; DEFAULT-NEXT:    [[ADD_PTR]] = getelementptr i8, ptr [[P_0]], i32 [[MUL]]
16; DEFAULT-NEXT:    [[ARRAYIDX:%.*]] = getelementptr ptr, ptr [[CALL:%.*]], i32 [[TMP1]]
17; DEFAULT-NEXT:    store ptr [[P_0]], ptr [[ARRAYIDX]], align 4
18; DEFAULT-NEXT:    [[INC]] = add i32 [[TMP1]], 1
19; DEFAULT-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP1]], 0
20; DEFAULT-NEXT:    br i1 [[TOBOOL_NOT]], label [[FOR_END:%.*]], label [[FOR_COND]]
21; DEFAULT:       for.end:
22; DEFAULT-NEXT:    ret void
23;
24; STRIDED-LABEL: @non_constant_scalar_expansion(
25; STRIDED-NEXT:  entry:
26; STRIDED-NEXT:    [[MUL:%.*]] = shl i32 [[TMP0:%.*]], 1
27; STRIDED-NEXT:    [[TMP1:%.*]] = sext i32 [[MUL]] to i64
28; STRIDED-NEXT:    br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]]
29; STRIDED:       vector.ph:
30; STRIDED-NEXT:    [[TMP2:%.*]] = mul i64 4294967264, [[TMP1]]
31; STRIDED-NEXT:    [[IND_END:%.*]] = getelementptr i8, ptr null, i64 [[TMP2]]
32; STRIDED-NEXT:    br label [[VECTOR_BODY:%.*]]
33; STRIDED:       vector.body:
34; STRIDED-NEXT:    [[INDEX:%.*]] = phi i64 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
35; STRIDED-NEXT:    [[DOTCAST:%.*]] = trunc i64 [[INDEX]] to i32
36; STRIDED-NEXT:    [[OFFSET_IDX:%.*]] = add i32 30, [[DOTCAST]]
37; STRIDED-NEXT:    [[TMP3:%.*]] = add i32 [[OFFSET_IDX]], 0
38; STRIDED-NEXT:    [[TMP4:%.*]] = add i32 [[OFFSET_IDX]], 1
39; STRIDED-NEXT:    [[TMP5:%.*]] = add i32 [[OFFSET_IDX]], 2
40; STRIDED-NEXT:    [[TMP6:%.*]] = add i32 [[OFFSET_IDX]], 3
41; STRIDED-NEXT:    [[OFFSET_IDX2:%.*]] = mul i64 [[INDEX]], [[TMP1]]
42; STRIDED-NEXT:    [[TMP7:%.*]] = mul i64 0, [[TMP1]]
43; STRIDED-NEXT:    [[TMP8:%.*]] = add i64 [[OFFSET_IDX2]], [[TMP7]]
44; STRIDED-NEXT:    [[TMP9:%.*]] = mul i64 1, [[TMP1]]
45; STRIDED-NEXT:    [[TMP10:%.*]] = add i64 [[OFFSET_IDX2]], [[TMP9]]
46; STRIDED-NEXT:    [[TMP11:%.*]] = mul i64 2, [[TMP1]]
47; STRIDED-NEXT:    [[TMP12:%.*]] = add i64 [[OFFSET_IDX2]], [[TMP11]]
48; STRIDED-NEXT:    [[TMP13:%.*]] = mul i64 3, [[TMP1]]
49; STRIDED-NEXT:    [[TMP14:%.*]] = add i64 [[OFFSET_IDX2]], [[TMP13]]
50; STRIDED-NEXT:    [[TMP15:%.*]] = getelementptr i8, ptr null, i64 [[TMP8]]
51; STRIDED-NEXT:    [[TMP16:%.*]] = getelementptr i8, ptr null, i64 [[TMP10]]
52; STRIDED-NEXT:    [[TMP17:%.*]] = getelementptr i8, ptr null, i64 [[TMP12]]
53; STRIDED-NEXT:    [[TMP18:%.*]] = getelementptr i8, ptr null, i64 [[TMP14]]
54; STRIDED-NEXT:    [[TMP19:%.*]] = getelementptr ptr, ptr [[CALL:%.*]], i32 [[TMP3]]
55; STRIDED-NEXT:    [[TMP20:%.*]] = getelementptr ptr, ptr [[CALL]], i32 [[TMP4]]
56; STRIDED-NEXT:    [[TMP21:%.*]] = getelementptr ptr, ptr [[CALL]], i32 [[TMP5]]
57; STRIDED-NEXT:    [[TMP22:%.*]] = getelementptr ptr, ptr [[CALL]], i32 [[TMP6]]
58; STRIDED-NEXT:    store ptr [[TMP15]], ptr [[TMP19]], align 4
59; STRIDED-NEXT:    store ptr [[TMP16]], ptr [[TMP20]], align 4
60; STRIDED-NEXT:    store ptr [[TMP17]], ptr [[TMP21]], align 4
61; STRIDED-NEXT:    store ptr [[TMP18]], ptr [[TMP22]], align 4
62; STRIDED-NEXT:    [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 4
63; STRIDED-NEXT:    [[TMP23:%.*]] = icmp eq i64 [[INDEX_NEXT]], 4294967264
64; STRIDED-NEXT:    br i1 [[TMP23]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]]
65; STRIDED:       middle.block:
66; STRIDED-NEXT:    br i1 false, label [[FOR_END:%.*]], label [[SCALAR_PH]]
67; STRIDED:       scalar.ph:
68; STRIDED-NEXT:    [[BC_RESUME_VAL:%.*]] = phi i32 [ -2, [[MIDDLE_BLOCK]] ], [ 30, [[ENTRY:%.*]] ]
69; STRIDED-NEXT:    [[BC_RESUME_VAL1:%.*]] = phi ptr [ [[IND_END]], [[MIDDLE_BLOCK]] ], [ null, [[ENTRY]] ]
70; STRIDED-NEXT:    br label [[FOR_COND:%.*]]
71; STRIDED:       for.cond:
72; STRIDED-NEXT:    [[TMP24:%.*]] = phi i32 [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ], [ [[INC:%.*]], [[FOR_COND]] ]
73; STRIDED-NEXT:    [[P_0:%.*]] = phi ptr [ [[BC_RESUME_VAL1]], [[SCALAR_PH]] ], [ [[ADD_PTR:%.*]], [[FOR_COND]] ]
74; STRIDED-NEXT:    [[ADD_PTR]] = getelementptr i8, ptr [[P_0]], i32 [[MUL]]
75; STRIDED-NEXT:    [[ARRAYIDX:%.*]] = getelementptr ptr, ptr [[CALL]], i32 [[TMP24]]
76; STRIDED-NEXT:    store ptr [[P_0]], ptr [[ARRAYIDX]], align 4
77; STRIDED-NEXT:    [[INC]] = add i32 [[TMP24]], 1
78; STRIDED-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP24]], 0
79; STRIDED-NEXT:    br i1 [[TOBOOL_NOT]], label [[FOR_END]], label [[FOR_COND]], !llvm.loop [[LOOP3:![0-9]+]]
80; STRIDED:       for.end:
81; STRIDED-NEXT:    ret void
82;
83entry:
84  %mul = shl i32 %0, 1
85  br label %for.cond
86
87for.cond:                                         ; preds = %for.body, %entry
88  %1 = phi i32 [ 30, %entry ], [ %inc, %for.cond ]
89  %p.0 = phi ptr [ null, %entry ], [ %add.ptr, %for.cond ]
90  %add.ptr = getelementptr i8, ptr %p.0, i32 %mul
91  %arrayidx = getelementptr ptr, ptr %call, i32 %1
92  store ptr %p.0, ptr %arrayidx, align 4
93  %inc = add i32 %1, 1
94  %tobool.not = icmp eq i32 %1, 0
95  br i1 %tobool.not, label %for.end, label %for.cond
96
97
98for.end:                                          ; preds = %for.cond
99  ret void
100}
101;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line:
102; CHECK: {{.*}}
103