xref: /llvm-project/llvm/test/Transforms/LoopVectorize/X86/runtime-limit.ll (revision 7d7577256b76e4293f455b8093504d5f7044ab4b)
1be51fa45SRoman Lebedev; RUN: opt < %s -passes=loop-vectorize,dce,instcombine -pass-remarks=loop-vectorize -pass-remarks-analysis=loop-vectorize -pass-remarks-missed=loop-vectorize -S 2>&1 | FileCheck %s
2c773d0f9SFlorian Hahn
3c773d0f9SFlorian Hahntarget datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
4c773d0f9SFlorian Hahn
5c773d0f9SFlorian Hahntarget triple = "x86_64-unknown-linux"
6c773d0f9SFlorian Hahn
7c773d0f9SFlorian Hahn; First loop produced diagnostic pass remark.
8c773d0f9SFlorian Hahn;CHECK: remark: {{.*}}:0:0: vectorized loop (vectorization width: 4, interleaved count: 2)
9c773d0f9SFlorian Hahn; Second loop produces diagnostic analysis remark.
10644a965cSFlorian Hahn;CHECK: remark: {{.*}}:0:0: vectorized loop (vectorization width: 4, interleaved count: 1)
11c773d0f9SFlorian Hahn
12c773d0f9SFlorian Hahn; We are vectorizing with 6 runtime checks.
13c773d0f9SFlorian Hahn;CHECK-LABEL: func1x6(
14c773d0f9SFlorian Hahn;CHECK: <4 x i32>
15c773d0f9SFlorian Hahn;CHECK: ret
16*7d757725SNikita Popovdefine i32 @func1x6(ptr nocapture %out, ptr nocapture %A, ptr nocapture %B, ptr nocapture %C, ptr nocapture %D, ptr nocapture %E, ptr nocapture %F) {
17c773d0f9SFlorian Hahnentry:
18c773d0f9SFlorian Hahn  br label %for.body
19c773d0f9SFlorian Hahn
20c773d0f9SFlorian Hahnfor.body:                                         ; preds = %for.body, %entry
21c773d0f9SFlorian Hahn  %i.016 = phi i64 [ 0, %entry ], [ %inc, %for.body ]
22*7d757725SNikita Popov  %arrayidx = getelementptr inbounds i32, ptr %A, i64 %i.016
23*7d757725SNikita Popov  %0 = load i32, ptr %arrayidx, align 4
24*7d757725SNikita Popov  %arrayidx1 = getelementptr inbounds i32, ptr %B, i64 %i.016
25*7d757725SNikita Popov  %1 = load i32, ptr %arrayidx1, align 4
26c773d0f9SFlorian Hahn  %add = add nsw i32 %1, %0
27*7d757725SNikita Popov  %arrayidx2 = getelementptr inbounds i32, ptr %C, i64 %i.016
28*7d757725SNikita Popov  %2 = load i32, ptr %arrayidx2, align 4
29c773d0f9SFlorian Hahn  %add3 = add nsw i32 %add, %2
30*7d757725SNikita Popov  %arrayidx4 = getelementptr inbounds i32, ptr %E, i64 %i.016
31*7d757725SNikita Popov  %3 = load i32, ptr %arrayidx4, align 4
32c773d0f9SFlorian Hahn  %add5 = add nsw i32 %add3, %3
33*7d757725SNikita Popov  %arrayidx6 = getelementptr inbounds i32, ptr %F, i64 %i.016
34*7d757725SNikita Popov  %4 = load i32, ptr %arrayidx6, align 4
35c773d0f9SFlorian Hahn  %add7 = add nsw i32 %add5, %4
36*7d757725SNikita Popov  %arrayidx8 = getelementptr inbounds i32, ptr %out, i64 %i.016
37*7d757725SNikita Popov  store i32 %add7, ptr %arrayidx8, align 4
38c773d0f9SFlorian Hahn  %inc = add i64 %i.016, 1
39c773d0f9SFlorian Hahn  %exitcond = icmp eq i64 %inc, 256
40c773d0f9SFlorian Hahn  br i1 %exitcond, label %for.end, label %for.body
41c773d0f9SFlorian Hahn
42c773d0f9SFlorian Hahnfor.end:                                          ; preds = %for.body
43c773d0f9SFlorian Hahn  ret i32 undef
44c773d0f9SFlorian Hahn}
45c773d0f9SFlorian Hahn
46644a965cSFlorian Hahn; We are vectorizing with 12 runtime checks.
47c773d0f9SFlorian Hahn;CHECK-LABEL: func2x6(
48644a965cSFlorian Hahn;CHECK: <4 x i32>
49c773d0f9SFlorian Hahn;CHECK: ret
50*7d757725SNikita Popovdefine i32 @func2x6(ptr nocapture %out, ptr nocapture %out2, ptr nocapture %A, ptr nocapture %B, ptr nocapture %C, ptr nocapture %D, ptr nocapture %E, ptr nocapture %F) {
51c773d0f9SFlorian Hahnentry:
52c773d0f9SFlorian Hahn  br label %for.body
53c773d0f9SFlorian Hahn
54c773d0f9SFlorian Hahnfor.body:                                         ; preds = %for.body, %entry
55c773d0f9SFlorian Hahn  %i.037 = phi i64 [ 0, %entry ], [ %inc, %for.body ]
56*7d757725SNikita Popov  %arrayidx = getelementptr inbounds i32, ptr %A, i64 %i.037
57*7d757725SNikita Popov  %0 = load i32, ptr %arrayidx, align 4
58*7d757725SNikita Popov  %arrayidx1 = getelementptr inbounds i32, ptr %B, i64 %i.037
59*7d757725SNikita Popov  %1 = load i32, ptr %arrayidx1, align 4
60c773d0f9SFlorian Hahn  %add = add nsw i32 %1, %0
61*7d757725SNikita Popov  %arrayidx2 = getelementptr inbounds i32, ptr %C, i64 %i.037
62*7d757725SNikita Popov  %2 = load i32, ptr %arrayidx2, align 4
63c773d0f9SFlorian Hahn  %add3 = add nsw i32 %add, %2
64*7d757725SNikita Popov  %arrayidx4 = getelementptr inbounds i32, ptr %E, i64 %i.037
65*7d757725SNikita Popov  %3 = load i32, ptr %arrayidx4, align 4
66c773d0f9SFlorian Hahn  %add5 = add nsw i32 %add3, %3
67*7d757725SNikita Popov  %arrayidx6 = getelementptr inbounds i32, ptr %F, i64 %i.037
68*7d757725SNikita Popov  %4 = load i32, ptr %arrayidx6, align 4
69c773d0f9SFlorian Hahn  %add7 = add nsw i32 %add5, %4
70*7d757725SNikita Popov  %arrayidx8 = getelementptr inbounds i32, ptr %out, i64 %i.037
71*7d757725SNikita Popov  store i32 %add7, ptr %arrayidx8, align 4
72*7d757725SNikita Popov  %5 = load i32, ptr %arrayidx, align 4
73*7d757725SNikita Popov  %6 = load i32, ptr %arrayidx1, align 4
74c773d0f9SFlorian Hahn  %add11 = add nsw i32 %6, %5
75*7d757725SNikita Popov  %7 = load i32, ptr %arrayidx2, align 4
76c773d0f9SFlorian Hahn  %add13 = add nsw i32 %add11, %7
77*7d757725SNikita Popov  %8 = load i32, ptr %arrayidx4, align 4
78c773d0f9SFlorian Hahn  %add15 = add nsw i32 %add13, %8
79*7d757725SNikita Popov  %9 = load i32, ptr %arrayidx6, align 4
80c773d0f9SFlorian Hahn  %add17 = add nsw i32 %add15, %9
81*7d757725SNikita Popov  %arrayidx18 = getelementptr inbounds i32, ptr %out2, i64 %i.037
82*7d757725SNikita Popov  store i32 %add17, ptr %arrayidx18, align 4
83c773d0f9SFlorian Hahn  %inc = add i64 %i.037, 1
84c773d0f9SFlorian Hahn  %exitcond = icmp eq i64 %inc, 256
85c773d0f9SFlorian Hahn  br i1 %exitcond, label %for.end, label %for.body
86c773d0f9SFlorian Hahn
87c773d0f9SFlorian Hahnfor.end:                                          ; preds = %for.body
88c773d0f9SFlorian Hahn  ret i32 undef
89c773d0f9SFlorian Hahn}
90