xref: /llvm-project/llvm/test/Transforms/CodeExtractor/PartialInlinePGOMultiRegion.ll (revision bbbbbfbdcb1ab1ba9857138dfa0f2355da8e4499)
1; RUN: opt -S -passes=partial-inliner -min-block-execution=1 -skip-partial-inlining-cost-analysis < %s | FileCheck %s
2; Require a dummy block (if.then.b) as successor to if.then due to PI requirement
3; of region containing more than one BB.
4define signext i32 @bar(i32 signext %value, i32 signext %ub) #0 !prof !30 {
5entry:
6  %value.addr = alloca i32, align 4
7  %ub.addr = alloca i32, align 4
8  %sum = alloca i32, align 4
9  %i = alloca i32, align 4
10  store i32 %value, ptr %value.addr, align 4
11  store i32 %ub, ptr %ub.addr, align 4
12  store i32 0, ptr %sum, align 4
13  store i32 0, ptr %i, align 4
14  br label %for.cond
15
16for.cond:                                         ; preds = %for.inc, %entry
17  %0 = load i32, ptr %i, align 4
18  %1 = load i32, ptr %ub.addr, align 4
19  %cmp = icmp slt i32 %0, %1
20  br i1 %cmp, label %for.body, label %for.cond2, !prof !31
21
22for.body:                                         ; preds = %for.cond
23  %2 = load i32, ptr %value.addr, align 4
24  %rem = srem i32 %2, 20
25  %cmp1 = icmp eq i32 %rem, 0
26  br i1 %cmp1, label %if.then, label %if.else, !prof !32
27
28if.then:                                          ; preds = %for.body
29  %3 = load i32, ptr %value.addr, align 4
30  %4 = load i32, ptr %i, align 4
31  %mul = mul nsw i32 %4, 5
32  %add = add nsw i32 %3, %mul
33  %5 = load i32, ptr %sum, align 4
34  %add2 = add nsw i32 %5, %add
35  store i32 %add2, ptr %sum, align 4
36  br label %if.then.b
37
38if.then.b:                                        ; preds = %if.then
39  br label %if.end
40
41if.else:                                          ; preds = %for.body
42  %6 = load i32, ptr %value.addr, align 4
43  %7 = load i32, ptr %i, align 4
44  %sub = sub nsw i32 %6, %7
45  %8 = load i32, ptr %sum, align 4
46  %add3 = add nsw i32 %8, %sub
47  store i32 %add3, ptr %sum, align 4
48  br label %if.end
49
50if.end:                                           ; preds = %if.else, %if.then
51  br label %for.inc
52
53for.inc:                                          ; preds = %if.end
54  %9 = load i32, ptr %i, align 4
55  %inc = add nsw i32 %9, 1
56  store i32 %inc, ptr %i, align 4
57  br label %for.cond
58
59for.cond2:                                         ; preds = %for.cond
60  %10 = load i32, ptr %i, align 4
61  %11 = load i32, ptr %ub.addr, align 4
62  %cmp2 = icmp slt i32 %10, %11
63  br i1 %cmp2, label %for.body2, label %for.end, !prof !31
64
65for.body2:                                         ; preds = %for.cond2
66  %12 = load i32, ptr %value.addr, align 4
67  %rem2 = srem i32 %12, 20
68  %cmp3 = icmp eq i32 %rem2, 0
69  br i1 %cmp3, label %if.then2, label %if.else2, !prof !32
70
71if.then2:                                          ; preds = %for.body2
72  %13 = load i32, ptr %value.addr, align 4
73  %14 = load i32, ptr %i, align 4
74  %mul2 = mul nsw i32 %14, 5
75  %add4 = add nsw i32 %13, %mul2
76  %15 = load i32, ptr %sum, align 4
77  %add5 = add nsw i32 %15, %add4
78  store i32 %add5, ptr %sum, align 4
79  br label %if.then2.b
80
81if.then2.b:                                        ; preds = %if.then2
82  br label %if.end2
83
84if.else2:                                          ; preds = %for.body2
85  %16 = load i32, ptr %value.addr, align 4
86  %17 = load i32, ptr %i, align 4
87  %sub2 = sub nsw i32 %16, %17
88  %18 = load i32, ptr %sum, align 4
89  %add6 = add nsw i32 %18, %sub2
90  store i32 %add6, ptr %sum, align 4
91  br label %if.end2
92
93if.end2:                                           ; preds = %if.else2, %if.then2
94  br label %for.inc2
95
96for.inc2:                                          ; preds = %if.end2
97  %19 = load i32, ptr %i, align 4
98  %inc2 = add nsw i32 %19, 1
99  store i32 %inc2, ptr %i, align 4
100  br label %for.cond2
101
102for.end:                                          ; preds = %for.cond2
103  callbr void asm sideeffect "1: nop\0A\09.quad b, ${0:l}, $$5\0A\09", "!i,~{dirflag},~{fpsr},~{flags}"()
104          to label %asm.fallthrough [label %l_yes]
105asm.fallthrough:                                  ; preds = %for.end
106  br label %l_yes
107
108l_yes:
109  %20 = load i32, ptr %sum, align 4
110  ret i32 %20
111}
112
113define signext i32 @foo(i32 signext %value, i32 signext %ub) #0 !prof !30 {
114; CHECK-LABEL: @foo
115; CHECK-NOT: call signext i32 @bar
116; CHECK: codeRepl1.i:
117; CHECK: call void @bar.1.if.then
118; CHECK: codeRepl.i:
119; CHECK: call void @bar.1.if.then2
120entry:
121  %value.addr = alloca i32, align 4
122  %ub.addr = alloca i32, align 4
123  store i32 %value, ptr %value.addr, align 4
124  store i32 %ub, ptr %ub.addr, align 4
125  %0 = load i32, ptr %value.addr, align 4
126  %1 = load i32, ptr %ub.addr, align 4
127  %call = call signext i32 @bar(i32 signext %0, i32 signext %1)
128  ret i32 %call
129}
130
131; CHECK-LABEL: define internal void @bar.1.if.then2
132; CHECK: .exitStub:
133; CHECK: ret void
134
135; CHECK-LABEL: define internal void @bar.1.if.then
136; CHECK: .exitStub:
137; CHECK: ret void
138
139!llvm.module.flags = !{!0, !1, !2}
140!llvm.ident = !{!29}
141
142!0 = !{i32 1, !"wchar_size", i32 4}
143!1 = !{i32 7, !"PIC Level", i32 2}
144!2 = !{i32 1, !"ProfileSummary", !3}
145!3 = !{!4, !5, !6, !7, !8, !9, !10, !11}
146!4 = !{!"ProfileFormat", !"InstrProf"}
147!5 = !{!"TotalCount", i64 103}
148!6 = !{!"MaxCount", i64 100}
149!7 = !{!"MaxInternalCount", i64 1}
150!8 = !{!"MaxFunctionCount", i64 100}
151!9 = !{!"NumCounts", i64 5}
152!10 = !{!"NumFunctions", i64 3}
153!11 = !{!"DetailedSummary", !12}
154!12 = !{!13, !14, !15, !16, !17, !18, !18, !19, !19, !20, !21, !22, !23, !24, !25, !26, !27, !28}
155!13 = !{i32 10000, i64 100, i32 1}
156!14 = !{i32 100000, i64 100, i32 1}
157!15 = !{i32 200000, i64 100, i32 1}
158!16 = !{i32 300000, i64 100, i32 1}
159!17 = !{i32 400000, i64 100, i32 1}
160!18 = !{i32 500000, i64 100, i32 1}
161!19 = !{i32 600000, i64 100, i32 1}
162!20 = !{i32 700000, i64 100, i32 1}
163!21 = !{i32 800000, i64 100, i32 1}
164!22 = !{i32 900000, i64 100, i32 1}
165!23 = !{i32 950000, i64 100, i32 1}
166!24 = !{i32 990000, i64 1, i32 4}
167!25 = !{i32 999000, i64 1, i32 4}
168!26 = !{i32 999900, i64 1, i32 4}
169!27 = !{i32 999990, i64 1, i32 4}
170!28 = !{i32 999999, i64 1, i32 4}
171!29 = !{!"clang version 6.0.0 (123456)"}
172!30 = !{!"function_entry_count", i64 2}
173!31 = !{!"branch_weights", i32 100, i32 1}
174!32 = !{!"branch_weights", i32 0, i32 100}
175