xref: /llvm-project/llvm/test/Transforms/PGOProfile/cspgo_sample.ll (revision b4fcaa137f057e68a9011b26c11627a16a8c9374)
1b1ca2a95Sxur-llvm; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
2b1ca2a95Sxur-llvm; REQUIRES: x86-registered-target
3b1ca2a95Sxur-llvm
4b1ca2a95Sxur-llvm; RUN: opt -module-summary %s -o %t1.bc
5b1ca2a95Sxur-llvm; RUN: opt -module-summary %S/Inputs/cspgo_bar_sample.ll -o %t2.bc
6b1ca2a95Sxur-llvm; RUN: llvm-lto2 run -lto-cspgo-profile-file=alloc -enable-sampled-instrumentation -lto-cspgo-gen -save-temps -o %t %t1.bc %t2.bc \
7b1ca2a95Sxur-llvm; RUN:   -r=%t1.bc,foo,pl \
8b1ca2a95Sxur-llvm; RUN:   -r=%t1.bc,bar,l \
9b1ca2a95Sxur-llvm; RUN:   -r=%t1.bc,main,plx \
10b1ca2a95Sxur-llvm; RUN:   -r=%t1.bc,__llvm_profile_filename,plx \
11b1ca2a95Sxur-llvm; RUN:   -r=%t1.bc,__llvm_profile_raw_version,plx \
12b1ca2a95Sxur-llvm; RUN:   -r=%t1.bc,__llvm_profile_sampling,pl \
13b1ca2a95Sxur-llvm; RUN:   -r=%t2.bc,bar,pl \
14b1ca2a95Sxur-llvm; RUN:   -r=%t2.bc,odd,pl \
15b1ca2a95Sxur-llvm; RUN:   -r=%t2.bc,even,pl \
16b1ca2a95Sxur-llvm; RUN:   -r=%t2.bc,__llvm_profile_filename,x \
17b1ca2a95Sxur-llvm; RUN:   -r=%t2.bc,__llvm_profile_raw_version,x \
18b1ca2a95Sxur-llvm; RUN:   -r=%t2.bc,__llvm_profile_sampling,
19b1ca2a95Sxur-llvm; RUN: llvm-dis %t.1.4.opt.bc -o - | FileCheck %s --check-prefix=CSGEN
20b1ca2a95Sxur-llvm
21b1ca2a95Sxur-llvm; CSGEN: @__llvm_profile_sampling = thread_local global i16 0, comdat
22b1ca2a95Sxur-llvm; CSGEN: @__profc_
23b1ca2a95Sxur-llvm; CSGEN: @__profd_
24b1ca2a95Sxur-llvm
25b1ca2a95Sxur-llvmsource_filename = "cspgo.c"
26b1ca2a95Sxur-llvmtarget datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
27b1ca2a95Sxur-llvmtarget triple = "x86_64-unknown-linux-gnu"
28b1ca2a95Sxur-llvm
29b1ca2a95Sxur-llvm$__llvm_profile_filename = comdat any
30b1ca2a95Sxur-llvm$__llvm_profile_raw_version = comdat any
31b1ca2a95Sxur-llvm$__llvm_profile_sampling = comdat any
32b1ca2a95Sxur-llvm@__llvm_profile_filename = local_unnamed_addr constant [25 x i8] c"pass2/default_%m.profraw\00", comdat
33b1ca2a95Sxur-llvm@__llvm_profile_raw_version = local_unnamed_addr constant i64 216172782113783812, comdat
34b1ca2a95Sxur-llvm@__llvm_profile_sampling = thread_local global i16 0, comdat
35b1ca2a95Sxur-llvm@llvm.used = appending global [1 x i8*] [i8* bitcast (i64* @__llvm_profile_sampling to i8*)], section "llvm.metadata"
36b1ca2a95Sxur-llvm
37b1ca2a95Sxur-llvmdefine dso_local void @foo() #0 !prof !30 {
38b1ca2a95Sxur-llvmentry:
39b1ca2a95Sxur-llvm  br label %for.body
40b1ca2a95Sxur-llvm
41b1ca2a95Sxur-llvmfor.body:
42b1ca2a95Sxur-llvm  %i.06 = phi i32 [ 0, %entry ], [ %add1, %for.body ]
43b1ca2a95Sxur-llvm  tail call void @bar(i32 %i.06) #3
44b1ca2a95Sxur-llvm  %add = or i32 %i.06, 1
45b1ca2a95Sxur-llvm  tail call void @bar(i32 %add) #3
46b1ca2a95Sxur-llvm  %add1 = add nuw nsw i32 %i.06, 2
47b1ca2a95Sxur-llvm  %cmp = icmp ult i32 %add1, 200000
48b1ca2a95Sxur-llvm  br i1 %cmp, label %for.body, label %for.end, !prof !31
49b1ca2a95Sxur-llvm
50b1ca2a95Sxur-llvmfor.end:
51b1ca2a95Sxur-llvm  ret void
52b1ca2a95Sxur-llvm}
53b1ca2a95Sxur-llvm
54b1ca2a95Sxur-llvm; CSGEN-LABEL: @foo
55b1ca2a95Sxur-llvm; CSGEN:        [[TMP0:%.*]]  = load i16, ptr @__llvm_profile_sampling, align 2
56*b4fcaa13SMichael O'Farrell; CSGEN-NEXT:   [[TMP1:%.*]] = icmp ult i16 [[TMP0]], 200
57b1ca2a95Sxur-llvm; CSGEN-NEXT:   br i1 [[TMP1]], label %{{.*}}, label %{{.*}}, !prof [[PROF:![0-9]+]]
58b1ca2a95Sxur-llvm; CSGEN:        [[TMP2:%.*]] = add i16 {{.*}}, 1
59b1ca2a95Sxur-llvm; CSGEN-NEXT:   store i16 [[TMP2]], ptr @__llvm_profile_sampling, align 2
60b1ca2a95Sxur-llvm
61b1ca2a95Sxur-llvmdeclare dso_local void @bar(i32)
62b1ca2a95Sxur-llvm
63b1ca2a95Sxur-llvmdefine dso_local i32 @main() !prof !30 {
64b1ca2a95Sxur-llvmentry:
65b1ca2a95Sxur-llvm  tail call void @foo()
66b1ca2a95Sxur-llvm  ret i32 0
67b1ca2a95Sxur-llvm}
68b1ca2a95Sxur-llvm; CSGEN-LABEL: @main
69b1ca2a95Sxur-llvm; CSGEN:        [[TMP0:%.*]]  = load i16, ptr @__llvm_profile_sampling, align 2
70*b4fcaa13SMichael O'Farrell; CSGEN-NEXT:   [[TMP1:%.*]] = icmp ult i16 [[TMP0]], 200
71b1ca2a95Sxur-llvm; CSGEN-NEXT:   br i1 [[TMP1]], label %{{.*}}, label %{{.*}}, !prof [[PROF:![0-9]+]]
72b1ca2a95Sxur-llvm; CSGEN:        [[TMP2:%.*]] = add i16 {{.*}}, 1
73b1ca2a95Sxur-llvm; CSGEN-NEXT:   store i16 [[TMP2]], ptr @__llvm_profile_sampling, align 2
74b1ca2a95Sxur-llvm
75b1ca2a95Sxur-llvmattributes #0 = { "target-cpu"="x86-64" }
76b1ca2a95Sxur-llvm
77b1ca2a95Sxur-llvm!llvm.module.flags = !{!0, !1, !2}
78b1ca2a95Sxur-llvm
79b1ca2a95Sxur-llvm!0 = !{i32 1, !"wchar_size", i32 4}
80b1ca2a95Sxur-llvm!1 = !{i32 1, !"EnableSplitLTOUnit", i32 0}
81b1ca2a95Sxur-llvm!2 = !{i32 1, !"ProfileSummary", !3}
82b1ca2a95Sxur-llvm!3 = !{!4, !5, !6, !7, !8, !9, !10, !11}
83b1ca2a95Sxur-llvm!4 = !{!"ProfileFormat", !"InstrProf"}
84b1ca2a95Sxur-llvm!5 = !{!"TotalCount", i64 500002}
85b1ca2a95Sxur-llvm!6 = !{!"MaxCount", i64 200000}
86b1ca2a95Sxur-llvm!7 = !{!"MaxInternalCount", i64 100000}
87b1ca2a95Sxur-llvm!8 = !{!"MaxFunctionCount", i64 200000}
88b1ca2a95Sxur-llvm!9 = !{!"NumCounts", i64 6}
89b1ca2a95Sxur-llvm!10 = !{!"NumFunctions", i64 4}
90b1ca2a95Sxur-llvm!11 = !{!"DetailedSummary", !12}
91b1ca2a95Sxur-llvm!12 = !{!13, !14, !15, !16, !17, !18, !19, !20, !21, !22, !23, !24, !25, !26, !27, !28}
92b1ca2a95Sxur-llvm!13 = !{i32 10000, i64 200000, i32 1}
93b1ca2a95Sxur-llvm!14 = !{i32 100000, i64 200000, i32 1}
94b1ca2a95Sxur-llvm!15 = !{i32 200000, i64 200000, i32 1}
95b1ca2a95Sxur-llvm!16 = !{i32 300000, i64 200000, i32 1}
96b1ca2a95Sxur-llvm!17 = !{i32 400000, i64 200000, i32 1}
97b1ca2a95Sxur-llvm!18 = !{i32 500000, i64 100000, i32 4}
98b1ca2a95Sxur-llvm!19 = !{i32 600000, i64 100000, i32 4}
99b1ca2a95Sxur-llvm!20 = !{i32 700000, i64 100000, i32 4}
100b1ca2a95Sxur-llvm!21 = !{i32 800000, i64 100000, i32 4}
101b1ca2a95Sxur-llvm!22 = !{i32 900000, i64 100000, i32 4}
102b1ca2a95Sxur-llvm!23 = !{i32 950000, i64 100000, i32 4}
103b1ca2a95Sxur-llvm!24 = !{i32 990000, i64 100000, i32 4}
104b1ca2a95Sxur-llvm!25 = !{i32 999000, i64 100000, i32 4}
105b1ca2a95Sxur-llvm!26 = !{i32 999900, i64 100000, i32 4}
106b1ca2a95Sxur-llvm!27 = !{i32 999990, i64 100000, i32 4}
107b1ca2a95Sxur-llvm!28 = !{i32 999999, i64 1, i32 6}
108b1ca2a95Sxur-llvm!30 = !{!"function_entry_count", i64 1}
109b1ca2a95Sxur-llvm!31 = !{!"branch_weights", i32 100000, i32 1}
110b1ca2a95Sxur-llvm
111b1ca2a95Sxur-llvm; CSGEN: [[PROF]] = !{!"branch_weights", i32 200, i32 65336}
112b1ca2a95Sxur-llvm
113