xref: /llvm-project/llvm/test/Transforms/Inline/memprof_inline.ll (revision 35c7e457e8b00a4772b00b0100748f9a517ea0c2)
1;; Test for memprof metadata propagation, ensuring metadata is simplified
2;; to function attributes appropriately after inlining profiled call chains.
3;;
4;; The following code was used to generate the following IR and its memprof
5;; profile:
6;;
7;; #include <stdlib.h>
8;; #include <string.h>
9;; #include <unistd.h>
10;; char *foo() {
11;;   return new char[10];
12;; }
13;; char *foo2() {
14;;   return foo();
15;; }
16;; int main(int argc, char **argv) {
17;;   char *c = foo();
18;;   char *d = foo();
19;;   char *e = foo2();
20;;   memset(c, 0, 10);
21;;   memset(d, 0, 10);
22;;   memset(e, 0, 10);
23;;   delete[] c;
24;;   sleep(200);
25;;   delete[] d;
26;;   delete[] e;
27;;   return 0;
28;; }
29
30
31; RUN: opt -passes=inline %s -S | FileCheck %s
32
33; ModuleID = 'memprof_inline.cc'
34source_filename = "memprof_inline.cc"
35target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
36target triple = "x86_64-unknown-linux-gnu"
37
38; Function Attrs: mustprogress uwtable
39; CHECK-LABEL: define dso_local noundef ptr @_Z3foov
40define dso_local noundef ptr @_Z3foov() #0 !dbg !39 {
41entry:
42  ;; We should keep the original memprof metadata intact.
43  ; CHECK: call {{.*}} @_Znam{{.*}} !memprof ![[ORIGMEMPROF:[0-9]+]]
44  %call = call noalias noundef nonnull ptr @_Znam(i64 noundef 10) #6, !dbg !42, !memprof !43, !callsite !50
45  ; CHECK-NEXT: ret
46  ret ptr %call, !dbg !51
47}
48
49; Function Attrs: nobuiltin allocsize(0)
50declare noundef nonnull ptr @_Znam(i64 noundef) #1
51
52; Function Attrs: mustprogress uwtable
53; CHECK-LABEL: define dso_local noundef ptr @_Z4foo2v
54define dso_local noundef ptr @_Z4foo2v() #0 !dbg !52 {
55entry:
56  ; CHECK: call {{.*}} @_Znam{{.*}} #[[COLD:[0-9]+]]
57  %call = call noundef ptr @_Z3foov(), !dbg !53, !callsite !54
58  ret ptr %call, !dbg !55
59}
60
61; Function Attrs: mustprogress norecurse uwtable
62; CHECK-LABEL: define dso_local noundef i32 @main
63define dso_local noundef i32 @main(i32 noundef %argc, ptr noundef %argv) #2 !dbg !56 {
64entry:
65  %retval = alloca i32, align 4
66  %argc.addr = alloca i32, align 4
67  %argv.addr = alloca ptr, align 8
68  %c = alloca ptr, align 8
69  %d = alloca ptr, align 8
70  %e = alloca ptr, align 8
71  store i32 0, ptr %retval, align 4
72  store i32 %argc, ptr %argc.addr, align 4
73  store ptr %argv, ptr %argv.addr, align 8
74  ; CHECK: call {{.*}} @_Znam{{.*}} #[[NOTCOLD:[0-9]+]]
75  %call = call noundef ptr @_Z3foov(), !dbg !57, !callsite !58
76  store ptr %call, ptr %c, align 8, !dbg !59
77  ; CHECK: call {{.*}} @_Znam{{.*}} #[[COLD]]
78  %call1 = call noundef ptr @_Z3foov(), !dbg !60, !callsite !61
79  store ptr %call1, ptr %d, align 8, !dbg !62
80  ; CHECK: call {{.*}} @_Znam{{.*}} #[[COLD]]
81  %call2 = call noundef ptr @_Z4foo2v(), !dbg !63, !callsite !64
82  store ptr %call2, ptr %e, align 8, !dbg !65
83  %0 = load ptr, ptr %c, align 8, !dbg !66
84  call void @llvm.memset.p0.i64(ptr align 1 %0, i8 0, i64 10, i1 false), !dbg !67
85  %1 = load ptr, ptr %d, align 8, !dbg !68
86  call void @llvm.memset.p0.i64(ptr align 1 %1, i8 0, i64 10, i1 false), !dbg !69
87  %2 = load ptr, ptr %e, align 8, !dbg !70
88  call void @llvm.memset.p0.i64(ptr align 1 %2, i8 0, i64 10, i1 false), !dbg !71
89  %3 = load ptr, ptr %c, align 8, !dbg !72
90  %isnull = icmp eq ptr %3, null, !dbg !73
91  br i1 %isnull, label %delete.end, label %delete.notnull, !dbg !73
92
93delete.notnull:                                   ; preds = %entry
94  call void @_ZdaPv(ptr noundef %3) #7, !dbg !74
95  br label %delete.end, !dbg !74
96
97delete.end:                                       ; preds = %delete.notnull, %entry
98  %call4 = call i32 @sleep(i32 noundef 200), !dbg !76
99  %4 = load ptr, ptr %d, align 8, !dbg !77
100  %isnull5 = icmp eq ptr %4, null, !dbg !78
101  br i1 %isnull5, label %delete.end7, label %delete.notnull6, !dbg !78
102
103delete.notnull6:                                  ; preds = %delete.end
104  call void @_ZdaPv(ptr noundef %4) #7, !dbg !79
105  br label %delete.end7, !dbg !79
106
107delete.end7:                                      ; preds = %delete.notnull6, %delete.end
108  %5 = load ptr, ptr %e, align 8, !dbg !80
109  %isnull8 = icmp eq ptr %5, null, !dbg !81
110  br i1 %isnull8, label %delete.end10, label %delete.notnull9, !dbg !81
111
112delete.notnull9:                                  ; preds = %delete.end7
113  call void @_ZdaPv(ptr noundef %5) #7, !dbg !82
114  br label %delete.end10, !dbg !82
115
116delete.end10:                                     ; preds = %delete.notnull9, %delete.end7
117  ret i32 0, !dbg !83
118}
119
120; Function Attrs: argmemonly nofree nounwind willreturn writeonly
121declare void @llvm.memset.p0.i64(ptr nocapture writeonly, i8, i64, i1 immarg) #3
122
123; Function Attrs: nobuiltin nounwind
124declare void @_ZdaPv(ptr noundef) #4
125
126declare i32 @sleep(i32 noundef) #5
127
128; CHECK: attributes #[[COLD]] = { builtin allocsize(0) "memprof"="cold" }
129; CHECK: attributes #[[NOTCOLD]] = { builtin allocsize(0) "memprof"="notcold" }
130
131attributes #0 = { mustprogress uwtable "disable-tail-calls"="true" "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
132attributes #1 = { nobuiltin allocsize(0) "disable-tail-calls"="true" "frame-pointer"="all" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
133attributes #2 = { mustprogress norecurse uwtable "disable-tail-calls"="true" "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
134attributes #3 = { argmemonly nofree nounwind willreturn writeonly }
135attributes #4 = { nobuiltin nounwind "disable-tail-calls"="true" "frame-pointer"="all" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
136attributes #5 = { "disable-tail-calls"="true" "frame-pointer"="all" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
137attributes #6 = { builtin allocsize(0) }
138attributes #7 = { builtin nounwind }
139
140!llvm.dbg.cu = !{!0}
141!llvm.module.flags = !{!2, !3, !4, !5, !6, !7, !8, !9}
142!llvm.ident = !{!38}
143
144!0 = distinct !DICompileUnit(language: DW_LANG_C_plus_plus_14, file: !1, producer: "clang version 15.0.0 (https://github.com/llvm/llvm-project.git e09c924f98ec157adeaa74819b0aec9a07a1b552)", isOptimized: false, runtimeVersion: 0, emissionKind: LineTablesOnly, splitDebugInlining: false, debugInfoForProfiling: true, nameTableKind: None)
145!1 = !DIFile(filename: "memprof_inline.cc", directory: "/usr/local/google/home/tejohnson/llvm/tmp", checksumkind: CSK_MD5, checksum: "8711f6fd269e6cb5611fef48bc906eab")
146!2 = !{i32 7, !"Dwarf Version", i32 5}
147!3 = !{i32 2, !"Debug Info Version", i32 3}
148!4 = !{i32 1, !"wchar_size", i32 4}
149!5 = !{i32 7, !"PIC Level", i32 2}
150!6 = !{i32 7, !"PIE Level", i32 2}
151!7 = !{i32 7, !"uwtable", i32 2}
152!8 = !{i32 7, !"frame-pointer", i32 2}
153!9 = !{i32 1, !"ProfileSummary", !10}
154!10 = !{!11, !12, !13, !14, !15, !16, !17, !18, !19, !20}
155!11 = !{!"ProfileFormat", !"InstrProf"}
156!12 = !{!"TotalCount", i64 0}
157!13 = !{!"MaxCount", i64 0}
158!14 = !{!"MaxInternalCount", i64 0}
159!15 = !{!"MaxFunctionCount", i64 0}
160!16 = !{!"NumCounts", i64 0}
161!17 = !{!"NumFunctions", i64 0}
162!18 = !{!"IsPartialProfile", i64 0}
163!19 = !{!"PartialProfileRatio", double 0.000000e+00}
164!20 = !{!"DetailedSummary", !21}
165!21 = !{!22, !23, !24, !25, !26, !27, !28, !29, !30, !31, !32, !33, !34, !35, !36, !37}
166!22 = !{i32 10000, i64 0, i32 0}
167!23 = !{i32 100000, i64 0, i32 0}
168!24 = !{i32 200000, i64 0, i32 0}
169!25 = !{i32 300000, i64 0, i32 0}
170!26 = !{i32 400000, i64 0, i32 0}
171!27 = !{i32 500000, i64 0, i32 0}
172!28 = !{i32 600000, i64 0, i32 0}
173!29 = !{i32 700000, i64 0, i32 0}
174!30 = !{i32 800000, i64 0, i32 0}
175!31 = !{i32 900000, i64 0, i32 0}
176!32 = !{i32 950000, i64 0, i32 0}
177!33 = !{i32 990000, i64 0, i32 0}
178!34 = !{i32 999000, i64 0, i32 0}
179!35 = !{i32 999900, i64 0, i32 0}
180!36 = !{i32 999990, i64 0, i32 0}
181!37 = !{i32 999999, i64 0, i32 0}
182!38 = !{!"clang version 15.0.0 (https://github.com/llvm/llvm-project.git e09c924f98ec157adeaa74819b0aec9a07a1b552)"}
183!39 = distinct !DISubprogram(name: "foo", linkageName: "_Z3foov", scope: !1, file: !1, line: 4, type: !40, scopeLine: 4, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !41)
184!40 = !DISubroutineType(types: !41)
185!41 = !{}
186!42 = !DILocation(line: 5, column: 10, scope: !39)
187!43 = !{!44, !46, !48}
188!44 = !{!45, !"cold"}
189!45 = !{i64 -2458008693472584243, i64 7394638144382192936}
190!46 = !{!47, !"notcold"}
191!47 = !{i64 -2458008693472584243, i64 -8908997186479157179}
192!48 = !{!49, !"cold"}
193!49 = !{i64 -2458008693472584243, i64 -8079659623765193173}
194; CHECK: ![[ORIGMEMPROF]] = !{![[ORIGMIB1:[0-9]+]], ![[ORIGMIB2:[0-9]+]], ![[ORIGMIB3:[0-9]+]]}
195; CHECK: ![[ORIGMIB1]] = !{![[ORIGMIBSTACK1:[0-9]+]], !"cold"}
196; CHECK: ![[ORIGMIBSTACK1]] = !{i64 -2458008693472584243, i64 7394638144382192936}
197; CHECK: ![[ORIGMIB2]] = !{![[ORIGMIBSTACK2:[0-9]+]], !"notcold"}
198; CHECK: ![[ORIGMIBSTACK2]] = !{i64 -2458008693472584243, i64 -8908997186479157179}
199; CHECK: ![[ORIGMIB3]] = !{![[ORIGMIBSTACK3:[0-9]+]], !"cold"}
200; CHECK: ![[ORIGMIBSTACK3]] = !{i64 -2458008693472584243, i64 -8079659623765193173}
201!50 = !{i64 -2458008693472584243}
202!51 = !DILocation(line: 5, column: 3, scope: !39)
203!52 = distinct !DISubprogram(name: "foo2", linkageName: "_Z4foo2v", scope: !1, file: !1, line: 7, type: !40, scopeLine: 7, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !41)
204!53 = !DILocation(line: 8, column: 10, scope: !52)
205!54 = !{i64 -8079659623765193173}
206!55 = !DILocation(line: 8, column: 3, scope: !52)
207!56 = distinct !DISubprogram(name: "main", scope: !1, file: !1, line: 16, type: !40, scopeLine: 16, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !41)
208!57 = !DILocation(line: 17, column: 13, scope: !56)
209!58 = !{i64 -8908997186479157179}
210!59 = !DILocation(line: 17, column: 9, scope: !56)
211!60 = !DILocation(line: 18, column: 13, scope: !56)
212!61 = !{i64 7394638144382192936}
213!62 = !DILocation(line: 18, column: 9, scope: !56)
214!63 = !DILocation(line: 19, column: 13, scope: !56)
215!64 = !{i64 -5510257407004945023}
216!65 = !DILocation(line: 19, column: 9, scope: !56)
217!66 = !DILocation(line: 21, column: 10, scope: !56)
218!67 = !DILocation(line: 21, column: 3, scope: !56)
219!68 = !DILocation(line: 22, column: 10, scope: !56)
220!69 = !DILocation(line: 22, column: 3, scope: !56)
221!70 = !DILocation(line: 23, column: 10, scope: !56)
222!71 = !DILocation(line: 23, column: 3, scope: !56)
223!72 = !DILocation(line: 25, column: 12, scope: !56)
224!73 = !DILocation(line: 25, column: 3, scope: !56)
225!74 = !DILocation(line: 25, column: 3, scope: !75)
226!75 = !DILexicalBlockFile(scope: !56, file: !1, discriminator: 2)
227!76 = !DILocation(line: 26, column: 3, scope: !56)
228!77 = !DILocation(line: 27, column: 12, scope: !56)
229!78 = !DILocation(line: 27, column: 3, scope: !56)
230!79 = !DILocation(line: 27, column: 3, scope: !75)
231!80 = !DILocation(line: 28, column: 12, scope: !56)
232!81 = !DILocation(line: 28, column: 3, scope: !56)
233!82 = !DILocation(line: 28, column: 3, scope: !75)
234!83 = !DILocation(line: 30, column: 3, scope: !56)
235