1; REQUIRES: x86_64-linux 2; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/profile-mismatch.prof -report-profile-staleness -persist-profile-staleness -S 2>%t -o %t.ll 3; RUN: FileCheck %s --input-file %t 4; RUN: FileCheck %s --input-file %t.ll -check-prefix=CHECK-MD 5; RUN: llc < %t.ll -filetype=obj -o %t.obj 6; RUN: llvm-objdump --section-headers %t.obj | FileCheck %s --check-prefix=CHECK-OBJ 7; RUN: llc < %t.ll -filetype=asm -o - | FileCheck %s --check-prefix=CHECK-ASM 8 9; CHECK: (1/3) of callsites' profile are invalid and (15/50) of samples are discarded due to callsite location mismatch. 10 11; CHECK-MD: ![[#]] = !{!"NumMismatchedCallsites", i64 1, !"NumRecoveredCallsites", i64 0, !"TotalProfiledCallsites", i64 3, !"MismatchedCallsiteSamples", i64 15, !"RecoveredCallsiteSamples", i64 0} 12 13; CHECK-OBJ: .llvm_stats 14 15; CHECK-ASM: .ascii "NumMismatchedCallsites" 16; CHECK-ASM: .byte 4 17; CHECK-ASM: .ascii "MQ==" 18; CHECK-ASM: .byte 21 19; CHECK-ASM: .ascii "NumRecoveredCallsites" 20; CHECK-ASM: .byte 4 21; CHECK-ASM: .ascii "MA==" 22; CHECK-ASM: .byte 22 23; CHECK-ASM: .ascii "TotalProfiledCallsites" 24; CHECK-ASM: .byte 4 25; CHECK-ASM: .ascii "Mw==" 26; CHECK-ASM: .byte 25 27; CHECK-ASM: .ascii "MismatchedCallsiteSamples" 28; CHECK-ASM: .byte 4 29; CHECK-ASM: .ascii "MTU=" 30; CHECK-ASM: .byte 24 31; CHECK-ASM: .ascii "RecoveredCallsiteSamples" 32; CHECK-ASM: .byte 4 33; CHECK-ASM: .ascii "MA==" 34 35 36target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" 37target triple = "x86_64-unknown-linux-gnu" 38 39@x = dso_local global i32 0, align 4, !dbg !0 40 41; Function Attrs: nounwind uwtable 42define dso_local i32 @foo(i32 noundef %x) #0 !dbg !12 { 43entry: 44 %y = alloca i32, align 4 45 call void @llvm.dbg.value(metadata i32 %x, metadata !16, metadata !DIExpression()), !dbg !18 46 call void @llvm.lifetime.start.p0(i64 4, ptr nonnull %y), !dbg !19 47 call void @llvm.dbg.declare(metadata ptr %y, metadata !17, metadata !DIExpression()), !dbg !20 48 %add = add nsw i32 %x, 1, !dbg !21 49 store volatile i32 %add, ptr %y, align 4, !dbg !20, !tbaa !22 50 %y.0. = load volatile i32, ptr %y, align 4, !dbg !26, !tbaa !22 51 %add1 = add nsw i32 %y.0., 1, !dbg !27 52 call void @llvm.lifetime.end.p0(i64 4, ptr nonnull %y), !dbg !28 53 ret i32 %add1, !dbg !29 54} 55 56; Function Attrs: mustprogress nocallback nofree nosync nounwind readnone speculatable willreturn 57declare void @llvm.dbg.declare(metadata, metadata, metadata) #1 58 59; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn 60declare void @llvm.lifetime.start.p0(i64 immarg, ptr nocapture) #2 61 62; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn 63declare void @llvm.lifetime.end.p0(i64 immarg, ptr nocapture) #2 64 65; Function Attrs: noinline nounwind uwtable 66define dso_local i32 @bar(i32 noundef %x) #3 !dbg !30 { 67entry: 68 call void @llvm.dbg.value(metadata i32 %x, metadata !32, metadata !DIExpression()), !dbg !33 69 %add = add nsw i32 %x, 2, !dbg !34 70 ret i32 %add, !dbg !35 71} 72 73; Function Attrs: noinline nounwind uwtable 74define dso_local i32 @matched(i32 noundef %x) #3 !dbg !36 { 75entry: 76 call void @llvm.dbg.value(metadata i32 %x, metadata !38, metadata !DIExpression()), !dbg !39 77 %add = add nsw i32 %x, 3, !dbg !40 78 ret i32 %add, !dbg !41 79} 80 81; Function Attrs: nounwind uwtable 82define dso_local i32 @main() #0 !dbg !42 { 83entry: 84 call void @llvm.dbg.value(metadata i32 0, metadata !46, metadata !DIExpression()), !dbg !52 85 br label %for.cond, !dbg !53 86 87for.cond: ; preds = %for.cond.cleanup3, %entry 88 %i.0 = phi i32 [ 0, %entry ], [ %inc8, %for.cond.cleanup3 ], !dbg !52 89 call void @llvm.dbg.value(metadata i32 %i.0, metadata !46, metadata !DIExpression()), !dbg !52 90 %cmp = icmp ult i32 %i.0, 1000, !dbg !54 91 br i1 %cmp, label %for.body, label %for.cond.cleanup, !dbg !56 92 93for.cond.cleanup: ; preds = %for.cond 94 ret i32 0, !dbg !58 95 96for.body: ; preds = %for.cond 97 call void @llvm.dbg.value(metadata i32 0, metadata !48, metadata !DIExpression()), !dbg !59 98 br label %for.cond1, !dbg !60 99 100for.cond1: ; preds = %for.body4, %for.body 101 %a.0 = phi i32 [ 0, %for.body ], [ %inc, %for.body4 ], !dbg !59 102 call void @llvm.dbg.value(metadata i32 %a.0, metadata !48, metadata !DIExpression()), !dbg !59 103 %cmp2 = icmp ult i32 %a.0, 10000, !dbg !61 104 br i1 %cmp2, label %for.body4, label %for.cond.cleanup3, !dbg !64 105 106for.cond.cleanup3: ; preds = %for.cond1 107 %inc8 = add nuw nsw i32 %i.0, 1, !dbg !66 108 call void @llvm.dbg.value(metadata i32 %inc8, metadata !46, metadata !DIExpression()), !dbg !52 109 br label %for.cond, !dbg !68, !llvm.loop !69 110 111for.body4: ; preds = %for.cond1 112 %0 = load volatile i32, ptr @x, align 4, !dbg !73, !tbaa !22 113 %call = call i32 @matched(i32 noundef %0), !dbg !75 114 store volatile i32 %call, ptr @x, align 4, !dbg !76, !tbaa !22 115 %1 = load volatile i32, ptr @x, align 4, !dbg !77, !tbaa !22 116 %call5 = call i32 @foo(i32 noundef %1), !dbg !78 117 store volatile i32 %call5, ptr @x, align 4, !dbg !79, !tbaa !22 118 %2 = load volatile i32, ptr @x, align 4, !dbg !80, !tbaa !22 119 %call6 = call i32 @bar(i32 noundef %2), !dbg !81 120 store volatile i32 %call6, ptr @x, align 4, !dbg !82, !tbaa !22 121 %inc = add nuw nsw i32 %a.0, 1, !dbg !83 122 call void @llvm.dbg.value(metadata i32 %inc, metadata !48, metadata !DIExpression()), !dbg !59 123 br label %for.cond1, !dbg !85, !llvm.loop !86 124} 125 126; Function Attrs: nocallback nofree nosync nounwind readnone speculatable willreturn 127declare void @llvm.dbg.value(metadata, metadata, metadata) #4 128 129attributes #0 = { nounwind uwtable "frame-pointer"="none" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" } 130attributes #1 = { mustprogress nocallback nofree nosync nounwind readnone speculatable willreturn } 131attributes #2 = { argmemonly mustprogress nocallback nofree nosync nounwind willreturn } 132attributes #3 = { noinline nounwind uwtable "frame-pointer"="none" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" } 133attributes #4 = { nocallback nofree nosync nounwind readnone speculatable willreturn } 134 135!llvm.dbg.cu = !{!2} 136!llvm.module.flags = !{!7, !8, !9, !10} 137!llvm.ident = !{!11} 138 139!0 = !DIGlobalVariableExpression(var: !1, expr: !DIExpression()) 140!1 = distinct !DIGlobalVariable(name: "x", scope: !2, file: !3, line: 1, type: !5, isLocal: false, isDefinition: true) 141!2 = distinct !DICompileUnit(language: DW_LANG_C99, file: !3, producer: "clang", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, globals: !4, splitDebugInlining: false, debugInfoForProfiling: true, nameTableKind: None) 142!3 = !DIFile(filename: "test.c", directory: "test") 143!4 = !{!0} 144!5 = !DIDerivedType(tag: DW_TAG_volatile_type, baseType: !6) 145!6 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed) 146!7 = !{i32 7, !"Dwarf Version", i32 5} 147!8 = !{i32 2, !"Debug Info Version", i32 3} 148!9 = !{i32 1, !"wchar_size", i32 4} 149!10 = !{i32 7, !"uwtable", i32 2} 150!11 = !{!""} 151!12 = distinct !DISubprogram(name: "foo", scope: !3, file: !3, line: 2, type: !13, scopeLine: 2, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !15) 152!13 = !DISubroutineType(types: !14) 153!14 = !{!6, !6} 154!15 = !{!16, !17} 155!16 = !DILocalVariable(name: "x", arg: 1, scope: !12, file: !3, line: 2, type: !6) 156!17 = !DILocalVariable(name: "y", scope: !12, file: !3, line: 3, type: !5) 157!18 = !DILocation(line: 0, scope: !12) 158!19 = !DILocation(line: 3, column: 3, scope: !12) 159!20 = !DILocation(line: 3, column: 16, scope: !12) 160!21 = !DILocation(line: 3, column: 22, scope: !12) 161!22 = !{!23, !23, i64 0} 162!23 = !{!"int", !24, i64 0} 163!24 = !{!"omnipotent char", !25, i64 0} 164!25 = !{!"Simple C/C++ TBAA"} 165!26 = !DILocation(line: 4, column: 10, scope: !12) 166!27 = !DILocation(line: 4, column: 12, scope: !12) 167!28 = !DILocation(line: 5, column: 1, scope: !12) 168!29 = !DILocation(line: 4, column: 3, scope: !12) 169!30 = distinct !DISubprogram(name: "bar", scope: !3, file: !3, line: 7, type: !13, scopeLine: 7, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !31) 170!31 = !{!32} 171!32 = !DILocalVariable(name: "x", arg: 1, scope: !30, file: !3, line: 7, type: !6) 172!33 = !DILocation(line: 0, scope: !30) 173!34 = !DILocation(line: 8, column: 12, scope: !30) 174!35 = !DILocation(line: 8, column: 3, scope: !30) 175!36 = distinct !DISubprogram(name: "matched", scope: !3, file: !3, line: 11, type: !13, scopeLine: 11, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !37) 176!37 = !{!38} 177!38 = !DILocalVariable(name: "x", arg: 1, scope: !36, file: !3, line: 11, type: !6) 178!39 = !DILocation(line: 0, scope: !36) 179!40 = !DILocation(line: 12, column: 12, scope: !36) 180!41 = !DILocation(line: 12, column: 3, scope: !36) 181!42 = distinct !DISubprogram(name: "main", scope: !3, file: !3, line: 15, type: !43, scopeLine: 15, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !45) 182!43 = !DISubroutineType(types: !44) 183!44 = !{!6} 184!45 = !{!46, !48} 185!46 = !DILocalVariable(name: "i", scope: !47, file: !3, line: 16, type: !6) 186!47 = distinct !DILexicalBlock(scope: !42, file: !3, line: 16, column: 3) 187!48 = !DILocalVariable(name: "a", scope: !49, file: !3, line: 17, type: !6) 188!49 = distinct !DILexicalBlock(scope: !50, file: !3, line: 17, column: 5) 189!50 = distinct !DILexicalBlock(scope: !51, file: !3, line: 16, column: 34) 190!51 = distinct !DILexicalBlock(scope: !47, file: !3, line: 16, column: 3) 191!52 = !DILocation(line: 0, scope: !47) 192!53 = !DILocation(line: 16, column: 8, scope: !47) 193!54 = !DILocation(line: 16, column: 21, scope: !55) 194!55 = !DILexicalBlockFile(scope: !51, file: !3, discriminator: 2) 195!56 = !DILocation(line: 16, column: 3, scope: !57) 196!57 = !DILexicalBlockFile(scope: !47, file: !3, discriminator: 2) 197!58 = !DILocation(line: 23, column: 1, scope: !42) 198!59 = !DILocation(line: 0, scope: !49) 199!60 = !DILocation(line: 17, column: 10, scope: !49) 200!61 = !DILocation(line: 17, column: 23, scope: !62) 201!62 = !DILexicalBlockFile(scope: !63, file: !3, discriminator: 2) 202!63 = distinct !DILexicalBlock(scope: !49, file: !3, line: 17, column: 5) 203!64 = !DILocation(line: 17, column: 5, scope: !65) 204!65 = !DILexicalBlockFile(scope: !49, file: !3, discriminator: 2) 205!66 = !DILocation(line: 16, column: 30, scope: !67) 206!67 = !DILexicalBlockFile(scope: !51, file: !3, discriminator: 4) 207!68 = !DILocation(line: 16, column: 3, scope: !67) 208!69 = distinct !{!69, !70, !71, !72} 209!70 = !DILocation(line: 16, column: 3, scope: !47) 210!71 = !DILocation(line: 22, column: 3, scope: !47) 211!72 = !{!"llvm.loop.mustprogress"} 212!73 = !DILocation(line: 18, column: 19, scope: !74) 213!74 = distinct !DILexicalBlock(scope: !63, file: !3, line: 17, column: 37) 214!75 = !DILocation(line: 18, column: 11, scope: !74) 215!76 = !DILocation(line: 18, column: 9, scope: !74) 216!77 = !DILocation(line: 19, column: 15, scope: !74) 217!78 = !DILocation(line: 19, column: 11, scope: !74) 218!79 = !DILocation(line: 19, column: 9, scope: !74) 219!80 = !DILocation(line: 20, column: 15, scope: !74) 220!81 = !DILocation(line: 20, column: 11, scope: !74) 221!82 = !DILocation(line: 20, column: 9, scope: !74) 222!83 = !DILocation(line: 17, column: 33, scope: !84) 223!84 = !DILexicalBlockFile(scope: !63, file: !3, discriminator: 4) 224!85 = !DILocation(line: 17, column: 5, scope: !84) 225!86 = distinct !{!86, !87, !88, !72} 226!87 = !DILocation(line: 17, column: 5, scope: !49) 227!88 = !DILocation(line: 21, column: 5, scope: !49) 228