| ; REQUIRES: x86_64-linux |
| ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/pseudo-probe-profile-mismatch.prof -report-profile-staleness -persist-profile-staleness -S 2>%t -o %t.ll |
| ; RUN: FileCheck %s --input-file %t |
| ; RUN: FileCheck %s --input-file %t.ll -check-prefix=CHECK-MD |
| ; RUN: llc < %t.ll -filetype=obj -o %t.obj |
| ; RUN: llvm-objdump --section-headers %t.obj | FileCheck %s --check-prefix=CHECK-OBJ |
| ; RUN: llc < %t.ll -filetype=asm -o - | FileCheck %s --check-prefix=CHECK-ASM |
| |
| ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/pseudo-probe-profile-mismatch-nested.prof -report-profile-staleness -persist-profile-staleness -S 2>&1 | FileCheck %s --check-prefix=CHECK-NESTED |
| |
| |
| ; CHECK: (1/3) of functions' profile are invalid and (10/50) of samples are discarded due to function hash mismatch. |
| ; CHECK: (2/3) of callsites' profile are invalid and (20/30) of samples are discarded due to callsite location mismatch. |
| |
| ; CHECK-MD: ![[#]] = !{!"NumMismatchedFuncHash", i64 1, !"TotalProfiledFunc", i64 3, !"MismatchedFuncHashSamples", i64 10, !"TotalFuncHashSamples", i64 50, !"NumMismatchedCallsites", i64 2, !"TotalProfiledCallsites", i64 3, !"MismatchedCallsiteSamples", i64 20, !"TotalCallsiteSamples", i64 30} |
| |
| ; CHECK-OBJ: .llvm_stats |
| |
| ; CHECK-ASM: .section .llvm_stats,"",@progbits |
| ; CHECK-ASM: .byte 21 |
| ; CHECK-ASM: .ascii "NumMismatchedFuncHash" |
| ; CHECK-ASM: .byte 4 |
| ; CHECK-ASM: .ascii "MQ==" |
| ; CHECK-ASM: .byte 17 |
| ; CHECK-ASM: .ascii "TotalProfiledFunc" |
| ; CHECK-ASM: .byte 4 |
| ; CHECK-ASM: .ascii "Mw==" |
| ; CHECK-ASM: .byte 25 |
| ; CHECK-ASM: .ascii "MismatchedFuncHashSamples" |
| ; CHECK-ASM: .byte 4 |
| ; CHECK-ASM: .ascii "MTA=" |
| ; CHECK-ASM: .byte 20 |
| ; CHECK-ASM: .ascii "TotalFuncHashSamples" |
| ; CHECK-ASM: .byte 4 |
| ; CHECK-ASM: .ascii "NTA=" |
| ; CHECK-ASM: .byte 22 |
| ; CHECK-ASM: .ascii "NumMismatchedCallsites" |
| ; CHECK-ASM: .byte 4 |
| ; CHECK-ASM: .ascii "Mg==" |
| ; CHECK-ASM: .byte 22 |
| ; CHECK-ASM: .ascii "TotalProfiledCallsites" |
| ; CHECK-ASM: .byte 4 |
| ; CHECK-ASM: .ascii "Mw==" |
| ; CHECK-ASM: .byte 25 |
| ; CHECK-ASM: .ascii "MismatchedCallsiteSamples" |
| ; CHECK-ASM: .byte 4 |
| ; CHECK-ASM: .ascii "MjA=" |
| ; CHECK-ASM: .byte 20 |
| ; CHECK-ASM: .ascii "TotalCallsiteSamples" |
| ; CHECK-ASM: .byte 4 |
| ; CHECK-ASM: .ascii "MzA=" |
| |
| ; CHECK-NESTED: (1/2) of functions' profile are invalid and (211/311) of samples are discarded due to function hash mismatch. |
| |
| |
| target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| @x = dso_local global i32 0, align 4, !dbg !0 |
| |
| ; Function Attrs: nounwind uwtable |
| define dso_local i32 @foo(i32 noundef %x) #0 !dbg !16 { |
| entry: |
| %y = alloca i32, align 4 |
| call void @llvm.dbg.value(metadata i32 %x, metadata !20, metadata !DIExpression()), !dbg !22 |
| call void @llvm.lifetime.start.p0(i64 4, ptr nonnull %y), !dbg !23 |
| call void @llvm.dbg.declare(metadata ptr %y, metadata !21, metadata !DIExpression()), !dbg !24 |
| call void @llvm.pseudoprobe(i64 6699318081062747564, i64 1, i32 0, i64 -1), !dbg !25 |
| %add = add nsw i32 %x, 1, !dbg !26 |
| store volatile i32 %add, ptr %y, align 4, !dbg !24, !tbaa !27 |
| %y.0. = load volatile i32, ptr %y, align 4, !dbg !31, !tbaa !27 |
| %add1 = add nsw i32 %y.0., 1, !dbg !32 |
| call void @llvm.lifetime.end.p0(i64 4, ptr nonnull %y), !dbg !33 |
| ret i32 %add1, !dbg !34 |
| } |
| |
| ; Function Attrs: mustprogress nocallback nofree nosync nounwind readnone speculatable willreturn |
| declare void @llvm.dbg.declare(metadata, metadata, metadata) #1 |
| |
| ; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn |
| declare void @llvm.lifetime.start.p0(i64 immarg, ptr nocapture) #2 |
| |
| ; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn |
| declare void @llvm.lifetime.end.p0(i64 immarg, ptr nocapture) #2 |
| |
| ; Function Attrs: noinline nounwind uwtable |
| define dso_local i32 @bar(i32 noundef %x) #3 !dbg !35 { |
| entry: |
| call void @llvm.dbg.value(metadata i32 %x, metadata !37, metadata !DIExpression()), !dbg !38 |
| call void @llvm.pseudoprobe(i64 -2012135647395072713, i64 1, i32 0, i64 -1), !dbg !39 |
| %add = add nsw i32 %x, 2, !dbg !40 |
| ret i32 %add, !dbg !41 |
| } |
| |
| ; Function Attrs: noinline nounwind uwtable |
| define dso_local i32 @matched(i32 noundef %x) #3 !dbg !42 { |
| entry: |
| call void @llvm.dbg.value(metadata i32 %x, metadata !44, metadata !DIExpression()), !dbg !45 |
| call void @llvm.pseudoprobe(i64 -5844448289301669773, i64 1, i32 0, i64 -1), !dbg !46 |
| %add = add nsw i32 %x, 3, !dbg !47 |
| ret i32 %add, !dbg !48 |
| } |
| |
| ; Function Attrs: nounwind uwtable |
| define dso_local i32 @main() #0 !dbg !49 { |
| entry: |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 1, i32 0, i64 -1), !dbg !59 |
| call void @llvm.dbg.value(metadata i32 0, metadata !53, metadata !DIExpression()), !dbg !60 |
| br label %for.cond, !dbg !61 |
| |
| for.cond: ; preds = %for.cond.cleanup3, %entry |
| %i.0 = phi i32 [ 0, %entry ], [ %inc8, %for.cond.cleanup3 ], !dbg !60 |
| call void @llvm.dbg.value(metadata i32 %i.0, metadata !53, metadata !DIExpression()), !dbg !60 |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 2, i32 0, i64 -1), !dbg !62 |
| %cmp = icmp ult i32 %i.0, 1000, !dbg !64 |
| br i1 %cmp, label %for.body, label %for.cond.cleanup, !dbg !65 |
| |
| for.cond.cleanup: ; preds = %for.cond |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 3, i32 0, i64 -1), !dbg !67 |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 11, i32 0, i64 -1), !dbg !68 |
| ret i32 0, !dbg !68 |
| |
| for.body: ; preds = %for.cond |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 4, i32 0, i64 -1), !dbg !69 |
| call void @llvm.dbg.value(metadata i32 0, metadata !55, metadata !DIExpression()), !dbg !70 |
| br label %for.cond1, !dbg !71 |
| |
| for.cond1: ; preds = %for.body4, %for.body |
| %a.0 = phi i32 [ 0, %for.body ], [ %inc, %for.body4 ], !dbg !70 |
| call void @llvm.dbg.value(metadata i32 %a.0, metadata !55, metadata !DIExpression()), !dbg !70 |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 5, i32 0, i64 -1), !dbg !72 |
| %cmp2 = icmp ult i32 %a.0, 10000, !dbg !75 |
| br i1 %cmp2, label %for.body4, label %for.cond.cleanup3, !dbg !76 |
| |
| for.cond.cleanup3: ; preds = %for.cond1 |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 6, i32 0, i64 -1), !dbg !67 |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 9, i32 0, i64 -1), !dbg !78 |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 10, i32 0, i64 -1), !dbg !79 |
| %inc8 = add nuw nsw i32 %i.0, 1, !dbg !79 |
| call void @llvm.dbg.value(metadata i32 %inc8, metadata !53, metadata !DIExpression()), !dbg !60 |
| br label %for.cond, !dbg !81, !llvm.loop !82 |
| |
| for.body4: ; preds = %for.cond1 |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 7, i32 0, i64 -1), !dbg !86 |
| %0 = load volatile i32, ptr @x, align 4, !dbg !86, !tbaa !27 |
| %call = call i32 @matched(i32 noundef %0), !dbg !88 |
| store volatile i32 %call, ptr @x, align 4, !dbg !90, !tbaa !27 |
| %1 = load volatile i32, ptr @x, align 4, !dbg !91, !tbaa !27 |
| %call5 = call i32 @foo(i32 noundef %1), !dbg !92 |
| store volatile i32 %call5, ptr @x, align 4, !dbg !94, !tbaa !27 |
| %2 = load volatile i32, ptr @x, align 4, !dbg !95, !tbaa !27 |
| %call6 = call i32 @bar(i32 noundef %2), !dbg !96 |
| store volatile i32 %call6, ptr @x, align 4, !dbg !98, !tbaa !27 |
| call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 8, i32 0, i64 -1), !dbg !99 |
| %inc = add nuw nsw i32 %a.0, 1, !dbg !99 |
| call void @llvm.dbg.value(metadata i32 %inc, metadata !55, metadata !DIExpression()), !dbg !70 |
| br label %for.cond1, !dbg !101, !llvm.loop !102 |
| } |
| |
| ; Function Attrs: inaccessiblememonly mustprogress nocallback nofree nosync nounwind willreturn |
| declare void @llvm.pseudoprobe(i64, i64, i32, i64) #4 |
| |
| ; Function Attrs: nocallback nofree nosync nounwind readnone speculatable willreturn |
| declare void @llvm.dbg.value(metadata, metadata, metadata) #5 |
| |
| attributes #0 = { nounwind uwtable "frame-pointer"="none" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" } |
| attributes #1 = { mustprogress nocallback nofree nosync nounwind readnone speculatable willreturn } |
| attributes #2 = { argmemonly mustprogress nocallback nofree nosync nounwind willreturn } |
| attributes #3 = { noinline nounwind uwtable "frame-pointer"="none" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" } |
| attributes #4 = { inaccessiblememonly mustprogress nocallback nofree nosync nounwind willreturn } |
| attributes #5 = { nocallback nofree nosync nounwind readnone speculatable willreturn } |
| |
| !llvm.dbg.cu = !{!2} |
| !llvm.module.flags = !{!7, !8, !9, !10} |
| !llvm.ident = !{!11} |
| !llvm.pseudo_probe_desc = !{!12, !13, !14, !15} |
| |
| !0 = !DIGlobalVariableExpression(var: !1, expr: !DIExpression()) |
| !1 = distinct !DIGlobalVariable(name: "x", scope: !2, file: !3, line: 1, type: !5, isLocal: false, isDefinition: true) |
| !2 = distinct !DICompileUnit(language: DW_LANG_C99, file: !3, producer: "", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, globals: !4, splitDebugInlining: false, debugInfoForProfiling: true, nameTableKind: None) |
| !3 = !DIFile(filename: "test.c", directory: "") |
| !4 = !{!0} |
| !5 = !DIDerivedType(tag: DW_TAG_volatile_type, baseType: !6) |
| !6 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed) |
| !7 = !{i32 7, !"Dwarf Version", i32 5} |
| !8 = !{i32 2, !"Debug Info Version", i32 3} |
| !9 = !{i32 1, !"wchar_size", i32 4} |
| !10 = !{i32 7, !"uwtable", i32 2} |
| !11 = !{!""} |
| !12 = !{i64 6699318081062747564, i64 4294967295, !"foo"} |
| !13 = !{i64 -2012135647395072713, i64 4294967295, !"bar"} |
| !14 = !{i64 -5844448289301669773, i64 4294967295, !"matched"} |
| !15 = !{i64 -2624081020897602054, i64 844635331715433, !"main"} |
| !16 = distinct !DISubprogram(name: "foo", scope: !3, file: !3, line: 2, type: !17, scopeLine: 2, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !19) |
| !17 = !DISubroutineType(types: !18) |
| !18 = !{!6, !6} |
| !19 = !{!20, !21} |
| !20 = !DILocalVariable(name: "x", arg: 1, scope: !16, file: !3, line: 2, type: !6) |
| !21 = !DILocalVariable(name: "y", scope: !16, file: !3, line: 3, type: !5) |
| !22 = !DILocation(line: 0, scope: !16) |
| !23 = !DILocation(line: 3, column: 3, scope: !16) |
| !24 = !DILocation(line: 3, column: 16, scope: !16) |
| !25 = !DILocation(line: 3, column: 20, scope: !16) |
| !26 = !DILocation(line: 3, column: 22, scope: !16) |
| !27 = !{!28, !28, i64 0} |
| !28 = !{!"int", !29, i64 0} |
| !29 = !{!"omnipotent char", !30, i64 0} |
| !30 = !{!"Simple C/C++ TBAA"} |
| !31 = !DILocation(line: 4, column: 10, scope: !16) |
| !32 = !DILocation(line: 4, column: 12, scope: !16) |
| !33 = !DILocation(line: 5, column: 1, scope: !16) |
| !34 = !DILocation(line: 4, column: 3, scope: !16) |
| !35 = distinct !DISubprogram(name: "bar", scope: !3, file: !3, line: 7, type: !17, scopeLine: 7, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !36) |
| !36 = !{!37} |
| !37 = !DILocalVariable(name: "x", arg: 1, scope: !35, file: !3, line: 7, type: !6) |
| !38 = !DILocation(line: 0, scope: !35) |
| !39 = !DILocation(line: 8, column: 10, scope: !35) |
| !40 = !DILocation(line: 8, column: 12, scope: !35) |
| !41 = !DILocation(line: 8, column: 3, scope: !35) |
| !42 = distinct !DISubprogram(name: "matched", scope: !3, file: !3, line: 11, type: !17, scopeLine: 11, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !43) |
| !43 = !{!44} |
| !44 = !DILocalVariable(name: "x", arg: 1, scope: !42, file: !3, line: 11, type: !6) |
| !45 = !DILocation(line: 0, scope: !42) |
| !46 = !DILocation(line: 12, column: 10, scope: !42) |
| !47 = !DILocation(line: 12, column: 12, scope: !42) |
| !48 = !DILocation(line: 12, column: 3, scope: !42) |
| !49 = distinct !DISubprogram(name: "main", scope: !3, file: !3, line: 15, type: !50, scopeLine: 15, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !52) |
| !50 = !DISubroutineType(types: !51) |
| !51 = !{!6} |
| !52 = !{!53, !55} |
| !53 = !DILocalVariable(name: "i", scope: !54, file: !3, line: 16, type: !6) |
| !54 = distinct !DILexicalBlock(scope: !49, file: !3, line: 16, column: 3) |
| !55 = !DILocalVariable(name: "a", scope: !56, file: !3, line: 17, type: !6) |
| !56 = distinct !DILexicalBlock(scope: !57, file: !3, line: 17, column: 5) |
| !57 = distinct !DILexicalBlock(scope: !58, file: !3, line: 16, column: 34) |
| !58 = distinct !DILexicalBlock(scope: !54, file: !3, line: 16, column: 3) |
| !59 = !DILocation(line: 16, column: 12, scope: !54) |
| !60 = !DILocation(line: 0, scope: !54) |
| !61 = !DILocation(line: 16, column: 8, scope: !54) |
| !62 = !DILocation(line: 16, column: 19, scope: !63) |
| !63 = !DILexicalBlockFile(scope: !58, file: !3, discriminator: 0) |
| !64 = !DILocation(line: 16, column: 21, scope: !63) |
| !65 = !DILocation(line: 16, column: 3, scope: !66) |
| !66 = !DILexicalBlockFile(scope: !54, file: !3, discriminator: 0) |
| !67 = !DILocation(line: 0, scope: !49) |
| !68 = !DILocation(line: 23, column: 1, scope: !49) |
| !69 = !DILocation(line: 17, column: 14, scope: !56) |
| !70 = !DILocation(line: 0, scope: !56) |
| !71 = !DILocation(line: 17, column: 10, scope: !56) |
| !72 = !DILocation(line: 17, column: 21, scope: !73) |
| !73 = !DILexicalBlockFile(scope: !74, file: !3, discriminator: 0) |
| !74 = distinct !DILexicalBlock(scope: !56, file: !3, line: 17, column: 5) |
| !75 = !DILocation(line: 17, column: 23, scope: !73) |
| !76 = !DILocation(line: 17, column: 5, scope: !77) |
| !77 = !DILexicalBlockFile(scope: !56, file: !3, discriminator: 0) |
| !78 = !DILocation(line: 22, column: 3, scope: !57) |
| !79 = !DILocation(line: 16, column: 30, scope: !80) |
| !80 = !DILexicalBlockFile(scope: !58, file: !3, discriminator: 0) |
| !81 = !DILocation(line: 16, column: 3, scope: !80) |
| !82 = distinct !{!82, !83, !84, !85} |
| !83 = !DILocation(line: 16, column: 3, scope: !54) |
| !84 = !DILocation(line: 22, column: 3, scope: !54) |
| !85 = !{!"llvm.loop.mustprogress"} |
| !86 = !DILocation(line: 18, column: 19, scope: !87) |
| !87 = distinct !DILexicalBlock(scope: !74, file: !3, line: 17, column: 37) |
| !88 = !DILocation(line: 18, column: 11, scope: !89) |
| !89 = !DILexicalBlockFile(scope: !87, file: !3, discriminator: 186646631) |
| !90 = !DILocation(line: 18, column: 9, scope: !87) |
| !91 = !DILocation(line: 19, column: 15, scope: !87) |
| !92 = !DILocation(line: 19, column: 11, scope: !93) |
| !93 = !DILexicalBlockFile(scope: !87, file: !3, discriminator: 186646639) |
| !94 = !DILocation(line: 19, column: 9, scope: !87) |
| !95 = !DILocation(line: 20, column: 15, scope: !87) |
| !96 = !DILocation(line: 20, column: 11, scope: !97) |
| !97 = !DILexicalBlockFile(scope: !87, file: !3, discriminator: 186646647) |
| !98 = !DILocation(line: 20, column: 9, scope: !87) |
| !99 = !DILocation(line: 17, column: 33, scope: !100) |
| !100 = !DILexicalBlockFile(scope: !74, file: !3, discriminator: 0) |
| !101 = !DILocation(line: 17, column: 5, scope: !100) |
| !102 = distinct !{!102, !103, !104, !85} |
| !103 = !DILocation(line: 17, column: 5, scope: !56) |
| !104 = !DILocation(line: 21, column: 5, scope: !56) |