| ; Test for CSSPGO's sample loader inlining to make sure it can use llvm-profgen preinliner's decision |
| |
| ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/csspgo-use-preinliner.prof -pass-remarks=inline -sample-profile-prioritized-inline -profile-sample-accurate -sample-profile-use-preinliner=0 -S 2>&1 | FileCheck %s --check-prefix=DEFAULT |
| ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/csspgo-use-preinliner.prof -pass-remarks=inline -sample-profile-prioritized-inline -profile-sample-accurate -sample-profile-use-preinliner=1 -S 2>&1 | FileCheck %s --check-prefix=PREINLINE |
| |
| ; RUN: llvm-profdata merge --sample --text --convert-sample-profile-layout=nest -generate-merged-base-profiles=0 %S/Inputs/csspgo-use-preinliner.prof -o %t.prof |
| ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%t.prof -pass-remarks=inline -sample-profile-prioritized-inline -profile-sample-accurate -sample-profile-use-preinliner=0 -S 2>&1 | FileCheck %s --check-prefix=DEFAULT |
| ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%t.prof -pass-remarks=inline -sample-profile-prioritized-inline -profile-sample-accurate -sample-profile-use-preinliner=1 -S 2>&1 | FileCheck %s --check-prefix=PREINLINE |
| |
| ; DEFAULT: '_Z5funcAi' inlined into 'main' |
| ; DEFAULT-NOT: inlined into |
| |
| ; PREINLINE-NOT: inlined into |
| ; `[main:3 @ _Z5funcAi]` does not have preinline decision, so it's up for loader inliner to decided. |
| ; PREINLINE: '_Z5funcAi' inlined into 'main' |
| ; `[main:3 @ _Z5funcAi:1 @ _Z8funcLeafi]` is inlined according to preinline decision. |
| ; PREINLINE: '_Z8funcLeafi' inlined into 'main' |
| ; Even though `[main:3.1 @ _Z5funcBi]` context is marked should inline, `_Z5funcBi` is a noinline function, so we honor that and don't inline. |
| ; When _Z5funcBi is promoted to be top level context-less profile, `[_Z5funcBi:1 @ _Z8funcLeafi]` becomes synthetic context, so preinline decision is ignored and we don't inline `_Z8funcLeafi`. |
| ; PREINLINE-NOT: inlined into |
| |
| @factor = dso_local global i32 3, align 4, !dbg !0 |
| |
| define dso_local i32 @main() local_unnamed_addr #0 !dbg !18 { |
| entry: |
| br label %for.body, !dbg !25 |
| |
| for.cond.cleanup: ; preds = %for.body |
| ret i32 %add3, !dbg !27 |
| |
| for.body: ; preds = %for.body, %entry |
| %x.011 = phi i32 [ 300000, %entry ], [ %dec, %for.body ] |
| %r.010 = phi i32 [ 0, %entry ], [ %add3, %for.body ] |
| %call = tail call i32 @_Z5funcBi(i32 %x.011), !dbg !32 |
| %add = add nuw nsw i32 %x.011, 1, !dbg !31 |
| %call1 = tail call i32 @_Z5funcAi(i32 %add), !dbg !28 |
| %add2 = add i32 %call, %r.010, !dbg !34 |
| %add3 = add i32 %add2, %call1, !dbg !35 |
| %dec = add nsw i32 %x.011, -1, !dbg !36 |
| %cmp = icmp eq i32 %x.011, 0, !dbg !38 |
| br i1 %cmp, label %for.cond.cleanup, label %for.body, !dbg !25 |
| } |
| |
| define dso_local i32 @_Z5funcAi(i32 %x) local_unnamed_addr #1 !dbg !40 { |
| entry: |
| %add = add nsw i32 %x, 100000, !dbg !44 |
| %call = tail call i32 @_Z8funcLeafi(i32 %add), !dbg !45 |
| ret i32 %call, !dbg !46 |
| } |
| |
| define dso_local i32 @_Z8funcLeafi(i32 %x) local_unnamed_addr #1 !dbg !54 { |
| entry: |
| %cmp = icmp sgt i32 %x, 0, !dbg !57 |
| br i1 %cmp, label %while.body, label %while.cond2.preheader, !dbg !59 |
| |
| while.cond2.preheader: ; preds = %entry |
| %cmp313 = icmp slt i32 %x, 0, !dbg !60 |
| br i1 %cmp313, label %while.body4, label %if.end, !dbg !63 |
| |
| while.body: ; preds = %while.body, %entry |
| %x.addr.016 = phi i32 [ %sub, %while.body ], [ %x, %entry ] |
| %tmp = load volatile i32, ptr @factor, align 4, !dbg !64 |
| %call = tail call i32 @_Z3fibi(i32 %tmp), !dbg !67 |
| %sub = sub nsw i32 %x.addr.016, %call, !dbg !68 |
| %cmp1 = icmp sgt i32 %sub, 0, !dbg !69 |
| br i1 %cmp1, label %while.body, label %if.end, !dbg !71 |
| |
| while.body4: ; preds = %while.body4, %while.cond2.preheader |
| %x.addr.114 = phi i32 [ %add, %while.body4 ], [ %x, %while.cond2.preheader ] |
| %tmp1 = load volatile i32, ptr @factor, align 4, !dbg !72 |
| %call5 = tail call i32 @_Z3fibi(i32 %tmp1), !dbg !74 |
| %add = add nsw i32 %call5, %x.addr.114, !dbg !75 |
| %cmp3 = icmp slt i32 %add, 0, !dbg !60 |
| br i1 %cmp3, label %while.body4, label %if.end, !dbg !63 |
| |
| if.end: ; preds = %while.body4, %while.body, %while.cond2.preheader |
| %x.addr.2 = phi i32 [ 0, %while.cond2.preheader ], [ %sub, %while.body ], [ %add, %while.body4 ] |
| ret i32 %x.addr.2, !dbg !76 |
| } |
| |
| define dso_local i32 @_Z5funcBi(i32 %x) local_unnamed_addr #0 !dbg !47 { |
| entry: |
| %sub = add nsw i32 %x, -100000, !dbg !51 |
| %call = tail call i32 @_Z8funcLeafi(i32 %sub), !dbg !52 |
| ret i32 %call, !dbg !53 |
| } |
| |
| declare i32 @_Z3fibi(i32) |
| |
| attributes #0 = { nofree noinline norecurse nounwind uwtable "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "frame-pointer"="none" "less-precise-fpmad"="false" "min-legal-vector-width"="0" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" "use-sample-profile" } |
| attributes #1 = { nofree norecurse nounwind uwtable "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "frame-pointer"="none" "less-precise-fpmad"="false" "min-legal-vector-width"="0" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" "use-sample-profile" } |
| |
| !llvm.dbg.cu = !{!2} |
| !llvm.module.flags = !{!14, !15, !16} |
| !llvm.ident = !{!17} |
| |
| !0 = !DIGlobalVariableExpression(var: !1, expr: !DIExpression()) |
| !1 = distinct !DIGlobalVariable(name: "factor", scope: !2, file: !3, line: 21, type: !13, isLocal: false, isDefinition: true) |
| !2 = distinct !DICompileUnit(language: DW_LANG_C_plus_plus_14, file: !3, producer: "clang version 11.0.0", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, enums: !4, retainedTypes: !5, globals: !12, splitDebugInlining: false, debugInfoForProfiling: true, nameTableKind: None) |
| !3 = !DIFile(filename: "merged.cpp", directory: "/local/autofdo") |
| !4 = !{} |
| !5 = !{!6, !10, !11} |
| !6 = !DISubprogram(name: "funcA", linkageName: "_Z5funcAi", scope: !3, file: !3, line: 6, type: !7, flags: DIFlagPrototyped, spFlags: DISPFlagOptimized, retainedNodes: !4) |
| !7 = !DISubroutineType(types: !8) |
| !8 = !{!9, !9} |
| !9 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed) |
| !10 = !DISubprogram(name: "funcB", linkageName: "_Z5funcBi", scope: !3, file: !3, line: 7, type: !7, flags: DIFlagPrototyped, spFlags: DISPFlagOptimized, retainedNodes: !4) |
| !11 = !DISubprogram(name: "funcLeaf", linkageName: "_Z8funcLeafi", scope: !3, file: !3, line: 22, type: !7, flags: DIFlagPrototyped, spFlags: DISPFlagOptimized, retainedNodes: !4) |
| !12 = !{!0} |
| !13 = !DIDerivedType(tag: DW_TAG_volatile_type, baseType: !9) |
| !14 = !{i32 7, !"Dwarf Version", i32 4} |
| !15 = !{i32 2, !"Debug Info Version", i32 3} |
| !16 = !{i32 1, !"wchar_size", i32 4} |
| !17 = !{!"clang version 11.0.0"} |
| !18 = distinct !DISubprogram(name: "main", scope: !3, file: !3, line: 11, type: !19, scopeLine: 11, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !21) |
| !19 = !DISubroutineType(types: !20) |
| !20 = !{!9} |
| !21 = !{!22, !23} |
| !22 = !DILocalVariable(name: "r", scope: !18, file: !3, line: 12, type: !9) |
| !23 = !DILocalVariable(name: "x", scope: !24, file: !3, line: 13, type: !9) |
| !24 = distinct !DILexicalBlock(scope: !18, file: !3, line: 13, column: 3) |
| !25 = !DILocation(line: 13, column: 3, scope: !26) |
| !26 = !DILexicalBlockFile(scope: !24, file: !3, discriminator: 2) |
| !27 = !DILocation(line: 17, column: 3, scope: !18) |
| !28 = !DILocation(line: 14, column: 10, scope: !29) |
| !29 = distinct !DILexicalBlock(scope: !30, file: !3, line: 13, column: 37) |
| !30 = distinct !DILexicalBlock(scope: !24, file: !3, line: 13, column: 3) |
| !31 = !DILocation(line: 14, column: 29, scope: !29) |
| !32 = !DILocation(line: 14, column: 21, scope: !33) |
| !33 = !DILexicalBlockFile(scope: !29, file: !3, discriminator: 2) |
| !34 = !DILocation(line: 14, column: 19, scope: !29) |
| !35 = !DILocation(line: 14, column: 7, scope: !29) |
| !36 = !DILocation(line: 13, column: 33, scope: !37) |
| !37 = !DILexicalBlockFile(scope: !30, file: !3, discriminator: 6) |
| !38 = !DILocation(line: 13, column: 26, scope: !39) |
| !39 = !DILexicalBlockFile(scope: !30, file: !3, discriminator: 2) |
| !40 = distinct !DISubprogram(name: "funcA", linkageName: "_Z5funcAi", scope: !3, file: !3, line: 26, type: !7, scopeLine: 26, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2) |
| !44 = !DILocation(line: 27, column: 22, scope: !40) |
| !45 = !DILocation(line: 27, column: 11, scope: !40) |
| !46 = !DILocation(line: 29, column: 3, scope: !40) |
| !47 = distinct !DISubprogram(name: "funcB", linkageName: "_Z5funcBi", scope: !3, file: !3, line: 32, type: !7, scopeLine: 32, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2) |
| !51 = !DILocation(line: 33, column: 22, scope: !47) |
| !52 = !DILocation(line: 33, column: 11, scope: !47) |
| !53 = !DILocation(line: 35, column: 3, scope: !47) |
| !54 = distinct !DISubprogram(name: "funcLeaf", linkageName: "_Z8funcLeafi", scope: !3, file: !3, line: 48, type: !7, scopeLine: 48, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2) |
| !57 = !DILocation(line: 49, column: 9, scope: !58) |
| !58 = distinct !DILexicalBlock(scope: !54, file: !3, line: 49, column: 7) |
| !59 = !DILocation(line: 49, column: 7, scope: !54) |
| !60 = !DILocation(line: 58, column: 14, scope: !61) |
| !61 = !DILexicalBlockFile(scope: !62, file: !3, discriminator: 2) |
| !62 = distinct !DILexicalBlock(scope: !58, file: !3, line: 56, column: 8) |
| !63 = !DILocation(line: 58, column: 5, scope: !61) |
| !64 = !DILocation(line: 52, column: 16, scope: !65) |
| !65 = distinct !DILexicalBlock(scope: !66, file: !3, line: 51, column: 19) |
| !66 = distinct !DILexicalBlock(scope: !58, file: !3, line: 49, column: 14) |
| !67 = !DILocation(line: 52, column: 12, scope: !65) |
| !68 = !DILocation(line: 52, column: 9, scope: !65) |
| !69 = !DILocation(line: 51, column: 14, scope: !70) |
| !70 = !DILexicalBlockFile(scope: !66, file: !3, discriminator: 2) |
| !71 = !DILocation(line: 51, column: 5, scope: !70) |
| !72 = !DILocation(line: 59, column: 16, scope: !73) |
| !73 = distinct !DILexicalBlock(scope: !62, file: !3, line: 58, column: 19) |
| !74 = !DILocation(line: 59, column: 12, scope: !73) |
| !75 = !DILocation(line: 59, column: 9, scope: !73) |
| !76 = !DILocation(line: 63, column: 3, scope: !54) |