blob: 6daf4f502004374d532794e6ea158eecb4c5889e [file] [log] [blame]
; REQUIRES: x86_64-linux
;
; RUN: rm -rf %t
; RUN: split-file %s %t
; RUN: llvm-ctxprof-util fromYAML --input=%t/profile.yaml --output=%t/profile.ctxprofdata
; RUN: opt -module-summary -passes='thinlto-pre-link<O2>' -use-ctx-profile=%t/profile.ctxprofdata \
; RUN: %t/example.ll -S -o %t/4909520559318251808.ll
; RUN: FileCheck --input-file %t/4909520559318251808.ll %s --check-prefix=PRELINK
; RUN: opt -passes='ctx-prof-flatten' -use-ctx-profile=%t/profile.ctxprofdata %t/4909520559318251808.ll -S | FileCheck %s --check-prefix=POSTLINK
;
;
; Check that instrumentation occurs where expected: the "no" block for both foo and
; @an_entrypoint - which explains the subsequent branch weights
;
; PRELINK-LABEL: @foo
; PRELINK-LABEL: yes:
; PRELINK-LABEL: no:
; PRELINK-NEXT: call void @llvm.instrprof.increment(ptr @foo, i64 [[#]], i32 2, i32 1)
; PRELINK-LABEL: @an_entrypoint
; PRELINK: br i1 %t, label %yes, label %common.ret, !prof ![[PREPROF:[0-9]+]]
; PRELINK-LABEL: yes:
; PRELINK-NEXT: call void @llvm.instrprof.increment(ptr @an_entrypoint, i64 [[#]], i32 2, i32 1)
; PRELINK: ![[#]] = !{i32 1, !"ProfileSummary", !1}
; PRELINK: ![[#]] = !{!"TotalCount", i64 3595}
; PRELINK: ![[#]] = !{!"MaxCount", i64 3000}
; PRELINK: ![[#]] = !{!"MaxInternalCount", i64 3000}
; PRELINK: ![[#]] = !{!"MaxFunctionCount", i64 300}
; PRELINK: ![[#]] = !{!"NumCounts", i64 6}
; PRELINK: ![[#]] = !{!"NumFunctions", i64 3}
; PRELINK: ![[PREPROF]] = !{!"branch_weights", i32 40, i32 60}
; Check that the output has:
; - no instrumentation
; - the 2 functions have an entry count
; - each conditional branch has profile annotation
;
; POSTLINK-NOT: call void @llvm.instrprof
;
; make sure we have function entry counts, branch weights, and a profile summary.
; POSTLINK-LABEL: @foo
; POSTLINK-SAME: !prof ![[FOO_EP:[0-9]+]]
; POSTLINK: br i1 %t, label %yes, label %no, !prof ![[FOO_BW:[0-9]+]]
; POSTLINK-LABEL: @an_entrypoint
; POSTLINK-SAME: !prof ![[AN_ENTRYPOINT_EP:[0-9]+]]
; POSTLINK: br i1 %t, label %yes, label %common.ret, !prof ![[AN_ENTRYPOINT_BW:[0-9]+]]
; The postlink summary is restricted to the stuff under the root - including the
; "unhandled" data.
; POSTLINK: ![[#]] = !{i32 1, !"ProfileSummary", !1}
; POSTLINK: ![[#]] = !{!"TotalCount", i64 1495}
; POSTLINK: ![[#]] = !{!"MaxCount", i64 1000}
; POSTLINK: ![[#]] = !{!"MaxInternalCount", i64 1000}
; POSTLINK: ![[#]] = !{!"MaxFunctionCount", i64 200}
; POSTLINK: ![[#]] = !{!"NumCounts", i64 6}
; POSTLINK: ![[#]] = !{!"NumFunctions", i64 3}
;
; @foo will be called both unconditionally and conditionally, on the "yes" branch
; which has a count of 40. So 140 times.
; POSTLINK: ![[FOO_EP]] = !{!"function_entry_count", i64 140}
; foo's "no" branch is taken 10+5 times (from the 2 contexts belonging to foo).
; Which means its "yes" branch is taken 140 - 15 times.
; POSTLINK: ![[FOO_BW]] = !{!"branch_weights", i32 125, i32 15}
; POSTLINK: ![[AN_ENTRYPOINT_EP]] = !{!"function_entry_count", i64 100}
; POSTLINK: ![[AN_ENTRYPOINT_BW]] = !{!"branch_weights", i32 40, i32 60}
;--- profile.yaml
Contexts:
- Guid: 4909520559318251808
TotalRootEntryCount: 100
Unhandled:
- Guid: 1234
Counters: [200, 1000]
Counters: [100, 40]
Callsites: -
- Guid: 11872291593386833696
Counters: [ 100, 5 ]
-
- Guid: 11872291593386833696
Counters: [ 40, 10 ]
FlatProfiles:
- Guid: 1234
Counters: [ 100, 2000 ]
;--- example.ll
declare void @bar()
define void @foo(i32 %a, ptr %fct) #0 !guid !0 {
%t = icmp sgt i32 %a, 7
br i1 %t, label %yes, label %no
yes:
call void %fct(i32 %a)
br label %exit
no:
call void @bar()
br label %exit
exit:
ret void
}
define void @an_entrypoint(i32 %a) !guid !1 {
%t = icmp sgt i32 %a, 0
call void @foo(i32 10, ptr null)
br i1 %t, label %yes, label %no
yes:
call void @foo(i32 1, ptr null)
ret void
no:
ret void
}
attributes #0 = { noinline }
!0 = !{ i64 11872291593386833696 }
!1 = !{i64 4909520559318251808}