| ;; Test to make sure that missing tail call frames in memprof profiles are |
| ;; identified but not cloned when there are multiple non-unique possible |
| ;; tail call chains between the profiled frames. |
| |
| ;; -stats requires asserts |
| ; REQUIRES: asserts |
| |
| ; RUN: opt -passes=memprof-context-disambiguation -supports-hot-cold-new \ |
| ; RUN: -memprof-export-to-dot -memprof-dot-file-path-prefix=%t. \ |
| ; RUN: -stats -debug %s -S 2>&1 | FileCheck %s --check-prefix=STATS \ |
| ; RUN: --check-prefix=IR --check-prefix=DEBUG |
| |
| ; DEBUG: Not found through unique tail call chain: _Z3barv from main that actually called xyz (found multiple possible chains) |
| |
| ;; Graph fixup should have nulled the call in the node that could not be |
| ;; resolved via tail call fixup. That happens in between the initial |
| ;; stack update and the end of graph building. |
| ; RUN: cat %t.ccg.poststackupdate.dot | FileCheck %s --check-prefix=DOTPOSTSTACKUPDATE |
| ; DOTPOSTSTACKUPDATE: {OrigId: 15025054523792398438\nmain -\> xyz} |
| ; RUN: cat %t.ccg.postbuild.dot | FileCheck %s --check-prefix=DOTPOSTBUILD |
| ; DOTPOSTBUILD: {OrigId: 15025054523792398438\nnull call (external)} |
| |
| ;; Check that all calls in the IR are to the original functions, leading to a |
| ;; non-cold operator new call. |
| |
| source_filename = "tailcall-nonunique.cc" |
| target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| ; Function Attrs: noinline |
| ; IR-LABEL: @_Z3barv() |
| define dso_local ptr @_Z3barv() local_unnamed_addr #0 { |
| entry: |
| ; IR: call ptr @_Znam(i64 10) #[[NOTCOLD:[0-9]+]] |
| %call = tail call ptr @_Znam(i64 10) #2, !memprof !0, !callsite !9 |
| ret ptr %call |
| } |
| |
| ; Function Attrs: nobuiltin allocsize(0) |
| declare ptr @_Znam(i64) #1 |
| |
| ; Function Attrs: noinline |
| ; IR-LABEL: @_Z5blah1v() |
| define dso_local ptr @_Z5blah1v() local_unnamed_addr #0 { |
| entry: |
| ; IR: call ptr @_Z3barv() |
| %call = tail call ptr @_Z3barv() |
| ret ptr %call |
| } |
| |
| ; Function Attrs: noinline |
| ; IR-LABEL: @_Z5blah2v() |
| define dso_local ptr @_Z5blah2v() local_unnamed_addr #0 { |
| entry: |
| ; IR: call ptr @_Z3barv() |
| %call = tail call ptr @_Z3barv() |
| ret ptr %call |
| } |
| |
| ; Function Attrs: noinline |
| ; IR-LABEL: @_Z4baz1v() |
| define dso_local ptr @_Z4baz1v() local_unnamed_addr #0 { |
| entry: |
| ; IR: call ptr @_Z5blah1v() |
| %call = tail call ptr @_Z5blah1v() |
| ret ptr %call |
| } |
| |
| ; Function Attrs: noinline |
| ; IR-LABEL: @_Z4baz2v() |
| define dso_local ptr @_Z4baz2v() local_unnamed_addr #0 { |
| entry: |
| ; IR: call ptr @_Z5blah2v() |
| %call = tail call ptr @_Z5blah2v() |
| ret ptr %call |
| } |
| |
| ; Function Attrs: noinline |
| ; IR-LABEL: @_Z3foob(i1 %b) |
| define dso_local ptr @_Z3foob(i1 %b) local_unnamed_addr #0 { |
| entry: |
| br i1 %b, label %if.then, label %if.else |
| |
| if.then: ; preds = %entry |
| ; IR: call ptr @_Z4baz1v() |
| %call = tail call ptr @_Z4baz1v() |
| br label %return |
| |
| if.else: ; preds = %entry |
| ; IR: call ptr @_Z4baz2v() |
| %call1 = tail call ptr @_Z4baz2v() |
| br label %return |
| |
| return: ; preds = %if.else, %if.then |
| %retval.0 = phi ptr [ %call, %if.then ], [ %call1, %if.else ] |
| ret ptr %retval.0 |
| } |
| |
| ; Function Attrs: noinline |
| ; IR-LABEL: @xyz() |
| define dso_local i32 @xyz() local_unnamed_addr #0 { |
| ; IR: call ptr @_Z3foob(i1 true) |
| %call = tail call ptr @_Z3foob(i1 true) |
| ; IR: call ptr @_Z3foob(i1 true) |
| %call1 = tail call ptr @_Z3foob(i1 true) |
| ; IR: call ptr @_Z3foob(i1 false) |
| %call2 = tail call ptr @_Z3foob(i1 false) |
| ; IR: call ptr @_Z3foob(i1 false) |
| %call3 = tail call ptr @_Z3foob(i1 false) |
| ret i32 0 |
| } |
| |
| define dso_local i32 @main() local_unnamed_addr #0 { |
| ; IR: call i32 @xyz() |
| %call1 = tail call i32 @xyz(), !callsite !11 |
| ret i32 0 |
| } |
| |
| ; IR: attributes #[[NOTCOLD]] = { builtin allocsize(0) "memprof"="notcold" } |
| |
| ; STATS: 1 memprof-context-disambiguation - Number of profiled callees found via multiple tail call chains |
| |
| attributes #0 = { noinline } |
| attributes #1 = { nobuiltin allocsize(0) } |
| attributes #2 = { builtin allocsize(0) } |
| |
| !0 = !{!5, !7} |
| !5 = !{!6, !"notcold"} |
| !6 = !{i64 3186456655321080972, i64 8632435727821051414} |
| !7 = !{!8, !"cold"} |
| !8 = !{i64 3186456655321080972, i64 -3421689549917153178} |
| !9 = !{i64 3186456655321080972} |
| !11 = !{i64 -3421689549917153178} |