| ; REQUIRES: asserts |
| ; asserts are required for -debug-only=<pass-name> |
| |
| ; RUN: rm -rf %t && split-file %s %t && cd %t |
| |
| ;; Read text profiles and merge them into indexed profiles. |
| ; RUN: llvm-profdata merge --memprof-version=4 memprof.yaml -o memprof.profdata |
| ; RUN: llvm-profdata merge --memprof-version=4 memprof-no-dap.yaml -o memprof-no-dap.profdata |
| |
| ;; Run optimizer pass on an IR module without IR functions, and test that global |
| ;; variables in the module could be annotated (i.e., no early return), |
| ; RUN: opt -passes='memprof-use<profile-filename=memprof.profdata>' -memprof-annotate-static-data-prefix \ |
| ; RUN: -debug-only=memprof -stats -S funcless-module.ll -o - 2>&1 | FileCheck %s --check-prefixes=LOG,IR,STAT |
| |
| ;; Run optimizer pass on the IR, and check the section prefix. |
| ; RUN: opt -passes='memprof-use<profile-filename=memprof.profdata>' -memprof-annotate-static-data-prefix \ |
| ; RUN: -debug-only=memprof -stats -S input.ll -o - 2>&1 | FileCheck %s --check-prefixes=LOG,IR,STAT |
| |
| ;; Run memprof without providing memprof data. Test that IR has module flag |
| ;; `EnableDataAccessProf` as 0. |
| ; RUN: opt -passes='memprof-use<profile-filename=memprof-no-dap.profdata>' -memprof-annotate-static-data-prefix \ |
| ; RUN: -debug-only=memprof -stats -S input.ll -o - 2>&1 | FileCheck %s --check-prefix=FLAG |
| |
| ;; Run memprof without explicitly setting -memprof-annotate-static-data-prefix. |
| ;; The output text IR shouldn't have `section_prefix` or EnableDataAccessProf module flag. |
| ; RUN: opt -passes='memprof-use<profile-filename=memprof.profdata>' \ |
| ; RUN: -debug-only=memprof -stats -S input.ll -o - | FileCheck %s --check-prefix=FLAGLESS --implicit-check-not="section_prefix" |
| |
| ; LOG: Skip annotating string literal .str |
| ; LOG: Global variable var1 is annotated as hot |
| ; LOG: Global variable var2.llvm.125 is annotated as hot |
| ; LOG: Global variable bar is not annotated |
| ; LOG: Global variable foo is annotated as unlikely |
| ; LOG: Skip annotation for var3 due to explicit section name. |
| ; LOG: Skip annotation for var4 due to explicit section name. |
| ; LOG: Skip annotation for llvm.fake_var due to name starts with `llvm.`. |
| ; LOG: Skip annotation for qux due to linker declaration. |
| |
| ;; String literals are not annotated. |
| ; IR: @.str = unnamed_addr constant [5 x i8] c"abcde" |
| ; IR-NOT: section_prefix |
| ; IR: @var1 = global i32 123, !section_prefix !0 |
| |
| ;; @var.llvm.125 will be canonicalized to @var2 for profile look-up. |
| ; IR-NEXT: @var2.llvm.125 = global i64 0, !section_prefix !0 |
| |
| ;; @bar is not seen in hot symbol or known symbol set, so it won't get a section |
| ;; prefix. Test this by testing that there is no section_prefix between @bar and |
| ;; @foo. |
| ; IR-NEXT: @bar = global i16 3 |
| ; IR-NOT: !section_prefix |
| |
| ;; @foo is unlikely. |
| ; IR-NEXT: @foo = global i8 2, !section_prefix !1 |
| |
| ; IR-NEXT: @var3 = constant [2 x i32] [i32 12345, i32 6789], section "sec1" |
| ; IR-NEXT: @var4 = constant [1 x i64] [i64 98765] #0 |
| |
| ; IR: @llvm.fake_var = global i32 123 |
| ; IR-NOT: !section_prefix |
| ; IR: @qux = external global i64 |
| ; IR-NOT: !section_prefix |
| |
| ; IR: attributes #0 = { "rodata-section"="sec2" } |
| |
| ; IR: !0 = !{!"section_prefix", !"hot"} |
| ; IR-NEXT: !1 = !{!"section_prefix", !"unlikely"} |
| ; IR-NEXT: !2 = !{i32 2, !"EnableDataAccessProf", i32 1} |
| |
| ; FLAG: !{i32 2, !"EnableDataAccessProf", i32 0} |
| ; FLAGLESS-NOT: EnableDataAccessProf |
| |
| ; STAT: 1 memprof - Number of global vars annotated with 'unlikely' section prefix. |
| ; STAT: 2 memprof - Number of global vars with user-specified section (not annotated). |
| ; STAT: 2 memprof - Number of global vars annotated with 'hot' section prefix. |
| ; STAT: 1 memprof - Number of global vars with unknown hotness (no section prefix). |
| |
| ;--- memprof.yaml |
| --- |
| DataAccessProfiles: |
| SampledRecords: |
| - Symbol: var1 |
| AccessCount: 1000 |
| - Symbol: var2 |
| AccessCount: 5 |
| - Hash: 101010 |
| AccessCount: 145 |
| KnownColdSymbols: |
| - foo |
| KnownColdStrHashes: [ 999, 1001 ] |
| ... |
| ;--- memprof-no-dap.yaml |
| --- |
| # A memprof file with without data access profiles. The heap records are simplified |
| # to pass profile parsing and don't need to match the IR. |
| HeapProfileRecords: |
| - GUID: 0xdeadbeef12345678 |
| AllocSites: |
| - Callstack: |
| - { Function: 0x1111111111111111, LineOffset: 11, Column: 10, IsInlineFrame: true } |
| MemInfoBlock: |
| AllocCount: 111 |
| TotalSize: 222 |
| TotalLifetime: 333 |
| TotalLifetimeAccessDensity: 444 |
| CallSites: |
| - Frames: |
| - { Function: 0x5555555555555555, LineOffset: 55, Column: 50, IsInlineFrame: true } |
| ... |
| ;--- input.ll |
| |
| target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| @.str = unnamed_addr constant [5 x i8] c"abcde" |
| @var1 = global i32 123 |
| @var2.llvm.125 = global i64 0 |
| @bar = global i16 3 |
| @foo = global i8 2 |
| @var3 = constant [2 x i32][i32 12345, i32 6789], section "sec1" |
| @var4 = constant [1 x i64][i64 98765] #0 |
| @llvm.fake_var = global i32 123 |
| @qux = external global i64 |
| |
| define i32 @func() { |
| %a = load i32, ptr @var1 |
| %b = load i32, ptr @var2.llvm.125 |
| %c = load i32, ptr @llvm.fake_var |
| %ret = call i32 (...) @func_taking_arbitrary_param(i32 %a, i32 %b, i32 %c) |
| ret i32 %ret |
| } |
| |
| declare i32 @func_taking_arbitrary_param(...) |
| |
| attributes #0 = { "rodata-section"="sec2" } |
| |
| ;--- funcless-module.ll |
| |
| target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| @.str = unnamed_addr constant [5 x i8] c"abcde" |
| @var1 = global i32 123 |
| @var2.llvm.125 = global i64 0 |
| @bar = global i16 3 |
| @foo = global i8 2 |
| @var3 = constant [2 x i32][i32 12345, i32 6789], section "sec1" |
| @var4 = constant [1 x i64][i64 98765] #0 |
| @llvm.fake_var = global i32 123 |
| @qux = external global i64 |
| |
| |
| attributes #0 = { "rodata-section"="sec2" } |