| ; The static-data-splitter processes data from @cold_func first, |
| ; @unprofiled_func secondly, and @hot_func after the two functions above. |
| ; Tests that data hotness is based on aggregated module-wide profile |
| ; information. This way linker-mergable data is emitted once per module. |
| |
| target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| ; The three RUN commands set `-relocation-model=pic` so `hot_relro_array` and |
| ; `cold_relro_array` are placed in the .data.rel.ro-prefixed section. |
| |
| ; This RUN command sets `-data-sections=true -unique-section-names=true` so data |
| ; sections are uniqufied by numbers. |
| ; RUN: llc -mtriple=x86_64-unknown-linux-gnu -relocation-model=pic \ |
| ; RUN: -partition-static-data-sections=true \ |
| ; RUN: -data-sections=true -unique-section-names=true \ |
| ; RUN: %s -o - 2>&1 | FileCheck %s --check-prefixes=SYM,COMMON --dump-input=always |
| |
| ; This RUN command sets `-data-sections=true -unique-section-names=false` so |
| ; data sections are uniqufied by variable names. |
| ; RUN: llc -mtriple=x86_64-unknown-linux-gnu -relocation-model=pic \ |
| ; RUN: -partition-static-data-sections=true \ |
| ; RUN: -data-sections=true -unique-section-names=false \ |
| ; RUN: %s -o - 2>&1 | FileCheck %s --check-prefixes=UNIQ,COMMON --dump-input=always |
| |
| ; This RUN command sets `-data-sections=false -unique-section-names=false`. |
| ; RUN: llc -mtriple=x86_64-unknown-linux-gnu -relocation-model=pic \ |
| ; RUN: -partition-static-data-sections=true \ |
| ; RUN: -data-sections=false -unique-section-names=false \ |
| ; RUN: %s -o - 2>&1 | FileCheck %s --check-prefixes=AGG,COMMON --dump-input=always |
| |
| ; For @.str and @.str.1 |
| ; COMMON: .type .L.str,@object |
| ; SYM-NEXT: .section .rodata.str1.1.hot. |
| ; UNIQ-NEXT: .section .rodata.str1.1.hot.,"aMS",@progbits,1 |
| ; AGG-NEXT: .section .rodata.str1.1.hot |
| ; COMMON-NEXT: .L.str: |
| ; COMMON-NEXT: "hot\t" |
| ; COMMON: .L.str.1: |
| ; COMMON-NEXT: "%d\t%d\t%d\n" |
| |
| ; For @hot_relro_array |
| ; COMMON: .type hot_relro_array,@object |
| ; SYM-NEXT: .section .data.rel.ro.hot.hot_relro_array |
| ; UNIQ-NEXT: .section .data.rel.ro.hot.,"aw",@progbits,unique,1 |
| ; AGG-NEXT: .section .data.rel.ro.hot.,"aw",@progbits |
| |
| ; For @hot_data, which is accessed by {cold_func, unprofiled_func, hot_func}. |
| ; COMMON: .type hot_data,@object |
| ; SYM-NEXT: .section .data.hot.hot_data,"aw",@progbits |
| ; UNIQ-NEXT: .section .data.hot.,"aw",@progbits,unique,2 |
| ; AGG-NEXT: .section .data.hot.,"aw",@progbits |
| |
| ; For @hot_bss, which is accessed by {unprofiled_func, hot_func}. |
| ; COMMON: .type hot_bss,@object |
| ; SYM-NEXT: .section .bss.hot.hot_bss,"aw",@nobits |
| ; UNIQ-NEXT: .section .bss.hot.,"aw",@nobits,unique,3 |
| ; AGG-NEXT: .section .bss.hot.,"aw",@nobits |
| |
| ; For @.str.2 |
| ; COMMON: .type .L.str.2,@object |
| ; SYM-NEXT: .section .rodata.str1.1.unlikely.,"aMS",@progbits,1 |
| ; UNIQ-NEXT: .section .rodata.str1.1.unlikely.,"aMS",@progbits,1 |
| ; AGG-NEXT: .section .rodata.str1.1.unlikely.,"aMS",@progbits,1 |
| ; COMMON-NEXT: .L.str.2: |
| ; COMMON-NEXT: "cold%d\t%d\t%d\n" |
| |
| ; For @cold_bss |
| ; COMMON: .type cold_bss,@object |
| ; SYM-NEXT: .section .bss.unlikely.cold_bss,"aw",@nobits |
| ; UNIQ-NEXT: .section .bss.unlikely.,"aw",@nobits,unique,4 |
| ; AGG-NEXT: .section .bss.unlikely.,"aw",@nobits |
| |
| ; For @cold_data |
| ; COMMON: .type cold_data,@object |
| ; SYM-NEXT: .section .data.unlikely.cold_data,"aw",@progbits |
| ; UNIQ-NEXT: .section .data.unlikely.,"aw",@progbits,unique,5 |
| ; AGG-NEXT: .section .data.unlikely.,"aw",@progbits |
| |
| ; For @cold_data_custom_foo_section |
| ; It has an explicit section 'foo' and shouldn't have hot or unlikely suffix. |
| ; COMMON: .type cold_data_custom_foo_section,@object |
| ; SYM-NEXT: .section foo,"aw",@progbits |
| ; UNIQ-NEXT: .section foo,"aw",@progbits |
| ; AGG-NEXT: .section foo,"aw",@progbits |
| |
| ; For @cold_relro_array |
| ; COMMON: .type cold_relro_array,@object |
| ; SYM-NEXT: .section .data.rel.ro.unlikely.cold_relro_array,"aw",@progbits |
| ; UNIQ-NEXT: .section .data.rel.ro.unlikely.,"aw",@progbits,unique,6 |
| ; AGG-NEXT: .section .data.rel.ro.unlikely.,"aw",@progbits |
| |
| ; Currently static-data-splitter only analyzes access from code. |
| ; @bss2 and @data3 are indirectly accessed by code through @hot_relro_array |
| ; and @cold_relro_array. A follow-up item is to analyze indirect access via data |
| ; and prune the unlikely list. |
| ; For @bss2 |
| ; COMMON: .type bss2,@object |
| ; SYM-NEXT: .section .bss.unlikely.bss2,"aw",@nobits |
| ; UNIQ-NEXT: .section .bss.unlikely.,"aw",@nobits,unique,7 |
| ; AGG-NEXT: .section .bss.unlikely.,"aw",@nobits |
| |
| ; For @data3 |
| ; COMMON: .type data3,@object |
| ; SYM-NEXT: .section .data.unlikely.data3,"aw",@progbits |
| ; UNIQ-NEXT: .section .data.unlikely.,"aw",@progbits,unique,8 |
| ; AGG-NEXT: .section .data.unlikely.,"aw",@progbits |
| |
| ; For @data_with_unknown_hotness |
| ; SYM: .type .Ldata_with_unknown_hotness,@object # @data_with_unknown_hotness |
| ; SYM: .section .data..Ldata_with_unknown_hotness,"aw",@progbits |
| ; UNIQ: .section .data,"aw",@progbits,unique,9 |
| ; The `.section` directive is omitted for .data with -unique-section-names=false. |
| ; See MCSectionELF::shouldOmitSectionDirective for the implementation details. |
| ; AGG: .data |
| ; COMMON: .Ldata_with_unknown_hotness: |
| |
| ; For @hot_data_custom_bar_section |
| ; It has an explicit section attribute 'var' and shouldn't have hot or unlikely suffix. |
| ; COMMON: .type hot_data_custom_bar_section,@object |
| ; SYM-NEXT: .section bar,"aw",@progbits |
| ; SYM: hot_data_custom_bar_section |
| ; UNIQ: .section bar,"aw",@progbits |
| ; AGG: .section bar,"aw",@progbits |
| |
| @.str = private unnamed_addr constant [5 x i8] c"hot\09\00", align 1 |
| @.str.1 = private unnamed_addr constant [10 x i8] c"%d\09%d\09%d\0A\00", align 1 |
| @hot_relro_array = internal constant [2 x ptr] [ptr @bss2, ptr @data3] |
| @hot_data = internal global i32 5 |
| @hot_bss = internal global i32 0 |
| @.str.2 = private unnamed_addr constant [14 x i8] c"cold%d\09%d\09%d\0A\00", align 1 |
| @cold_bss = internal global i32 0 |
| @cold_data = internal global i32 4 |
| @cold_data_custom_foo_section = internal global i32 100, section "foo" |
| @cold_relro_array = internal constant [2 x ptr] [ptr @data3, ptr @bss2] |
| @bss2 = internal global i32 0 |
| @data3 = internal global i32 3 |
| @data_with_unknown_hotness = private global i32 5 |
| @hot_data_custom_bar_section = internal global i32 101 #0 |
| |
| define void @cold_func(i32 %0) !prof !15 { |
| %2 = load i32, ptr @cold_bss |
| %3 = load i32, ptr @cold_data |
| %4 = srem i32 %0, 2 |
| %5 = sext i32 %4 to i64 |
| %6 = getelementptr inbounds [2 x ptr], ptr @cold_relro_array, i64 0, i64 %5 |
| %7 = load ptr, ptr %6 |
| %8 = load i32, ptr %7 |
| %9 = load i32, ptr @data_with_unknown_hotness |
| %11 = load i32, ptr @hot_data |
| %12 = load i32, ptr @cold_data_custom_foo_section |
| %13 = call i32 (...) @func_taking_arbitrary_param(ptr @.str.2, i32 %2, i32 %3, i32 %8, i32 %9, i32 %11, i32 %12) |
| ret void |
| } |
| |
| define i32 @unprofiled_func() { |
| %a = load i32, ptr @data_with_unknown_hotness |
| %b = load i32, ptr @hot_data |
| %c = load i32, ptr @hot_bss |
| %ret = call i32 (...) @func_taking_arbitrary_param(i32 %a, i32 %b, i32 %c) |
| ret i32 %ret |
| } |
| |
| define void @hot_func(i32 %0) !prof !14 { |
| %2 = call i32 (...) @func_taking_arbitrary_param(ptr @.str) |
| %3 = srem i32 %0, 2 |
| %4 = sext i32 %3 to i64 |
| %5 = getelementptr inbounds [2 x ptr], ptr @hot_relro_array, i64 0, i64 %4 |
| %6 = load ptr, ptr %5 |
| %7 = load i32, ptr %6 |
| %8 = load i32, ptr @hot_data |
| %9 = load i32, ptr @hot_bss |
| %10 = load i32, ptr @hot_data_custom_bar_section |
| %11 = call i32 (...) @func_taking_arbitrary_param(ptr @.str.1, i32 %7, i32 %8, i32 %9, i32 %10) |
| ret void |
| } |
| |
| define i32 @main(i32 %0, ptr %1) !prof !15 { |
| br label %11 |
| |
| 5: ; preds = %11 |
| %6 = call i32 @rand() |
| store i32 %6, ptr @cold_bss |
| store i32 %6, ptr @cold_data |
| store i32 %6, ptr @bss2 |
| store i32 %6, ptr @data3 |
| call void @cold_func(i32 %6) |
| ret i32 0 |
| |
| 11: ; preds = %11, %2 |
| %12 = phi i32 [ 0, %2 ], [ %19, %11 ] |
| %13 = call i32 @rand() |
| %14 = srem i32 %13, 2 |
| %15 = sext i32 %14 to i64 |
| %16 = getelementptr inbounds [2 x ptr], ptr @hot_relro_array, i64 0, i64 %15 |
| %17 = load ptr, ptr %16 |
| store i32 %13, ptr %17 |
| store i32 %13, ptr @hot_data |
| %18 = add i32 %13, 1 |
| store i32 %18, ptr @hot_bss |
| call void @hot_func(i32 %12) |
| %19 = add i32 %12, 1 |
| %20 = icmp eq i32 %19, 100000 |
| br i1 %20, label %5, label %11, !prof !16 |
| } |
| |
| declare i32 @rand() |
| declare i32 @func_taking_arbitrary_param(...) |
| |
| attributes #0 = {"data-section"="bar"} |
| |
| !llvm.module.flags = !{!1} |
| |
| !1 = !{i32 1, !"ProfileSummary", !2} |
| !2 = !{!3, !4, !5, !6, !7, !8, !9, !10} |
| !3 = !{!"ProfileFormat", !"InstrProf"} |
| !4 = !{!"TotalCount", i64 1460183} |
| !5 = !{!"MaxCount", i64 849024} |
| !6 = !{!"MaxInternalCount", i64 32769} |
| !7 = !{!"MaxFunctionCount", i64 849024} |
| !8 = !{!"NumCounts", i64 23627} |
| !9 = !{!"NumFunctions", i64 3271} |
| !10 = !{!"DetailedSummary", !11} |
| !11 = !{!12, !13} |
| !12 = !{i32 990000, i64 166, i32 73} |
| !13 = !{i32 999999, i64 3, i32 1443} |
| !14 = !{!"function_entry_count", i64 100000} |
| !15 = !{!"function_entry_count", i64 1} |
| !16 = !{!"branch_weights", i32 1, i32 99999} |