blob: ce06d1712f8409c15ed2189ee3367c5269be6013 [file] [log] [blame]
; The static-data-splitter processes data from @cold_func first,
; @unprofiled_func secondly, and @hot_func after the two functions above.
; Tests that data hotness is based on aggregated module-wide profile
; information. This way linker-mergable data is emitted once per module.
target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128"
target triple = "x86_64-unknown-linux-gnu"
; The three RUN commands set `-relocation-model=pic` so `hot_relro_array` and
; `cold_relro_array` are placed in the .data.rel.ro-prefixed section.
; This RUN command sets `-data-sections=true -unique-section-names=true` so data
; sections are uniqufied by numbers.
; RUN: llc -mtriple=x86_64-unknown-linux-gnu -relocation-model=pic \
; RUN: -partition-static-data-sections=true \
; RUN: -data-sections=true -unique-section-names=true \
; RUN: %s -o - 2>&1 | FileCheck %s --check-prefixes=SYM,COMMON --dump-input=always
; This RUN command sets `-data-sections=true -unique-section-names=false` so
; data sections are uniqufied by variable names.
; RUN: llc -mtriple=x86_64-unknown-linux-gnu -relocation-model=pic \
; RUN: -partition-static-data-sections=true \
; RUN: -data-sections=true -unique-section-names=false \
; RUN: %s -o - 2>&1 | FileCheck %s --check-prefixes=UNIQ,COMMON --dump-input=always
; This RUN command sets `-data-sections=false -unique-section-names=false`.
; RUN: llc -mtriple=x86_64-unknown-linux-gnu -relocation-model=pic \
; RUN: -partition-static-data-sections=true \
; RUN: -data-sections=false -unique-section-names=false \
; RUN: %s -o - 2>&1 | FileCheck %s --check-prefixes=AGG,COMMON --dump-input=always
; For @.str and @.str.1
; COMMON: .type .L.str,@object
; SYM-NEXT: .section .rodata.str1.1.hot.
; UNIQ-NEXT: .section .rodata.str1.1.hot.,"aMS",@progbits,1
; AGG-NEXT: .section .rodata.str1.1.hot
; COMMON-NEXT: .L.str:
; COMMON-NEXT: "hot\t"
; COMMON: .L.str.1:
; COMMON-NEXT: "%d\t%d\t%d\n"
; For @hot_relro_array
; COMMON: .type hot_relro_array,@object
; SYM-NEXT: .section .data.rel.ro.hot.hot_relro_array
; UNIQ-NEXT: .section .data.rel.ro.hot.,"aw",@progbits,unique,1
; AGG-NEXT: .section .data.rel.ro.hot.,"aw",@progbits
; For @hot_data, which is accessed by {cold_func, unprofiled_func, hot_func}.
; COMMON: .type hot_data,@object
; SYM-NEXT: .section .data.hot.hot_data,"aw",@progbits
; UNIQ-NEXT: .section .data.hot.,"aw",@progbits,unique,2
; AGG-NEXT: .section .data.hot.,"aw",@progbits
; For @hot_bss, which is accessed by {unprofiled_func, hot_func}.
; COMMON: .type hot_bss,@object
; SYM-NEXT: .section .bss.hot.hot_bss,"aw",@nobits
; UNIQ-NEXT: .section .bss.hot.,"aw",@nobits,unique,3
; AGG-NEXT: .section .bss.hot.,"aw",@nobits
; For @.str.2
; COMMON: .type .L.str.2,@object
; SYM-NEXT: .section .rodata.str1.1.unlikely.,"aMS",@progbits,1
; UNIQ-NEXT: .section .rodata.str1.1.unlikely.,"aMS",@progbits,1
; AGG-NEXT: .section .rodata.str1.1.unlikely.,"aMS",@progbits,1
; COMMON-NEXT: .L.str.2:
; COMMON-NEXT: "cold%d\t%d\t%d\n"
; For @cold_bss
; COMMON: .type cold_bss,@object
; SYM-NEXT: .section .bss.unlikely.cold_bss,"aw",@nobits
; UNIQ-NEXT: .section .bss.unlikely.,"aw",@nobits,unique,4
; AGG-NEXT: .section .bss.unlikely.,"aw",@nobits
; For @cold_data
; COMMON: .type cold_data,@object
; SYM-NEXT: .section .data.unlikely.cold_data,"aw",@progbits
; UNIQ-NEXT: .section .data.unlikely.,"aw",@progbits,unique,5
; AGG-NEXT: .section .data.unlikely.,"aw",@progbits
; For @cold_data_custom_foo_section
; It has an explicit section 'foo' and shouldn't have hot or unlikely suffix.
; COMMON: .type cold_data_custom_foo_section,@object
; SYM-NEXT: .section foo,"aw",@progbits
; UNIQ-NEXT: .section foo,"aw",@progbits
; AGG-NEXT: .section foo,"aw",@progbits
; For @cold_relro_array
; COMMON: .type cold_relro_array,@object
; SYM-NEXT: .section .data.rel.ro.unlikely.cold_relro_array,"aw",@progbits
; UNIQ-NEXT: .section .data.rel.ro.unlikely.,"aw",@progbits,unique,6
; AGG-NEXT: .section .data.rel.ro.unlikely.,"aw",@progbits
; Currently static-data-splitter only analyzes access from code.
; @bss2 and @data3 are indirectly accessed by code through @hot_relro_array
; and @cold_relro_array. A follow-up item is to analyze indirect access via data
; and prune the unlikely list.
; For @bss2
; COMMON: .type bss2,@object
; SYM-NEXT: .section .bss.unlikely.bss2,"aw",@nobits
; UNIQ-NEXT: .section .bss.unlikely.,"aw",@nobits,unique,7
; AGG-NEXT: .section .bss.unlikely.,"aw",@nobits
; For @data3
; COMMON: .type data3,@object
; SYM-NEXT: .section .data.unlikely.data3,"aw",@progbits
; UNIQ-NEXT: .section .data.unlikely.,"aw",@progbits,unique,8
; AGG-NEXT: .section .data.unlikely.,"aw",@progbits
; For @data_with_unknown_hotness
; SYM: .type .Ldata_with_unknown_hotness,@object # @data_with_unknown_hotness
; SYM: .section .data..Ldata_with_unknown_hotness,"aw",@progbits
; UNIQ: .section .data,"aw",@progbits,unique,9
; The `.section` directive is omitted for .data with -unique-section-names=false.
; See MCSectionELF::shouldOmitSectionDirective for the implementation details.
; AGG: .data
; COMMON: .Ldata_with_unknown_hotness:
; For @hot_data_custom_bar_section
; It has an explicit section attribute 'var' and shouldn't have hot or unlikely suffix.
; COMMON: .type hot_data_custom_bar_section,@object
; SYM-NEXT: .section bar,"aw",@progbits
; SYM: hot_data_custom_bar_section
; UNIQ: .section bar,"aw",@progbits
; AGG: .section bar,"aw",@progbits
@.str = private unnamed_addr constant [5 x i8] c"hot\09\00", align 1
@.str.1 = private unnamed_addr constant [10 x i8] c"%d\09%d\09%d\0A\00", align 1
@hot_relro_array = internal constant [2 x ptr] [ptr @bss2, ptr @data3]
@hot_data = internal global i32 5
@hot_bss = internal global i32 0
@.str.2 = private unnamed_addr constant [14 x i8] c"cold%d\09%d\09%d\0A\00", align 1
@cold_bss = internal global i32 0
@cold_data = internal global i32 4
@cold_data_custom_foo_section = internal global i32 100, section "foo"
@cold_relro_array = internal constant [2 x ptr] [ptr @data3, ptr @bss2]
@bss2 = internal global i32 0
@data3 = internal global i32 3
@data_with_unknown_hotness = private global i32 5
@hot_data_custom_bar_section = internal global i32 101 #0
define void @cold_func(i32 %0) !prof !15 {
%2 = load i32, ptr @cold_bss
%3 = load i32, ptr @cold_data
%4 = srem i32 %0, 2
%5 = sext i32 %4 to i64
%6 = getelementptr inbounds [2 x ptr], ptr @cold_relro_array, i64 0, i64 %5
%7 = load ptr, ptr %6
%8 = load i32, ptr %7
%9 = load i32, ptr @data_with_unknown_hotness
%11 = load i32, ptr @hot_data
%12 = load i32, ptr @cold_data_custom_foo_section
%13 = call i32 (...) @func_taking_arbitrary_param(ptr @.str.2, i32 %2, i32 %3, i32 %8, i32 %9, i32 %11, i32 %12)
ret void
}
define i32 @unprofiled_func() {
%a = load i32, ptr @data_with_unknown_hotness
%b = load i32, ptr @hot_data
%c = load i32, ptr @hot_bss
%ret = call i32 (...) @func_taking_arbitrary_param(i32 %a, i32 %b, i32 %c)
ret i32 %ret
}
define void @hot_func(i32 %0) !prof !14 {
%2 = call i32 (...) @func_taking_arbitrary_param(ptr @.str)
%3 = srem i32 %0, 2
%4 = sext i32 %3 to i64
%5 = getelementptr inbounds [2 x ptr], ptr @hot_relro_array, i64 0, i64 %4
%6 = load ptr, ptr %5
%7 = load i32, ptr %6
%8 = load i32, ptr @hot_data
%9 = load i32, ptr @hot_bss
%10 = load i32, ptr @hot_data_custom_bar_section
%11 = call i32 (...) @func_taking_arbitrary_param(ptr @.str.1, i32 %7, i32 %8, i32 %9, i32 %10)
ret void
}
define i32 @main(i32 %0, ptr %1) !prof !15 {
br label %11
5: ; preds = %11
%6 = call i32 @rand()
store i32 %6, ptr @cold_bss
store i32 %6, ptr @cold_data
store i32 %6, ptr @bss2
store i32 %6, ptr @data3
call void @cold_func(i32 %6)
ret i32 0
11: ; preds = %11, %2
%12 = phi i32 [ 0, %2 ], [ %19, %11 ]
%13 = call i32 @rand()
%14 = srem i32 %13, 2
%15 = sext i32 %14 to i64
%16 = getelementptr inbounds [2 x ptr], ptr @hot_relro_array, i64 0, i64 %15
%17 = load ptr, ptr %16
store i32 %13, ptr %17
store i32 %13, ptr @hot_data
%18 = add i32 %13, 1
store i32 %18, ptr @hot_bss
call void @hot_func(i32 %12)
%19 = add i32 %12, 1
%20 = icmp eq i32 %19, 100000
br i1 %20, label %5, label %11, !prof !16
}
declare i32 @rand()
declare i32 @func_taking_arbitrary_param(...)
attributes #0 = {"data-section"="bar"}
!llvm.module.flags = !{!1}
!1 = !{i32 1, !"ProfileSummary", !2}
!2 = !{!3, !4, !5, !6, !7, !8, !9, !10}
!3 = !{!"ProfileFormat", !"InstrProf"}
!4 = !{!"TotalCount", i64 1460183}
!5 = !{!"MaxCount", i64 849024}
!6 = !{!"MaxInternalCount", i64 32769}
!7 = !{!"MaxFunctionCount", i64 849024}
!8 = !{!"NumCounts", i64 23627}
!9 = !{!"NumFunctions", i64 3271}
!10 = !{!"DetailedSummary", !11}
!11 = !{!12, !13}
!12 = !{i32 990000, i64 166, i32 73}
!13 = !{i32 999999, i64 3, i32 1443}
!14 = !{!"function_entry_count", i64 100000}
!15 = !{!"function_entry_count", i64 1}
!16 = !{!"branch_weights", i32 1, i32 99999}