
Per discussion in https://github.com/llvm/llvm-project/pull/129781#discussion_r2017489088, we'd like to refactor out the requirement of MFS.
230 lines
9.1 KiB
LLVM
230 lines
9.1 KiB
LLVM
; The static-data-splitter processes data from @cold_func first,
|
|
; @unprofiled_func secondly, and @hot_func after the two functions above.
|
|
; Tests that data hotness is based on aggregated module-wide profile
|
|
; information. This way linker-mergable data is emitted once per module.
|
|
|
|
target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128"
|
|
target triple = "x86_64-unknown-linux-gnu"
|
|
|
|
; The three RUN commands set `-relocation-model=pic` so `hot_relro_array` and
|
|
; `cold_relro_array` are placed in the .data.rel.ro-prefixed section.
|
|
|
|
; This RUN command sets `-data-sections=true -unique-section-names=true` so data
|
|
; sections are uniqufied by numbers.
|
|
; RUN: llc -mtriple=x86_64-unknown-linux-gnu -relocation-model=pic \
|
|
; RUN: -partition-static-data-sections=true \
|
|
; RUN: -data-sections=true -unique-section-names=true \
|
|
; RUN: %s -o - 2>&1 | FileCheck %s --check-prefixes=SYM,COMMON --dump-input=always
|
|
|
|
; This RUN command sets `-data-sections=true -unique-section-names=false` so
|
|
; data sections are uniqufied by variable names.
|
|
; RUN: llc -mtriple=x86_64-unknown-linux-gnu -relocation-model=pic \
|
|
; RUN: -partition-static-data-sections=true \
|
|
; RUN: -data-sections=true -unique-section-names=false \
|
|
; RUN: %s -o - 2>&1 | FileCheck %s --check-prefixes=UNIQ,COMMON --dump-input=always
|
|
|
|
; This RUN command sets `-data-sections=false -unique-section-names=false`.
|
|
; RUN: llc -mtriple=x86_64-unknown-linux-gnu -relocation-model=pic \
|
|
; RUN: -partition-static-data-sections=true \
|
|
; RUN: -data-sections=false -unique-section-names=false \
|
|
; RUN: %s -o - 2>&1 | FileCheck %s --check-prefixes=AGG,COMMON --dump-input=always
|
|
|
|
; For @.str and @.str.1
|
|
; COMMON: .type .L.str,@object
|
|
; SYM-NEXT: .section .rodata.str1.1.hot.
|
|
; UNIQ-NEXT: .section .rodata.str1.1.hot.,"aMS",@progbits,1
|
|
; AGG-NEXT: .section .rodata.str1.1.hot
|
|
; COMMON-NEXT: .L.str:
|
|
; COMMON-NEXT: "hot\t"
|
|
; COMMON: .L.str.1:
|
|
; COMMON-NEXT: "%d\t%d\t%d\n"
|
|
|
|
; For @hot_relro_array
|
|
; COMMON: .type hot_relro_array,@object
|
|
; SYM-NEXT: .section .data.rel.ro.hot.hot_relro_array
|
|
; UNIQ-NEXT: .section .data.rel.ro.hot.,"aw",@progbits,unique,1
|
|
; AGG-NEXT: .section .data.rel.ro.hot.,"aw",@progbits
|
|
|
|
; For @hot_data, which is accessed by {cold_func, unprofiled_func, hot_func}.
|
|
; COMMON: .type hot_data,@object
|
|
; SYM-NEXT: .section .data.hot.hot_data,"aw",@progbits
|
|
; UNIQ-NEXT: .section .data.hot.,"aw",@progbits,unique,2
|
|
; AGG-NEXT: .section .data.hot.,"aw",@progbits
|
|
|
|
; For @hot_bss, which is accessed by {unprofiled_func, hot_func}.
|
|
; COMMON: .type hot_bss,@object
|
|
; SYM-NEXT: .section .bss.hot.hot_bss,"aw",@nobits
|
|
; UNIQ-NEXT: .section .bss.hot.,"aw",@nobits,unique,3
|
|
; AGG-NEXT: .section .bss.hot.,"aw",@nobits
|
|
|
|
; For @.str.2
|
|
; COMMON: .type .L.str.2,@object
|
|
; SYM-NEXT: .section .rodata.str1.1.unlikely.,"aMS",@progbits,1
|
|
; UNIQ-NEXT: .section .rodata.str1.1.unlikely.,"aMS",@progbits,1
|
|
; AGG-NEXT: .section .rodata.str1.1.unlikely.,"aMS",@progbits,1
|
|
; COMMON-NEXT: .L.str.2:
|
|
; COMMON-NEXT: "cold%d\t%d\t%d\n"
|
|
|
|
; For @cold_bss
|
|
; COMMON: .type cold_bss,@object
|
|
; SYM-NEXT: .section .bss.unlikely.cold_bss,"aw",@nobits
|
|
; UNIQ-NEXT: .section .bss.unlikely.,"aw",@nobits,unique,4
|
|
; AGG-NEXT: .section .bss.unlikely.,"aw",@nobits
|
|
|
|
; For @cold_data
|
|
; COMMON: .type cold_data,@object
|
|
; SYM-NEXT: .section .data.unlikely.cold_data,"aw",@progbits
|
|
; UNIQ-NEXT: .section .data.unlikely.,"aw",@progbits,unique,5
|
|
; AGG-NEXT: .section .data.unlikely.,"aw",@progbits
|
|
|
|
; For @cold_data_custom_foo_section
|
|
; It has an explicit section 'foo' and shouldn't have hot or unlikely suffix.
|
|
; COMMON: .type cold_data_custom_foo_section,@object
|
|
; SYM-NEXT: .section foo,"aw",@progbits
|
|
; UNIQ-NEXT: .section foo,"aw",@progbits
|
|
; AGG-NEXT: .section foo,"aw",@progbits
|
|
|
|
; For @cold_relro_array
|
|
; COMMON: .type cold_relro_array,@object
|
|
; SYM-NEXT: .section .data.rel.ro.unlikely.cold_relro_array,"aw",@progbits
|
|
; UNIQ-NEXT: .section .data.rel.ro.unlikely.,"aw",@progbits,unique,6
|
|
; AGG-NEXT: .section .data.rel.ro.unlikely.,"aw",@progbits
|
|
|
|
; Currently static-data-splitter only analyzes access from code.
|
|
; @bss2 and @data3 are indirectly accessed by code through @hot_relro_array
|
|
; and @cold_relro_array. A follow-up item is to analyze indirect access via data
|
|
; and prune the unlikely list.
|
|
; For @bss2
|
|
; COMMON: .type bss2,@object
|
|
; SYM-NEXT: .section .bss.unlikely.bss2,"aw",@nobits
|
|
; UNIQ-NEXT: .section .bss.unlikely.,"aw",@nobits,unique,7
|
|
; AGG-NEXT: .section .bss.unlikely.,"aw",@nobits
|
|
|
|
; For @data3
|
|
; COMMON: .type data3,@object
|
|
; SYM-NEXT: .section .data.unlikely.data3,"aw",@progbits
|
|
; UNIQ-NEXT: .section .data.unlikely.,"aw",@progbits,unique,8
|
|
; AGG-NEXT: .section .data.unlikely.,"aw",@progbits
|
|
|
|
; For @data_with_unknown_hotness
|
|
; SYM: .type .Ldata_with_unknown_hotness,@object # @data_with_unknown_hotness
|
|
; SYM: .section .data..Ldata_with_unknown_hotness,"aw",@progbits
|
|
; UNIQ: .section .data,"aw",@progbits,unique,9
|
|
; The `.section` directive is omitted for .data with -unique-section-names=false.
|
|
; See MCSectionELF::shouldOmitSectionDirective for the implementation details.
|
|
; AGG: .data
|
|
; COMMON: .Ldata_with_unknown_hotness:
|
|
|
|
; For @hot_data_custom_bar_section
|
|
; It has an explicit section attribute 'var' and shouldn't have hot or unlikely suffix.
|
|
; COMMON: .type hot_data_custom_bar_section,@object
|
|
; SYM-NEXT: .section bar,"aw",@progbits
|
|
; SYM: hot_data_custom_bar_section
|
|
; UNIQ: .section bar,"aw",@progbits
|
|
; AGG: .section bar,"aw",@progbits
|
|
|
|
@.str = private unnamed_addr constant [5 x i8] c"hot\09\00", align 1
|
|
@.str.1 = private unnamed_addr constant [10 x i8] c"%d\09%d\09%d\0A\00", align 1
|
|
@hot_relro_array = internal constant [2 x ptr] [ptr @bss2, ptr @data3]
|
|
@hot_data = internal global i32 5
|
|
@hot_bss = internal global i32 0
|
|
@.str.2 = private unnamed_addr constant [14 x i8] c"cold%d\09%d\09%d\0A\00", align 1
|
|
@cold_bss = internal global i32 0
|
|
@cold_data = internal global i32 4
|
|
@cold_data_custom_foo_section = internal global i32 100, section "foo"
|
|
@cold_relro_array = internal constant [2 x ptr] [ptr @data3, ptr @bss2]
|
|
@bss2 = internal global i32 0
|
|
@data3 = internal global i32 3
|
|
@data_with_unknown_hotness = private global i32 5
|
|
@hot_data_custom_bar_section = internal global i32 101 #0
|
|
|
|
define void @cold_func(i32 %0) !prof !15 {
|
|
%2 = load i32, ptr @cold_bss
|
|
%3 = load i32, ptr @cold_data
|
|
%4 = srem i32 %0, 2
|
|
%5 = sext i32 %4 to i64
|
|
%6 = getelementptr inbounds [2 x ptr], ptr @cold_relro_array, i64 0, i64 %5
|
|
%7 = load ptr, ptr %6
|
|
%8 = load i32, ptr %7
|
|
%9 = load i32, ptr @data_with_unknown_hotness
|
|
%11 = load i32, ptr @hot_data
|
|
%12 = load i32, ptr @cold_data_custom_foo_section
|
|
%13 = call i32 (...) @func_taking_arbitrary_param(ptr @.str.2, i32 %2, i32 %3, i32 %8, i32 %9, i32 %11, i32 %12)
|
|
ret void
|
|
}
|
|
|
|
define i32 @unprofiled_func() {
|
|
%a = load i32, ptr @data_with_unknown_hotness
|
|
%b = load i32, ptr @hot_data
|
|
%c = load i32, ptr @hot_bss
|
|
%ret = call i32 (...) @func_taking_arbitrary_param(i32 %a, i32 %b, i32 %c)
|
|
ret i32 %ret
|
|
}
|
|
|
|
define void @hot_func(i32 %0) !prof !14 {
|
|
%2 = call i32 (...) @func_taking_arbitrary_param(ptr @.str)
|
|
%3 = srem i32 %0, 2
|
|
%4 = sext i32 %3 to i64
|
|
%5 = getelementptr inbounds [2 x ptr], ptr @hot_relro_array, i64 0, i64 %4
|
|
%6 = load ptr, ptr %5
|
|
%7 = load i32, ptr %6
|
|
%8 = load i32, ptr @hot_data
|
|
%9 = load i32, ptr @hot_bss
|
|
%10 = load i32, ptr @hot_data_custom_bar_section
|
|
%11 = call i32 (...) @func_taking_arbitrary_param(ptr @.str.1, i32 %7, i32 %8, i32 %9, i32 %10)
|
|
ret void
|
|
}
|
|
|
|
define i32 @main(i32 %0, ptr %1) !prof !15 {
|
|
br label %11
|
|
|
|
5: ; preds = %11
|
|
%6 = call i32 @rand()
|
|
store i32 %6, ptr @cold_bss
|
|
store i32 %6, ptr @cold_data
|
|
store i32 %6, ptr @bss2
|
|
store i32 %6, ptr @data3
|
|
call void @cold_func(i32 %6)
|
|
ret i32 0
|
|
|
|
11: ; preds = %11, %2
|
|
%12 = phi i32 [ 0, %2 ], [ %19, %11 ]
|
|
%13 = call i32 @rand()
|
|
%14 = srem i32 %13, 2
|
|
%15 = sext i32 %14 to i64
|
|
%16 = getelementptr inbounds [2 x ptr], ptr @hot_relro_array, i64 0, i64 %15
|
|
%17 = load ptr, ptr %16
|
|
store i32 %13, ptr %17
|
|
store i32 %13, ptr @hot_data
|
|
%18 = add i32 %13, 1
|
|
store i32 %18, ptr @hot_bss
|
|
call void @hot_func(i32 %12)
|
|
%19 = add i32 %12, 1
|
|
%20 = icmp eq i32 %19, 100000
|
|
br i1 %20, label %5, label %11, !prof !16
|
|
}
|
|
|
|
declare i32 @rand()
|
|
declare i32 @func_taking_arbitrary_param(...)
|
|
|
|
attributes #0 = {"data-section"="bar"}
|
|
|
|
!llvm.module.flags = !{!1}
|
|
|
|
!1 = !{i32 1, !"ProfileSummary", !2}
|
|
!2 = !{!3, !4, !5, !6, !7, !8, !9, !10}
|
|
!3 = !{!"ProfileFormat", !"InstrProf"}
|
|
!4 = !{!"TotalCount", i64 1460183}
|
|
!5 = !{!"MaxCount", i64 849024}
|
|
!6 = !{!"MaxInternalCount", i64 32769}
|
|
!7 = !{!"MaxFunctionCount", i64 849024}
|
|
!8 = !{!"NumCounts", i64 23627}
|
|
!9 = !{!"NumFunctions", i64 3271}
|
|
!10 = !{!"DetailedSummary", !11}
|
|
!11 = !{!12, !13}
|
|
!12 = !{i32 990000, i64 166, i32 73}
|
|
!13 = !{i32 999999, i64 3, i32 1443}
|
|
!14 = !{!"function_entry_count", i64 100000}
|
|
!15 = !{!"function_entry_count", i64 1}
|
|
!16 = !{!"branch_weights", i32 1, i32 99999}
|