mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-22 18:54:02 +01:00
8e4adad70b
alloca-dbgdeclare-merge.ll: alloca-merge-align.ll: array_merge.ll: NPM inliner does not merge allocas delete-call.ll: NPM inliner does not delete readonly calls externally_available.ll: NPM inliner does not delete available_externally functions inline-cold-callee.ll: inline-hot-callee.ll: inline-hot-callee.ll has a comment saying it only applies to legacy PM, I assume same for inline-cold-callee.ll devirtualize-2.ll: inline-hot-callsite: monster_scc.ll: pr22285.ll: already has legacy and new PM RUN lines inline-cold.ll: profile-summary required to see callee as cold prof-update-sample.ll: profile-summary required to update branch_weights Reviewed By: davidxl Differential Revision: https://reviews.llvm.org/D89093
122 lines
3.4 KiB
LLVM
122 lines
3.4 KiB
LLVM
; This tests that a hot callsite gets the (higher) inlinehint-threshold even without
|
|
; without inline hints and gets inlined because the cost is less than
|
|
; inlinehint-threshold. A cold callee with identical body does not get inlined because
|
|
; cost exceeds the inline-threshold
|
|
|
|
; RUN: opt < %s -inline -inline-threshold=0 -hot-callsite-threshold=100 -S -enable-new-pm=0 | FileCheck %s
|
|
; RUN: opt < %s -passes='require<profile-summary>,cgscc(inline)' -inline-threshold=0 -hot-callsite-threshold=100 -S | FileCheck %s
|
|
|
|
; Run this with the default O2 pipeline to test that profile summary analysis
|
|
; is available during inlining.
|
|
; RUN: opt < %s -passes='default<O2>' -inline-threshold=0 -hot-callsite-threshold=100 -S | FileCheck %s
|
|
|
|
define i32 @callee1(i32 %x) {
|
|
%x1 = add i32 %x, 1
|
|
%x2 = add i32 %x1, 1
|
|
%x3 = add i32 %x2, 1
|
|
call void @extern()
|
|
call void @extern()
|
|
ret i32 %x3
|
|
}
|
|
|
|
define i32 @callee2(i32 %x) {
|
|
; CHECK-LABEL: @callee2(
|
|
%x1 = add i32 %x, 1
|
|
%x2 = add i32 %x1, 1
|
|
%x3 = add i32 %x2, 1
|
|
call void @extern()
|
|
call void @extern()
|
|
ret i32 %x3
|
|
}
|
|
|
|
define i32 @caller2(i32 %y1) {
|
|
; CHECK-LABEL: @caller2(
|
|
; CHECK: call i32 @callee2
|
|
; CHECK-NOT: call i32 @callee1
|
|
; CHECK: ret i32 %x3.i
|
|
%y2 = call i32 @callee2(i32 %y1), !prof !22
|
|
%y3 = call i32 @callee1(i32 %y2), !prof !21
|
|
ret i32 %y3
|
|
}
|
|
|
|
declare i32 @__gxx_personality_v0(...)
|
|
|
|
define i32 @invoker2(i32 %y1) personality i8* bitcast (i32 (...)* @__gxx_personality_v0 to i8*) {
|
|
; CHECK-LABEL: @invoker2(
|
|
; CHECK: invoke i32 @callee2
|
|
; CHECK-NOT: invoke i32 @callee1
|
|
; CHECK: ret i32
|
|
%y2 = invoke i32 @callee2(i32 %y1) to label %next unwind label %lpad, !prof !22
|
|
|
|
next:
|
|
%y3 = invoke i32 @callee1(i32 %y2) to label %exit unwind label %lpad, !prof !21
|
|
|
|
exit:
|
|
ret i32 1
|
|
|
|
lpad:
|
|
%ll = landingpad { i8*, i32 } cleanup
|
|
ret i32 1
|
|
}
|
|
|
|
define i32 @invoker3(i32 %y1) personality i8* bitcast (i32 (...)* @__gxx_personality_v0 to i8*) {
|
|
; CHECK-LABEL: @invoker3(
|
|
; CHECK: invoke i32 @callee2
|
|
; CHECK-NOT: invoke i32 @callee1
|
|
; CHECK: ret i32
|
|
%y2 = invoke i32 @callee2(i32 %y1) to label %next unwind label %lpad,
|
|
!prof !{!"branch_weights", i64 1, i64 0}
|
|
|
|
next:
|
|
%y3 = invoke i32 @callee1(i32 %y2) to label %exit unwind label %lpad,
|
|
!prof !{!"branch_weights", i64 300, i64 1}
|
|
|
|
exit:
|
|
ret i32 1
|
|
|
|
lpad:
|
|
%ll = landingpad { i8*, i32 } cleanup
|
|
ret i32 1
|
|
}
|
|
|
|
define i32 @invoker4(i32 %y1) personality i8* bitcast (i32 (...)* @__gxx_personality_v0 to i8*) {
|
|
; CHECK-LABEL: @invoker4(
|
|
; CHECK: invoke i32 @callee2
|
|
; CHECK-NOT: invoke i32 @callee1
|
|
; CHECK: ret i32
|
|
%y2 = invoke i32 @callee2(i32 %y1) to label %next unwind label %lpad,
|
|
!prof !{!"branch_weights", i64 1, i64 0}
|
|
|
|
next:
|
|
%y3 = invoke i32 @callee1(i32 %y2) to label %exit unwind label %lpad,
|
|
!prof !{!"branch_weights", i64 0, i64 300}
|
|
|
|
exit:
|
|
ret i32 1
|
|
|
|
lpad:
|
|
%ll = landingpad { i8*, i32 } cleanup
|
|
ret i32 1
|
|
}
|
|
|
|
declare void @extern()
|
|
|
|
!llvm.module.flags = !{!1}
|
|
!21 = !{!"branch_weights", i64 300}
|
|
!22 = !{!"branch_weights", i64 1}
|
|
|
|
!1 = !{i32 1, !"ProfileSummary", !2}
|
|
!2 = !{!3, !4, !5, !6, !7, !8, !9, !10}
|
|
!3 = !{!"ProfileFormat", !"SampleProfile"}
|
|
!4 = !{!"TotalCount", i64 10000}
|
|
!5 = !{!"MaxCount", i64 1000}
|
|
!6 = !{!"MaxInternalCount", i64 1}
|
|
!7 = !{!"MaxFunctionCount", i64 1000}
|
|
!8 = !{!"NumCounts", i64 3}
|
|
!9 = !{!"NumFunctions", i64 3}
|
|
!10 = !{!"DetailedSummary", !11}
|
|
!11 = !{!12, !13, !14}
|
|
!12 = !{i32 10000, i64 100, i32 1}
|
|
!13 = !{i32 999000, i64 100, i32 1}
|
|
!14 = !{i32 999999, i64 1, i32 2}
|