mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-25 04:02:41 +01:00
f4af38fa5f
Summary: This is largely NFC*, in preparation for utilizing ProfileSummaryInfo and BranchFrequencyInfo analyses. In this patch I am only doing the splitting for the New PM, but I can do the same for the legacy PM as a follow-on if this looks good. *Not NFC since for partial unrolling we lose the updates done to the loop traversal (adding new sibling and child loops) - according to Chandler this is not very useful for partial unrolling, but it also means that the debugging flag -unroll-revisit-child-loops no longer works for partial unrolling. Reviewers: chandlerc Subscribers: mehdi_amini, mzolotukhin, eraman, llvm-commits Differential Revision: https://reviews.llvm.org/D36157 llvm-svn: 309886
54 lines
1.6 KiB
LLVM
54 lines
1.6 KiB
LLVM
; The goal of this test is checking if LastCallToStaticBonus is applied
|
|
; correctly while deciding inline deferral. For the test code below, when
|
|
; inliner evaluates the callsite of bar->baz, it checks if inlining of bar->baz
|
|
; prevents ininling of foo->bar, even when foo->bar inlining is more beneficial
|
|
; than bar->baz inlining. As LastCallToStaticBonus has a massive value, and
|
|
; both baz and bar has only one caller, the cost of foo->bar inlining and
|
|
; bar->baz inlining should be non-trivial for inliner to compute that bar->baz
|
|
; inlining can actaully prevent foo->bar inlining. To make the cost of these
|
|
; callsites big enough, loop unrolling pass with very high threshold is used to
|
|
; preprocess the test.
|
|
|
|
; RUN: opt < %s -loop-unroll -inline -unroll-threshold=15000 -inline-threshold=250 -S | FileCheck %s
|
|
; RUN: opt < %s -passes='function(require<opt-remark-emit>,unroll),require<profile-summary>,cgscc(inline)' -unroll-threshold=15000 -inline-threshold=250 -S | FileCheck %s
|
|
; CHECK-LABEL: define internal i32 @bar()
|
|
|
|
define internal i32 @baz() {
|
|
entry:
|
|
br label %bb1
|
|
|
|
bb1:
|
|
%ind = phi i32 [ 0, %entry ], [ %inc, %bb1 ]
|
|
call void @extern()
|
|
%inc = add nsw i32 %ind, 1
|
|
%cmp = icmp sgt i32 %inc, 510
|
|
br i1 %cmp, label %ret, label %bb1
|
|
|
|
ret:
|
|
ret i32 0
|
|
}
|
|
|
|
define internal i32 @bar() {
|
|
entry:
|
|
br label %bb1
|
|
|
|
bb1:
|
|
%ind = phi i32 [ 0, %entry ], [ %inc, %bb1 ]
|
|
call void @extern()
|
|
%inc = add nsw i32 %ind, 1
|
|
%cmp = icmp sgt i32 %inc, 510
|
|
br i1 %cmp, label %ret, label %bb1
|
|
|
|
ret:
|
|
call i32 @baz()
|
|
ret i32 0
|
|
}
|
|
|
|
define i32 @foo() {
|
|
entry:
|
|
call i32 @bar()
|
|
ret i32 0
|
|
}
|
|
|
|
declare void @extern()
|