1
0
mirror of https://github.com/RPCS3/llvm-mirror.git synced 2024-11-26 04:32:44 +01:00
llvm-mirror/test/Transforms/PGOProfile/indirect_call_promotion_musttail.ll
Teresa Johnson 01add29a48 [ICP] Don't promote when target not defined in module
This guards against cases where the symbol was dead code eliminated in
the binary by ThinLTO, and we have a sample profile collected for one
binary but used to optimize another.

Most of the benefit from ICP comes from inlining the target, which we
can't do with only a declaration anyway. If this is in the pre-ThinLTO
link step (e.g. for instrumentation based PGO), we will attempt the
promotion again in the ThinLTO backend after importing anyway, and we
don't need the early promotion to facilitate that.

Differential Revision: https://reviews.llvm.org/D92804
2020-12-08 07:45:36 -08:00

77 lines
3.0 KiB
LLVM

; RUN: opt < %s -pgo-icall-prom -S | FileCheck %s --check-prefix=ICALL-PROM
; RUN: opt < %s -passes=pgo-icall-prom -S | FileCheck %s --check-prefix=ICALL-PROM
target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
target triple = "x86_64-unknown-linux-gnu"
@foo = common global i32* ()* null, align 8
define i32* @func1() {
ret i32* null
}
define i32* @func2() {
ret i32* null
}
define i32* @func3() {
ret i32* null
}
define i32* @func4() {
ret i32* null
}
define i32* @bar() {
entry:
%tmp = load i32* ()*, i32* ()** @foo, align 8
; ICALL-PROM: [[CMP1:%[0-9]+]] = icmp eq i32* ()* %tmp, @func4
; ICALL-PROM: br i1 [[CMP1]], label %if.true.direct_targ, label %[[L1:[0-9]+]], !prof [[BRANCH_WEIGHT1:![0-9]+]]
; ICALL-PROM: if.true.direct_targ:
; ICALL-PROM: [[DIRCALL_RET1:%[0-9]+]] = musttail call i32* @func4()
; ICALL-PROM: ret i32* [[DIRCALL_RET1]]
; ICALL-PROM: [[L1]]:
; ICALL-PROM: [[CMP2:%[0-9]+]] = icmp eq i32* ()* %tmp, @func2
; ICALL-PROM: br i1 [[CMP2]], label %if.true.direct_targ1, label %[[L2:[0-9]+]], !prof [[BRANCH_WEIGHT2:![0-9]+]]
; ICALL-PROM: if.true.direct_targ1:
; ICALL-PROM: [[DIRCALL_RET2:%[0-9]+]] = musttail call i32* @func2()
; ICALL-PROM: ret i32* [[DIRCALL_RET2]]
; ICALL-PROM: [[L2]]:
; ICALL-PROM: [[CMP3:%[0-9]+]] = icmp eq i32* ()* %tmp, @func3
; ICALL-PROM: br i1 [[CMP3]], label %if.true.direct_targ2, label %[[L3:[0-9]+]], !prof [[BRANCH_WEIGHT3:![0-9]+]]
; ICALL-PROM: if.true.direct_targ2:
; ICALL-PROM: [[DIRCALL_RET3:%[0-9]+]] = musttail call i32* @func3()
; ICALL-PROM: ret i32* [[DIRCALL_RET3]]
; ICALL-PROM: [[L3]]:
; ICALL-PROM: %call = musttail call i32* %tmp()
; ICALL-PROM: ret i32* %call
%call = musttail call i32* %tmp(), !prof !1
ret i32* %call
}
define i64* @bar2() {
entry:
%tmp = load i32* ()*, i32* ()** @foo, align 8
; ICALL-PROM: [[CMP1:%[0-9]+]] = icmp eq i32* ()* %tmp, @func4
; ICALL-PROM: br i1 [[CMP1]], label %if.true.direct_targ, label %[[L4:[0-9]+]], !prof [[BRANCH_WEIGHT4:![0-9]+]]
; ICALL-PROM: if.true.direct_targ:
; ICALL-PROM: [[DIRCALL_RET1:%[0-9]+]] = musttail call i32* @func4()
; ICALL-PROM: [[DIRCALL_RET2:%[0-9]+]] = bitcast i32* [[DIRCALL_RET1]] to i64*
; ICALL-PROM: ret i64* [[DIRCALL_RET2]]
; ICALL-PROM: [[L4]]:
; ICALL-PROM: %call = musttail call i32* %tmp()
; ICALL-PROM: %rv = bitcast i32* %call to i64*
; ICALL-PROM: ret i64* %rv
%call = musttail call i32* %tmp(), !prof !2
%rv = bitcast i32* %call to i64*
ret i64* %rv
}
!1 = !{!"VP", i32 0, i64 1600, i64 7651369219802541373, i64 1030, i64 -4377547752858689819, i64 410, i64 -6929281286627296573, i64 150, i64 -2545542355363006406, i64 10}
!2 = !{!"VP", i32 0, i64 100, i64 7651369219802541373, i64 100}
; ICALL-PROM: [[BRANCH_WEIGHT1]] = !{!"branch_weights", i32 1030, i32 570}
; ICALL-PROM: [[BRANCH_WEIGHT2]] = !{!"branch_weights", i32 410, i32 160}
; ICALL-PROM: [[BRANCH_WEIGHT3]] = !{!"branch_weights", i32 150, i32 10}
; ICALL-PROM: [[BRANCH_WEIGHT4]] = !{!"branch_weights", i32 100, i32 0}