mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 11:13:28 +01:00
54e8749794
This pass implements whole program optimization of virtual calls in cases where we know (via bitset information) that the list of callees is fixed. This includes the following: - Single implementation devirtualization: if a virtual call has a single possible callee, replace all calls with a direct call to that callee. - Virtual constant propagation: if the virtual function's return type is an integer <=64 bits and all possible callees are readnone, for each class and each list of constant arguments: evaluate the function, store the return value alongside the virtual table, and rewrite each virtual call as a load from the virtual table. - Uniform return value optimization: if the conditions for virtual constant propagation hold and each function returns the same constant value, replace each virtual call with that constant. - Unique return value optimization for i1 return values: if the conditions for virtual constant propagation hold and a single vtable's function returns 0, or a single vtable's function returns 1, replace each virtual call with a comparison of the vptr against that vtable's address. Differential Revision: http://reviews.llvm.org/D16795 llvm-svn: 260312
138 lines
5.7 KiB
LLVM
138 lines
5.7 KiB
LLVM
; RUN: opt -S -wholeprogramdevirt %s | FileCheck %s
|
|
|
|
target datalayout = "e-p:64:64"
|
|
target triple = "x86_64-unknown-linux-gnu"
|
|
|
|
; CHECK: [[VT1DATA:@[^ ]*]] = private constant { [8 x i8], [3 x i8*], [0 x i8] } { [8 x i8] c"\00\00\00\01\01\00\00\00", [3 x i8*] [i8* bitcast (i1 (i8*)* @vf0i1 to i8*), i8* bitcast (i1 (i8*)* @vf1i1 to i8*), i8* bitcast (i32 (i8*)* @vf1i32 to i8*)], [0 x i8] zeroinitializer }, section "vt1sec"
|
|
@vt1 = constant [3 x i8*] [
|
|
i8* bitcast (i1 (i8*)* @vf0i1 to i8*),
|
|
i8* bitcast (i1 (i8*)* @vf1i1 to i8*),
|
|
i8* bitcast (i32 (i8*)* @vf1i32 to i8*)
|
|
], section "vt1sec"
|
|
|
|
; CHECK: [[VT2DATA:@[^ ]*]] = private constant { [8 x i8], [3 x i8*], [0 x i8] } { [8 x i8] c"\00\00\00\02\02\00\00\00", [3 x i8*] [i8* bitcast (i1 (i8*)* @vf1i1 to i8*), i8* bitcast (i1 (i8*)* @vf0i1 to i8*), i8* bitcast (i32 (i8*)* @vf2i32 to i8*)], [0 x i8] zeroinitializer }{{$}}
|
|
@vt2 = constant [3 x i8*] [
|
|
i8* bitcast (i1 (i8*)* @vf1i1 to i8*),
|
|
i8* bitcast (i1 (i8*)* @vf0i1 to i8*),
|
|
i8* bitcast (i32 (i8*)* @vf2i32 to i8*)
|
|
]
|
|
|
|
; CHECK: [[VT3DATA:@[^ ]*]] = private constant { [8 x i8], [3 x i8*], [0 x i8] } { [8 x i8] c"\00\00\00\01\03\00\00\00", [3 x i8*] [i8* bitcast (i1 (i8*)* @vf0i1 to i8*), i8* bitcast (i1 (i8*)* @vf1i1 to i8*), i8* bitcast (i32 (i8*)* @vf3i32 to i8*)], [0 x i8] zeroinitializer }{{$}}
|
|
@vt3 = constant [3 x i8*] [
|
|
i8* bitcast (i1 (i8*)* @vf0i1 to i8*),
|
|
i8* bitcast (i1 (i8*)* @vf1i1 to i8*),
|
|
i8* bitcast (i32 (i8*)* @vf3i32 to i8*)
|
|
]
|
|
|
|
; CHECK: [[VT4DATA:@[^ ]*]] = private constant { [8 x i8], [3 x i8*], [0 x i8] } { [8 x i8] c"\00\00\00\02\04\00\00\00", [3 x i8*] [i8* bitcast (i1 (i8*)* @vf1i1 to i8*), i8* bitcast (i1 (i8*)* @vf0i1 to i8*), i8* bitcast (i32 (i8*)* @vf4i32 to i8*)], [0 x i8] zeroinitializer }{{$}}
|
|
@vt4 = constant [3 x i8*] [
|
|
i8* bitcast (i1 (i8*)* @vf1i1 to i8*),
|
|
i8* bitcast (i1 (i8*)* @vf0i1 to i8*),
|
|
i8* bitcast (i32 (i8*)* @vf4i32 to i8*)
|
|
]
|
|
|
|
@vt5 = constant [3 x i8*] [
|
|
i8* bitcast (void ()* @__cxa_pure_virtual to i8*),
|
|
i8* bitcast (void ()* @__cxa_pure_virtual to i8*),
|
|
i8* bitcast (void ()* @__cxa_pure_virtual to i8*)
|
|
]
|
|
|
|
; CHECK: @vt1 = alias [3 x i8*], getelementptr inbounds ({ [8 x i8], [3 x i8*], [0 x i8] }, { [8 x i8], [3 x i8*], [0 x i8] }* [[VT1DATA]], i32 0, i32 1)
|
|
; CHECK: @vt2 = alias [3 x i8*], getelementptr inbounds ({ [8 x i8], [3 x i8*], [0 x i8] }, { [8 x i8], [3 x i8*], [0 x i8] }* [[VT2DATA]], i32 0, i32 1)
|
|
; CHECK: @vt3 = alias [3 x i8*], getelementptr inbounds ({ [8 x i8], [3 x i8*], [0 x i8] }, { [8 x i8], [3 x i8*], [0 x i8] }* [[VT3DATA]], i32 0, i32 1)
|
|
; CHECK: @vt4 = alias [3 x i8*], getelementptr inbounds ({ [8 x i8], [3 x i8*], [0 x i8] }, { [8 x i8], [3 x i8*], [0 x i8] }* [[VT4DATA]], i32 0, i32 1)
|
|
|
|
define i1 @vf0i1(i8* %this) readnone {
|
|
ret i1 0
|
|
}
|
|
|
|
define i1 @vf1i1(i8* %this) readnone {
|
|
ret i1 1
|
|
}
|
|
|
|
define i32 @vf1i32(i8* %this) readnone {
|
|
ret i32 1
|
|
}
|
|
|
|
define i32 @vf2i32(i8* %this) readnone {
|
|
ret i32 2
|
|
}
|
|
|
|
define i32 @vf3i32(i8* %this) readnone {
|
|
ret i32 3
|
|
}
|
|
|
|
define i32 @vf4i32(i8* %this) readnone {
|
|
ret i32 4
|
|
}
|
|
|
|
; CHECK: define i1 @call1(
|
|
define i1 @call1(i8* %obj) {
|
|
%vtableptr = bitcast i8* %obj to [3 x i8*]**
|
|
%vtable = load [3 x i8*]*, [3 x i8*]** %vtableptr
|
|
; CHECK: [[VT1:%[^ ]*]] = bitcast [3 x i8*]* {{.*}} to i8*
|
|
%vtablei8 = bitcast [3 x i8*]* %vtable to i8*
|
|
%p = call i1 @llvm.bitset.test(i8* %vtablei8, metadata !"bitset")
|
|
call void @llvm.assume(i1 %p)
|
|
%fptrptr = getelementptr [3 x i8*], [3 x i8*]* %vtable, i32 0, i32 0
|
|
%fptr = load i8*, i8** %fptrptr
|
|
%fptr_casted = bitcast i8* %fptr to i1 (i8*)*
|
|
; CHECK: [[VTGEP1:%[^ ]*]] = getelementptr i8, i8* [[VT1]], i64 -5
|
|
; CHECK: [[VTLOAD1:%[^ ]*]] = load i8, i8* [[VTGEP1]]
|
|
; CHECK: [[VTAND1:%[^ ]*]] = and i8 [[VTLOAD1]], 2
|
|
; CHECK: [[VTCMP1:%[^ ]*]] = icmp ne i8 [[VTAND1]], 0
|
|
%result = call i1 %fptr_casted(i8* %obj)
|
|
; CHECK: ret i1 [[VTCMP1]]
|
|
ret i1 %result
|
|
}
|
|
|
|
; CHECK: define i1 @call2(
|
|
define i1 @call2(i8* %obj) {
|
|
%vtableptr = bitcast i8* %obj to [3 x i8*]**
|
|
%vtable = load [3 x i8*]*, [3 x i8*]** %vtableptr
|
|
; CHECK: [[VT2:%[^ ]*]] = bitcast [3 x i8*]* {{.*}} to i8*
|
|
%vtablei8 = bitcast [3 x i8*]* %vtable to i8*
|
|
%p = call i1 @llvm.bitset.test(i8* %vtablei8, metadata !"bitset")
|
|
call void @llvm.assume(i1 %p)
|
|
%fptrptr = getelementptr [3 x i8*], [3 x i8*]* %vtable, i32 0, i32 1
|
|
%fptr = load i8*, i8** %fptrptr
|
|
%fptr_casted = bitcast i8* %fptr to i1 (i8*)*
|
|
; CHECK: [[VTGEP2:%[^ ]*]] = getelementptr i8, i8* [[VT2]], i64 -5
|
|
; CHECK: [[VTLOAD2:%[^ ]*]] = load i8, i8* [[VTGEP2]]
|
|
; CHECK: [[VTAND2:%[^ ]*]] = and i8 [[VTLOAD2]], 1
|
|
; CHECK: [[VTCMP2:%[^ ]*]] = icmp ne i8 [[VTAND2]], 0
|
|
%result = call i1 %fptr_casted(i8* %obj)
|
|
; CHECK: ret i1 [[VTCMP2]]
|
|
ret i1 %result
|
|
}
|
|
|
|
; CHECK: define i32 @call3(
|
|
define i32 @call3(i8* %obj) {
|
|
%vtableptr = bitcast i8* %obj to [3 x i8*]**
|
|
%vtable = load [3 x i8*]*, [3 x i8*]** %vtableptr
|
|
; CHECK: [[VT3:%[^ ]*]] = bitcast [3 x i8*]* {{.*}} to i8*
|
|
%vtablei8 = bitcast [3 x i8*]* %vtable to i8*
|
|
%p = call i1 @llvm.bitset.test(i8* %vtablei8, metadata !"bitset")
|
|
call void @llvm.assume(i1 %p)
|
|
%fptrptr = getelementptr [3 x i8*], [3 x i8*]* %vtable, i32 0, i32 2
|
|
%fptr = load i8*, i8** %fptrptr
|
|
%fptr_casted = bitcast i8* %fptr to i32 (i8*)*
|
|
; CHECK: [[VTGEP3:%[^ ]*]] = getelementptr i8, i8* [[VT3]], i64 -4
|
|
; CHECK: [[VTBC3:%[^ ]*]] = bitcast i8* [[VTGEP3]] to i32*
|
|
; CHECK: [[VTLOAD3:%[^ ]*]] = load i32, i32* [[VTBC3]]
|
|
%result = call i32 %fptr_casted(i8* %obj)
|
|
; CHECK: ret i32 [[VTLOAD3]]
|
|
ret i32 %result
|
|
}
|
|
|
|
declare i1 @llvm.bitset.test(i8*, metadata)
|
|
declare void @llvm.assume(i1)
|
|
declare void @__cxa_pure_virtual()
|
|
|
|
!0 = !{!"bitset", [3 x i8*]* @vt1, i32 0}
|
|
!1 = !{!"bitset", [3 x i8*]* @vt2, i32 0}
|
|
!2 = !{!"bitset", [3 x i8*]* @vt3, i32 0}
|
|
!3 = !{!"bitset", [3 x i8*]* @vt4, i32 0}
|
|
!4 = !{!"bitset", [3 x i8*]* @vt5, i32 0}
|
|
!llvm.bitsets = !{!0, !1, !2, !3, !4}
|