mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-31 20:51:52 +01:00
1ba93908c7
AMDGPU currently only supports direct calls, but at lower optimisation levels it fails to lower statically direct calls which appear indirect due to a bitcast. Add a pass to visit all CallSites and use CallPromotionUtils to "devirtualize" calls. Differential Revision: https://reviews.llvm.org/D52741 llvm-svn: 345382
28 lines
975 B
LLVM
28 lines
975 B
LLVM
; RUN: opt -data-layout=A5 -S -mtriple=amdgcn-unknown-unknown -amdgpu-promote-alloca -disable-promote-alloca-to-vector < %s | FileCheck %s
|
|
|
|
; Make sure that AMDGPUPromoteAlloca doesn't crash if the called
|
|
; function is a constantexpr cast of a function.
|
|
|
|
declare void @foo(float addrspace(5)*) #0
|
|
declare void @foo.varargs(...) #0
|
|
|
|
; CHECK-LABEL: @crash_call_constexpr_cast(
|
|
; CHECK: alloca
|
|
; CHECK: call void
|
|
define amdgpu_kernel void @crash_call_constexpr_cast() #0 {
|
|
%alloca = alloca i32, addrspace(5)
|
|
call void bitcast (void (float addrspace(5)*)* @foo to void (i32 addrspace(5)*)*)(i32 addrspace(5)* %alloca) #0
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: @crash_call_constexpr_cast_varargs(
|
|
; CHECK: alloca
|
|
; CHECK: call void
|
|
define amdgpu_kernel void @crash_call_constexpr_cast_varargs() #0 {
|
|
%alloca = alloca i32, addrspace(5)
|
|
call void bitcast (void (...)* @foo.varargs to void (i32 addrspace(5)*)*)(i32 addrspace(5)* %alloca) #0
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { nounwind }
|