mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-10-24 05:23:45 +02:00
dd9ab77318
Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444
84 lines
2.9 KiB
LLVM
84 lines
2.9 KiB
LLVM
; RUN: llc -march=amdgcn -mcpu=bonaire -verify-machineinstrs < %s | FileCheck %s
|
|
|
|
declare i32 @llvm.read_register.i32(metadata) #0
|
|
declare i64 @llvm.read_register.i64(metadata) #0
|
|
|
|
; FIXME: Should be able to eliminate copy
|
|
; CHECK-LABEL: {{^}}test_read_m0:
|
|
; CHECK: s_mov_b32 m0, -1
|
|
; CHECK: s_mov_b32 [[COPY_M0:s[0-9]+]], m0
|
|
; CHECK: v_mov_b32_e32 [[COPY:v[0-9]+]], [[COPY_M0]]
|
|
; CHECK: buffer_store_dword [[COPY]]
|
|
define amdgpu_kernel void @test_read_m0(i32 addrspace(1)* %out) #0 {
|
|
store volatile i32 0, i32 addrspace(3)* undef
|
|
%m0 = call i32 @llvm.read_register.i32(metadata !0)
|
|
store i32 %m0, i32 addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}test_read_exec:
|
|
; CHECK: v_mov_b32_e32 v[[LO:[0-9]+]], exec_lo
|
|
; CHECK: v_mov_b32_e32 v[[HI:[0-9]+]], exec_hi
|
|
; CHECK: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
|
|
define amdgpu_kernel void @test_read_exec(i64 addrspace(1)* %out) #0 {
|
|
%exec = call i64 @llvm.read_register.i64(metadata !1)
|
|
store i64 %exec, i64 addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}test_read_flat_scratch:
|
|
; CHECK: v_mov_b32_e32 v[[LO:[0-9]+]], flat_scratch_lo
|
|
; CHECK: v_mov_b32_e32 v[[HI:[0-9]+]], flat_scratch_hi
|
|
; CHECK: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
|
|
define amdgpu_kernel void @test_read_flat_scratch(i64 addrspace(1)* %out) #0 {
|
|
%flat_scratch = call i64 @llvm.read_register.i64(metadata !2)
|
|
store i64 %flat_scratch, i64 addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}test_read_flat_scratch_lo:
|
|
; CHECK: v_mov_b32_e32 [[COPY:v[0-9]+]], flat_scratch_lo
|
|
; CHECK: buffer_store_dword [[COPY]]
|
|
define amdgpu_kernel void @test_read_flat_scratch_lo(i32 addrspace(1)* %out) #0 {
|
|
%flat_scratch_lo = call i32 @llvm.read_register.i32(metadata !3)
|
|
store i32 %flat_scratch_lo, i32 addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}test_read_flat_scratch_hi:
|
|
; CHECK: v_mov_b32_e32 [[COPY:v[0-9]+]], flat_scratch_hi
|
|
; CHECK: buffer_store_dword [[COPY]]
|
|
define amdgpu_kernel void @test_read_flat_scratch_hi(i32 addrspace(1)* %out) #0 {
|
|
%flat_scratch_hi = call i32 @llvm.read_register.i32(metadata !4)
|
|
store i32 %flat_scratch_hi, i32 addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}test_read_exec_lo:
|
|
; CHECK: v_mov_b32_e32 [[COPY:v[0-9]+]], exec_lo
|
|
; CHECK: buffer_store_dword [[COPY]]
|
|
define amdgpu_kernel void @test_read_exec_lo(i32 addrspace(1)* %out) #0 {
|
|
%exec_lo = call i32 @llvm.read_register.i32(metadata !5)
|
|
store i32 %exec_lo, i32 addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}test_read_exec_hi:
|
|
; CHECK: v_mov_b32_e32 [[COPY:v[0-9]+]], exec_hi
|
|
; CHECK: buffer_store_dword [[COPY]]
|
|
define amdgpu_kernel void @test_read_exec_hi(i32 addrspace(1)* %out) #0 {
|
|
%exec_hi = call i32 @llvm.read_register.i32(metadata !6)
|
|
store i32 %exec_hi, i32 addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { nounwind }
|
|
|
|
!0 = !{!"m0"}
|
|
!1 = !{!"exec"}
|
|
!2 = !{!"flat_scratch"}
|
|
!3 = !{!"flat_scratch_lo"}
|
|
!4 = !{!"flat_scratch_hi"}
|
|
!5 = !{!"exec_lo"}
|
|
!6 = !{!"exec_hi"}
|