mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-24 03:33:20 +01:00
dd9ab77318
Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444
94 lines
2.8 KiB
LLVM
94 lines
2.8 KiB
LLVM
; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s
|
|
; RUN: llc -march=amdgcn -mcpu=tonga -mattr=-flat-for-global -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s
|
|
|
|
; SI-LABEL: {{^}}test_i64_eq:
|
|
; SI: v_cmp_eq_u64
|
|
define amdgpu_kernel void @test_i64_eq(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp eq i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; SI-LABEL: {{^}}test_i64_ne:
|
|
; SI: v_cmp_ne_u64
|
|
define amdgpu_kernel void @test_i64_ne(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp ne i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; SI-LABEL: {{^}}test_i64_slt:
|
|
; SI: v_cmp_lt_i64
|
|
define amdgpu_kernel void @test_i64_slt(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp slt i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; SI-LABEL: {{^}}test_i64_ult:
|
|
; SI: v_cmp_lt_u64
|
|
define amdgpu_kernel void @test_i64_ult(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp ult i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; SI-LABEL: {{^}}test_i64_sle:
|
|
; SI: v_cmp_le_i64
|
|
define amdgpu_kernel void @test_i64_sle(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp sle i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; SI-LABEL: {{^}}test_i64_ule:
|
|
; SI: v_cmp_le_u64
|
|
define amdgpu_kernel void @test_i64_ule(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp ule i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; SI-LABEL: {{^}}test_i64_sgt:
|
|
; SI: v_cmp_gt_i64
|
|
define amdgpu_kernel void @test_i64_sgt(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp sgt i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; SI-LABEL: {{^}}test_i64_ugt:
|
|
; SI: v_cmp_gt_u64
|
|
define amdgpu_kernel void @test_i64_ugt(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp ugt i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; SI-LABEL: {{^}}test_i64_sge:
|
|
; SI: v_cmp_ge_i64
|
|
define amdgpu_kernel void @test_i64_sge(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp sge i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; SI-LABEL: {{^}}test_i64_uge:
|
|
; SI: v_cmp_ge_u64
|
|
define amdgpu_kernel void @test_i64_uge(i32 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
|
|
%cmp = icmp uge i64 %a, %b
|
|
%result = sext i1 %cmp to i32
|
|
store i32 %result, i32 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|