mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 11:13:28 +01:00
a0cd02ace9
Summary: ... and after all that refactoring, it's possible to distinguish softfloat floating point values from integers so this patch no longer breaks softfloat to do it. Remove direct handling of i32's in the N32/N64 ABI by promoting them to i64. This more closely reflects the ABI documentation and also fixes problems with stack arguments on big-endian targets. We now rely on signext/zeroext annotations (already generated by clang) and the Assert[SZ]ext nodes to avoid the introduction of unnecessary sign/zero extends. It was not possible to convert three tests to use signext/zeroext. These tests are bswap.ll, ctlz-v.ll, ctlz-v.ll. It's not possible to put signext on a vector type so we just accept the sign extends here for now. These tests don't pass the vectors the same way clang does (clang puts multiple elements in the same argument, these map 1 element to 1 argument) so we don't need to worry too much about it. With this patch, all known N32/N64 bugs should be fixed and we now pass the first 10,000 tests generated by ABITest.py. Subscribers: llvm-commits Differential Revision: http://reviews.llvm.org/D6117 llvm-svn: 221534
389 lines
10 KiB
LLVM
389 lines
10 KiB
LLVM
; RUN: llc -march=mips -mcpu=mips32 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC32 -check-prefix=ACC32-TRAP
|
|
; RUN: llc -march=mips -mcpu=mips32r2 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC32 -check-prefix=ACC32-TRAP
|
|
; RUN: llc -march=mips -mcpu=mips32r6 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=GPR32 -check-prefix=GPR32-TRAP
|
|
; RUN: llc -march=mips64 -mcpu=mips64 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC64 -check-prefix=ACC64-TRAP
|
|
; RUN: llc -march=mips64 -mcpu=mips64r2 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC64 -check-prefix=ACC64-TRAP
|
|
; RUN: llc -march=mips64 -mcpu=mips64r6 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=GPR64 -check-prefix=GPR64-TRAP
|
|
|
|
; RUN: llc -march=mips -mcpu=mips32 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC32 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips -mcpu=mips32r2 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC32 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips -mcpu=mips32r6 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=GPR32 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips64 -mcpu=mips64 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC64 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips64 -mcpu=mips64r2 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC64 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips64 -mcpu=mips64r6 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=GPR64 -check-prefix=NOCHECK
|
|
|
|
; FileCheck Prefixes:
|
|
; ALL - All targets
|
|
; ACC32 - Accumulator based multiply/divide on 32-bit targets
|
|
; ACC64 - Same as ACC32 but only for 64-bit targets
|
|
; GPR32 - GPR based multiply/divide on 32-bit targets
|
|
; GPR64 - Same as GPR32 but only for 64-bit targets
|
|
; ACC32-TRAP - Same as TRAP and ACC32 combined
|
|
; ACC64-TRAP - Same as TRAP and ACC64 combined
|
|
; GPR32-TRAP - Same as TRAP and GPR32 combined
|
|
; GPR64-TRAP - Same as TRAP and GPR64 combined
|
|
; NOCHECK - Division by zero will not be detected
|
|
|
|
@g0 = common global i32 0, align 4
|
|
@g1 = common global i32 0, align 4
|
|
|
|
define i32 @sdiv1(i32 signext %a0, i32 signext %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: sdiv1:
|
|
|
|
; ACC32: div $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
|
|
; ACC64: div $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR32: div $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: div $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC32: mflo $2
|
|
; ACC64: mflo $2
|
|
|
|
; ALL: .end sdiv1
|
|
|
|
%div = sdiv i32 %a0, %a1
|
|
ret i32 %div
|
|
}
|
|
|
|
define i32 @srem1(i32 signext %a0, i32 signext %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: srem1:
|
|
|
|
; ACC32: div $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
|
|
; ACC64: div $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR32: mod $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: mod $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC32: mfhi $2
|
|
; ACC64: mfhi $2
|
|
|
|
; ALL: .end srem1
|
|
|
|
%rem = srem i32 %a0, %a1
|
|
ret i32 %rem
|
|
}
|
|
|
|
define i32 @udiv1(i32 zeroext %a0, i32 zeroext %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: udiv1:
|
|
|
|
; ACC32: divu $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR32: divu $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: divu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC32: mflo $2
|
|
; ACC64: mflo $2
|
|
|
|
; ALL: .end udiv1
|
|
%div = udiv i32 %a0, %a1
|
|
ret i32 %div
|
|
}
|
|
|
|
define i32 @urem1(i32 zeroext %a0, i32 zeroext %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: urem1:
|
|
|
|
; ACC32: divu $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR32: modu $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: modu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC32: mfhi $2
|
|
; ACC64: mfhi $2
|
|
|
|
; ALL: .end urem1
|
|
|
|
%rem = urem i32 %a0, %a1
|
|
ret i32 %rem
|
|
}
|
|
|
|
define i32 @sdivrem1(i32 signext %a0, i32 signext %a1, i32* nocapture %r) nounwind {
|
|
entry:
|
|
; ALL-LABEL: sdivrem1:
|
|
|
|
; ACC32: div $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC32: mflo $2
|
|
; ACC32: mfhi $[[R0:[0-9]+]]
|
|
; ACC32: sw $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; ACC64: div $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC64: mflo $2
|
|
; ACC64: mfhi $[[R0:[0-9]+]]
|
|
; ACC64: sw $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR32: mod $[[R0:[0-9]+]], $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR32: sw $[[R0]], 0(${{[0-9]+}})
|
|
; GPR32-DAG: div $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: mod $[[R0:[0-9]+]], $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR64: sw $[[R0]], 0(${{[0-9]+}})
|
|
; GPR64-DAG: div $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ALL: .end sdivrem1
|
|
|
|
%rem = srem i32 %a0, %a1
|
|
store i32 %rem, i32* %r, align 4
|
|
%div = sdiv i32 %a0, %a1
|
|
ret i32 %div
|
|
}
|
|
|
|
define i32 @udivrem1(i32 zeroext %a0, i32 zeroext %a1, i32* nocapture %r) nounwind {
|
|
entry:
|
|
; ALL-LABEL: udivrem1:
|
|
|
|
; ACC32: divu $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC32: mflo $2
|
|
; ACC32: mfhi $[[R0:[0-9]+]]
|
|
; ACC32: sw $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC64: mflo $2
|
|
; ACC64: mfhi $[[R0:[0-9]+]]
|
|
; ACC64: sw $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR32: modu $[[R0:[0-9]+]], $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR32: sw $[[R0]], 0(${{[0-9]+}})
|
|
; GPR32-DAG: divu $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; GPR64: modu $[[R0:[0-9]+]], $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR64: sw $[[R0]], 0(${{[0-9]+}})
|
|
; GPR64-DAG: divu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ALL: .end udivrem1
|
|
|
|
%rem = urem i32 %a0, %a1
|
|
store i32 %rem, i32* %r, align 4
|
|
%div = udiv i32 %a0, %a1
|
|
ret i32 %div
|
|
}
|
|
|
|
; FIXME: It's not clear what this is supposed to test.
|
|
define i32 @killFlags() {
|
|
entry:
|
|
%0 = load i32* @g0, align 4
|
|
%1 = load i32* @g1, align 4
|
|
%div = sdiv i32 %0, %1
|
|
ret i32 %div
|
|
}
|
|
|
|
define i64 @sdiv2(i64 %a0, i64 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: sdiv2:
|
|
|
|
; ACC32: lw $25, %call16(__divdi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: ddiv $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: ddiv $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC64: mflo $2
|
|
|
|
; ALL: .end sdiv2
|
|
|
|
%div = sdiv i64 %a0, %a1
|
|
ret i64 %div
|
|
}
|
|
|
|
define i64 @srem2(i64 %a0, i64 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: srem2:
|
|
|
|
; ACC32: lw $25, %call16(__moddi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: div $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: dmod $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC64: mfhi $2
|
|
|
|
; ALL: .end srem2
|
|
|
|
%rem = srem i64 %a0, %a1
|
|
ret i64 %rem
|
|
}
|
|
|
|
define i64 @udiv2(i64 %a0, i64 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: udiv2:
|
|
|
|
; ACC32: lw $25, %call16(__udivdi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: ddivu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC64: mflo $2
|
|
|
|
; ALL: .end udiv2
|
|
%div = udiv i64 %a0, %a1
|
|
ret i64 %div
|
|
}
|
|
|
|
define i64 @urem2(i64 %a0, i64 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: urem2:
|
|
|
|
; ACC32: lw $25, %call16(__umoddi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: dmodu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC64: mfhi $2
|
|
|
|
; ALL: .end urem2
|
|
|
|
%rem = urem i64 %a0, %a1
|
|
ret i64 %rem
|
|
}
|
|
|
|
define i64 @sdivrem2(i64 %a0, i64 %a1, i64* nocapture %r) nounwind {
|
|
entry:
|
|
; ALL-LABEL: sdivrem2:
|
|
|
|
; sdivrem2 is too complex to effectively check. We can at least check for the
|
|
; calls though.
|
|
; ACC32: lw $25, %call16(__moddi3)(
|
|
; ACC32: jalr $25
|
|
; ACC32: lw $25, %call16(__divdi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: ddiv $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC64: mflo $2
|
|
; ACC64: mfhi $[[R0:[0-9]+]]
|
|
; ACC64: sd $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR64: dmod $[[R0:[0-9]+]], $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR64: sd $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR64-DAG: ddiv $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ALL: .end sdivrem2
|
|
|
|
%rem = srem i64 %a0, %a1
|
|
store i64 %rem, i64* %r, align 8
|
|
%div = sdiv i64 %a0, %a1
|
|
ret i64 %div
|
|
}
|
|
|
|
define i64 @udivrem2(i64 %a0, i64 %a1, i64* nocapture %r) nounwind {
|
|
entry:
|
|
; ALL-LABEL: udivrem2:
|
|
|
|
; udivrem2 is too complex to effectively check. We can at least check for the
|
|
; calls though.
|
|
; ACC32: lw $25, %call16(__umoddi3)(
|
|
; ACC32: jalr $25
|
|
; ACC32: lw $25, %call16(__udivdi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: ddivu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC64: mflo $2
|
|
; ACC64: mfhi $[[R0:[0-9]+]]
|
|
; ACC64: sd $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR64: dmodu $[[R0:[0-9]+]], $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR64: sd $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR64-DAG: ddivu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ALL: .end udivrem2
|
|
|
|
%rem = urem i64 %a0, %a1
|
|
store i64 %rem, i64* %r, align 8
|
|
%div = udiv i64 %a0, %a1
|
|
ret i64 %div
|
|
}
|