mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-01 16:33:37 +01:00
44b06b0096
llvm-svn: 144990
171 lines
5.4 KiB
LLVM
171 lines
5.4 KiB
LLVM
; RUN: llc < %s -march=x86-64 -mattr=+ssse3,-avx | FileCheck %s -check-prefix=SSSE3
|
|
; RUN: llc < %s -march=x86-64 -mattr=-ssse3,+avx | FileCheck %s -check-prefix=AVX
|
|
|
|
; SSSE3: phaddw1:
|
|
; SSSE3-NOT: vphaddw
|
|
; SSSE3: phaddw
|
|
; AVX: phaddw1:
|
|
; AVX: vphaddw
|
|
define <8 x i16> @phaddw1(<8 x i16> %x, <8 x i16> %y) {
|
|
%a = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 0, i32 2, i32 4, i32 6, i32 8, i32 10, i32 12, i32 14>
|
|
%b = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 1, i32 3, i32 5, i32 7, i32 9, i32 11, i32 13, i32 15>
|
|
%r = add <8 x i16> %a, %b
|
|
ret <8 x i16> %r
|
|
}
|
|
|
|
; SSSE3: phaddw2:
|
|
; SSSE3-NOT: vphaddw
|
|
; SSSE3: phaddw
|
|
; AVX: phaddw2:
|
|
; AVX: vphaddw
|
|
define <8 x i16> @phaddw2(<8 x i16> %x, <8 x i16> %y) {
|
|
%a = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 1, i32 2, i32 5, i32 6, i32 9, i32 10, i32 13, i32 14>
|
|
%b = shufflevector <8 x i16> %y, <8 x i16> %x, <8 x i32> <i32 8, i32 11, i32 12, i32 15, i32 0, i32 3, i32 4, i32 7>
|
|
%r = add <8 x i16> %a, %b
|
|
ret <8 x i16> %r
|
|
}
|
|
|
|
; SSSE3: phaddd1:
|
|
; SSSE3-NOT: vphaddd
|
|
; SSSE3: phaddd
|
|
; AVX: phaddd1:
|
|
; AVX: vphaddd
|
|
define <4 x i32> @phaddd1(<4 x i32> %x, <4 x i32> %y) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 0, i32 2, i32 4, i32 6>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 1, i32 3, i32 5, i32 7>
|
|
%r = add <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phaddd2:
|
|
; SSSE3-NOT: vphaddd
|
|
; SSSE3: phaddd
|
|
; AVX: phaddd2:
|
|
; AVX: vphaddd
|
|
define <4 x i32> @phaddd2(<4 x i32> %x, <4 x i32> %y) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 1, i32 2, i32 5, i32 6>
|
|
%b = shufflevector <4 x i32> %y, <4 x i32> %x, <4 x i32> <i32 4, i32 7, i32 0, i32 3>
|
|
%r = add <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phaddd3:
|
|
; SSSE3-NOT: vphaddd
|
|
; SSSE3: phaddd
|
|
; AVX: phaddd3:
|
|
; AVX: vphaddd
|
|
define <4 x i32> @phaddd3(<4 x i32> %x) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 2, i32 4, i32 6>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 3, i32 5, i32 7>
|
|
%r = add <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phaddd4:
|
|
; SSSE3-NOT: vphaddd
|
|
; SSSE3: phaddd
|
|
; AVX: phaddd4:
|
|
; AVX: vphaddd
|
|
define <4 x i32> @phaddd4(<4 x i32> %x) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 2, i32 undef, i32 undef>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 3, i32 undef, i32 undef>
|
|
%r = add <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phaddd5:
|
|
; SSSE3-NOT: vphaddd
|
|
; SSSE3: phaddd
|
|
; AVX: phaddd5:
|
|
; AVX: vphaddd
|
|
define <4 x i32> @phaddd5(<4 x i32> %x) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 3, i32 undef, i32 undef>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 2, i32 undef, i32 undef>
|
|
%r = add <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phaddd6:
|
|
; SSSE3-NOT: vphaddd
|
|
; SSSE3: phaddd
|
|
; AVX: phaddd6:
|
|
; AVX: vphaddd
|
|
define <4 x i32> @phaddd6(<4 x i32> %x) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 undef, i32 undef, i32 undef>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 undef, i32 undef, i32 undef>
|
|
%r = add <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phaddd7:
|
|
; SSSE3-NOT: vphaddd
|
|
; SSSE3: phaddd
|
|
; AVX: phaddd7:
|
|
; AVX: vphaddd
|
|
define <4 x i32> @phaddd7(<4 x i32> %x) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 3, i32 undef, i32 undef>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 2, i32 undef, i32 undef>
|
|
%r = add <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phsubw1:
|
|
; SSSE3-NOT: vphsubw
|
|
; SSSE3: phsubw
|
|
; AVX: phsubw1:
|
|
; AVX: vphsubw
|
|
define <8 x i16> @phsubw1(<8 x i16> %x, <8 x i16> %y) {
|
|
%a = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 0, i32 2, i32 4, i32 6, i32 8, i32 10, i32 12, i32 14>
|
|
%b = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 1, i32 3, i32 5, i32 7, i32 9, i32 11, i32 13, i32 15>
|
|
%r = sub <8 x i16> %a, %b
|
|
ret <8 x i16> %r
|
|
}
|
|
|
|
; SSSE3: phsubd1:
|
|
; SSSE3-NOT: vphsubd
|
|
; SSSE3: phsubd
|
|
; AVX: phsubd1:
|
|
; AVX: vphsubd
|
|
define <4 x i32> @phsubd1(<4 x i32> %x, <4 x i32> %y) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 0, i32 2, i32 4, i32 6>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 1, i32 3, i32 5, i32 7>
|
|
%r = sub <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phsubd2:
|
|
; SSSE3-NOT: vphsubd
|
|
; SSSE3: phsubd
|
|
; AVX: phsubd2:
|
|
; AVX: vphsubd
|
|
define <4 x i32> @phsubd2(<4 x i32> %x) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 2, i32 4, i32 6>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 3, i32 5, i32 7>
|
|
%r = sub <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phsubd3:
|
|
; SSSE3-NOT: vphsubd
|
|
; SSSE3: phsubd
|
|
; AVX: phsubd3:
|
|
; AVX: vphsubd
|
|
define <4 x i32> @phsubd3(<4 x i32> %x) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 2, i32 undef, i32 undef>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 3, i32 undef, i32 undef>
|
|
%r = sub <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; SSSE3: phsubd4:
|
|
; SSSE3-NOT: vphsubd
|
|
; SSSE3: phsubd
|
|
; AVX: phsubd4:
|
|
; AVX: vphsubd
|
|
define <4 x i32> @phsubd4(<4 x i32> %x) {
|
|
%a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 undef, i32 undef, i32 undef>
|
|
%b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 undef, i32 undef, i32 undef>
|
|
%r = sub <4 x i32> %a, %b
|
|
ret <4 x i32> %r
|
|
}
|