mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-25 12:12:47 +01:00
f7935a3f63
`llc -march` is problematic because it only switches the target architecture, but leaves the operating system unchanged. This occasionally leads to indeterministic tests because the OS from LLVM_DEFAULT_TARGET_TRIPLE is used. However we can simply always use `llc -mtriple` instead. This changes all the tests to do this to avoid people using -march when they copy and paste parts of tests. See also the discussion in https://reviews.llvm.org/D35287 llvm-svn: 309774
46 lines
1.7 KiB
LLVM
46 lines
1.7 KiB
LLVM
; RUN: llc < %s -mtriple=x86_64-- -mcpu=corei7 | FileCheck %s
|
|
|
|
; rdar://11897677
|
|
|
|
;CHECK-LABEL: intrin_pmov:
|
|
;CHECK: pmovzxbw (%{{.*}}), %xmm0
|
|
;CHECK-NEXT: movdqu
|
|
;CHECK-NEXT: ret
|
|
define void @intrin_pmov(i16* noalias %dest, i8* noalias %src) nounwind uwtable ssp {
|
|
%1 = bitcast i8* %src to <2 x i64>*
|
|
%2 = load <2 x i64>, <2 x i64>* %1, align 16
|
|
%3 = bitcast <2 x i64> %2 to <16 x i8>
|
|
%4 = tail call <8 x i16> @llvm.x86.sse41.pmovzxbw(<16 x i8> %3) nounwind
|
|
%5 = bitcast i16* %dest to i8*
|
|
%6 = bitcast <8 x i16> %4 to <16 x i8>
|
|
tail call void @llvm.x86.sse2.storeu.dq(i8* %5, <16 x i8> %6) nounwind
|
|
ret void
|
|
}
|
|
|
|
declare <8 x i16> @llvm.x86.sse41.pmovzxbw(<16 x i8>) nounwind readnone
|
|
declare void @llvm.x86.sse2.storeu.dq(i8*, <16 x i8>) nounwind
|
|
|
|
; rdar://15245794
|
|
|
|
define <4 x i32> @foo0(double %v.coerce) nounwind ssp {
|
|
; CHECK-LABEL: foo0
|
|
; CHECK: pmovzxwd %xmm0, %xmm0
|
|
; CHECK-NEXT: ret
|
|
%tmp = bitcast double %v.coerce to <4 x i16>
|
|
%tmp1 = shufflevector <4 x i16> %tmp, <4 x i16> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 undef, i32 undef, i32 undef, i32 undef>
|
|
%tmp2 = tail call <4 x i32> @llvm.x86.sse41.pmovzxwd(<8 x i16> %tmp1) nounwind
|
|
ret <4 x i32> %tmp2
|
|
}
|
|
|
|
define <8 x i16> @foo1(double %v.coerce) nounwind ssp {
|
|
; CHECK-LABEL: foo1
|
|
; CHECK: pmovzxbw %xmm0, %xmm0
|
|
; CHECK-NEXT: ret
|
|
%tmp = bitcast double %v.coerce to <8 x i8>
|
|
%tmp1 = shufflevector <8 x i8> %tmp, <8 x i8> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
|
|
%tmp2 = tail call <8 x i16> @llvm.x86.sse41.pmovzxbw(<16 x i8> %tmp1)
|
|
ret <8 x i16> %tmp2
|
|
}
|
|
|
|
declare <4 x i32> @llvm.x86.sse41.pmovzxwd(<8 x i16>) nounwind readnone
|