mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-24 03:33:20 +01:00
d464e3d65b
Add earlyclobber constaints to prevent input register being allocated as the output register because, according to Intel spec [1], "If any pair of the index, mask, or destination registers are the same, this instruction results a UD fault." --- [1] http://software.intel.com/sites/default/files/319433-014.pdf llvm-svn: 183327
19 lines
690 B
LLVM
19 lines
690 B
LLVM
; RUN: not llc < %s -mtriple=x86_64-apple-darwin -mcpu=corei7-avx
|
|
; RUN: llc < %s -mtriple=x86_64-apple-darwin -mcpu=core-avx2 | FileCheck %s
|
|
|
|
declare <4 x float> @llvm.x86.avx2.gather.d.ps(<4 x float>, i8*,
|
|
<4 x i32>, <4 x float>, i8) nounwind readonly
|
|
|
|
define <4 x float> @test_x86_avx2_gather_d_ps(i8* %a1,
|
|
<4 x i32> %idx, <4 x float> %mask) {
|
|
%res = call <4 x float> @llvm.x86.avx2.gather.d.ps(<4 x float> undef,
|
|
i8* %a1, <4 x i32> %idx, <4 x float> %mask, i8 2) ;
|
|
ret <4 x float> %res
|
|
}
|
|
|
|
; CHECK: test_x86_avx2_gather_d_ps
|
|
; CHECK: vgatherdps
|
|
; CHECK-NOT: [[DST]]
|
|
; CHECK: [[DST:%xmm[0-9]+]]{{$}}
|
|
; CHECK: ret
|