mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-22 18:54:02 +01:00
416a79594b
We currently produce a load, followed by (possibly a move for integers and) a splat as separate instructions. VSX has always had a splatting load for doublewords, but as of Power9, we have it for words as well. This patch just exploits these instructions. Differential revision: https://reviews.llvm.org/D63624 llvm-svn: 372139
56 lines
2.4 KiB
LLVM
56 lines
2.4 KiB
LLVM
; RUN: llc -verify-machineinstrs -mcpu=pwr8 -mtriple=powerpc64le-unknown-linux-gnu -O3 < %s | FileCheck %s
|
|
;
|
|
; This is a regression test based on https://llvm.org/bugs/show_bug.cgi?id=27735
|
|
;
|
|
|
|
@G1 = global <2 x double> <double 2.0, double -10.0>
|
|
@G2 = global <2 x double> <double 3.0, double 4.0>
|
|
@G3 = global <2 x double> <double 5.0, double 6.0>
|
|
@G4 = global <2 x double> <double 7.0, double 8.0>
|
|
|
|
; CHECK-LABEL: @zg
|
|
; CHECK: lxvdsx
|
|
; CHECK-NEXT: lxvdsx
|
|
; CHECK-NEXT: xvmuldp
|
|
; CHECK-DAG: xvmuldp
|
|
; CHECK-DAG: xvsubdp
|
|
; CHECK-DAG: xvadddp
|
|
; CHECK-DAG: xxswapd
|
|
; CHECK-DAG: xxpermdi
|
|
; CHECK-DAG: xvsubdp
|
|
; CHECK: xxswapd
|
|
; CHECK-NEXT: stxvd2x
|
|
; CHECK: blr
|
|
|
|
; Function Attrs: noinline
|
|
define void @zg(i8* %.G0011_640.0, i8* %.G0012_642.0, <2 x double>* %JJ, <2 x double>* %.ka0000_391, double %.unpack, double %.unpack66) #0 {
|
|
L.JA291:
|
|
%Z.L.JA291.2 = load <2 x double>, <2 x double>* %.ka0000_391, align 16
|
|
store <2 x double> %Z.L.JA291.2, <2 x double>* %JJ, align 8
|
|
%Z.L.JA291.3 = bitcast i8* %.G0012_642.0 to <2 x double>*
|
|
%Z.L.JA291.4 = load <2 x double>, <2 x double>* %Z.L.JA291.3, align 1
|
|
%.elt136 = bitcast i8* %.G0011_640.0 to double*
|
|
%.unpack137 = load double, double* %.elt136, align 1
|
|
%.elt138 = getelementptr inbounds i8, i8* %.G0011_640.0, i64 8
|
|
%Z.L.JA291.5 = bitcast i8* %.elt138 to double*
|
|
%.unpack139 = load double, double* %Z.L.JA291.5, align 1
|
|
%Z.L.JA291.6 = insertelement <2 x double> undef, double %.unpack137, i32 0
|
|
%Z.L.JA291.7 = insertelement <2 x double> %Z.L.JA291.6, double %.unpack137, i32 1
|
|
%Z.L.JA291.8 = fmul <2 x double> %Z.L.JA291.2, %Z.L.JA291.7
|
|
%Z.L.JA291.9 = shufflevector <2 x double> %Z.L.JA291.2, <2 x double> undef, <2 x i32> <i32 1, i32 0>
|
|
%Z.L.JA291.10 = insertelement <2 x double> undef, double %.unpack139, i32 0
|
|
%Z.L.JA291.11 = insertelement <2 x double> %Z.L.JA291.10, double %.unpack139, i32 1
|
|
%Z.L.JA291.12 = fmul <2 x double> %Z.L.JA291.9, %Z.L.JA291.11
|
|
%Z.L.JA291.13 = fsub <2 x double> %Z.L.JA291.8, %Z.L.JA291.12
|
|
%Z.L.JA291.14 = fadd <2 x double> %Z.L.JA291.8, %Z.L.JA291.12
|
|
%Z.L.JA291.15 = shufflevector <2 x double> %Z.L.JA291.13, <2 x double> %Z.L.JA291.14, <2 x i32> <i32 0, i32 3>
|
|
%Z.L.JA291.16 = fsub <2 x double> %Z.L.JA291.4, %Z.L.JA291.15
|
|
%Z.L.JA291.17 = bitcast i8* %.G0012_642.0 to <2 x double>*
|
|
store <2 x double> %Z.L.JA291.16, <2 x double>* %Z.L.JA291.17, align 8
|
|
%.. = bitcast <2 x double>* %JJ to i32*
|
|
%.pre = load i32, i32* %.., align 32
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { noinline }
|