mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 11:13:28 +01:00
e4386158ff
Since z13, the max group size will be 2 if any μop has more than 3 register sources. This has been ignored sofar in the SystemZHazardRecognizer, but is now handled by recognizing those instructions and adjusting the tracking of decoding and the cost heuristic for grouping. Review: Ulrich Weigand https://reviews.llvm.org/D49847 llvm-svn: 338368
850 lines
34 KiB
LLVM
850 lines
34 KiB
LLVM
; Test that a vector select with a logic combination of two compares do not
|
|
; produce any unnecessary pack, unpack or shift instructions.
|
|
; And, Or and Xor are tested.
|
|
;
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z14 | FileCheck %s -check-prefix=CHECK-Z14
|
|
|
|
define <2 x i8> @fun0(<2 x i8> %val1, <2 x i8> %val2, <2 x i8> %val3, <2 x i8> %val4, <2 x i8> %val5, <2 x i8> %val6) {
|
|
; CHECK-LABEL: fun0:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqb [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vceqb [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vn %v0, [[REG0]], [[REG1]]
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i8> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i8> %val3, %val4
|
|
%and = and <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i8> %val5, <2 x i8> %val6
|
|
ret <2 x i8> %sel
|
|
}
|
|
|
|
define <2 x i16> @fun1(<2 x i8> %val1, <2 x i8> %val2, <2 x i8> %val3, <2 x i8> %val4, <2 x i16> %val5, <2 x i16> %val6) {
|
|
; CHECK-LABEL: fun1:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqb [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vceqb [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vn %v0, [[REG0]], [[REG1]]
|
|
; CHECK-NEXT: vuphb %v0, %v0
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i8> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i8> %val3, %val4
|
|
%and = and <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i16> %val5, <2 x i16> %val6
|
|
ret <2 x i16> %sel
|
|
}
|
|
|
|
define <16 x i8> @fun2(<16 x i8> %val1, <16 x i8> %val2, <16 x i16> %val3, <16 x i16> %val4, <16 x i8> %val5, <16 x i8> %val6) {
|
|
; CHECK-LABEL: fun2:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqh [[REG0:%v[0-9]+]], %v30, %v27
|
|
; CHECK-DAG: vceqh [[REG1:%v[0-9]+]], %v28, %v25
|
|
; CHECK-DAG: vceqb [[REG2:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vpkh [[REG3:%v[0-9]+]], [[REG1]], [[REG0]]
|
|
; CHECK-NEXT: vo %v0, [[REG2]], [[REG3]]
|
|
; CHECK-NEXT: vsel %v24, %v29, %v31, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <16 x i8> %val1, %val2
|
|
%cmp1 = icmp eq <16 x i16> %val3, %val4
|
|
%and = or <16 x i1> %cmp0, %cmp1
|
|
%sel = select <16 x i1> %and, <16 x i8> %val5, <16 x i8> %val6
|
|
ret <16 x i8> %sel
|
|
}
|
|
|
|
define <16 x i16> @fun3(<16 x i8> %val1, <16 x i8> %val2, <16 x i16> %val3, <16 x i16> %val4, <16 x i16> %val5, <16 x i16> %val6) {
|
|
; CHECK-LABEL: fun3:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqb [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vuphb [[REG2:%v[0-9]+]], [[REG0]]
|
|
; CHECK-DAG: vmrlg [[REG1:%v[0-9]+]], [[REG0]], [[REG0]]
|
|
; CHECK-DAG: vuphb [[REG1]], [[REG1]]
|
|
; CHECK-DAG: vceqh [[REG3:%v[0-9]+]], %v28, %v25
|
|
; CHECK-DAG: vceqh [[REG4:%v[0-9]+]], %v30, %v27
|
|
; CHECK-DAG: vl [[REG5:%v[0-9]+]], 176(%r15)
|
|
; CHECK-DAG: vl [[REG6:%v[0-9]+]], 160(%r15)
|
|
; CHECK-DAG: vo [[REG7:%v[0-9]+]], %v2, [[REG4]]
|
|
; CHECK-DAG: vo [[REG8:%v[0-9]+]], [[REG2]], [[REG3]]
|
|
; CHECK-DAG: vsel %v24, %v29, [[REG6]], [[REG8]]
|
|
; CHECK-DAG: vsel %v26, %v31, [[REG5]], [[REG7]]
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <16 x i8> %val1, %val2
|
|
%cmp1 = icmp eq <16 x i16> %val3, %val4
|
|
%and = or <16 x i1> %cmp0, %cmp1
|
|
%sel = select <16 x i1> %and, <16 x i16> %val5, <16 x i16> %val6
|
|
ret <16 x i16> %sel
|
|
}
|
|
|
|
define <32 x i8> @fun4(<32 x i8> %val1, <32 x i8> %val2, <32 x i8> %val3, <32 x i8> %val4, <32 x i8> %val5, <32 x i8> %val6) {
|
|
; CHECK-LABEL: fun4:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqb [[REG0:%v[0-9]+]], %v24, %v28
|
|
; CHECK-DAG: vceqb [[REG1:%v[0-9]+]], %v26, %v30
|
|
; CHECK-DAG: vceqb [[REG2:%v[0-9]+]], %v25, %v29
|
|
; CHECK-DAG: vceqb [[REG3:%v[0-9]+]], %v27, %v31
|
|
; CHECK-DAG: vl [[REG4:%v[0-9]+]], 208(%r15)
|
|
; CHECK-DAG: vl [[REG5:%v[0-9]+]], 176(%r15)
|
|
; CHECK-DAG: vl [[REG6:%v[0-9]+]], 192(%r15)
|
|
; CHECK-DAG: vl [[REG7:%v[0-9]+]], 160(%r15)
|
|
; CHECK-DAG: vx [[REG8:%v[0-9]+]], [[REG1]], [[REG3]]
|
|
; CHECK-DAG: vx [[REG9:%v[0-9]+]], [[REG0]], [[REG2]]
|
|
; CHECK-DAG: vsel %v24, [[REG7]], [[REG6]], [[REG9]]
|
|
; CHECK-DAG: vsel %v26, [[REG5]], [[REG4]], [[REG8]]
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <32 x i8> %val1, %val2
|
|
%cmp1 = icmp eq <32 x i8> %val3, %val4
|
|
%and = xor <32 x i1> %cmp0, %cmp1
|
|
%sel = select <32 x i1> %and, <32 x i8> %val5, <32 x i8> %val6
|
|
ret <32 x i8> %sel
|
|
}
|
|
|
|
define <2 x i8> @fun5(<2 x i16> %val1, <2 x i16> %val2, <2 x i8> %val3, <2 x i8> %val4, <2 x i8> %val5, <2 x i8> %val6) {
|
|
; CHECK-LABEL: fun5:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqh [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vpkh [[REG1:%v[0-9]+]], [[REG0]], [[REG0]]
|
|
; CHECK-DAG: vceqb [[REG2:%v[0-9]+]], %v28, %v30
|
|
; CHECK-DAG: vo %v0, [[REG1]], [[REG2]]
|
|
; CHECK-DAG: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i16> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i8> %val3, %val4
|
|
%and = or <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i8> %val5, <2 x i8> %val6
|
|
ret <2 x i8> %sel
|
|
}
|
|
|
|
define <2 x i16> @fun6(<2 x i16> %val1, <2 x i16> %val2, <2 x i8> %val3, <2 x i8> %val4, <2 x i16> %val5, <2 x i16> %val6) {
|
|
; CHECK-LABEL: fun6:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vceqb %v1, %v28, %v30
|
|
; CHECK-NEXT: vceqh %v0, %v24, %v26
|
|
; CHECK-NEXT: vuphb %v1, %v1
|
|
; CHECK-NEXT: vo %v0, %v0, %v1
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i16> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i8> %val3, %val4
|
|
%and = or <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i16> %val5, <2 x i16> %val6
|
|
ret <2 x i16> %sel
|
|
}
|
|
|
|
define <2 x i32> @fun7(<2 x i16> %val1, <2 x i16> %val2, <2 x i8> %val3, <2 x i8> %val4, <2 x i32> %val5, <2 x i32> %val6) {
|
|
; CHECK-LABEL: fun7:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vceqb %v1, %v28, %v30
|
|
; CHECK-NEXT: vceqh %v0, %v24, %v26
|
|
; CHECK-NEXT: vuphb %v1, %v1
|
|
; CHECK-NEXT: vo %v0, %v0, %v1
|
|
; CHECK-NEXT: vuphh %v0, %v0
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i16> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i8> %val3, %val4
|
|
%and = or <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i32> %val5, <2 x i32> %val6
|
|
ret <2 x i32> %sel
|
|
}
|
|
|
|
define <8 x i8> @fun8(<8 x i16> %val1, <8 x i16> %val2, <8 x i16> %val3, <8 x i16> %val4, <8 x i8> %val5, <8 x i8> %val6) {
|
|
; CHECK-LABEL: fun8:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqh [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vceqh [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vx %v0, [[REG0]], [[REG1]]
|
|
; CHECK-NEXT: vpkh %v0, %v0, %v0
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <8 x i16> %val1, %val2
|
|
%cmp1 = icmp eq <8 x i16> %val3, %val4
|
|
%and = xor <8 x i1> %cmp0, %cmp1
|
|
%sel = select <8 x i1> %and, <8 x i8> %val5, <8 x i8> %val6
|
|
ret <8 x i8> %sel
|
|
}
|
|
|
|
define <8 x i16> @fun9(<8 x i16> %val1, <8 x i16> %val2, <8 x i16> %val3, <8 x i16> %val4, <8 x i16> %val5, <8 x i16> %val6) {
|
|
; CHECK-LABEL: fun9:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqh [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vceqh [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vx %v0, [[REG0]], [[REG1]]
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <8 x i16> %val1, %val2
|
|
%cmp1 = icmp eq <8 x i16> %val3, %val4
|
|
%and = xor <8 x i1> %cmp0, %cmp1
|
|
%sel = select <8 x i1> %and, <8 x i16> %val5, <8 x i16> %val6
|
|
ret <8 x i16> %sel
|
|
}
|
|
|
|
define <8 x i32> @fun10(<8 x i16> %val1, <8 x i16> %val2, <8 x i16> %val3, <8 x i16> %val4, <8 x i32> %val5, <8 x i32> %val6) {
|
|
; CHECK-LABEL: fun10:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqh [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vceqh [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vx [[REG2:%v[0-9]+]], [[REG0]], [[REG1]]
|
|
; CHECK-DAG: vuphh [[REG3:%v[0-9]+]], [[REG2]]
|
|
; CHECK-DAG: vmrlg [[REG4:%v[0-9]+]], [[REG2]], [[REG2]]
|
|
; CHECK-DAG: vuphh [[REG5:%v[0-9]+]], [[REG4]]
|
|
; CHECK-NEXT: vsel %v24, %v25, %v29, [[REG3]]
|
|
; CHECK-NEXT: vsel %v26, %v27, %v31, [[REG5]]
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <8 x i16> %val1, %val2
|
|
%cmp1 = icmp eq <8 x i16> %val3, %val4
|
|
%and = xor <8 x i1> %cmp0, %cmp1
|
|
%sel = select <8 x i1> %and, <8 x i32> %val5, <8 x i32> %val6
|
|
ret <8 x i32> %sel
|
|
}
|
|
|
|
define <16 x i8> @fun11(<16 x i16> %val1, <16 x i16> %val2, <16 x i32> %val3, <16 x i32> %val4, <16 x i8> %val5, <16 x i8> %val6) {
|
|
; CHECK-LABEL: fun11:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vl [[REG0:%v[0-9]+]], 192(%r15)
|
|
; CHECK-DAG: vl [[REG1:%v[0-9]+]], 208(%r15)
|
|
; CHECK-DAG: vl [[REG2:%v[0-9]+]], 160(%r15)
|
|
; CHECK-DAG: vl [[REG3:%v[0-9]+]], 176(%r15)
|
|
; CHECK-DAG: vceqf [[REG4:%v[0-9]+]], %v27, [[REG3]]
|
|
; CHECK-DAG: vceqf [[REG5:%v[0-9]+]], %v25, [[REG2]]
|
|
; CHECK-DAG: vceqf [[REG6:%v[0-9]+]], %v31, [[REG1]]
|
|
; CHECK-DAG: vceqf [[REG7:%v[0-9]+]], %v29, [[REG0]]
|
|
; CHECK-DAG: vceqh [[REG8:%v[0-9]+]], %v24, %v28
|
|
; CHECK-DAG: vceqh [[REG9:%v[0-9]+]], %v26, %v30
|
|
; CHECK-DAG: vpkf [[REG10:%v[0-9]+]], [[REG5]], [[REG4]]
|
|
; CHECK-DAG: vpkf [[REG11:%v[0-9]+]], [[REG7]], [[REG6]]
|
|
; CHECK-DAG: vn [[REG12:%v[0-9]+]], [[REG9]], [[REG11]]
|
|
; CHECK-DAG: vn [[REG13:%v[0-9]+]], [[REG8]], [[REG10]]
|
|
; CHECK-DAG: vl [[REG14:%v[0-9]+]], 240(%r15)
|
|
; CHECK-DAG: vl [[REG15:%v[0-9]+]], 224(%r15)
|
|
; CHECK-DAG: vpkh [[REG16:%v[0-9]+]], [[REG13]], [[REG12]]
|
|
; CHECK-NEXT: vsel %v24, [[REG15]], [[REG14]], [[REG16]]
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <16 x i16> %val1, %val2
|
|
%cmp1 = icmp eq <16 x i32> %val3, %val4
|
|
%and = and <16 x i1> %cmp0, %cmp1
|
|
%sel = select <16 x i1> %and, <16 x i8> %val5, <16 x i8> %val6
|
|
ret <16 x i8> %sel
|
|
}
|
|
|
|
define <16 x i16> @fun12(<16 x i16> %val1, <16 x i16> %val2, <16 x i32> %val3, <16 x i32> %val4, <16 x i16> %val5, <16 x i16> %val6) {
|
|
; CHECK-LABEL: fun12:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vl [[REG0:%v[0-9]+]], 192(%r15)
|
|
; CHECK-DAG: vl [[REG1:%v[0-9]+]], 208(%r15)
|
|
; CHECK-DAG: vl [[REG2:%v[0-9]+]], 160(%r15)
|
|
; CHECK-DAG: vl [[REG3:%v[0-9]+]], 176(%r15)
|
|
; CHECK-DAG: vceqf [[REG4:%v[0-9]+]], %v27, [[REG3]]
|
|
; CHECK-DAG: vceqf [[REG5:%v[0-9]+]], %v25, [[REG2]]
|
|
; CHECK-DAG: vceqf [[REG6:%v[0-9]+]], %v31, [[REG1]]
|
|
; CHECK-DAG: vceqf [[REG7:%v[0-9]+]], %v29, [[REG0]]
|
|
; CHECK-DAG: vceqh [[REG8:%v[0-9]+]], %v24, %v28
|
|
; CHECK-DAG: vceqh [[REG9:%v[0-9]+]], %v26, %v30
|
|
; CHECK-DAG: vpkf [[REG10:%v[0-9]+]], [[REG5]], [[REG4]]
|
|
; CHECK-DAG: vpkf [[REG11:%v[0-9]+]], [[REG7]], [[REG6]]
|
|
; CHECK-DAG: vl [[REG12:%v[0-9]+]], 272(%r15)
|
|
; CHECK-DAG: vl [[REG13:%v[0-9]+]], 240(%r15)
|
|
; CHECK-DAG: vl [[REG14:%v[0-9]+]], 256(%r15)
|
|
; CHECK-DAG: vl [[REG15:%v[0-9]+]], 224(%r15)
|
|
; CHECK-DAG: vn [[REG16:%v[0-9]+]], [[REG9]], [[REG11]]
|
|
; CHECK-DAG: vn [[REG17:%v[0-9]+]], [[REG8]], [[REG10]]
|
|
; CHECK-DAG: vsel %v24, [[REG15]], [[REG14]], [[REG17]]
|
|
; CHECK-DAG: vsel %v26, [[REG13]], [[REG12]], [[REG16]]
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <16 x i16> %val1, %val2
|
|
%cmp1 = icmp eq <16 x i32> %val3, %val4
|
|
%and = and <16 x i1> %cmp0, %cmp1
|
|
%sel = select <16 x i1> %and, <16 x i16> %val5, <16 x i16> %val6
|
|
ret <16 x i16> %sel
|
|
}
|
|
|
|
define <2 x i16> @fun13(<2 x i32> %val1, <2 x i32> %val2, <2 x i64> %val3, <2 x i64> %val4, <2 x i16> %val5, <2 x i16> %val6) {
|
|
; CHECK-LABEL: fun13:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vceqg %v1, %v28, %v30
|
|
; CHECK-NEXT: vceqf %v0, %v24, %v26
|
|
; CHECK-NEXT: vpkg %v1, %v1, %v1
|
|
; CHECK-NEXT: vx %v0, %v0, %v1
|
|
; CHECK-NEXT: vpkf %v0, %v0, %v0
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i32> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i64> %val3, %val4
|
|
%and = xor <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i16> %val5, <2 x i16> %val6
|
|
ret <2 x i16> %sel
|
|
}
|
|
|
|
define <2 x i32> @fun14(<2 x i32> %val1, <2 x i32> %val2, <2 x i64> %val3, <2 x i64> %val4, <2 x i32> %val5, <2 x i32> %val6) {
|
|
; CHECK-LABEL: fun14:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vceqg %v1, %v28, %v30
|
|
; CHECK-NEXT: vceqf %v0, %v24, %v26
|
|
; CHECK-NEXT: vpkg %v1, %v1, %v1
|
|
; CHECK-NEXT: vx %v0, %v0, %v1
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i32> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i64> %val3, %val4
|
|
%and = xor <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i32> %val5, <2 x i32> %val6
|
|
ret <2 x i32> %sel
|
|
}
|
|
|
|
define <2 x i64> @fun15(<2 x i32> %val1, <2 x i32> %val2, <2 x i64> %val3, <2 x i64> %val4, <2 x i64> %val5, <2 x i64> %val6) {
|
|
; CHECK-LABEL: fun15:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqf [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vuphf [[REG1:%v[0-9]+]], [[REG0]]
|
|
; CHECK-DAG: vceqg [[REG2:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vx %v0, [[REG1]], [[REG2]]
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i32> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i64> %val3, %val4
|
|
%and = xor <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i64> %val5, <2 x i64> %val6
|
|
ret <2 x i64> %sel
|
|
}
|
|
|
|
define <4 x i16> @fun16(<4 x i32> %val1, <4 x i32> %val2, <4 x i16> %val3, <4 x i16> %val4, <4 x i16> %val5, <4 x i16> %val6) {
|
|
; CHECK-LABEL: fun16:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqf [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vpkf [[REG1:%v[0-9]+]], [[REG0]], [[REG0]]
|
|
; CHECK-DAG: vceqh [[REG2:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vn %v0, [[REG1]], [[REG2]]
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <4 x i32> %val1, %val2
|
|
%cmp1 = icmp eq <4 x i16> %val3, %val4
|
|
%and = and <4 x i1> %cmp0, %cmp1
|
|
%sel = select <4 x i1> %and, <4 x i16> %val5, <4 x i16> %val6
|
|
ret <4 x i16> %sel
|
|
}
|
|
|
|
define <4 x i32> @fun17(<4 x i32> %val1, <4 x i32> %val2, <4 x i16> %val3, <4 x i16> %val4, <4 x i32> %val5, <4 x i32> %val6) {
|
|
; CHECK-LABEL: fun17:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vceqh %v1, %v28, %v30
|
|
; CHECK-NEXT: vceqf %v0, %v24, %v26
|
|
; CHECK-NEXT: vuphh %v1, %v1
|
|
; CHECK-NEXT: vn %v0, %v0, %v1
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <4 x i32> %val1, %val2
|
|
%cmp1 = icmp eq <4 x i16> %val3, %val4
|
|
%and = and <4 x i1> %cmp0, %cmp1
|
|
%sel = select <4 x i1> %and, <4 x i32> %val5, <4 x i32> %val6
|
|
ret <4 x i32> %sel
|
|
}
|
|
|
|
define <4 x i64> @fun18(<4 x i32> %val1, <4 x i32> %val2, <4 x i16> %val3, <4 x i16> %val4, <4 x i64> %val5, <4 x i64> %val6) {
|
|
; CHECK-LABEL: fun18:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vceqh %v1, %v28, %v30
|
|
; CHECK-NEXT: vceqf %v0, %v24, %v26
|
|
; CHECK-NEXT: vuphh %v1, %v1
|
|
; CHECK-NEXT: vn %v0, %v0, %v1
|
|
; CHECK-DAG: vuphf [[REG0:%v[0-9]+]], %v0
|
|
; CHECK-DAG: vmrlg [[REG1:%v[0-9]+]], %v0, %v0
|
|
; CHECK-DAG: vuphf [[REG2:%v[0-9]+]], [[REG1]]
|
|
; CHECK-NEXT: vsel %v24, %v25, %v29, [[REG0]]
|
|
; CHECK-NEXT: vsel %v26, %v27, %v31, [[REG2]]
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <4 x i32> %val1, %val2
|
|
%cmp1 = icmp eq <4 x i16> %val3, %val4
|
|
%and = and <4 x i1> %cmp0, %cmp1
|
|
%sel = select <4 x i1> %and, <4 x i64> %val5, <4 x i64> %val6
|
|
ret <4 x i64> %sel
|
|
}
|
|
|
|
define <8 x i16> @fun19(<8 x i32> %val1, <8 x i32> %val2, <8 x i32> %val3, <8 x i32> %val4, <8 x i16> %val5, <8 x i16> %val6) {
|
|
; CHECK-LABEL: fun19:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqf [[REG0:%v[0-9]+]], %v24, %v28
|
|
; CHECK-DAG: vceqf [[REG1:%v[0-9]+]], %v26, %v30
|
|
; CHECK-DAG: vceqf [[REG2:%v[0-9]+]], %v25, %v29
|
|
; CHECK-DAG: vceqf [[REG3:%v[0-9]+]], %v27, %v31
|
|
; CHECK-DAG: vo [[REG4:%v[0-9]+]], [[REG1]], [[REG3]]
|
|
; CHECK-DAG: vo [[REG5:%v[0-9]+]], [[REG0]], [[REG2]]
|
|
; CHECK-DAG: vl [[REG6:%v[0-9]+]], 176(%r15)
|
|
; CHECK-DAG: vl [[REG7:%v[0-9]+]], 160(%r15)
|
|
; CHECK-DAG: vpkf [[REG8:%v[0-9]+]], [[REG5]], [[REG4]]
|
|
; CHECK-NEXT: vsel %v24, [[REG7]], [[REG6]], [[REG8]]
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <8 x i32> %val1, %val2
|
|
%cmp1 = icmp eq <8 x i32> %val3, %val4
|
|
%and = or <8 x i1> %cmp0, %cmp1
|
|
%sel = select <8 x i1> %and, <8 x i16> %val5, <8 x i16> %val6
|
|
ret <8 x i16> %sel
|
|
}
|
|
|
|
define <8 x i32> @fun20(<8 x i32> %val1, <8 x i32> %val2, <8 x i32> %val3, <8 x i32> %val4, <8 x i32> %val5, <8 x i32> %val6) {
|
|
; CHECK-LABEL: fun20:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqf [[REG0:%v[0-9]+]], %v24, %v28
|
|
; CHECK-DAG: vceqf [[REG1:%v[0-9]+]], %v26, %v30
|
|
; CHECK-DAG: vceqf [[REG2:%v[0-9]+]], %v25, %v29
|
|
; CHECK-DAG: vceqf [[REG3:%v[0-9]+]], %v27, %v31
|
|
; CHECK-DAG: vl [[REG4:%v[0-9]+]], 208(%r15)
|
|
; CHECK-DAG: vl [[REG5:%v[0-9]+]], 176(%r15)
|
|
; CHECK-DAG: vl [[REG6:%v[0-9]+]], 192(%r15)
|
|
; CHECK-DAG: vl [[REG7:%v[0-9]+]], 160(%r15)
|
|
; CHECK-DAG: vo [[REG8:%v[0-9]+]], [[REG1]], [[REG3]]
|
|
; CHECK-DAG: vo [[REG9:%v[0-9]+]], [[REG0]], [[REG2]]
|
|
; CHECK-DAG: vsel %v24, [[REG7]], [[REG6]], [[REG9]]
|
|
; CHECK-DAG: vsel %v26, [[REG5]], [[REG4]], [[REG8]]
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <8 x i32> %val1, %val2
|
|
%cmp1 = icmp eq <8 x i32> %val3, %val4
|
|
%and = or <8 x i1> %cmp0, %cmp1
|
|
%sel = select <8 x i1> %and, <8 x i32> %val5, <8 x i32> %val6
|
|
ret <8 x i32> %sel
|
|
}
|
|
|
|
define <2 x i32> @fun21(<2 x i64> %val1, <2 x i64> %val2, <2 x i64> %val3, <2 x i64> %val4, <2 x i32> %val5, <2 x i32> %val6) {
|
|
; CHECK-LABEL: fun21:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqg [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vceqg [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vn %v0, [[REG0]], [[REG1]]
|
|
; CHECK-NEXT: vpkg %v0, %v0, %v0
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i64> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i64> %val3, %val4
|
|
%and = and <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i32> %val5, <2 x i32> %val6
|
|
ret <2 x i32> %sel
|
|
}
|
|
|
|
define <2 x i64> @fun22(<2 x i64> %val1, <2 x i64> %val2, <2 x i64> %val3, <2 x i64> %val4, <2 x i64> %val5, <2 x i64> %val6) {
|
|
; CHECK-LABEL: fun22:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqg [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vceqg [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vn %v0, [[REG0]], [[REG1]]
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i64> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i64> %val3, %val4
|
|
%and = and <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x i64> %val5, <2 x i64> %val6
|
|
ret <2 x i64> %sel
|
|
}
|
|
|
|
define <4 x i32> @fun23(<4 x i64> %val1, <4 x i64> %val2, <4 x i32> %val3, <4 x i32> %val4, <4 x i32> %val5, <4 x i32> %val6) {
|
|
; CHECK-LABEL: fun23:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vceqg %v0, %v26, %v30
|
|
; CHECK-NEXT: vceqg %v1, %v24, %v28
|
|
; CHECK-NEXT: vpkg %v0, %v1, %v0
|
|
; CHECK-NEXT: vceqf %v1, %v25, %v27
|
|
; CHECK-NEXT: vx %v0, %v0, %v1
|
|
; CHECK-NEXT: vsel %v24, %v29, %v31, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <4 x i64> %val1, %val2
|
|
%cmp1 = icmp eq <4 x i32> %val3, %val4
|
|
%and = xor <4 x i1> %cmp0, %cmp1
|
|
%sel = select <4 x i1> %and, <4 x i32> %val5, <4 x i32> %val6
|
|
ret <4 x i32> %sel
|
|
}
|
|
|
|
define <4 x i64> @fun24(<4 x i64> %val1, <4 x i64> %val2, <4 x i32> %val3, <4 x i32> %val4, <4 x i64> %val5, <4 x i64> %val6) {
|
|
; CHECK-LABEL: fun24:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vceqf [[REG0:%v[0-9]+]], %v25, %v27
|
|
; CHECK-NEXT: vuphf [[REG1:%v[0-9]+]], [[REG0]]
|
|
; CHECK-NEXT: vmrlg [[REG2:%v[0-9]+]], [[REG0]], [[REG0]]
|
|
; CHECK-DAG: vceqg [[REG3:%v[0-9]+]], %v24, %v28
|
|
; CHECK-DAG: vceqg [[REG4:%v[0-9]+]], %v26, %v30
|
|
; CHECK-DAG: vuphf [[REG5:%v[0-9]+]], [[REG2]]
|
|
; CHECK-DAG: vl [[REG6:%v[0-9]+]], 176(%r15)
|
|
; CHECK-DAG: vl [[REG7:%v[0-9]+]], 160(%r15)
|
|
; CHECK-DAG: vx [[REG8:%v[0-9]+]], [[REG4]], [[REG5]]
|
|
; CHECK-DAG: vx [[REG9:%v[0-9]+]], [[REG3]], [[REG1]]
|
|
; CHECK-DAG: vsel %v24, %v29, [[REG7]], [[REG9]]
|
|
; CHECK-DAG: vsel %v26, %v31, [[REG6]], [[REG8]]
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <4 x i64> %val1, %val2
|
|
%cmp1 = icmp eq <4 x i32> %val3, %val4
|
|
%and = xor <4 x i1> %cmp0, %cmp1
|
|
%sel = select <4 x i1> %and, <4 x i64> %val5, <4 x i64> %val6
|
|
ret <4 x i64> %sel
|
|
}
|
|
|
|
define <2 x float> @fun25(<2 x float> %val1, <2 x float> %val2, <2 x double> %val3, <2 x double> %val4, <2 x float> %val5, <2 x float> %val6) {
|
|
; CHECK-LABEL: fun25:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vmrlf %v0, %v26, %v26
|
|
; CHECK-NEXT: vmrlf %v1, %v24, %v24
|
|
; CHECK-NEXT: vldeb %v0, %v0
|
|
; CHECK-NEXT: vldeb %v1, %v1
|
|
; CHECK-NEXT: vfchdb %v0, %v1, %v0
|
|
; CHECK-NEXT: vmrhf %v1, %v26, %v26
|
|
; CHECK-NEXT: vmrhf %v2, %v24, %v24
|
|
; CHECK-NEXT: vldeb %v1, %v1
|
|
; CHECK-NEXT: vldeb %v2, %v2
|
|
; CHECK-NEXT: vfchdb %v1, %v2, %v1
|
|
; CHECK-NEXT: vpkg %v0, %v1, %v0
|
|
; CHECK-NEXT: vfchdb %v1, %v28, %v30
|
|
; CHECK-NEXT: vpkg %v1, %v1, %v1
|
|
; CHECK-NEXT: vo %v0, %v0, %v1
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
;
|
|
; CHECK-Z14-LABEL: fun25:
|
|
; CHECK-Z14: # %bb.0:
|
|
; CHECK-Z14-NEXT: vfchdb %v1, %v28, %v30
|
|
; CHECK-Z14-NEXT: vfchsb %v0, %v24, %v26
|
|
; CHECK-Z14-NEXT: vpkg %v1, %v1, %v1
|
|
; CHECK-Z14-NEXT: vo %v0, %v0, %v1
|
|
; CHECK-Z14-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-Z14-NEXT: br %r14
|
|
%cmp0 = fcmp ogt <2 x float> %val1, %val2
|
|
%cmp1 = fcmp ogt <2 x double> %val3, %val4
|
|
%and = or <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x float> %val5, <2 x float> %val6
|
|
ret <2 x float> %sel
|
|
}
|
|
|
|
define <2 x double> @fun26(<2 x float> %val1, <2 x float> %val2, <2 x double> %val3, <2 x double> %val4, <2 x double> %val5, <2 x double> %val6) {
|
|
; CHECK-LABEL: fun26:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vmrlf %v0, %v26, %v26
|
|
; CHECK-NEXT: vmrlf %v1, %v24, %v24
|
|
; CHECK-NEXT: vldeb %v0, %v0
|
|
; CHECK-NEXT: vldeb %v1, %v1
|
|
; CHECK-NEXT: vfchdb %v0, %v1, %v0
|
|
; CHECK-NEXT: vmrhf %v1, %v26, %v26
|
|
; CHECK-NEXT: vmrhf %v2, %v24, %v24
|
|
; CHECK-NEXT: vldeb %v1, %v1
|
|
; CHECK-NEXT: vldeb %v2, %v2
|
|
; CHECK-NEXT: vfchdb %v1, %v2, %v1
|
|
; CHECK-NEXT: vpkg %v0, %v1, %v0
|
|
; CHECK-NEXT: vuphf %v0, %v0
|
|
; CHECK-NEXT: vfchdb %v1, %v28, %v30
|
|
; CHECK-NEXT: vo %v0, %v0, %v1
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
;
|
|
; CHECK-Z14-LABEL: fun26:
|
|
; CHECK-Z14: # %bb.0:
|
|
; CHECK-Z14-NEXT: vfchsb %v0, %v24, %v26
|
|
; CHECK-Z14-NEXT: vuphf %v0, %v0
|
|
; CHECK-Z14-NEXT: vfchdb %v1, %v28, %v30
|
|
; CHECK-Z14-NEXT: vo %v0, %v0, %v1
|
|
; CHECK-Z14-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-Z14-NEXT: br %r14
|
|
%cmp0 = fcmp ogt <2 x float> %val1, %val2
|
|
%cmp1 = fcmp ogt <2 x double> %val3, %val4
|
|
%and = or <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x double> %val5, <2 x double> %val6
|
|
ret <2 x double> %sel
|
|
}
|
|
|
|
; Also check a widening select of a vector of floats
|
|
define <2 x float> @fun27(<2 x i8> %val1, <2 x i8> %val2, <2 x i8> %val3, <2 x i8> %val4, <2 x float> %val5, <2 x float> %val6) {
|
|
; CHECK-LABEL: fun27:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vceqb [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vceqb [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vo %v0, [[REG0]], [[REG1]]
|
|
; CHECK-NEXT: vuphb %v0, %v0
|
|
; CHECK-NEXT: vuphh %v0, %v0
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = icmp eq <2 x i8> %val1, %val2
|
|
%cmp1 = icmp eq <2 x i8> %val3, %val4
|
|
%and = or <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x float> %val5, <2 x float> %val6
|
|
ret <2 x float> %sel
|
|
}
|
|
|
|
define <4 x float> @fun28(<4 x float> %val1, <4 x float> %val2, <4 x float> %val3, <4 x float> %val4, <4 x float> %val5, <4 x float> %val6) {
|
|
; CHECK-LABEL: fun28:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vmrlf [[REG0:%v[0-9]+]], %v26, %v26
|
|
; CHECK-DAG: vmrlf [[REG1:%v[0-9]+]], %v24, %v24
|
|
; CHECK-DAG: vldeb [[REG2:%v[0-9]+]], [[REG0]]
|
|
; CHECK-DAG: vldeb [[REG3:%v[0-9]+]], [[REG1]]
|
|
; CHECK-DAG: vfchdb [[REG4:%v[0-9]+]], [[REG3]], [[REG2]]
|
|
; CHECK-DAG: vmrhf [[REG5:%v[0-9]+]], %v26, %v26
|
|
; CHECK-DAG: vmrhf [[REG6:%v[0-9]+]], %v24, %v24
|
|
; CHECK-DAG: vldeb [[REG7:%v[0-9]+]], [[REG5]]
|
|
; CHECK-DAG: vmrhf [[REG8:%v[0-9]+]], %v28, %v28
|
|
; CHECK-DAG: vldeb [[REG9:%v[0-9]+]], [[REG6]]
|
|
; CHECK-DAG: vfchdb [[REG10:%v[0-9]+]], [[REG9]], [[REG7]]
|
|
; CHECK-DAG: vpkg [[REG11:%v[0-9]+]], [[REG10]], [[REG4]]
|
|
; CHECK-DAG: vmrlf [[REG12:%v[0-9]+]], %v30, %v30
|
|
; CHECK-DAG: vmrlf [[REG13:%v[0-9]+]], %v28, %v28
|
|
; CHECK-DAG: vldeb [[REG14:%v[0-9]+]], [[REG12]]
|
|
; CHECK-DAG: vldeb [[REG15:%v[0-9]+]], [[REG13]]
|
|
; CHECK-DAG: vfchdb [[REG16:%v[0-9]+]], [[REG15]], [[REG14]]
|
|
; CHECK-DAG: vmrhf [[REG17:%v[0-9]+]], %v30, %v30
|
|
; CHECK-DAG: vldeb [[REG19:%v[0-9]+]], [[REG17]]
|
|
; CHECK-DAG: vldeb [[REG20:%v[0-9]+]], [[REG8]]
|
|
; CHECK-NEXT: vfchdb %v2, [[REG20]], [[REG19]]
|
|
; CHECK-NEXT: vpkg [[REG21:%v[0-9]+]], %v2, [[REG16]]
|
|
; CHECK-NEXT: vx %v0, [[REG11]], [[REG21]]
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
;
|
|
; CHECK-Z14-LABEL: fun28:
|
|
; CHECK-Z14: # %bb.0:
|
|
; CHECK-Z14-NEXT: vfchsb %v0, %v24, %v26
|
|
; CHECK-Z14-NEXT: vfchsb %v1, %v28, %v30
|
|
; CHECK-Z14-NEXT: vx %v0, %v0, %v1
|
|
; CHECK-Z14-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-Z14-NEXT: br %r14
|
|
%cmp0 = fcmp ogt <4 x float> %val1, %val2
|
|
%cmp1 = fcmp ogt <4 x float> %val3, %val4
|
|
%and = xor <4 x i1> %cmp0, %cmp1
|
|
%sel = select <4 x i1> %and, <4 x float> %val5, <4 x float> %val6
|
|
ret <4 x float> %sel
|
|
}
|
|
|
|
define <4 x double> @fun29(<4 x float> %val1, <4 x float> %val2, <4 x float> %val3, <4 x float> %val4, <4 x double> %val5, <4 x double> %val6) {
|
|
; CHECK-LABEL: fun29:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vmrlf %v0, %v26, %v26
|
|
; CHECK-NEXT: vmrlf %v1, %v24, %v24
|
|
; CHECK-NEXT: vldeb %v0, %v0
|
|
; CHECK-NEXT: vldeb %v1, %v1
|
|
; CHECK-NEXT: vfchdb %v0, %v1, %v0
|
|
; CHECK-NEXT: vmrhf %v1, %v26, %v26
|
|
; CHECK-NEXT: vmrhf %v2, %v24, %v24
|
|
; CHECK-NEXT: vldeb %v1, %v1
|
|
; CHECK-NEXT: vmrhf %v3, %v28, %v28
|
|
; CHECK-NEXT: vldeb %v2, %v2
|
|
; CHECK-NEXT: vfchdb %v1, %v2, %v1
|
|
; CHECK-NEXT: vpkg %v0, %v1, %v0
|
|
; CHECK-NEXT: vmrlf %v1, %v30, %v30
|
|
; CHECK-NEXT: vmrlf %v2, %v28, %v28
|
|
; CHECK-NEXT: vldeb %v1, %v1
|
|
; CHECK-NEXT: vldeb %v2, %v2
|
|
; CHECK-NEXT: vfchdb %v1, %v2, %v1
|
|
; CHECK-NEXT: vmrhf %v2, %v30, %v30
|
|
; CHECK-NEXT: vldeb %v2, %v2
|
|
; CHECK-NEXT: vldeb %v3, %v3
|
|
; CHECK-NEXT: vfchdb %v2, %v3, %v2
|
|
; CHECK-NEXT: vpkg %v1, %v2, %v1
|
|
; CHECK-NEXT: vx %v0, %v0, %v1
|
|
; CHECK-NEXT: vmrlg %v1, %v0, %v0
|
|
; CHECK-NEXT: vuphf %v1, %v1
|
|
; CHECK-NEXT: vuphf %v0, %v0
|
|
; CHECK-NEXT: vsel %v24, %v25, %v29, %v0
|
|
; CHECK-NEXT: vsel %v26, %v27, %v31, %v1
|
|
; CHECK-NEXT: br %r14
|
|
;
|
|
; CHECK-Z14-LABEL: fun29:
|
|
; CHECK-Z14: # %bb.0:
|
|
; CHECK-Z14-NEXT: vfchsb %v0, %v24, %v26
|
|
; CHECK-Z14-NEXT: vfchsb %v1, %v28, %v30
|
|
; CHECK-Z14-NEXT: vx %v0, %v0, %v1
|
|
; CHECK-Z14-NEXT: vmrlg %v1, %v0, %v0
|
|
; CHECK-Z14-NEXT: vuphf %v1, %v1
|
|
; CHECK-Z14-NEXT: vuphf %v0, %v0
|
|
; CHECK-Z14-NEXT: vsel %v24, %v25, %v29, %v0
|
|
; CHECK-Z14-NEXT: vsel %v26, %v27, %v31, %v1
|
|
; CHECK-Z14-NEXT: br %r14
|
|
%cmp0 = fcmp ogt <4 x float> %val1, %val2
|
|
%cmp1 = fcmp ogt <4 x float> %val3, %val4
|
|
%and = xor <4 x i1> %cmp0, %cmp1
|
|
%sel = select <4 x i1> %and, <4 x double> %val5, <4 x double> %val6
|
|
ret <4 x double> %sel
|
|
}
|
|
|
|
define <8 x float> @fun30(<8 x float> %val1, <8 x float> %val2, <8 x double> %val3, <8 x double> %val4, <8 x float> %val5, <8 x float> %val6) {
|
|
; CHECK-LABEL: fun30:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vmrlf %v16, %v28, %v28
|
|
; CHECK-NEXT: vmrlf %v17, %v24, %v24
|
|
; CHECK-NEXT: vldeb %v16, %v16
|
|
; CHECK-NEXT: vldeb %v17, %v17
|
|
; CHECK-NEXT: vfchdb %v16, %v17, %v16
|
|
; CHECK-NEXT: vmrhf %v17, %v28, %v28
|
|
; CHECK-NEXT: vmrhf %v18, %v24, %v24
|
|
; CHECK-NEXT: vldeb %v17, %v17
|
|
; CHECK-NEXT: vl %v4, 192(%r15)
|
|
; CHECK-NEXT: vldeb %v18, %v18
|
|
; CHECK-NEXT: vl %v5, 208(%r15)
|
|
; CHECK-NEXT: vl %v6, 160(%r15)
|
|
; CHECK-NEXT: vl %v7, 176(%r15)
|
|
; CHECK-NEXT: vl %v0, 272(%r15)
|
|
; CHECK-NEXT: vl %v1, 240(%r15)
|
|
; CHECK-NEXT: vfchdb %v17, %v18, %v17
|
|
; CHECK-NEXT: vl %v2, 256(%r15)
|
|
; CHECK-NEXT: vl %v3, 224(%r15)
|
|
; CHECK-NEXT: vpkg %v16, %v17, %v16
|
|
; CHECK-NEXT: vmrlf %v17, %v30, %v30
|
|
; CHECK-NEXT: vmrlf %v18, %v26, %v26
|
|
; CHECK-NEXT: vmrhf %v19, %v26, %v26
|
|
; CHECK-NEXT: vfchdb %v7, %v27, %v7
|
|
; CHECK-NEXT: vfchdb %v6, %v25, %v6
|
|
; CHECK-NEXT: vfchdb %v5, %v31, %v5
|
|
; CHECK-NEXT: vfchdb %v4, %v29, %v4
|
|
; CHECK-NEXT: vpkg %v6, %v6, %v7
|
|
; CHECK-NEXT: vpkg %v4, %v4, %v5
|
|
; CHECK-NEXT: vn %v5, %v16, %v6
|
|
; CHECK-DAG: vsel %v24, %v3, %v2, %v5
|
|
; CHECK-DAG: vldeb %v17, %v17
|
|
; CHECK-NEXT: vldeb %v18, %v18
|
|
; CHECK-NEXT: vfchdb %v17, %v18, %v17
|
|
; CHECK-NEXT: vmrhf %v18, %v30, %v30
|
|
; CHECK-NEXT: vldeb %v18, %v18
|
|
; CHECK-NEXT: vldeb %v19, %v19
|
|
; CHECK-NEXT: vfchdb %v18, %v19, %v18
|
|
; CHECK-NEXT: vpkg %v17, %v18, %v17
|
|
; CHECK-NEXT: vn %v4, %v17, %v4
|
|
; CHECK-NEXT: vsel %v26, %v1, %v0, %v4
|
|
; CHECK-NEXT: br %r14
|
|
;
|
|
; CHECK-Z14-LABEL: fun30:
|
|
; CHECK-Z14: # %bb.0:
|
|
; CHECK-Z14-NEXT: vl %v4, 192(%r15)
|
|
; CHECK-Z14-NEXT: vl %v5, 208(%r15)
|
|
; CHECK-Z14-NEXT: vl %v6, 160(%r15)
|
|
; CHECK-Z14-NEXT: vl %v7, 176(%r15)
|
|
; CHECK-Z14-NEXT: vfchdb %v7, %v27, %v7
|
|
; CHECK-Z14-NEXT: vfchdb %v6, %v25, %v6
|
|
; CHECK-Z14-NEXT: vfchdb %v5, %v31, %v5
|
|
; CHECK-Z14-NEXT: vfchdb %v4, %v29, %v4
|
|
; CHECK-Z14-DAG: vfchsb %v16, %v24, %v28
|
|
; CHECK-Z14-DAG: vfchsb %v17, %v26, %v30
|
|
; CHECK-Z14-DAG: vpkg %v6, %v6, %v7
|
|
; CHECK-Z14-DAG: vpkg %v4, %v4, %v5
|
|
; CHECK-Z14-DAG: vl %v0, 272(%r15)
|
|
; CHECK-Z14-DAG: vl %v1, 240(%r15)
|
|
; CHECK-Z14-DAG: vl %v2, 256(%r15)
|
|
; CHECK-Z14-DAG: vl %v3, 224(%r15)
|
|
; CHECK-Z14-NEXT: vn %v4, %v17, %v4
|
|
; CHECK-Z14-NEXT: vn %v5, %v16, %v6
|
|
; CHECK-Z14-NEXT: vsel %v24, %v3, %v2, %v5
|
|
; CHECK-Z14-NEXT: vsel %v26, %v1, %v0, %v4
|
|
; CHECK-Z14-NEXT: br %r14
|
|
%cmp0 = fcmp ogt <8 x float> %val1, %val2
|
|
%cmp1 = fcmp ogt <8 x double> %val3, %val4
|
|
%and = and <8 x i1> %cmp0, %cmp1
|
|
%sel = select <8 x i1> %and, <8 x float> %val5, <8 x float> %val6
|
|
ret <8 x float> %sel
|
|
}
|
|
|
|
define <2 x float> @fun31(<2 x double> %val1, <2 x double> %val2, <2 x double> %val3, <2 x double> %val4, <2 x float> %val5, <2 x float> %val6) {
|
|
; CHECK-LABEL: fun31:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vfchdb [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vfchdb [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vx %v0, [[REG0]], [[REG1]]
|
|
; CHECK-NEXT: vpkg %v0, %v0, %v0
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = fcmp ogt <2 x double> %val1, %val2
|
|
%cmp1 = fcmp ogt <2 x double> %val3, %val4
|
|
%and = xor <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x float> %val5, <2 x float> %val6
|
|
ret <2 x float> %sel
|
|
}
|
|
|
|
define <2 x double> @fun32(<2 x double> %val1, <2 x double> %val2, <2 x double> %val3, <2 x double> %val4, <2 x double> %val5, <2 x double> %val6) {
|
|
; CHECK-LABEL: fun32:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-DAG: vfchdb [[REG0:%v[0-9]+]], %v24, %v26
|
|
; CHECK-DAG: vfchdb [[REG1:%v[0-9]+]], %v28, %v30
|
|
; CHECK-NEXT: vx %v0, [[REG0]], [[REG1]]
|
|
; CHECK-NEXT: vsel %v24, %v25, %v27, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%cmp0 = fcmp ogt <2 x double> %val1, %val2
|
|
%cmp1 = fcmp ogt <2 x double> %val3, %val4
|
|
%and = xor <2 x i1> %cmp0, %cmp1
|
|
%sel = select <2 x i1> %and, <2 x double> %val5, <2 x double> %val6
|
|
ret <2 x double> %sel
|
|
}
|
|
|
|
define <4 x float> @fun33(<4 x double> %val1, <4 x double> %val2, <4 x float> %val3, <4 x float> %val4, <4 x float> %val5, <4 x float> %val6) {
|
|
; CHECK-LABEL: fun33:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vfchdb %v0, %v26, %v30
|
|
; CHECK-NEXT: vfchdb %v1, %v24, %v28
|
|
; CHECK-NEXT: vpkg %v0, %v1, %v0
|
|
; CHECK-NEXT: vmrlf %v1, %v27, %v27
|
|
; CHECK-NEXT: vmrlf %v2, %v25, %v25
|
|
; CHECK-NEXT: vldeb %v1, %v1
|
|
; CHECK-NEXT: vldeb %v2, %v2
|
|
; CHECK-NEXT: vfchdb %v1, %v2, %v1
|
|
; CHECK-NEXT: vmrhf %v2, %v27, %v27
|
|
; CHECK-NEXT: vmrhf %v3, %v25, %v25
|
|
; CHECK-NEXT: vldeb %v2, %v2
|
|
; CHECK-NEXT: vldeb %v3, %v3
|
|
; CHECK-NEXT: vfchdb %v2, %v3, %v2
|
|
; CHECK-NEXT: vpkg %v1, %v2, %v1
|
|
; CHECK-NEXT: vn %v0, %v0, %v1
|
|
; CHECK-NEXT: vsel %v24, %v29, %v31, %v0
|
|
; CHECK-NEXT: br %r14
|
|
;
|
|
; CHECK-Z14-LABEL: fun33:
|
|
; CHECK-Z14: # %bb.0:
|
|
; CHECK-Z14-NEXT: vfchdb %v0, %v26, %v30
|
|
; CHECK-Z14-NEXT: vfchdb %v1, %v24, %v28
|
|
; CHECK-Z14-NEXT: vpkg %v0, %v1, %v0
|
|
; CHECK-Z14-NEXT: vfchsb %v1, %v25, %v27
|
|
; CHECK-Z14-NEXT: vn %v0, %v0, %v1
|
|
; CHECK-Z14-NEXT: vsel %v24, %v29, %v31, %v0
|
|
; CHECK-Z14-NEXT: br %r14
|
|
%cmp0 = fcmp ogt <4 x double> %val1, %val2
|
|
%cmp1 = fcmp ogt <4 x float> %val3, %val4
|
|
%and = and <4 x i1> %cmp0, %cmp1
|
|
%sel = select <4 x i1> %and, <4 x float> %val5, <4 x float> %val6
|
|
ret <4 x float> %sel
|
|
}
|
|
|
|
define <4 x double> @fun34(<4 x double> %val1, <4 x double> %val2, <4 x float> %val3, <4 x float> %val4, <4 x double> %val5, <4 x double> %val6) {
|
|
; CHECK-LABEL: fun34:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vmrlf [[REG0:%v[0-9]+]], %v27, %v27
|
|
; CHECK-NEXT: vmrlf [[REG1:%v[0-9]+]], %v25, %v25
|
|
; CHECK-NEXT: vldeb [[REG2:%v[0-9]+]], [[REG0]]
|
|
; CHECK-NEXT: vldeb [[REG3:%v[0-9]+]], [[REG1]]
|
|
; CHECK-NEXT: vfchdb [[REG4:%v[0-9]+]], [[REG3]], [[REG2]]
|
|
; CHECK-NEXT: vmrhf [[REG5:%v[0-9]+]], %v27, %v27
|
|
; CHECK-NEXT: vmrhf [[REG6:%v[0-9]+]], %v25, %v25
|
|
; CHECK-DAG: vldeb [[REG7:%v[0-9]+]], [[REG5]]
|
|
; CHECK-DAG: vl [[REG8:%v[0-9]+]], 176(%r15)
|
|
; CHECK-DAG: vldeb [[REG9:%v[0-9]+]], [[REG6]]
|
|
; CHECK-DAG: vl [[REG10:%v[0-9]+]], 160(%r15)
|
|
; CHECK-DAG: vfchdb [[REG11:%v[0-9]+]], [[REG9]], [[REG7]]
|
|
; CHECK-DAG: vpkg [[REG12:%v[0-9]+]], [[REG11]], [[REG4]]
|
|
; CHECK-DAG: vuphf [[REG13:%v[0-9]+]], [[REG12]]
|
|
; CHECK-DAG: vmrlg [[REG14:%v[0-9]+]], [[REG12]], [[REG12]]
|
|
; CHECK-NEXT: vfchdb [[REG15:%v[0-9]+]], %v24, %v28
|
|
; CHECK-NEXT: vfchdb [[REG16:%v[0-9]+]], %v26, %v30
|
|
; CHECK-NEXT: vuphf [[REG17:%v[0-9]+]], [[REG14]]
|
|
; CHECK-NEXT: vn [[REG18:%v[0-9]+]], [[REG16]], [[REG17]]
|
|
; CHECK-NEXT: vn [[REG19:%v[0-9]+]], [[REG15]], [[REG13]]
|
|
; CHECK-NEXT: vsel %v24, %v29, [[REG10]], [[REG19]]
|
|
; CHECK-NEXT: vsel %v26, %v31, [[REG8]], [[REG18]]
|
|
; CHECK-NEXT: br %r14
|
|
;
|
|
; CHECK-Z14-LABEL: fun34:
|
|
; CHECK-Z14: # %bb.0:
|
|
; CHECK-Z14-NEXT: vfchsb %v4, %v25, %v27
|
|
; CHECK-Z14-NEXT: vuphf %v5, %v4
|
|
; CHECK-Z14-NEXT: vmrlg %v4, %v4, %v4
|
|
; CHECK-Z14-DAG: vfchdb %v2, %v24, %v28
|
|
; CHECK-Z14-DAG: vfchdb %v3, %v26, %v30
|
|
; CHECK-Z14-DAG: vuphf %v4, %v4
|
|
; CHECK-Z14-DAG: vl %v0, 176(%r15)
|
|
; CHECK-Z14-DAG: vl %v1, 160(%r15)
|
|
; CHECK-Z14-NEXT: vn %v3, %v3, %v4
|
|
; CHECK-Z14-NEXT: vn %v2, %v2, %v5
|
|
; CHECK-Z14-NEXT: vsel %v24, %v29, %v1, %v2
|
|
; CHECK-Z14-NEXT: vsel %v26, %v31, %v0, %v3
|
|
; CHECK-Z14-NEXT: br %r14
|
|
%cmp0 = fcmp ogt <4 x double> %val1, %val2
|
|
%cmp1 = fcmp ogt <4 x float> %val3, %val4
|
|
%and = and <4 x i1> %cmp0, %cmp1
|
|
%sel = select <4 x i1> %and, <4 x double> %val5, <4 x double> %val6
|
|
ret <4 x double> %sel
|
|
}
|