mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-25 20:23:11 +01:00
90d0031df7
On SystemZ, a ZERO_EXTEND of an i1 vector handled by WidenVecRes_Convert() always ended up being scalarized, because the type action of the input is promotion which was previously an unhandled case in this method. This fixes https://bugs.llvm.org/show_bug.cgi?id=47132. Differential Revision: https://reviews.llvm.org/D86268 Patch by Eli Friedman. Review: Ulrich Weigand
111 lines
2.8 KiB
LLVM
111 lines
2.8 KiB
LLVM
; Test that vector zexts are done efficently also in case of fewer elements
|
|
; than allowed, e.g. <2 x i32>.
|
|
;
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s
|
|
|
|
|
|
define <2 x i16> @fun1(<2 x i8> %val1) {
|
|
; CHECK-LABEL: fun1:
|
|
; CHECK: vuplhb %v24, %v24
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <2 x i8> %val1 to <2 x i16>
|
|
ret <2 x i16> %z
|
|
}
|
|
|
|
define <2 x i32> @fun2(<2 x i8> %val1) {
|
|
; CHECK-LABEL: fun2:
|
|
; CHECK: larl %r1, .LCPI1_0
|
|
; CHECK-NEXT: vl %v0, 0(%r1), 3
|
|
; CHECK-NEXT: vperm %v24, %v0, %v24, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <2 x i8> %val1 to <2 x i32>
|
|
ret <2 x i32> %z
|
|
}
|
|
|
|
define <2 x i64> @fun3(<2 x i8> %val1) {
|
|
; CHECK-LABEL: fun3:
|
|
; CHECK: larl %r1, .LCPI2_0
|
|
; CHECK-NEXT: vl %v0, 0(%r1), 3
|
|
; CHECK-NEXT: vperm %v24, %v0, %v24, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <2 x i8> %val1 to <2 x i64>
|
|
ret <2 x i64> %z
|
|
}
|
|
|
|
define <2 x i32> @fun4(<2 x i16> %val1) {
|
|
; CHECK-LABEL: fun4:
|
|
; CHECK: vuplhh %v24, %v24
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <2 x i16> %val1 to <2 x i32>
|
|
ret <2 x i32> %z
|
|
}
|
|
|
|
define <2 x i64> @fun5(<2 x i16> %val1) {
|
|
; CHECK-LABEL: fun5:
|
|
; CHECK: larl %r1, .LCPI4_0
|
|
; CHECK-NEXT: vl %v0, 0(%r1), 3
|
|
; CHECK-NEXT: vperm %v24, %v0, %v24, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <2 x i16> %val1 to <2 x i64>
|
|
ret <2 x i64> %z
|
|
}
|
|
|
|
define <2 x i64> @fun6(<2 x i32> %val1) {
|
|
; CHECK-LABEL: fun6:
|
|
; CHECK: vuplhf %v24, %v24
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <2 x i32> %val1 to <2 x i64>
|
|
ret <2 x i64> %z
|
|
}
|
|
|
|
define <4 x i16> @fun7(<4 x i8> %val1) {
|
|
; CHECK-LABEL: fun7:
|
|
; CHECK: vuplhb %v24, %v24
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <4 x i8> %val1 to <4 x i16>
|
|
ret <4 x i16> %z
|
|
}
|
|
|
|
define <4 x i32> @fun8(<4 x i8> %val1) {
|
|
; CHECK-LABEL: fun8:
|
|
; CHECK: larl %r1, .LCPI7_0
|
|
; CHECK-NEXT: vl %v0, 0(%r1), 3
|
|
; CHECK-NEXT: vperm %v24, %v0, %v24, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <4 x i8> %val1 to <4 x i32>
|
|
ret <4 x i32> %z
|
|
}
|
|
|
|
define <4 x i32> @fun9(<4 x i16> %val1) {
|
|
; CHECK-LABEL: fun9:
|
|
; CHECK: vuplhh %v24, %v24
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <4 x i16> %val1 to <4 x i32>
|
|
ret <4 x i32> %z
|
|
}
|
|
|
|
define <8 x i16> @fun10(<8 x i8> %val1) {
|
|
; CHECK-LABEL: fun10:
|
|
; CHECK: vuplhb %v24, %v24
|
|
; CHECK-NEXT: br %r14
|
|
%z = zext <8 x i8> %val1 to <8 x i16>
|
|
ret <8 x i16> %z
|
|
}
|
|
|
|
define <2 x i32> @fun11(<2 x i64> %Arg1, <2 x i64> %Arg2) {
|
|
; CHECK-LABEL: fun11:
|
|
; CHECK: vgbm %v0, 0
|
|
; CHECK-NEXT: vceqg %v1, %v24, %v0
|
|
; CHECK-NEXT: vceqg %v0, %v26, %v0
|
|
; CHECK-NEXT: vo %v0, %v1, %v0
|
|
; CHECK-NEXT: vrepig %v1, 1
|
|
; CHECK-NEXT: vn %v0, %v0, %v1
|
|
; CHECK-NEXT: vpkg %v24, %v0, %v0
|
|
; CHECK-NEXT: br %r14
|
|
%i3 = icmp eq <2 x i64> %Arg1, zeroinitializer
|
|
%i5 = icmp eq <2 x i64> %Arg2, zeroinitializer
|
|
%i6 = or <2 x i1> %i3, %i5
|
|
%i7 = zext <2 x i1> %i6 to <2 x i32>
|
|
ret <2 x i32> %i7
|
|
}
|