mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-31 20:51:52 +01:00
e5babc6bd2
Summary: This patch adds AArch64ISD nodes for [S|U]MIN_PRED and [S|U]MAX_PRED, and lowers both SVE intrinsics and IR operations for min and max to these nodes. There are two forms of these instructions for SVE: a predicated form and an immediate (unpredicated) form. The patterns which existed for the latter have been updated to match a predicated node with an immediate and map this to the immediate instruction. Reviewers: sdesmalen, efriedma, dancgr, rengolin Reviewed By: efriedma Subscribers: huihuiz, tschuett, kristof.beyls, hiraditya, rkruppe, psnobl, cfe-commits, llvm-commits Tags: #llvm Differential Revision: https://reviews.llvm.org/D79087
222 lines
7.1 KiB
LLVM
222 lines
7.1 KiB
LLVM
; RUN: llc -mtriple=aarch64-linux-gnu -mattr=+sve < %s | FileCheck %s
|
|
|
|
;
|
|
; SDIV
|
|
;
|
|
|
|
define <vscale x 4 x i32> @sdiv_i32(<vscale x 4 x i32> %a, <vscale x 4 x i32> %b) {
|
|
; CHECK-LABEL: @sdiv_i32
|
|
; CHECK-DAG: ptrue p0.s
|
|
; CHECK-DAG: sdiv z0.s, p0/m, z0.s, z1.s
|
|
; CHECK-NEXT: ret
|
|
%div = sdiv <vscale x 4 x i32> %a, %b
|
|
ret <vscale x 4 x i32> %div
|
|
}
|
|
|
|
define <vscale x 2 x i64> @sdiv_i64(<vscale x 2 x i64> %a, <vscale x 2 x i64> %b) {
|
|
; CHECK-LABEL: @sdiv_i64
|
|
; CHECK-DAG: ptrue p0.d
|
|
; CHECK-DAG: sdiv z0.d, p0/m, z0.d, z1.d
|
|
; CHECK-NEXT: ret
|
|
%div = sdiv <vscale x 2 x i64> %a, %b
|
|
ret <vscale x 2 x i64> %div
|
|
}
|
|
|
|
;
|
|
; UDIV
|
|
;
|
|
|
|
define <vscale x 4 x i32> @udiv_i32(<vscale x 4 x i32> %a, <vscale x 4 x i32> %b) {
|
|
; CHECK-LABEL: @udiv_i32
|
|
; CHECK-DAG: ptrue p0.s
|
|
; CHECK-DAG: udiv z0.s, p0/m, z0.s, z1.s
|
|
; CHECK-NEXT: ret
|
|
%div = udiv <vscale x 4 x i32> %a, %b
|
|
ret <vscale x 4 x i32> %div
|
|
}
|
|
|
|
define <vscale x 2 x i64> @udiv_i64(<vscale x 2 x i64> %a, <vscale x 2 x i64> %b) {
|
|
; CHECK-LABEL: @udiv_i64
|
|
; CHECK-DAG: ptrue p0.d
|
|
; CHECK-DAG: udiv z0.d, p0/m, z0.d, z1.d
|
|
; CHECK-NEXT: ret
|
|
%div = udiv <vscale x 2 x i64> %a, %b
|
|
ret <vscale x 2 x i64> %div
|
|
}
|
|
|
|
;
|
|
; SMIN
|
|
;
|
|
|
|
define <vscale x 16 x i8> @smin_i8(<vscale x 16 x i8> %a, <vscale x 16 x i8> %b, <vscale x 16 x i8> %c) {
|
|
; CHECK-LABEL: @smin_i8
|
|
; CHECK-DAG: ptrue p0.b
|
|
; CHECK-DAG: smin z0.b, p0/m, z0.b, z1.b
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp slt <vscale x 16 x i8> %a, %b
|
|
%min = select <vscale x 16 x i1> %cmp, <vscale x 16 x i8> %a, <vscale x 16 x i8> %b
|
|
ret <vscale x 16 x i8> %min
|
|
}
|
|
|
|
define <vscale x 8 x i16> @smin_i16(<vscale x 8 x i16> %a, <vscale x 8 x i16> %b, <vscale x 8 x i16> %c) {
|
|
; CHECK-LABEL: @smin_i16
|
|
; CHECK-DAG: ptrue p0.h
|
|
; CHECK-DAG: smin z0.h, p0/m, z0.h, z1.h
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp slt <vscale x 8 x i16> %a, %b
|
|
%min = select <vscale x 8 x i1> %cmp, <vscale x 8 x i16> %a, <vscale x 8 x i16> %b
|
|
ret <vscale x 8 x i16> %min
|
|
}
|
|
|
|
define <vscale x 4 x i32> @smin_i32(<vscale x 4 x i32> %a, <vscale x 4 x i32> %b, <vscale x 4 x i32> %c) {
|
|
; CHECK-LABEL: smin_i32:
|
|
; CHECK-DAG: ptrue p0.s
|
|
; CHECK-DAG: smin z0.s, p0/m, z0.s, z1.s
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp slt <vscale x 4 x i32> %a, %b
|
|
%min = select <vscale x 4 x i1> %cmp, <vscale x 4 x i32> %a, <vscale x 4 x i32> %b
|
|
ret <vscale x 4 x i32> %min
|
|
}
|
|
|
|
define <vscale x 2 x i64> @smin_i64(<vscale x 2 x i64> %a, <vscale x 2 x i64> %b, <vscale x 2 x i64> %c) {
|
|
; CHECK-LABEL: smin_i64:
|
|
; CHECK-DAG: ptrue p0.d
|
|
; CHECK-DAG: smin z0.d, p0/m, z0.d, z1.d
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp slt <vscale x 2 x i64> %a, %b
|
|
%min = select <vscale x 2 x i1> %cmp, <vscale x 2 x i64> %a, <vscale x 2 x i64> %b
|
|
ret <vscale x 2 x i64> %min
|
|
}
|
|
|
|
;
|
|
; UMIN
|
|
;
|
|
|
|
define <vscale x 16 x i8> @umin_i8(<vscale x 16 x i8> %a, <vscale x 16 x i8> %b, <vscale x 16 x i8> %c) {
|
|
; CHECK-LABEL: @umin_i8
|
|
; CHECK-DAG: ptrue p0.b
|
|
; CHECK-DAG: umin z0.b, p0/m, z0.b, z1.b
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp ult <vscale x 16 x i8> %a, %b
|
|
%min = select <vscale x 16 x i1> %cmp, <vscale x 16 x i8> %a, <vscale x 16 x i8> %b
|
|
ret <vscale x 16 x i8> %min
|
|
}
|
|
|
|
define <vscale x 8 x i16> @umin_i16(<vscale x 8 x i16> %a, <vscale x 8 x i16> %b, <vscale x 8 x i16> %c) {
|
|
; CHECK-LABEL: @umin_i16
|
|
; CHECK-DAG: ptrue p0.h
|
|
; CHECK-DAG: umin z0.h, p0/m, z0.h, z1.h
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp ult <vscale x 8 x i16> %a, %b
|
|
%min = select <vscale x 8 x i1> %cmp, <vscale x 8 x i16> %a, <vscale x 8 x i16> %b
|
|
ret <vscale x 8 x i16> %min
|
|
}
|
|
|
|
define <vscale x 4 x i32> @umin_i32(<vscale x 4 x i32> %a, <vscale x 4 x i32> %b, <vscale x 4 x i32> %c) {
|
|
; CHECK-LABEL: umin_i32:
|
|
; CHECK-DAG: ptrue p0.s
|
|
; CHECK-DAG: umin z0.s, p0/m, z0.s, z1.s
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp ult <vscale x 4 x i32> %a, %b
|
|
%min = select <vscale x 4 x i1> %cmp, <vscale x 4 x i32> %a, <vscale x 4 x i32> %b
|
|
ret <vscale x 4 x i32> %min
|
|
}
|
|
|
|
define <vscale x 2 x i64> @umin_i64(<vscale x 2 x i64> %a, <vscale x 2 x i64> %b, <vscale x 2 x i64> %c) {
|
|
; CHECK-LABEL: umin_i64:
|
|
; CHECK-DAG: ptrue p0.d
|
|
; CHECK-DAG: umin z0.d, p0/m, z0.d, z1.d
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp ult <vscale x 2 x i64> %a, %b
|
|
%min = select <vscale x 2 x i1> %cmp, <vscale x 2 x i64> %a, <vscale x 2 x i64> %b
|
|
ret <vscale x 2 x i64> %min
|
|
}
|
|
|
|
;
|
|
; SMAX
|
|
;
|
|
|
|
define <vscale x 16 x i8> @smax_i8(<vscale x 16 x i8> %a, <vscale x 16 x i8> %b, <vscale x 16 x i8> %c) {
|
|
; CHECK-LABEL: @smax_i8
|
|
; CHECK-DAG: ptrue p0.b
|
|
; CHECK-DAG: smax z0.b, p0/m, z0.b, z1.b
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp sgt <vscale x 16 x i8> %a, %b
|
|
%min = select <vscale x 16 x i1> %cmp, <vscale x 16 x i8> %a, <vscale x 16 x i8> %b
|
|
ret <vscale x 16 x i8> %min
|
|
}
|
|
|
|
define <vscale x 8 x i16> @smax_i16(<vscale x 8 x i16> %a, <vscale x 8 x i16> %b, <vscale x 8 x i16> %c) {
|
|
; CHECK-LABEL: @smax_i16
|
|
; CHECK-DAG: ptrue p0.h
|
|
; CHECK-DAG: smax z0.h, p0/m, z0.h, z1.h
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp sgt <vscale x 8 x i16> %a, %b
|
|
%min = select <vscale x 8 x i1> %cmp, <vscale x 8 x i16> %a, <vscale x 8 x i16> %b
|
|
ret <vscale x 8 x i16> %min
|
|
}
|
|
|
|
define <vscale x 4 x i32> @smax_i32(<vscale x 4 x i32> %a, <vscale x 4 x i32> %b, <vscale x 4 x i32> %c) {
|
|
; CHECK-LABEL: smax_i32:
|
|
; CHECK-DAG: ptrue p0.s
|
|
; CHECK-DAG: smax z0.s, p0/m, z0.s, z1.s
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp sgt <vscale x 4 x i32> %a, %b
|
|
%min = select <vscale x 4 x i1> %cmp, <vscale x 4 x i32> %a, <vscale x 4 x i32> %b
|
|
ret <vscale x 4 x i32> %min
|
|
}
|
|
|
|
define <vscale x 2 x i64> @smax_i64(<vscale x 2 x i64> %a, <vscale x 2 x i64> %b, <vscale x 2 x i64> %c) {
|
|
; CHECK-LABEL: smax_i64:
|
|
; CHECK-DAG: ptrue p0.d
|
|
; CHECK-DAG: smax z0.d, p0/m, z0.d, z1.d
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp sgt <vscale x 2 x i64> %a, %b
|
|
%min = select <vscale x 2 x i1> %cmp, <vscale x 2 x i64> %a, <vscale x 2 x i64> %b
|
|
ret <vscale x 2 x i64> %min
|
|
}
|
|
|
|
;
|
|
; UMAX
|
|
;
|
|
|
|
define <vscale x 16 x i8> @umax_i8(<vscale x 16 x i8> %a, <vscale x 16 x i8> %b, <vscale x 16 x i8> %c) {
|
|
; CHECK-LABEL: @umax_i8
|
|
; CHECK-DAG: ptrue p0.b
|
|
; CHECK-DAG: umax z0.b, p0/m, z0.b, z1.b
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp ugt <vscale x 16 x i8> %a, %b
|
|
%min = select <vscale x 16 x i1> %cmp, <vscale x 16 x i8> %a, <vscale x 16 x i8> %b
|
|
ret <vscale x 16 x i8> %min
|
|
}
|
|
|
|
define <vscale x 8 x i16> @umax_i16(<vscale x 8 x i16> %a, <vscale x 8 x i16> %b, <vscale x 8 x i16> %c) {
|
|
; CHECK-LABEL: @umax_i16
|
|
; CHECK-DAG: ptrue p0.h
|
|
; CHECK-DAG: umax z0.h, p0/m, z0.h, z1.h
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp ugt <vscale x 8 x i16> %a, %b
|
|
%min = select <vscale x 8 x i1> %cmp, <vscale x 8 x i16> %a, <vscale x 8 x i16> %b
|
|
ret <vscale x 8 x i16> %min
|
|
}
|
|
|
|
define <vscale x 4 x i32> @umax_i32(<vscale x 4 x i32> %a, <vscale x 4 x i32> %b, <vscale x 4 x i32> %c) {
|
|
; CHECK-LABEL: umax_i32:
|
|
; CHECK-DAG: ptrue p0.s
|
|
; CHECK-DAG: umax z0.s, p0/m, z0.s, z1.s
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp ugt <vscale x 4 x i32> %a, %b
|
|
%min = select <vscale x 4 x i1> %cmp, <vscale x 4 x i32> %a, <vscale x 4 x i32> %b
|
|
ret <vscale x 4 x i32> %min
|
|
}
|
|
|
|
define <vscale x 2 x i64> @umax_i64(<vscale x 2 x i64> %a, <vscale x 2 x i64> %b, <vscale x 2 x i64> %c) {
|
|
; CHECK-LABEL: umax_i64:
|
|
; CHECK-DAG: ptrue p0.d
|
|
; CHECK-DAG: umax z0.d, p0/m, z0.d, z1.d
|
|
; CHECK-NEXT: ret
|
|
%cmp = icmp ugt <vscale x 2 x i64> %a, %b
|
|
%min = select <vscale x 2 x i1> %cmp, <vscale x 2 x i64> %a, <vscale x 2 x i64> %b
|
|
ret <vscale x 2 x i64> %min
|
|
}
|