mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-22 18:54:02 +01:00
2b3fd0441a
This patch added generation of SIMD bitwise insert BIT/BIF instructions. In the absence of GCC-like functionality for optimal constraints satisfaction during register allocation the bitwise insert and select patterns are matched by pseudo bitwise select BSP instruction with not tied def. It is expanded later after register allocation with def tied to BSL/BIT/BIF depending on operands registers. This allows to get rid of redundant moves. Reviewers: t.p.northover, samparker, dmgreen Reviewed By: dmgreen Differential Revision: https://reviews.llvm.org/D74147
147 lines
4.3 KiB
LLVM
147 lines
4.3 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -mtriple=aarch64-unknown-linux-gnu < %s | FileCheck %s
|
|
|
|
; BIF Bitwise Insert if False
|
|
;
|
|
; 8-bit vectors tests
|
|
|
|
define <1 x i8> @test_bitf_v1i8(<1 x i8> %A, <1 x i8> %B, <1 x i8> %C) {
|
|
; CHECK-LABEL: test_bitf_v1i8:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.8b, v1.8b, v2.8b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <1 x i8> %C, <i8 -1>
|
|
%and = and <1 x i8> %neg, %B
|
|
%and1 = and <1 x i8> %C, %A
|
|
%or = or <1 x i8> %and, %and1
|
|
ret <1 x i8> %or
|
|
}
|
|
|
|
; 16-bit vectors tests
|
|
|
|
define <1 x i16> @test_bitf_v1i16(<1 x i16> %A, <1 x i16> %B, <1 x i16> %C) {
|
|
; CHECK-LABEL: test_bitf_v1i16:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.8b, v1.8b, v2.8b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <1 x i16> %C, <i16 -1>
|
|
%and = and <1 x i16> %neg, %B
|
|
%and1 = and <1 x i16> %C, %A
|
|
%or = or <1 x i16> %and, %and1
|
|
ret <1 x i16> %or
|
|
}
|
|
|
|
; 32-bit vectors tests
|
|
|
|
define <1 x i32> @test_bitf_v1i32(<1 x i32> %A, <1 x i32> %B, <1 x i32> %C) {
|
|
; CHECK-LABEL: test_bitf_v1i32:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.8b, v1.8b, v2.8b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <1 x i32> %C, <i32 -1>
|
|
%and = and <1 x i32> %neg, %B
|
|
%and1 = and <1 x i32> %C, %A
|
|
%or = or <1 x i32> %and, %and1
|
|
ret <1 x i32> %or
|
|
}
|
|
|
|
; 64-bit vectors tests
|
|
|
|
define <1 x i64> @test_bitf_v1i64(<1 x i64> %A, <1 x i64> %B, <1 x i64> %C) {
|
|
; CHECK-LABEL: test_bitf_v1i64:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.8b, v1.8b, v2.8b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <1 x i64> %C, <i64 -1>
|
|
%and = and <1 x i64> %neg, %B
|
|
%and1 = and <1 x i64> %C, %A
|
|
%or = or <1 x i64> %and, %and1
|
|
ret <1 x i64> %or
|
|
}
|
|
|
|
define <2 x i32> @test_bitf_v2i32(<2 x i32> %A, <2 x i32> %B, <2 x i32> %C) {
|
|
; CHECK-LABEL: test_bitf_v2i32:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.8b, v1.8b, v2.8b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <2 x i32> %C, <i32 -1, i32 -1>
|
|
%and = and <2 x i32> %neg, %B
|
|
%and1 = and <2 x i32> %C, %A
|
|
%or = or <2 x i32> %and, %and1
|
|
ret <2 x i32> %or
|
|
}
|
|
|
|
define <4 x i16> @test_bitf_v4i16(<4 x i16> %A, <4 x i16> %B, <4 x i16> %C) {
|
|
; CHECK-LABEL: test_bitf_v4i16:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.8b, v1.8b, v2.8b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <4 x i16> %C, <i16 -1, i16 -1, i16 -1, i16 -1>
|
|
%and = and <4 x i16> %neg, %B
|
|
%and1 = and <4 x i16> %C, %A
|
|
%or = or <4 x i16> %and, %and1
|
|
ret <4 x i16> %or
|
|
}
|
|
|
|
define <8 x i8> @test_bitf_v8i8(<8 x i8> %A, <8 x i8> %B, <8 x i8> %C) {
|
|
; CHECK-LABEL: test_bitf_v8i8:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.8b, v1.8b, v2.8b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <8 x i8> %C, <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
|
|
%and = and <8 x i8> %neg, %B
|
|
%and1 = and <8 x i8> %C, %A
|
|
%or = or <8 x i8> %and, %and1
|
|
ret <8 x i8> %or
|
|
}
|
|
|
|
; 128-bit vectors tests
|
|
|
|
define <2 x i64> @test_bitf_v2i64(<2 x i64> %A, <2 x i64> %B, <2 x i64> %C) {
|
|
; CHECK-LABEL: test_bitf_v2i64:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.16b, v1.16b, v2.16b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <2 x i64> %C, <i64 -1, i64 -1>
|
|
%and = and <2 x i64> %neg, %B
|
|
%and1 = and <2 x i64> %C, %A
|
|
%or = or <2 x i64> %and, %and1
|
|
ret <2 x i64> %or
|
|
}
|
|
|
|
define <4 x i32> @test_bitf_v4i32(<4 x i32> %A, <4 x i32> %B, <4 x i32> %C) {
|
|
; CHECK-LABEL: test_bitf_v4i32:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.16b, v1.16b, v2.16b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <4 x i32> %C, <i32 -1, i32 -1, i32 -1, i32 -1>
|
|
%and = and <4 x i32> %neg, %B
|
|
%and1 = and <4 x i32> %C, %A
|
|
%or = or <4 x i32> %and, %and1
|
|
ret <4 x i32> %or
|
|
}
|
|
|
|
define <8 x i16> @test_bitf_v8i16(<8 x i16> %A, <8 x i16> %B, <8 x i16> %C) {
|
|
; CHECK-LABEL: test_bitf_v8i16:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.16b, v1.16b, v2.16b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <8 x i16> %C, <i16 -1, i16 -1, i16 -1, i16 -1, i16 -1, i16 -1, i16 -1, i16 -1>
|
|
%and = and <8 x i16> %neg, %B
|
|
%and1 = and <8 x i16> %C, %A
|
|
%or = or <8 x i16> %and, %and1
|
|
ret <8 x i16> %or
|
|
}
|
|
|
|
define <16 x i8> @test_bitf_v16i8(<16 x i8> %A, <16 x i8> %B, <16 x i8> %C) {
|
|
; CHECK-LABEL: test_bitf_v16i8:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: bif v0.16b, v1.16b, v2.16b
|
|
; CHECK-NEXT: ret
|
|
%neg = xor <16 x i8> %C, <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
|
|
%and = and <16 x i8> %neg, %B
|
|
%and1 = and <16 x i8> %C, %A
|
|
%or = or <16 x i8> %and, %and1
|
|
ret <16 x i8> %or
|
|
}
|