mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-26 04:32:44 +01:00
bcefc6091f
Summary: This change implements ACLE CDE intrinsics that translate to instructions working with general-purpose registers. The specification is available at https://static.docs.arm.com/101028/0010/ACLE_2019Q4_release-0010.pdf Each ACLE intrinsic gets a corresponding LLVM IR intrinsic (because they have distinct function prototypes). Dual-register operands are represented as pairs of i32 values. Because of this the instruction selection for these intrinsics cannot be represented as TableGen patterns and requires custom C++ code. Reviewers: simon_tatham, MarkMurrayARM, dmgreen, ostannard Reviewed By: MarkMurrayARM Subscribers: kristof.beyls, hiraditya, danielkiss, cfe-commits Tags: #clang Differential Revision: https://reviews.llvm.org/D76296
190 lines
5.9 KiB
LLVM
190 lines
5.9 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -mtriple=thumbv8.1m.main -mattr=+cdecp0 -mattr=+cdecp1 -verify-machineinstrs -o - %s | FileCheck %s
|
|
; RUN: llc -mtriple=thumbebv8.1m.main -mattr=+cdecp0 -mattr=+cdecp1 -verify-machineinstrs -o - %s | FileCheck %s
|
|
|
|
declare i32 @llvm.arm.cde.cx1(i32 immarg, i32 immarg)
|
|
declare i32 @llvm.arm.cde.cx1a(i32 immarg, i32, i32 immarg)
|
|
declare { i32, i32 } @llvm.arm.cde.cx1d(i32 immarg, i32 immarg)
|
|
declare { i32, i32 } @llvm.arm.cde.cx1da(i32 immarg, i32, i32, i32 immarg)
|
|
|
|
declare i32 @llvm.arm.cde.cx2(i32 immarg, i32, i32 immarg)
|
|
declare i32 @llvm.arm.cde.cx2a(i32 immarg, i32, i32, i32 immarg)
|
|
declare { i32, i32 } @llvm.arm.cde.cx2d(i32 immarg, i32, i32 immarg)
|
|
declare { i32, i32 } @llvm.arm.cde.cx2da(i32 immarg, i32, i32, i32, i32 immarg)
|
|
|
|
declare i32 @llvm.arm.cde.cx3(i32 immarg, i32, i32, i32 immarg)
|
|
declare i32 @llvm.arm.cde.cx3a(i32 immarg, i32, i32, i32, i32 immarg)
|
|
declare { i32, i32 } @llvm.arm.cde.cx3d(i32 immarg, i32, i32, i32 immarg)
|
|
declare { i32, i32 } @llvm.arm.cde.cx3da(i32 immarg, i32, i32, i32, i32, i32 immarg)
|
|
|
|
define arm_aapcs_vfpcc i32 @test_cx1() {
|
|
; CHECK-LABEL: test_cx1:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: cx1 p0, r0, #123
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = call i32 @llvm.arm.cde.cx1(i32 0, i32 123)
|
|
ret i32 %0
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i32 @test_cx1a(i32 %acc) {
|
|
; CHECK-LABEL: test_cx1a:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: cx1a p0, r0, #345
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = call i32 @llvm.arm.cde.cx1a(i32 0, i32 %acc, i32 345)
|
|
ret i32 %0
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i64 @test_cx1d() {
|
|
; CHECK-LABEL: test_cx1d:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: cx1d p1, r0, r1, #567
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = call { i32, i32 } @llvm.arm.cde.cx1d(i32 1, i32 567)
|
|
%1 = extractvalue { i32, i32 } %0, 1
|
|
%2 = zext i32 %1 to i64
|
|
%3 = shl i64 %2, 32
|
|
%4 = extractvalue { i32, i32 } %0, 0
|
|
%5 = zext i32 %4 to i64
|
|
%6 = or i64 %3, %5
|
|
ret i64 %6
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i64 @test_cx1da(i64 %acc) {
|
|
; CHECK-LABEL: test_cx1da:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: @ kill: def $r1 killed $r1 killed $r0_r1 def $r0_r1
|
|
; CHECK-NEXT: @ kill: def $r0 killed $r0 killed $r0_r1 def $r0_r1
|
|
; CHECK-NEXT: cx1da p0, r0, r1, #789
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = lshr i64 %acc, 32
|
|
%1 = trunc i64 %0 to i32
|
|
%2 = trunc i64 %acc to i32
|
|
%3 = call { i32, i32 } @llvm.arm.cde.cx1da(i32 0, i32 %2, i32 %1, i32 789)
|
|
%4 = extractvalue { i32, i32 } %3, 1
|
|
%5 = zext i32 %4 to i64
|
|
%6 = shl i64 %5, 32
|
|
%7 = extractvalue { i32, i32 } %3, 0
|
|
%8 = zext i32 %7 to i64
|
|
%9 = or i64 %6, %8
|
|
ret i64 %9
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i32 @test_cx2(i32 %n) {
|
|
; CHECK-LABEL: test_cx2:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: cx2 p0, r0, r0, #11
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = call i32 @llvm.arm.cde.cx2(i32 0, i32 %n, i32 11)
|
|
ret i32 %0
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i32 @test_cx2a(i32 %acc, i32 %n) {
|
|
; CHECK-LABEL: test_cx2a:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: cx2a p1, r0, r1, #22
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = call i32 @llvm.arm.cde.cx2a(i32 1, i32 %acc, i32 %n, i32 22)
|
|
ret i32 %0
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i64 @test_cx2d(i32 %n) #0 {
|
|
; CHECK-LABEL: test_cx2d:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: cx2d p1, r0, r1, r0, #33
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = call { i32, i32 } @llvm.arm.cde.cx2d(i32 1, i32 %n, i32 33)
|
|
%1 = extractvalue { i32, i32 } %0, 1
|
|
%2 = zext i32 %1 to i64
|
|
%3 = shl i64 %2, 32
|
|
%4 = extractvalue { i32, i32 } %0, 0
|
|
%5 = zext i32 %4 to i64
|
|
%6 = or i64 %3, %5
|
|
ret i64 %6
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i64 @test_cx2da(i64 %acc, i32 %n) {
|
|
; CHECK-LABEL: test_cx2da:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: @ kill: def $r1 killed $r1 killed $r0_r1 def $r0_r1
|
|
; CHECK-NEXT: @ kill: def $r0 killed $r0 killed $r0_r1 def $r0_r1
|
|
; CHECK-NEXT: cx2da p0, r0, r1, r2, #44
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = lshr i64 %acc, 32
|
|
%1 = trunc i64 %0 to i32
|
|
%2 = trunc i64 %acc to i32
|
|
%3 = call { i32, i32 } @llvm.arm.cde.cx2da(i32 0, i32 %2, i32 %1, i32 %n, i32 44)
|
|
%4 = extractvalue { i32, i32 } %3, 1
|
|
%5 = zext i32 %4 to i64
|
|
%6 = shl i64 %5, 32
|
|
%7 = extractvalue { i32, i32 } %3, 0
|
|
%8 = zext i32 %7 to i64
|
|
%9 = or i64 %6, %8
|
|
ret i64 %9
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i32 @test_cx3(i32 %n, i32 %m) {
|
|
; CHECK-LABEL: test_cx3:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: cx3 p0, r0, r0, r1, #1
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = call i32 @llvm.arm.cde.cx3(i32 0, i32 %n, i32 %m, i32 1)
|
|
ret i32 %0
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i32 @test_cx3a(i32 %acc, i32 %n, i32 %m) {
|
|
; CHECK-LABEL: test_cx3a:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: cx3a p1, r0, r1, r2, #2
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = call i32 @llvm.arm.cde.cx3a(i32 1, i32 %acc, i32 %n, i32 %m, i32 2)
|
|
ret i32 %0
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i64 @test_cx3d(i32 %n, i32 %m) {
|
|
; CHECK-LABEL: test_cx3d:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: cx3d p1, r0, r1, r0, r1, #3
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = call { i32, i32 } @llvm.arm.cde.cx3d(i32 1, i32 %n, i32 %m, i32 3)
|
|
%1 = extractvalue { i32, i32 } %0, 1
|
|
%2 = zext i32 %1 to i64
|
|
%3 = shl i64 %2, 32
|
|
%4 = extractvalue { i32, i32 } %0, 0
|
|
%5 = zext i32 %4 to i64
|
|
%6 = or i64 %3, %5
|
|
ret i64 %6
|
|
}
|
|
|
|
define arm_aapcs_vfpcc i64 @test_cx3da(i64 %acc, i32 %n, i32 %m) {
|
|
; CHECK-LABEL: test_cx3da:
|
|
; CHECK: @ %bb.0: @ %entry
|
|
; CHECK-NEXT: @ kill: def $r1 killed $r1 killed $r0_r1 def $r0_r1
|
|
; CHECK-NEXT: @ kill: def $r0 killed $r0 killed $r0_r1 def $r0_r1
|
|
; CHECK-NEXT: cx3da p0, r0, r1, r2, r3, #4
|
|
; CHECK-NEXT: bx lr
|
|
entry:
|
|
%0 = lshr i64 %acc, 32
|
|
%1 = trunc i64 %0 to i32
|
|
%2 = trunc i64 %acc to i32
|
|
%3 = call { i32, i32 } @llvm.arm.cde.cx3da(i32 0, i32 %2, i32 %1, i32 %n, i32 %m, i32 4)
|
|
%4 = extractvalue { i32, i32 } %3, 1
|
|
%5 = zext i32 %4 to i64
|
|
%6 = shl i64 %5, 32
|
|
%7 = extractvalue { i32, i32 } %3, 0
|
|
%8 = zext i32 %7 to i64
|
|
%9 = or i64 %6, %8
|
|
ret i64 %9
|
|
}
|