mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-25 20:23:11 +01:00
7dcf1654f8
Based ontop of D104598, which is a NFCI-ish refactoring. Here, a restriction, that only empty blocks can be merged, is lifted. Reviewed By: rnk Differential Revision: https://reviews.llvm.org/D104597
210 lines
5.6 KiB
LLVM
210 lines
5.6 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -mtriple=aarch64-apple-darwin -fast-isel -fast-isel-abort=1 -verify-machineinstrs < %s | FileCheck %s
|
|
|
|
define i64 @test_or(i32 %a, i32 %b) {
|
|
; CHECK-LABEL: test_or:
|
|
; CHECK: ; %bb.0: ; %bb1
|
|
; CHECK-NEXT: mov w8, w0
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: cbnz w8, LBB0_2
|
|
; CHECK-NEXT: LBB0_1: ; %common.ret
|
|
; CHECK-NEXT: ret
|
|
; CHECK-NEXT: LBB0_2: ; %bb1.cond.split
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: cbz w1, LBB0_1
|
|
; CHECK-NEXT: ; %bb.3: ; %bb4
|
|
; CHECK-NEXT: stp x29, x30, [sp, #-16]! ; 16-byte Folded Spill
|
|
; CHECK-NEXT: .cfi_def_cfa_offset 16
|
|
; CHECK-NEXT: .cfi_offset w30, -8
|
|
; CHECK-NEXT: .cfi_offset w29, -16
|
|
; CHECK-NEXT: bl _bar
|
|
; CHECK-NEXT: ldp x29, x30, [sp], #16 ; 16-byte Folded Reload
|
|
; CHECK-NEXT: ret
|
|
bb1:
|
|
%0 = icmp eq i32 %a, 0
|
|
%1 = icmp eq i32 %b, 0
|
|
%or.cond = or i1 %0, %1
|
|
br i1 %or.cond, label %bb3, label %bb4, !prof !0
|
|
|
|
bb3:
|
|
ret i64 0
|
|
|
|
bb4:
|
|
%2 = call i64 @bar()
|
|
ret i64 %2
|
|
}
|
|
|
|
define i64 @test_or_select(i32 %a, i32 %b) {
|
|
; CHECK-LABEL: test_or_select:
|
|
; CHECK: ; %bb.0: ; %bb1
|
|
; CHECK-NEXT: mov w8, w0
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: cbnz w8, LBB1_2
|
|
; CHECK-NEXT: LBB1_1: ; %common.ret
|
|
; CHECK-NEXT: ret
|
|
; CHECK-NEXT: LBB1_2: ; %bb1.cond.split
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: cbz w1, LBB1_1
|
|
; CHECK-NEXT: ; %bb.3: ; %bb4
|
|
; CHECK-NEXT: stp x29, x30, [sp, #-16]! ; 16-byte Folded Spill
|
|
; CHECK-NEXT: .cfi_def_cfa_offset 16
|
|
; CHECK-NEXT: .cfi_offset w30, -8
|
|
; CHECK-NEXT: .cfi_offset w29, -16
|
|
; CHECK-NEXT: bl _bar
|
|
; CHECK-NEXT: ldp x29, x30, [sp], #16 ; 16-byte Folded Reload
|
|
; CHECK-NEXT: ret
|
|
bb1:
|
|
%0 = icmp eq i32 %a, 0
|
|
%1 = icmp eq i32 %b, 0
|
|
%or.cond = select i1 %0, i1 true, i1 %1
|
|
br i1 %or.cond, label %bb3, label %bb4, !prof !0
|
|
|
|
bb3:
|
|
ret i64 0
|
|
|
|
bb4:
|
|
%2 = call i64 @bar()
|
|
ret i64 %2
|
|
}
|
|
|
|
define i64 @test_and(i32 %a, i32 %b) {
|
|
; CHECK-LABEL: test_and:
|
|
; CHECK: ; %bb.0: ; %bb1
|
|
; CHECK-NEXT: mov w8, w0
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: cbnz w8, LBB2_2
|
|
; CHECK-NEXT: LBB2_1: ; %common.ret
|
|
; CHECK-NEXT: ret
|
|
; CHECK-NEXT: LBB2_2: ; %bb1.cond.split
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: cbz w1, LBB2_1
|
|
; CHECK-NEXT: ; %bb.3: ; %bb4
|
|
; CHECK-NEXT: stp x29, x30, [sp, #-16]! ; 16-byte Folded Spill
|
|
; CHECK-NEXT: .cfi_def_cfa_offset 16
|
|
; CHECK-NEXT: .cfi_offset w30, -8
|
|
; CHECK-NEXT: .cfi_offset w29, -16
|
|
; CHECK-NEXT: bl _bar
|
|
; CHECK-NEXT: ldp x29, x30, [sp], #16 ; 16-byte Folded Reload
|
|
; CHECK-NEXT: ret
|
|
bb1:
|
|
%0 = icmp ne i32 %a, 0
|
|
%1 = icmp ne i32 %b, 0
|
|
%or.cond = and i1 %0, %1
|
|
br i1 %or.cond, label %bb4, label %bb3, !prof !1
|
|
|
|
bb3:
|
|
ret i64 0
|
|
|
|
bb4:
|
|
%2 = call i64 @bar()
|
|
ret i64 %2
|
|
}
|
|
|
|
define i64 @test_and_select(i32 %a, i32 %b) {
|
|
; CHECK-LABEL: test_and_select:
|
|
; CHECK: ; %bb.0: ; %bb1
|
|
; CHECK-NEXT: mov w8, w0
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: cbnz w8, LBB3_2
|
|
; CHECK-NEXT: LBB3_1: ; %common.ret
|
|
; CHECK-NEXT: ret
|
|
; CHECK-NEXT: LBB3_2: ; %bb1.cond.split
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: cbz w1, LBB3_1
|
|
; CHECK-NEXT: ; %bb.3: ; %bb4
|
|
; CHECK-NEXT: stp x29, x30, [sp, #-16]! ; 16-byte Folded Spill
|
|
; CHECK-NEXT: .cfi_def_cfa_offset 16
|
|
; CHECK-NEXT: .cfi_offset w30, -8
|
|
; CHECK-NEXT: .cfi_offset w29, -16
|
|
; CHECK-NEXT: bl _bar
|
|
; CHECK-NEXT: ldp x29, x30, [sp], #16 ; 16-byte Folded Reload
|
|
; CHECK-NEXT: ret
|
|
bb1:
|
|
%0 = icmp ne i32 %a, 0
|
|
%1 = icmp ne i32 %b, 0
|
|
%or.cond = select i1 %0, i1 %1, i1 false
|
|
br i1 %or.cond, label %bb4, label %bb3, !prof !1
|
|
|
|
bb3:
|
|
ret i64 0
|
|
|
|
bb4:
|
|
%2 = call i64 @bar()
|
|
ret i64 %2
|
|
}
|
|
|
|
; If the branch is unpredictable, don't add another branch.
|
|
|
|
define i64 @test_or_unpredictable(i32 %a, i32 %b) {
|
|
; CHECK-LABEL: test_or_unpredictable:
|
|
; CHECK: ; %bb.0: ; %bb1
|
|
; CHECK-NEXT: cmp w0, #0 ; =0
|
|
; CHECK-NEXT: cset w8, eq
|
|
; CHECK-NEXT: cmp w1, #0 ; =0
|
|
; CHECK-NEXT: cset w9, eq
|
|
; CHECK-NEXT: orr w8, w8, w9
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: tbnz w8, #0, LBB4_2
|
|
; CHECK-NEXT: ; %bb.1: ; %bb4
|
|
; CHECK-NEXT: stp x29, x30, [sp, #-16]! ; 16-byte Folded Spill
|
|
; CHECK-NEXT: .cfi_def_cfa_offset 16
|
|
; CHECK-NEXT: .cfi_offset w30, -8
|
|
; CHECK-NEXT: .cfi_offset w29, -16
|
|
; CHECK-NEXT: bl _bar
|
|
; CHECK-NEXT: ldp x29, x30, [sp], #16 ; 16-byte Folded Reload
|
|
; CHECK-NEXT: LBB4_2: ; %common.ret
|
|
; CHECK-NEXT: ret
|
|
bb1:
|
|
%0 = icmp eq i32 %a, 0
|
|
%1 = icmp eq i32 %b, 0
|
|
%or.cond = or i1 %0, %1
|
|
br i1 %or.cond, label %bb3, label %bb4, !unpredictable !2
|
|
|
|
bb3:
|
|
ret i64 0
|
|
|
|
bb4:
|
|
%2 = call i64 @bar()
|
|
ret i64 %2
|
|
}
|
|
|
|
define i64 @test_and_unpredictable(i32 %a, i32 %b) {
|
|
; CHECK-LABEL: test_and_unpredictable:
|
|
; CHECK: ; %bb.0: ; %bb1
|
|
; CHECK-NEXT: cmp w0, #0 ; =0
|
|
; CHECK-NEXT: cset w8, ne
|
|
; CHECK-NEXT: cmp w1, #0 ; =0
|
|
; CHECK-NEXT: cset w9, ne
|
|
; CHECK-NEXT: and w8, w8, w9
|
|
; CHECK-NEXT: mov x0, xzr
|
|
; CHECK-NEXT: tbz w8, #0, LBB5_2
|
|
; CHECK-NEXT: ; %bb.1: ; %bb4
|
|
; CHECK-NEXT: stp x29, x30, [sp, #-16]! ; 16-byte Folded Spill
|
|
; CHECK-NEXT: .cfi_def_cfa_offset 16
|
|
; CHECK-NEXT: .cfi_offset w30, -8
|
|
; CHECK-NEXT: .cfi_offset w29, -16
|
|
; CHECK-NEXT: bl _bar
|
|
; CHECK-NEXT: ldp x29, x30, [sp], #16 ; 16-byte Folded Reload
|
|
; CHECK-NEXT: LBB5_2: ; %common.ret
|
|
; CHECK-NEXT: ret
|
|
bb1:
|
|
%0 = icmp ne i32 %a, 0
|
|
%1 = icmp ne i32 %b, 0
|
|
%or.cond = and i1 %0, %1
|
|
br i1 %or.cond, label %bb4, label %bb3, !unpredictable !2
|
|
|
|
bb3:
|
|
ret i64 0
|
|
|
|
bb4:
|
|
%2 = call i64 @bar()
|
|
ret i64 %2
|
|
}
|
|
|
|
declare i64 @bar()
|
|
|
|
!0 = !{!"branch_weights", i32 5128, i32 32}
|
|
!1 = !{!"branch_weights", i32 1024, i32 4136}
|
|
!2 = !{}
|
|
|