mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-22 18:54:02 +01:00
19cfa09971
This reverts commit 329aeb5db43f5e69df038fb20d2def77fe6f8595, and relands commit 61f006ac655431bd44b9e089f74c73bec0c1a48c. This is a continuation of D89456. As it was suggested there, now that SCEV models `PtrToInt`, we can try to improve SCEV's pointer handling. In particular, i believe, i will need this in the future to further fix `SCEVAddExpr`operation type handling. This removes special handling of `ConstantPointerNull` from `ScalarEvolution::createSCEV()`, and add constant folding into `ScalarEvolution::getPtrToIntExpr()`. This way, `null` constants stay as such in SCEV's, but gracefully become zero integers when asked. Reviewed By: Meinersbur Differential Revision: https://reviews.llvm.org/D98147
311 lines
9.5 KiB
LLVM
311 lines
9.5 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -mcpu=pwr8 -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
|
|
; RUN: -mtriple=powerpc64le-unknown-unknown < %s | FileCheck %s
|
|
; RUN: llc -mcpu=pwr9 -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
|
|
; RUN: -mtriple=powerpc64le-unknown-unknown < %s | FileCheck %s \
|
|
; RUN: -check-prefix=CHECK-P9
|
|
|
|
define void @julia__typed_vcat_20() #0 {
|
|
; CHECK-LABEL: julia__typed_vcat_20:
|
|
; CHECK: # %bb.0: # %bb
|
|
; CHECK-NEXT: mflr r0
|
|
; CHECK-NEXT: std r30, -16(r1) # 8-byte Folded Spill
|
|
; CHECK-NEXT: std r0, 16(r1)
|
|
; CHECK-NEXT: stdu r1, -48(r1)
|
|
; CHECK-NEXT: li r3, 1
|
|
; CHECK-NEXT: li r30, 0
|
|
; CHECK-NEXT: .p2align 4
|
|
; CHECK-NEXT: .LBB0_1: # %bb3
|
|
; CHECK-NEXT: #
|
|
; CHECK-NEXT: addi r3, r3, -1
|
|
; CHECK-NEXT: mtfprd f0, r3
|
|
; CHECK-NEXT: xscvsxdsp f1, f0
|
|
; CHECK-NEXT: bl __gnu_f2h_ieee
|
|
; CHECK-NEXT: nop
|
|
; CHECK-NEXT: clrldi r3, r3, 48
|
|
; CHECK-NEXT: bl __gnu_h2f_ieee
|
|
; CHECK-NEXT: nop
|
|
; CHECK-NEXT: addi r30, r30, -1
|
|
; CHECK-NEXT: li r3, 0
|
|
; CHECK-NEXT: cmpldi r30, 0
|
|
; CHECK-NEXT: bne+ cr0, .LBB0_1
|
|
; CHECK-NEXT: # %bb.2: # %bb11
|
|
; CHECK-NEXT: bl __gnu_f2h_ieee
|
|
; CHECK-NEXT: nop
|
|
; CHECK-NEXT: sth r3, 0(r3)
|
|
;
|
|
; CHECK-P9-LABEL: julia__typed_vcat_20:
|
|
; CHECK-P9: # %bb.0: # %bb
|
|
; CHECK-P9-NEXT: li r3, 0
|
|
; CHECK-P9-NEXT: mtctr r3
|
|
; CHECK-P9-NEXT: li r3, 1
|
|
; CHECK-P9-NEXT: .p2align 4
|
|
; CHECK-P9-NEXT: .LBB0_1: # %bb3
|
|
; CHECK-P9-NEXT: #
|
|
; CHECK-P9-NEXT: addi r3, r3, -1
|
|
; CHECK-P9-NEXT: mtfprd f0, r3
|
|
; CHECK-P9-NEXT: xscvsxdsp f0, f0
|
|
; CHECK-P9-NEXT: xscvdphp f0, f0
|
|
; CHECK-P9-NEXT: mffprwz r3, f0
|
|
; CHECK-P9-NEXT: clrlwi r3, r3, 16
|
|
; CHECK-P9-NEXT: mtfprwz f0, r3
|
|
; CHECK-P9-NEXT: li r3, 0
|
|
; CHECK-P9-NEXT: xscvhpdp f0, f0
|
|
; CHECK-P9-NEXT: bdnz .LBB0_1
|
|
; CHECK-P9-NEXT: # %bb.2: # %bb11
|
|
; CHECK-P9-NEXT: xscvdphp f0, f0
|
|
; CHECK-P9-NEXT: stxsihx f0, 0, r3
|
|
bb:
|
|
%i = load i64, i64 addrspace(11)* null, align 8
|
|
%i1 = call { i64, i1 } @llvm.ssub.with.overflow.i64(i64 %i, i64 0)
|
|
%i2 = extractvalue { i64, i1 } %i1, 0
|
|
br label %bb3
|
|
|
|
bb3: ; preds = %bb3, %bb
|
|
%i4 = phi i64 [ %i10, %bb3 ], [ 1, %bb ]
|
|
%i5 = phi i64 [ 0, %bb3 ], [ 1, %bb ]
|
|
%i6 = add nsw i64 %i5, -1
|
|
%i7 = add i64 %i6, 0
|
|
%i8 = sitofp i64 %i7 to half
|
|
store half %i8, half addrspace(13)* undef, align 2
|
|
%i9 = icmp eq i64 %i4, 0
|
|
%i10 = add i64 %i4, 1
|
|
br i1 %i9, label %bb11, label %bb3
|
|
|
|
bb11: ; preds = %bb3
|
|
unreachable
|
|
}
|
|
|
|
declare { i64, i1 } @llvm.ssub.with.overflow.i64(i64, i64) #0
|
|
|
|
define void @julia__hypot_17() #0 {
|
|
; CHECK-LABEL: julia__hypot_17:
|
|
; CHECK: # %bb.0: # %bb
|
|
; CHECK-NEXT: mflr r0
|
|
; CHECK-NEXT: std r30, -16(r1) # 8-byte Folded Spill
|
|
; CHECK-NEXT: std r0, 16(r1)
|
|
; CHECK-NEXT: stdu r1, -48(r1)
|
|
; CHECK-NEXT: li r30, 3
|
|
; CHECK-NEXT: .p2align 5
|
|
; CHECK-NEXT: .LBB1_1: # %bb1
|
|
; CHECK-NEXT: #
|
|
; CHECK-NEXT: addi r30, r30, -1
|
|
; CHECK-NEXT: cmpldi r30, 0
|
|
; CHECK-NEXT: beq cr0, .LBB1_3
|
|
; CHECK-NEXT: # %bb.2: # %bb3
|
|
; CHECK-NEXT: #
|
|
; CHECK-NEXT: lhz r3, 0(0)
|
|
; CHECK-NEXT: bl __gnu_h2f_ieee
|
|
; CHECK-NEXT: nop
|
|
; CHECK-NEXT: fcmpu cr0, f1, f1
|
|
; CHECK-NEXT: bun cr0, .LBB1_1
|
|
; CHECK-NEXT: .LBB1_3: # %bb9
|
|
; CHECK-NEXT: addi r1, r1, 48
|
|
; CHECK-NEXT: ld r0, 16(r1)
|
|
; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload
|
|
; CHECK-NEXT: mtlr r0
|
|
; CHECK-NEXT: blr
|
|
;
|
|
; CHECK-P9-LABEL: julia__hypot_17:
|
|
; CHECK-P9: # %bb.0: # %bb
|
|
; CHECK-P9-NEXT: li r3, 3
|
|
; CHECK-P9-NEXT: mtctr r3
|
|
; CHECK-P9-NEXT: li r3, 0
|
|
; CHECK-P9-NEXT: .p2align 5
|
|
; CHECK-P9-NEXT: .LBB1_1: # %bb1
|
|
; CHECK-P9-NEXT: #
|
|
; CHECK-P9-NEXT: bdzlr
|
|
; CHECK-P9-NEXT: # %bb.2: # %bb3
|
|
; CHECK-P9-NEXT: #
|
|
; CHECK-P9-NEXT: lxsihzx f0, 0, r3
|
|
; CHECK-P9-NEXT: xscvhpdp f0, f0
|
|
; CHECK-P9-NEXT: fcmpu cr0, f0, f0
|
|
; CHECK-P9-NEXT: bun cr0, .LBB1_1
|
|
; CHECK-P9-NEXT: # %bb.3: # %bb9
|
|
; CHECK-P9-NEXT: blr
|
|
bb:
|
|
br label %bb1
|
|
|
|
bb1: ; preds = %bb3, %bb
|
|
%i = phi i64 [ %i4, %bb3 ], [ 2, %bb ]
|
|
%i2 = icmp eq i64 %i, 4
|
|
br i1 %i2, label %bb9, label %bb3
|
|
|
|
bb3: ; preds = %bb1
|
|
%i4 = add nuw nsw i64 %i, 1
|
|
%i5 = load half, half* null, align 2
|
|
%i6 = fpext half %i5 to float
|
|
%i7 = fcmp uno float %i6, 0.000000e+00
|
|
%i8 = or i1 %i7, false
|
|
br i1 %i8, label %bb1, label %bb9
|
|
|
|
bb9: ; preds = %bb3, %bb1
|
|
ret void
|
|
}
|
|
|
|
define void @func_48786() #0 {
|
|
; CHECK-LABEL: func_48786:
|
|
; CHECK: # %bb.0: # %bb
|
|
; CHECK-NEXT: mfocrf r12, 32
|
|
; CHECK-NEXT: mflr r0
|
|
; CHECK-NEXT: std r0, 16(r1)
|
|
; CHECK-NEXT: stw r12, 8(r1)
|
|
; CHECK-NEXT: stdu r1, -48(r1)
|
|
; CHECK-NEXT: ld r3, 0(r3)
|
|
; CHECK-NEXT: std r30, 32(r1) # 8-byte Folded Spill
|
|
; CHECK-NEXT: # implicit-def: $x30
|
|
; CHECK-NEXT: cmpdi r3, 0
|
|
; CHECK-NEXT: crnot 4*cr2+lt, eq
|
|
; CHECK-NEXT: bc 12, 4*cr5+lt, .LBB2_3
|
|
; CHECK-NEXT: .p2align 4
|
|
; CHECK-NEXT: .LBB2_1: # %bb4
|
|
; CHECK-NEXT: lhz r3, 0(r3)
|
|
; CHECK-NEXT: bl __gnu_h2f_ieee
|
|
; CHECK-NEXT: nop
|
|
; CHECK-NEXT: bc 4, 4*cr2+lt, .LBB2_6
|
|
; CHECK-NEXT: # %bb.2: # %bb8
|
|
; CHECK-NEXT: bl __gnu_f2h_ieee
|
|
; CHECK-NEXT: nop
|
|
; CHECK-NEXT: sth r3, 0(0)
|
|
; CHECK-NEXT: .LBB2_3: # %bb10
|
|
; CHECK-NEXT: #
|
|
; CHECK-NEXT: cmpldi r30, 0
|
|
; CHECK-NEXT: beq cr0, .LBB2_5
|
|
; CHECK-NEXT: # %bb.4: # %bb12
|
|
; CHECK-NEXT: #
|
|
; CHECK-NEXT: addi r30, r30, 1
|
|
; CHECK-NEXT: bc 4, 4*cr5+lt, .LBB2_1
|
|
; CHECK-NEXT: b .LBB2_3
|
|
; CHECK-NEXT: .LBB2_5: # %bb14
|
|
; CHECK-NEXT: ld r30, 32(r1) # 8-byte Folded Reload
|
|
; CHECK-NEXT: addi r1, r1, 48
|
|
; CHECK-NEXT: ld r0, 16(r1)
|
|
; CHECK-NEXT: lwz r12, 8(r1)
|
|
; CHECK-NEXT: mtocrf 32, r12
|
|
; CHECK-NEXT: mtlr r0
|
|
; CHECK-NEXT: blr
|
|
; CHECK-NEXT: .LBB2_6: # %bb15
|
|
;
|
|
; CHECK-P9-LABEL: func_48786:
|
|
; CHECK-P9: # %bb.0: # %bb
|
|
; CHECK-P9-NEXT: ld r3, 0(r3)
|
|
; CHECK-P9-NEXT: cmpdi r3, 0
|
|
; CHECK-P9-NEXT: mtctr r3
|
|
; CHECK-P9-NEXT: li r3, 0
|
|
; CHECK-P9-NEXT: crnot 4*cr5+lt, eq
|
|
; CHECK-P9-NEXT: b .LBB2_2
|
|
; CHECK-P9-NEXT: .p2align 5
|
|
; CHECK-P9-NEXT: .LBB2_1: # %bb10
|
|
; CHECK-P9-NEXT: #
|
|
; CHECK-P9-NEXT: bdzlr
|
|
; CHECK-P9-NEXT: .LBB2_2: # %bb2
|
|
; CHECK-P9-NEXT: #
|
|
; CHECK-P9-NEXT: bc 12, 4*cr5+lt, .LBB2_1
|
|
; CHECK-P9-NEXT: # %bb.3: # %bb4
|
|
; CHECK-P9-NEXT: #
|
|
; CHECK-P9-NEXT: lxsihzx f0, 0, r3
|
|
; CHECK-P9-NEXT: xscvhpdp f0, f0
|
|
; CHECK-P9-NEXT: bc 4, 4*cr5+lt, .LBB2_5
|
|
; CHECK-P9-NEXT: # %bb.4: # %bb8
|
|
; CHECK-P9-NEXT: #
|
|
; CHECK-P9-NEXT: xscvdphp f0, f0
|
|
; CHECK-P9-NEXT: stxsihx f0, 0, r3
|
|
; CHECK-P9-NEXT: b .LBB2_1
|
|
; CHECK-P9-NEXT: .LBB2_5: # %bb15
|
|
bb:
|
|
%i = load i64, i64 addrspace(11)* undef, align 8
|
|
%i1 = load i64, i64 addrspace(11)* undef, align 8
|
|
br label %bb2
|
|
|
|
bb2: ; preds = %bb12, %bb
|
|
%i3 = phi i64 [ undef, %bb ], [ %i13, %bb12 ]
|
|
br i1 undef, label %bb10, label %bb4
|
|
|
|
bb4: ; preds = %bb2
|
|
switch i32 undef, label %bb9 [
|
|
i32 1426063360, label %bb5
|
|
i32 1275068416, label %bb5
|
|
]
|
|
|
|
bb5: ; preds = %bb4, %bb4
|
|
%i6 = load half, half addrspace(13)* undef, align 2
|
|
%i7 = icmp ult i64 0, %i1
|
|
br i1 %i7, label %bb8, label %bb15
|
|
|
|
bb8: ; preds = %bb5
|
|
store half %i6, half addrspace(13)* null, align 2
|
|
br label %bb10
|
|
|
|
bb9: ; preds = %bb4
|
|
unreachable
|
|
|
|
bb10: ; preds = %bb8, %bb2
|
|
%i11 = icmp eq i64 %i3, 0
|
|
br i1 %i11, label %bb14, label %bb12
|
|
|
|
bb12: ; preds = %bb10
|
|
%i13 = add i64 %i3, 1
|
|
br label %bb2
|
|
|
|
bb14: ; preds = %bb10
|
|
ret void
|
|
|
|
bb15: ; preds = %bb5
|
|
unreachable
|
|
}
|
|
|
|
define void @func_48785(half %arg) #0 {
|
|
; CHECK-LABEL: func_48785:
|
|
; CHECK: # %bb.0: # %bb
|
|
; CHECK-NEXT: mflr r0
|
|
; CHECK-NEXT: std r29, -32(r1) # 8-byte Folded Spill
|
|
; CHECK-NEXT: std r30, -24(r1) # 8-byte Folded Spill
|
|
; CHECK-NEXT: stfd f31, -8(r1) # 8-byte Folded Spill
|
|
; CHECK-NEXT: std r0, 16(r1)
|
|
; CHECK-NEXT: stdu r1, -64(r1)
|
|
; CHECK-NEXT: fmr f31, f1
|
|
; CHECK-NEXT: li r30, 0
|
|
; CHECK-NEXT: li r29, 0
|
|
; CHECK-NEXT: .p2align 5
|
|
; CHECK-NEXT: .LBB3_1: # %bb1
|
|
; CHECK-NEXT: #
|
|
; CHECK-NEXT: fmr f1, f31
|
|
; CHECK-NEXT: bl __gnu_f2h_ieee
|
|
; CHECK-NEXT: nop
|
|
; CHECK-NEXT: addi r29, r29, -12
|
|
; CHECK-NEXT: sth r3, 0(r30)
|
|
; CHECK-NEXT: addi r30, r30, 24
|
|
; CHECK-NEXT: cmpldi r29, 0
|
|
; CHECK-NEXT: bne+ cr0, .LBB3_1
|
|
; CHECK-NEXT: # %bb.2: # %bb5
|
|
;
|
|
; CHECK-P9-LABEL: func_48785:
|
|
; CHECK-P9: # %bb.0: # %bb
|
|
; CHECK-P9-NEXT: li r3, 1
|
|
; CHECK-P9-NEXT: rldic r3, r3, 62, 1
|
|
; CHECK-P9-NEXT: mtctr r3
|
|
; CHECK-P9-NEXT: li r3, 0
|
|
; CHECK-P9-NEXT: .p2align 4
|
|
; CHECK-P9-NEXT: .LBB3_1: # %bb1
|
|
; CHECK-P9-NEXT: #
|
|
; CHECK-P9-NEXT: xscvdphp f0, f1
|
|
; CHECK-P9-NEXT: stxsihx f0, 0, r3
|
|
; CHECK-P9-NEXT: addi r3, r3, 24
|
|
; CHECK-P9-NEXT: bdnz .LBB3_1
|
|
; CHECK-P9-NEXT: # %bb.2: # %bb5
|
|
bb:
|
|
br label %bb1
|
|
|
|
bb1: ; preds = %bb1, %bb
|
|
%i = phi i64 [ 0, %bb ], [ %i3, %bb1 ]
|
|
%i2 = getelementptr inbounds half, half addrspace(13)* null, i64 %i
|
|
store half %arg, half addrspace(13)* %i2, align 2
|
|
%i3 = add i64 %i, 12
|
|
%i4 = icmp eq i64 %i3, 0
|
|
br i1 %i4, label %bb5, label %bb1
|
|
|
|
bb5: ; preds = %bb1
|
|
unreachable
|
|
}
|
|
attributes #0 = { nounwind }
|