mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-22 10:42:39 +01:00
437b6055f0
On subtargets that have a red zone, we will copy the stack pointer to the base pointer in the prologue prior to updating the stack pointer. There are no other updates to the base pointer after that. This suggests that we should be able to restore the stack pointer from the base pointer rather than loading it from the back chain or adding the frame size back to either the stack pointer or the frame pointer. This came about because functions that call setjmp need to restore the SP from the FP because the back chain might have been clobbered (see https://reviews.llvm.org/D92906). However, if the stack is realigned, the restored SP might be incorrect (which is what caused the failures in the two ASan test cases). This patch was tested quite extensivelly both with sanitizer runtimes and general code. Differential revision: https://reviews.llvm.org/D93327
225 lines
6.7 KiB
LLVM
225 lines
6.7 KiB
LLVM
; RUN: llc -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 < %s | FileCheck %s
|
|
; RUN: llc -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -frame-pointer=all < %s | FileCheck -check-prefix=CHECK-FP %s
|
|
; RUN: llc -mtriple=powerpc-unknown-linux-gnu -frame-pointer=all < %s | FileCheck -check-prefix=CHECK-32 %s
|
|
; RUN: llc -mtriple=powerpc-unknown-linux-gnu -frame-pointer=all -relocation-model=pic < %s | FileCheck -check-prefix=CHECK-32-PIC %s
|
|
target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"
|
|
target triple = "powerpc64-unknown-linux-gnu"
|
|
|
|
%struct.s = type { i32, i32 }
|
|
|
|
declare void @bar(i32*)
|
|
|
|
@barbaz = external global i32
|
|
|
|
define void @goo(%struct.s* byval(%struct.s) nocapture readonly %a) {
|
|
entry:
|
|
%x = alloca [2 x i32], align 32
|
|
%a1 = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 0
|
|
%0 = load i32, i32* %a1, align 4
|
|
%arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %x, i64 0, i64 0
|
|
store i32 %0, i32* %arrayidx, align 32
|
|
%b = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 1
|
|
%1 = load i32, i32* %b, align 4
|
|
%2 = load i32, i32* @barbaz, align 4
|
|
%arrayidx2 = getelementptr inbounds [2 x i32], [2 x i32]* %x, i64 0, i64 1
|
|
store i32 %2, i32* %arrayidx2, align 4
|
|
call void @bar(i32* %arrayidx)
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: @goo
|
|
|
|
; CHECK-DAG: mflr {{[0-9]+}}
|
|
; CHECK-DAG: clrldi [[REG:[0-9]+]], 1, 59
|
|
; CHECK-DAG: std 30, -16(1)
|
|
; CHECK-DAG: mr 30, 1
|
|
; CHECK-DAG: std 0, 16(1)
|
|
; CHECK-DAG: subfic 0, [[REG]], -160
|
|
; CHECK: stdux 1, 1, 0
|
|
|
|
; CHECK: .cfi_def_cfa_register r30
|
|
; CHECK: .cfi_offset r30, -16
|
|
; CHECK: .cfi_offset lr, 16
|
|
|
|
; CHECK: std 3, 48(30)
|
|
|
|
; CHECK: mr 1, 30
|
|
; CHECK-DAG: ld [[SR:[0-9]+]], 16(1)
|
|
; CHECK-DAG: ld 30, -16(1)
|
|
; CHECK-DAG: mtlr [[SR]]
|
|
; CHECK: blr
|
|
|
|
; CHECK-FP-LABEL: @goo
|
|
|
|
; CHECK-FP-DAG: mflr {{[0-9]+}}
|
|
; CHECK-FP-DAG: clrldi [[REG:[0-9]+]], 1, 59
|
|
; CHECK-FP-DAG: std 31, -8(1)
|
|
; CHECK-FP-DAG: std 30, -16(1)
|
|
; CHECK-FP-DAG: mr 30, 1
|
|
; CHECK-FP-DAG: std 0, 16(1)
|
|
; CHECK-FP-DAG: subfic 0, [[REG]], -160
|
|
; CHECK-FP: stdux 1, 1, 0
|
|
|
|
; CHECK-FP: .cfi_def_cfa_register r30
|
|
; CHECK-FP: .cfi_offset r31, -8
|
|
; CHECK-FP: .cfi_offset r30, -16
|
|
; CHECK-FP: .cfi_offset lr, 16
|
|
|
|
; CHECK-FP: mr 31, 1
|
|
|
|
; CHECK-FP: std 3, 48(30)
|
|
|
|
; CHECK-FP: mr 1, 30
|
|
; CHECK-FP-DAG: ld [[SR:[0-9]+]], 16(1)
|
|
; CHECK-FP-DAG: ld 31, -8(1)
|
|
; CHECK-FP-DAG: ld 30, -16(1)
|
|
; CHECK-FP-DAG: mtlr [[SR]]
|
|
; CHECK-FP: blr
|
|
|
|
; CHECK-32-LABEL: @goo
|
|
; CHECK-32-DAG: mflr [[LR:[0-9]+]]
|
|
; CHECK-32-DAG: clrlwi [[REG:[0-9]+]], 1, 27
|
|
; CHECK-32-DAG: stw [[LR]], 4(1)
|
|
; CHECK-32-DAG: subfic 0, [[REG]], -64
|
|
; CHECK-32: stwux 1, 1, 0
|
|
; CHECK-32: sub 0, 1, 0
|
|
; CHECK-32: addic 0, 0, -4
|
|
; CHECK-32: stwx 31, 0, 0
|
|
; CHECK-32: addic 0, 0, -4
|
|
; CHECK-32: stwx 30, 0, 0
|
|
; CHECK-32: addic 30, 0, 8
|
|
|
|
; CHECK-32-PIC-LABEL: @goo
|
|
; CHECK-32-PIC-DAG: mflr [[LR:[0-9]+]]
|
|
; CHECK-32-PIC-DAG: clrlwi [[REG:[0-9]+]], 1, 27
|
|
; CHECK-32-PIC-DAG: stw [[LR]], 4(1)
|
|
; CHECK-32-PIC-DAG: subfic 0, [[REG]], -64
|
|
; CHECK-32-PIC: stwux 1, 1, 0
|
|
; CHECK-32-PIC: sub 0, 1, 0
|
|
; CHECK-32-PIC: addic 0, 0, -4
|
|
; CHECK-32-PIC: stwx 31, 0, 0
|
|
; CHECK-32-PIC: addic 0, 0, -4
|
|
; CHECK-32-PIC: stwx 30, 0, 0
|
|
; CHECK-32-PIC: addic 0, 0, -4
|
|
; CHECK-32-PIC: stwx 29, 0, 0
|
|
; CHECK-32-PIC: addic 29, 0, 12
|
|
|
|
; The large-frame-size case.
|
|
define void @hoo(%struct.s* byval(%struct.s) nocapture readonly %a) {
|
|
entry:
|
|
%x = alloca [200000 x i32], align 32
|
|
%a1 = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 0
|
|
%0 = load i32, i32* %a1, align 4
|
|
%arrayidx = getelementptr inbounds [200000 x i32], [200000 x i32]* %x, i64 0, i64 0
|
|
store i32 %0, i32* %arrayidx, align 32
|
|
%b = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 1
|
|
%1 = load i32, i32* %b, align 4
|
|
%arrayidx2 = getelementptr inbounds [200000 x i32], [200000 x i32]* %x, i64 0, i64 1
|
|
store i32 %1, i32* %arrayidx2, align 4
|
|
call void @bar(i32* %arrayidx)
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: @hoo
|
|
|
|
; CHECK-DAG: lis [[REG1:[0-9]+]], -13
|
|
; CHECK-DAG: clrldi [[REG3:[0-9]+]], 1, 59
|
|
; CHECK-DAG: mflr {{[0-9]+}}
|
|
; CHECK-DAG: ori [[REG2:[0-9]+]], [[REG1]], 51808
|
|
; CHECK-DAG: std 30, -16(1)
|
|
; CHECK-DAG: mr 30, 1
|
|
; CHECK-DAG: std 0, 16(1)
|
|
; CHECK-DAG: subc 0, [[REG2]], [[REG3]]
|
|
; CHECK: stdux 1, 1, 0
|
|
|
|
; CHECK: .cfi_def_cfa_register r30
|
|
|
|
; CHECK: blr
|
|
|
|
; CHECK-32-LABEL: @hoo
|
|
|
|
; CHECK-32-DAG: lis [[REG1:[0-9]+]], -13
|
|
; CHECK-32-DAG: clrlwi [[REG3:[0-9]+]], 1, 27
|
|
; CHECK-32-DAG: mflr [[LR:[0-9]+]]
|
|
; CHECK-32-DAG: ori [[REG2:[0-9]+]], [[REG1]], 51904
|
|
; CHECK-32-DAG: stw [[LR]], 4(1)
|
|
; CHECK-32-DAG: subc 0, [[REG2]], [[REG3]]
|
|
; CHECK-32: stwux 1, 1, 0
|
|
; CHECK-32: sub 0, 1, 0
|
|
; CHECK-32: addic 0, 0, -4
|
|
; CHECK-32: stwx 31, 0, 0
|
|
; CHECK-32: addic 0, 0, -4
|
|
; CHECK-32: stwx 30, 0, 0
|
|
; CHECK-32: addic 30, 0, 8
|
|
|
|
; CHECK-32: blr
|
|
|
|
; CHECK-32-PIC-LABEL: @hoo
|
|
|
|
; CHECK-32-PIC-DAG: lis [[REG1:[0-9]+]], -13
|
|
; CHECK-32-PIC-DAG: clrlwi [[REG3:[0-9]+]], 1, 27
|
|
; CHECK-32-PIC-DAG: mflr {{[0-9]+}}
|
|
; CHECK-32-PIC-DAG: ori [[REG2:[0-9]+]], [[REG1]], 51904
|
|
; CHECK-32-PIC-DAG: stw 0, 4(1)
|
|
; CHECK-32-PIC-DAG: subc 0, [[REG2]], [[REG3]]
|
|
; CHECK-32-PIC: stwux 1, 1, 0
|
|
; CHECK-32-PIC: sub 0, 1, 0
|
|
; CHECK-32-PIC: addic 0, 0, -4
|
|
; CHECK-32-PIC: stwx 31, 0, 0
|
|
; CHECK-32-PIC: addic 0, 0, -8
|
|
; CHECK-32-PIC: stwx 29, 0, 0
|
|
; CHECK-32-PIC: addic 29, 0, 12
|
|
|
|
; CHECK-32: blr
|
|
|
|
; Make sure that the FP save area is still allocated correctly relative to
|
|
; where r30 is saved.
|
|
define void @loo(%struct.s* byval(%struct.s) nocapture readonly %a) {
|
|
entry:
|
|
%x = alloca [2 x i32], align 32
|
|
%a1 = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 0
|
|
%0 = load i32, i32* %a1, align 4
|
|
%arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %x, i64 0, i64 0
|
|
store i32 %0, i32* %arrayidx, align 32
|
|
%b = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 1
|
|
%1 = load i32, i32* %b, align 4
|
|
%arrayidx2 = getelementptr inbounds [2 x i32], [2 x i32]* %x, i64 0, i64 1
|
|
store i32 %1, i32* %arrayidx2, align 4
|
|
call void @bar(i32* %arrayidx)
|
|
call void asm sideeffect "", "~{f30}"() nounwind
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: @loo
|
|
|
|
; CHECK-DAG: mflr {{[0-9]+}}
|
|
; CHECK-DAG: clrldi [[REG:[0-9]+]], 1, 59
|
|
; CHECK-DAG: std 30, -32(1)
|
|
; CHECK-DAG: mr 30, 1
|
|
; CHECK-DAG: std 0, 16(1)
|
|
; CHECK-DAG: subfic 0, [[REG]], -192
|
|
; CHECK: stdux 1, 1, 0
|
|
|
|
; CHECK: .cfi_def_cfa_register r30
|
|
|
|
; CHECK: stfd 30, -16(30)
|
|
|
|
; CHECK: blr
|
|
|
|
; CHECK-FP-LABEL: @loo
|
|
|
|
; CHECK-FP-DAG: mflr {{[0-9]+}}
|
|
; CHECK-FP-DAG: clrldi [[REG:[0-9]+]], 1, 59
|
|
; CHECK-FP-DAG: std 31, -24(1)
|
|
; CHECK-FP-DAG: std 30, -32(1)
|
|
; CHECK-FP-DAG: mr 30, 1
|
|
; CHECK-FP-DAG: std 0, 16(1)
|
|
; CHECK-FP-DAG: subfic 0, [[REG]], -192
|
|
; CHECK-FP: stdux 1, 1, 0
|
|
|
|
; CHECK-FP: .cfi_def_cfa_register r30
|
|
|
|
; CHECK-FP: stfd 30, -16(30)
|
|
|
|
; CHECK-FP: blr
|