mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-31 20:51:52 +01:00
d53723ece8
In the presence of packed structures (#pragma pack(1)) where elements are referenced through pointers, there will be stores/loads with alignment values matching the default alignments for the element types while the elements are in fact unaligned. Strictly speaking this is incorrect source code, but is unfortunately part of existing code and therefore now addressed. This patch improves the pattern predicate for PC-relative loads and stores by not only checking the alignment value of the instruction, but also making sure that the symbol (and element) itself is aligned. Fixes https://bugs.llvm.org/show_bug.cgi?id=44405 Review: Ulrich Weigand Differential Revision: https://reviews.llvm.org/D87510
210 lines
5.7 KiB
LLVM
210 lines
5.7 KiB
LLVM
; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s
|
|
;
|
|
; Test PC-relative memory accesses of globals with packed struct types.
|
|
; PC-relative memory accesses cannot be used when the address is not
|
|
; aligned. This can happen with programs like the following (which are not
|
|
; strictly correct):
|
|
;
|
|
; #pragma pack(1)
|
|
; struct {
|
|
; short a;
|
|
; int b;
|
|
; } c;
|
|
;
|
|
; void main() {
|
|
; int *e = &c.b;
|
|
; *e = 0;
|
|
; }
|
|
;
|
|
|
|
%packed.i16i32 = type <{ i16, i32 }>
|
|
%packed.i16i32i16i32 = type <{ i16, i32, i16, i32 }>
|
|
%packed.i16i64 = type <{ i16, i64 }>
|
|
%packed.i8i16 = type <{ i8, i16 }>
|
|
|
|
@A_align2 = global %packed.i16i32 zeroinitializer, align 2
|
|
@B_align2 = global %packed.i16i32i16i32 zeroinitializer, align 2
|
|
@C_align2 = global %packed.i16i64 zeroinitializer, align 2
|
|
@D_align4 = global %packed.i16i32 zeroinitializer, align 4
|
|
@E_align4 = global %packed.i16i32i16i32 zeroinitializer, align 4
|
|
@F_align2 = global %packed.i8i16 zeroinitializer, align 2
|
|
|
|
;;; Stores
|
|
|
|
; unaligned packed struct + 2 -> unaligned address
|
|
define void @f1() {
|
|
; CHECK-LABEL: f1:
|
|
; CHECK: larl %r1, A_align2
|
|
; CHECK: mvhi 2(%r1), 0
|
|
; CHECK: br %r14
|
|
store i32 0, i32* getelementptr inbounds (%packed.i16i32, %packed.i16i32* @A_align2, i64 0, i32 1), align 4
|
|
ret void
|
|
}
|
|
|
|
; unaligned packed struct + 8 -> unaligned address
|
|
define void @f2() {
|
|
; CHECK-LABEL: f2:
|
|
; CHECK: larl %r1, B_align2
|
|
; CHECK: mvhi 8(%r1), 0
|
|
; CHECK: br %r14
|
|
store i32 0, i32* getelementptr inbounds (%packed.i16i32i16i32, %packed.i16i32i16i32* @B_align2, i64 0, i32 3), align 4
|
|
ret void
|
|
}
|
|
|
|
; aligned packed struct + 2 -> unaligned address
|
|
define void @f3() {
|
|
; CHECK-LABEL: f3:
|
|
; CHECK: larl %r1, D_align4
|
|
; CHECK: mvhi 2(%r1), 0
|
|
; CHECK: br %r14
|
|
store i32 0, i32* getelementptr inbounds (%packed.i16i32, %packed.i16i32* @D_align4, i64 0, i32 1), align 4
|
|
ret void
|
|
}
|
|
|
|
; aligned packed struct + 8 -> aligned address
|
|
define void @f4() {
|
|
; CHECK-LABEL: f4:
|
|
; CHECK: lhi %r0, 0
|
|
; CHECK: strl %r0, E_align4+8
|
|
; CHECK: br %r14
|
|
store i32 0, i32* getelementptr inbounds (%packed.i16i32i16i32, %packed.i16i32i16i32* @E_align4, i64 0, i32 3), align 4
|
|
ret void
|
|
}
|
|
|
|
define void @f5() {
|
|
; CHECK-LABEL: f5:
|
|
; CHECK: larl %r1, C_align2
|
|
; CHECK: mvghi 2(%r1), 0
|
|
; CHECK: br %r14
|
|
store i64 0, i64* getelementptr inbounds (%packed.i16i64, %packed.i16i64* @C_align2, i64 0, i32 1), align 8
|
|
ret void
|
|
}
|
|
|
|
define void @f6() {
|
|
; CHECK-LABEL: f6:
|
|
; CHECK-NOT: sthrl
|
|
store i16 0, i16* getelementptr inbounds (%packed.i8i16, %packed.i8i16* @F_align2, i64 0, i32 1), align 2
|
|
ret void
|
|
}
|
|
|
|
define void @f7(i64* %Src) {
|
|
; CHECK-LABEL: f7:
|
|
; CHECK: lg %r0, 0(%r2)
|
|
; CHECK: larl %r1, D_align4
|
|
; CHECK: st %r0, 2(%r1)
|
|
; CHECK: br %r14
|
|
%L = load i64, i64* %Src
|
|
%T = trunc i64 %L to i32
|
|
store i32 %T, i32* getelementptr inbounds (%packed.i16i32, %packed.i16i32* @D_align4, i64 0, i32 1), align 4
|
|
ret void
|
|
}
|
|
|
|
define void @f8(i64* %Src) {
|
|
; CHECK-LABEL: f8:
|
|
; CHECK-NOT: sthrl
|
|
%L = load i64, i64* %Src
|
|
%T = trunc i64 %L to i16
|
|
store i16 %T, i16* getelementptr inbounds (%packed.i8i16, %packed.i8i16* @F_align2, i64 0, i32 1), align 2
|
|
ret void
|
|
}
|
|
|
|
;;; Loads
|
|
|
|
; unaligned packed struct + 2 -> unaligned address
|
|
define i32 @f9() {
|
|
; CHECK-LABEL: f9:
|
|
; CHECK: larl %r1, A_align2
|
|
; CHECK: l %r2, 2(%r1)
|
|
; CHECK: br %r14
|
|
%L = load i32, i32* getelementptr inbounds (%packed.i16i32, %packed.i16i32* @A_align2, i64 0, i32 1), align 4
|
|
ret i32 %L
|
|
}
|
|
|
|
; unaligned packed struct + 8 -> unaligned address
|
|
define i32 @f10() {
|
|
; CHECK-LABEL: f10:
|
|
; CHECK: larl %r1, B_align2
|
|
; CHECK: l %r2, 8(%r1)
|
|
; CHECK: br %r14
|
|
%L = load i32, i32* getelementptr inbounds (%packed.i16i32i16i32, %packed.i16i32i16i32* @B_align2, i64 0, i32 3), align 4
|
|
ret i32 %L
|
|
}
|
|
|
|
; aligned packed struct + 2 -> unaligned address
|
|
define i32 @f11() {
|
|
; CHECK-LABEL: f11:
|
|
; CHECK: larl %r1, D_align4
|
|
; CHECK: l %r2, 2(%r1)
|
|
; CHECK: br %r14
|
|
%L = load i32, i32* getelementptr inbounds (%packed.i16i32, %packed.i16i32* @D_align4, i64 0, i32 1), align 4
|
|
ret i32 %L
|
|
}
|
|
|
|
; aligned packed struct + 8 -> aligned address
|
|
define i32 @f12() {
|
|
; CHECK-LABEL: f12:
|
|
; CHECK: lrl %r2, E_align4+8
|
|
; CHECK: br %r14
|
|
%L = load i32, i32* getelementptr inbounds (%packed.i16i32i16i32, %packed.i16i32i16i32* @E_align4, i64 0, i32 3), align 4
|
|
ret i32 %L
|
|
}
|
|
|
|
define i64 @f13() {
|
|
; CHECK-LABEL: f13:
|
|
; CHECK: larl %r1, C_align2
|
|
; CHECK: lg %r2, 2(%r1)
|
|
; CHECK: br %r14
|
|
%L = load i64, i64* getelementptr inbounds (%packed.i16i64, %packed.i16i64* @C_align2, i64 0, i32 1), align 8
|
|
ret i64 %L
|
|
}
|
|
|
|
define i32 @f14() {
|
|
; CHECK-LABEL: f14:
|
|
; CHECK-NOT: lhrl
|
|
%L = load i16, i16* getelementptr inbounds (%packed.i8i16, %packed.i8i16* @F_align2, i64 0, i32 1), align 2
|
|
%ext = sext i16 %L to i32
|
|
ret i32 %ext
|
|
}
|
|
|
|
define i64 @f15() {
|
|
; CHECK-LABEL: f15:
|
|
; CHECK-NOT: llghrl
|
|
%L = load i16, i16* getelementptr inbounds (%packed.i8i16, %packed.i8i16* @F_align2, i64 0, i32 1), align 2
|
|
%ext = zext i16 %L to i64
|
|
ret i64 %ext
|
|
}
|
|
|
|
;;; Loads folded into compare instructions
|
|
|
|
define i32 @f16(i32 %src1) {
|
|
; CHECK-LABEL: f16:
|
|
; CHECK: larl %r1, A_align2
|
|
; CHECK: c %r2, 2(%r1)
|
|
entry:
|
|
%src2 = load i32, i32* getelementptr inbounds (%packed.i16i32, %packed.i16i32* @A_align2, i64 0, i32 1), align 4
|
|
%cond = icmp slt i32 %src1, %src2
|
|
br i1 %cond, label %exit, label %mulb
|
|
mulb:
|
|
%mul = mul i32 %src1, %src1
|
|
br label %exit
|
|
exit:
|
|
%res = phi i32 [ %src1, %entry ], [ %mul, %mulb ]
|
|
ret i32 %res
|
|
}
|
|
|
|
define i64 @f17(i64 %src1) {
|
|
; CHECK-LABEL: f17:
|
|
; CHECK: larl %r1, C_align2
|
|
; CHECK: clg %r2, 2(%r1)
|
|
entry:
|
|
%src2 = load i64, i64* getelementptr inbounds (%packed.i16i64, %packed.i16i64* @C_align2, i64 0, i32 1), align 8
|
|
%cond = icmp ult i64 %src1, %src2
|
|
br i1 %cond, label %exit, label %mulb
|
|
mulb:
|
|
%mul = mul i64 %src1, %src1
|
|
br label %exit
|
|
exit:
|
|
%res = phi i64 [ %src1, %entry ], [ %mul, %mulb ]
|
|
ret i64 %res
|
|
}
|