mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-02-01 05:01:59 +01:00
07981cc027
This patch fixes PR39695. The original LoopSink only considers memory alias in loop body. But PR39695 shows that instructions following sink candidate in preheader should also be checked. This is a conservative patch, it simply adds whole preheader block to alias set. It may lose some optimization opportunity, but I think that is very rare because: 1 in the most common case st/ld to the same address, the load should already be optimized away. 2 usually preheader is not very large. Differential Revision: https://reviews.llvm.org/D54659 llvm-svn: 347325
38 lines
1.2 KiB
LLVM
38 lines
1.2 KiB
LLVM
; RUN: opt -S -loop-sink < %s | FileCheck %s
|
|
|
|
; The load instruction should not be sunk into following loop.
|
|
; CHECK: @foo
|
|
; CHECK-NEXT: entry
|
|
; CHECK-NEXT: %ptr = load i8*, i8** %pp, align 8
|
|
; CHECK-NEXT: store i8* null, i8** %pp, align 8
|
|
|
|
define i32 @foo(i32 %n, i8** %pp) !prof !0 {
|
|
entry:
|
|
%ptr = load i8*, i8** %pp, align 8
|
|
store i8* null, i8** %pp, align 8
|
|
br label %for.cond
|
|
|
|
for.cond: ; preds = %for.body, %entry
|
|
%i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
%cmp = icmp ult i32 %i.0, %n
|
|
br i1 %cmp, label %for.body, label %for.end, !prof !1
|
|
|
|
for.body: ; preds = %for.cond
|
|
%0 = sext i32 %i.0 to i64
|
|
%arrayidx = getelementptr inbounds i8, i8* %ptr, i64 %0
|
|
%1 = load i8, i8* %arrayidx, align 1
|
|
%or19 = call i8 @llvm.bitreverse.i8(i8 %1)
|
|
%v = sext i8 %or19 to i32
|
|
%inc = add i32 %i.0, %v
|
|
br label %for.cond
|
|
|
|
for.end: ; preds = %for.cond
|
|
ret i32 %i.0
|
|
}
|
|
|
|
declare i8 @llvm.bitreverse.i8(i8) #0
|
|
attributes #0 = { nounwind readnone speculatable }
|
|
|
|
!0 = !{!"function_entry_count", i64 1}
|
|
!1 = !{!"branch_weights", i32 1, i32 2000}
|