mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 11:13:28 +01:00
[LICM] When we are recomputing the alias sets for a subloop, we cannot
skip sub-subloops. The logic to skip subloops dated from when this code was shared with the cached case. Once it was factored out to only run in the case of recomputed subloops it became a dangerous bug. If a subsubloop contained an interfering instruction it would be silently skipped from the alias sets for LICM. With the old pass manager this was extremely hard to trigger as it would require failing to visit these subloops with the LICM pass but then visiting the outer loop somehow. I've not yet contrived any test case that actually manages to trigger this. But with the new pass manager we don't do the cross-loop caching hack that the old PM does and so we recompute alias set information from first principles. While this seems much cleaner and simpler it exposed this bug and would subtly miscompile code due to failing to correctly model the aliasing constraints of deeply nested loops. llvm-svn: 293273
This commit is contained in:
parent
e87466a278
commit
7ddff7f375
@ -1224,10 +1224,7 @@ LoopInvariantCodeMotion::collectAliasInfoForLoop(Loop *L, LoopInfo *LI,
|
||||
|
||||
auto mergeLoop = [&](Loop *L) {
|
||||
// Loop over the body of this loop, looking for calls, invokes, and stores.
|
||||
// Because subloops have already been incorporated into AST, we skip blocks
|
||||
// in subloops.
|
||||
for (BasicBlock *BB : L->blocks())
|
||||
if (LI->getLoopFor(BB) == L) // Ignore blocks in subloops.
|
||||
CurAST->add(*BB); // Incorporate the specified basic block
|
||||
};
|
||||
|
||||
|
76
test/Transforms/LICM/unrolled-deeply-nested.ll
Normal file
76
test/Transforms/LICM/unrolled-deeply-nested.ll
Normal file
@ -0,0 +1,76 @@
|
||||
; Test that LICM correctly detects conflicting accesses to memory in deeply
|
||||
; nested subloops. This works in the legacy PM due to a special retained map of
|
||||
; alias information for inner loops, and in the new PM it is recomputed for each
|
||||
; loop.
|
||||
;
|
||||
; RUN: opt -S -aa-pipeline=basic-aa -passes='require<opt-remark-emit>,loop(licm)' < %s | FileCheck %s
|
||||
; RUN: opt -S -basicaa -licm < %s | FileCheck %s
|
||||
|
||||
define i32 @test(i32* %a, i64 %n.0, i64 %n.0.0, i64 %n.0.0.0, i64 %n.0.0.0.0) nounwind uwtable readonly {
|
||||
; CHECK-LABEL: define i32 @test
|
||||
entry:
|
||||
%b = alloca i32
|
||||
%c = alloca i32
|
||||
%a.i8 = bitcast i32* %a to i8*
|
||||
%b.i8 = bitcast i32* %b to i8*
|
||||
%c.i8 = bitcast i32* %c to i8*
|
||||
br label %l.0.header
|
||||
; CHECK: %b = alloca i32
|
||||
; CHECK: %c = alloca i32
|
||||
; CHECK: %[[AI8:.*]] = bitcast i32* %a to i8*
|
||||
; CHECK: %[[BI8:.*]] = bitcast i32* %b to i8*
|
||||
; CHECK: %[[CI8:.*]] = bitcast i32* %c to i8*
|
||||
; CHECK-NOT: load
|
||||
; CHECK: br
|
||||
|
||||
l.0.header:
|
||||
%iv.0 = phi i64 [ %iv.0.next, %l.0.latch ], [ 0, %entry ]
|
||||
%iv.0.next = add i64 %iv.0, 1
|
||||
%exitcond.0 = icmp eq i64 %iv.0.next, %n.0
|
||||
%a.val = load i32, i32* %a
|
||||
store i32 %a.val, i32* %b
|
||||
%c.val = trunc i64 %iv.0 to i32
|
||||
store i32 %c.val, i32* %c
|
||||
br label %l.0.0.header
|
||||
; CHECK: %[[AV:.*]] = load i32, i32* %a
|
||||
; CHECK: store i32 %[[AV]], i32* %b
|
||||
; CHECK: %[[CT:.*]] = trunc i64 {{.*}} to i32
|
||||
; CHECK: store i32 %[[CT]], i32* %c
|
||||
; CHECK: br
|
||||
|
||||
l.0.0.header:
|
||||
%iv.0.0 = phi i64 [ %iv.0.0.next, %l.0.0.latch ], [ 0, %l.0.header ]
|
||||
%iv.0.0.next = add i64 %iv.0.0, 1
|
||||
%exitcond.0.0 = icmp eq i64 %iv.0.0.next, %n.0.0
|
||||
br label %l.0.0.0.header
|
||||
; CHECK: br
|
||||
|
||||
l.0.0.0.header:
|
||||
%iv.0.0.0 = phi i64 [ %iv.0.0.0.next, %l.0.0.0.header ], [ 0, %l.0.0.header ]
|
||||
%iv.0.0.0.next = add i64 %iv.0.0.0, 1
|
||||
%exitcond.0.0.0 = icmp eq i64 %iv.0.0.0.next, %n.0.0.0
|
||||
call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a.i8, i8* %c.i8, i64 4, i32 1, i1 false)
|
||||
call void @llvm.memcpy.p0i8.p0i8.i64(i8* %b.i8, i8* %c.i8, i64 4, i32 1, i1 false)
|
||||
br i1 %exitcond.0.0.0, label %l.0.0.0.header, label %l.0.0.latch
|
||||
; CHECK: call void @llvm.memcpy.{{.*}}(i8* %[[AI8]], i8* %[[CI8]], i64 4
|
||||
; CHECK: call void @llvm.memcpy.{{.*}}(i8* %[[BI8]], i8* %[[CI8]], i64 4
|
||||
; CHECK: br
|
||||
|
||||
l.0.0.latch:
|
||||
br i1 %exitcond.0.0, label %l.0.0.header, label %l.0.latch
|
||||
; CHECK: br
|
||||
|
||||
l.0.latch:
|
||||
%b.val = load i32, i32* %b
|
||||
br i1 %exitcond.0, label %exit, label %l.0.header
|
||||
; CHECK: %[[BV:.*]] = load i32, i32* %b
|
||||
; CHECK: br
|
||||
|
||||
exit:
|
||||
%result.lcssa = phi i32 [ %b.val, %l.0.latch ]
|
||||
ret i32 %b.val
|
||||
; CHECK: %[[LCSSA:.*]] = phi i32 [ %[[BV]], %{{.*}} ]
|
||||
; CHECK: ret i32 %[[LCSSA]]
|
||||
}
|
||||
|
||||
declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture writeonly, i8* nocapture readonly, i64, i32, i1)
|
Loading…
Reference in New Issue
Block a user