mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 19:23:23 +01:00
90105ec5c8
The optimisation remarks for loop unrolling with an unrolled remainder looks something like: test.c:7:18: remark: completely unrolled loop with 3 iterations [-Rpass=loop-unroll] C[i] += A[i*N+j]; ^ test.c:6:9: remark: unrolled loop by a factor of 4 with run-time trip count [-Rpass=loop-unroll] for(int j = 0; j < N; j++) ^ This removes the first of the two messages. Differential revision: https://reviews.llvm.org/D38725 llvm-svn: 316986
48 lines
1.8 KiB
LLVM
48 lines
1.8 KiB
LLVM
; RUN: opt < %s -S -loop-unroll -pass-remarks=loop-unroll -unroll-count=16 2>&1 | FileCheck -check-prefix=COMPLETE-UNROLL %s
|
|
; RUN: opt < %s -S -loop-unroll -pass-remarks=loop-unroll -unroll-count=4 2>&1 | FileCheck -check-prefix=PARTIAL-UNROLL %s
|
|
; RUN: opt < %s -S -loop-unroll -pass-remarks=loop-unroll -unroll-count=4 -unroll-runtime=true -unroll-remainder 2>&1 | FileCheck %s --check-prefix=RUNTIME-UNROLL
|
|
|
|
; COMPLETE-UNROLL: remark: {{.*}}: completely unrolled loop with 16 iterations
|
|
; PARTIAL-UNROLL: remark: {{.*}}: unrolled loop by a factor of 4
|
|
; RUNTIME-UNROLL: remark: {{.*}}: unrolled loop by a factor of 4
|
|
|
|
define i32 @sum() {
|
|
entry:
|
|
br label %for.body
|
|
|
|
for.body: ; preds = %for.body, %entry
|
|
%s.06 = phi i32 [ 0, %entry ], [ %add1, %for.body ]
|
|
%i.05 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
%add = add nsw i32 %i.05, 4
|
|
%call = tail call i32 @baz(i32 %add) #2
|
|
%add1 = add nsw i32 %call, %s.06
|
|
%inc = add nsw i32 %i.05, 1
|
|
%exitcond = icmp eq i32 %inc, 16
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
for.end: ; preds = %for.body
|
|
ret i32 %add1
|
|
}
|
|
|
|
; RUNTIME-UNROLL-NOT: remark: {{.*}}: completely unrolled loop with 3 iterations
|
|
; RUNTIME-UNROLL: remark: {{.*}}: unrolled loop by a factor of 4
|
|
|
|
define i32 @runtime(i32 %n) {
|
|
entry:
|
|
br label %for.body
|
|
|
|
for.body: ; preds = %for.body, %entry
|
|
%s.06 = phi i32 [ 0, %entry ], [ %add1, %for.body ]
|
|
%i.05 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
%add = add nsw i32 %i.05, 4
|
|
%call = tail call i32 @baz(i32 %add) #2
|
|
%add1 = add nsw i32 %call, %s.06
|
|
%inc = add nsw i32 %i.05, 1
|
|
%exitcond = icmp eq i32 %inc, %n
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
for.end: ; preds = %for.body
|
|
ret i32 %add1
|
|
}
|
|
|
|
declare i32 @baz(i32) |