mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-25 20:23:11 +01:00
d13f674130
and generalize it so that it can be used by IndVarSimplify. Implement the base IndVarSimplify transformation code using IVUsers. This removes TestOrigIVForWrap and associated code, as ScalarEvolution now has enough builtin overflow detection and folding logic to handle all the same cases, and more. Run "opt -iv-users -analyze -disable-output" on your favorite loop for an example of what IVUsers does. This lets IndVarSimplify eliminate IV casts and compute trip counts in more cases. Also, this happens to finally fix the remaining testcases in PR1301. Now that IndVarSimplify is being more aggressive, it occasionally runs into the problem where ScalarEvolutionExpander's code for avoiding duplicate expansions makes it difficult to ensure that all expanded instructions dominate all the instructions that will use them. As a temporary measure, IndVarSimplify now uses a FixUsesBeforeDefs function to fix up instructions inserted by SCEVExpander. Fortunately, this code is contained, and can be easily removed once a more comprehensive solution is available. llvm-svn: 71535
36 lines
994 B
LLVM
36 lines
994 B
LLVM
; RUN: llvm-as < %s | llc -march=x86-64 > %t
|
|
; RUN: grep addl %t
|
|
; RUN: not egrep {movl|movq} %t
|
|
|
|
define float @foo(float* %B) nounwind {
|
|
entry:
|
|
br label %bb2
|
|
|
|
bb2: ; preds = %bb3, %entry
|
|
%B_addr.0.rec = phi i64 [ %indvar.next154, %bb3 ], [ 0, %entry ] ; <i64> [#uses=2]
|
|
%z = icmp slt i64 %B_addr.0.rec, 20000
|
|
br i1 %z, label %bb3, label %bb4
|
|
|
|
bb3: ; preds = %bb2
|
|
%indvar.next154 = add i64 %B_addr.0.rec, 1 ; <i64> [#uses=1]
|
|
br label %bb2
|
|
|
|
bb4: ; preds = %bb2
|
|
%B_addr.0 = getelementptr float* %B, i64 %B_addr.0.rec ; <float*> [#uses=1]
|
|
%t1 = ptrtoint float* %B_addr.0 to i64 ; <i64> [#uses=1]
|
|
%t2 = and i64 %t1, 4294967295 ; <i64> [#uses=1]
|
|
%t3 = icmp eq i64 %t2, 0 ; <i1> [#uses=1]
|
|
br i1 %t3, label %bb5, label %bb10.preheader
|
|
|
|
bb10.preheader: ; preds = %bb4
|
|
br label %bb9
|
|
|
|
bb5: ; preds = %bb4
|
|
ret float 7.0
|
|
|
|
bb9: ; preds = %bb10.preheader
|
|
%t5 = getelementptr float* %B, i64 0 ; <float*> [#uses=1]
|
|
%t7 = load float* %t5 ; <float> [#uses=1]
|
|
ret float %t7
|
|
}
|