mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-10-24 21:42:54 +02:00
5a59407f3b
MIPS32 has instructions for efficient count-leading/trailing-zeros, so this should be considered a cheap operation (and therefore fair game for speculation) for any MIPS32 implementation. The net result of allowing this speculation for the regression tests in this patch is that we get this code: ctlz: jr $ra clz $2, $4 cttz: addiu $1, $4, -1 not $2, $4 and $1, $2, $1 clz $1, $1 addiu $2, $zero, 32 jr $ra subu $2, $2, $1 Instead of: ctlz: beqz $4, $BB0_2 addiu $2, $zero, 32 clz $2, $4 $BB0_2: jr $ra nop cttz: beqz $4, $BB1_2 addiu $2, $zero, 32 addiu $1, $4, -1 not $2, $4 and $1, $2, $1 clz $1, $1 addiu $2, $zero, 32 subu $2, $2, $1 $BB1_2: jr $ra nop See D14469 for the larger motivation. Differential Revision: http://reviews.llvm.org/D14500 llvm-svn: 252755
44 lines
1.2 KiB
LLVM
44 lines
1.2 KiB
LLVM
; RUN: opt -S -simplifycfg -mtriple=mips-linux-gnu < %s | FileCheck %s
|
|
|
|
define i32 @ctlz(i32 %A) {
|
|
; CHECK-LABEL: @ctlz(
|
|
; CHECK: [[ICMP:%[A-Za-z0-9]+]] = icmp eq i32 %A, 0
|
|
; CHECK-NEXT: [[CTZ:%[A-Za-z0-9]+]] = tail call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
|
; CHECK-NEXT: [[SEL:%[A-Za-z0-9.]+]] = select i1 [[ICMP]], i32 32, i32 [[CTZ]]
|
|
; CHECK-NEXT: ret i32 [[SEL]]
|
|
entry:
|
|
%tobool = icmp eq i32 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true:
|
|
%0 = tail call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end:
|
|
%cond = phi i32 [ %0, %cond.true ], [ 32, %entry ]
|
|
ret i32 %cond
|
|
}
|
|
|
|
define i32 @cttz(i32 %A) {
|
|
; CHECK-LABEL: @cttz(
|
|
; CHECK: [[ICMP:%[A-Za-z0-9]+]] = icmp eq i32 %A, 0
|
|
; CHECK-NEXT: [[CTZ:%[A-Za-z0-9]+]] = tail call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
|
; CHECK-NEXT: [[SEL:%[A-Za-z0-9.]+]] = select i1 [[ICMP]], i32 32, i32 [[CTZ]]
|
|
; CHECK-NEXT: ret i32 [[SEL]]
|
|
entry:
|
|
%tobool = icmp eq i32 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true:
|
|
%0 = tail call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end:
|
|
%cond = phi i32 [ %0, %cond.true ], [ 32, %entry ]
|
|
ret i32 %cond
|
|
}
|
|
|
|
declare i32 @llvm.ctlz.i32(i32, i1)
|
|
declare i32 @llvm.cttz.i32(i32, i1)
|
|
|