mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-25 04:02:41 +01:00
a59eb7c09c
what it does. Enhance it to return false to optimizing vector sign extensions from vector comparisions, which is the idiom used to get a splatted vector for a vector comparison. Doing this breaks vector-casts.ll, add some compensating transformations to handle the important case they cover without depending on this canonicalization. This fixes rdar://7434900 a serious pessimization of vector compares. llvm-svn: 95855
124 lines
3.4 KiB
LLVM
124 lines
3.4 KiB
LLVM
; RUN: opt < %s -instcombine -S | FileCheck %s
|
|
|
|
; This turns into a&1 != 0
|
|
define <2 x i1> @test1(<2 x i64> %a) {
|
|
%t = trunc <2 x i64> %a to <2 x i1>
|
|
ret <2 x i1> %t
|
|
|
|
; CHECK: @test1
|
|
; CHECK: and <2 x i64> %a, <i64 1, i64 1>
|
|
; CHECK: icmp ne <2 x i64> %tmp, zeroinitializer
|
|
}
|
|
|
|
; The ashr turns into an lshr.
|
|
define <2 x i64> @test2(<2 x i64> %a) {
|
|
%b = and <2 x i64> %a, <i64 65535, i64 65535>
|
|
%t = ashr <2 x i64> %b, <i64 1, i64 1>
|
|
ret <2 x i64> %t
|
|
|
|
; CHECK: @test2
|
|
; CHECK: and <2 x i64> %a, <i64 65535, i64 65535>
|
|
; CHECK: lshr <2 x i64> %b, <i64 1, i64 1>
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @test3(<4 x float> %a, <4 x float> %b) nounwind readnone {
|
|
entry:
|
|
%cmp = fcmp ord <4 x float> %a, zeroinitializer
|
|
%sext = sext <4 x i1> %cmp to <4 x i32>
|
|
%cmp4 = fcmp ord <4 x float> %b, zeroinitializer
|
|
%sext5 = sext <4 x i1> %cmp4 to <4 x i32>
|
|
%and = and <4 x i32> %sext, %sext5
|
|
%conv = bitcast <4 x i32> %and to <2 x i64>
|
|
ret <2 x i64> %conv
|
|
|
|
; CHECK: @test3
|
|
; CHECK: fcmp ord <4 x float> %a, %b
|
|
}
|
|
|
|
define <2 x i64> @test4(<4 x float> %a, <4 x float> %b) nounwind readnone {
|
|
entry:
|
|
%cmp = fcmp uno <4 x float> %a, zeroinitializer
|
|
%sext = sext <4 x i1> %cmp to <4 x i32>
|
|
%cmp4 = fcmp uno <4 x float> %b, zeroinitializer
|
|
%sext5 = sext <4 x i1> %cmp4 to <4 x i32>
|
|
%or = or <4 x i32> %sext, %sext5
|
|
%conv = bitcast <4 x i32> %or to <2 x i64>
|
|
ret <2 x i64> %conv
|
|
; CHECK: @test4
|
|
; CHECK: fcmp uno <4 x float> %a, %b
|
|
}
|
|
|
|
|
|
; rdar://7434900
|
|
define <2 x i64> @test5(<4 x float> %a, <4 x float> %b) nounwind readnone {
|
|
entry:
|
|
%cmp = fcmp ult <4 x float> %a, zeroinitializer
|
|
%sext = sext <4 x i1> %cmp to <4 x i32>
|
|
%cmp4 = fcmp ult <4 x float> %b, zeroinitializer
|
|
%sext5 = sext <4 x i1> %cmp4 to <4 x i32>
|
|
%and = and <4 x i32> %sext, %sext5
|
|
%conv = bitcast <4 x i32> %and to <2 x i64>
|
|
ret <2 x i64> %conv
|
|
|
|
; CHECK: @test5
|
|
; CHECK: sext <4 x i1> %cmp to <4 x i32>
|
|
; CHECK: sext <4 x i1> %cmp4 to <4 x i32>
|
|
}
|
|
|
|
|
|
define void @convert(<2 x i32>* %dst.addr, <2 x i64> %src) nounwind {
|
|
entry:
|
|
%val = trunc <2 x i64> %src to <2 x i32>
|
|
%add = add <2 x i32> %val, <i32 1, i32 1>
|
|
store <2 x i32> %add, <2 x i32>* %dst.addr
|
|
ret void
|
|
}
|
|
|
|
define <2 x i65> @foo(<2 x i64> %t) {
|
|
%a = trunc <2 x i64> %t to <2 x i32>
|
|
%b = zext <2 x i32> %a to <2 x i65>
|
|
ret <2 x i65> %b
|
|
}
|
|
define <2 x i64> @bar(<2 x i65> %t) {
|
|
%a = trunc <2 x i65> %t to <2 x i32>
|
|
%b = zext <2 x i32> %a to <2 x i64>
|
|
ret <2 x i64> %b
|
|
}
|
|
define <2 x i65> @foos(<2 x i64> %t) {
|
|
%a = trunc <2 x i64> %t to <2 x i32>
|
|
%b = sext <2 x i32> %a to <2 x i65>
|
|
ret <2 x i65> %b
|
|
}
|
|
define <2 x i64> @bars(<2 x i65> %t) {
|
|
%a = trunc <2 x i65> %t to <2 x i32>
|
|
%b = sext <2 x i32> %a to <2 x i64>
|
|
ret <2 x i64> %b
|
|
}
|
|
define <2 x i64> @quxs(<2 x i64> %t) {
|
|
%a = trunc <2 x i64> %t to <2 x i32>
|
|
%b = sext <2 x i32> %a to <2 x i64>
|
|
ret <2 x i64> %b
|
|
}
|
|
define <2 x i64> @quxt(<2 x i64> %t) {
|
|
%a = shl <2 x i64> %t, <i64 32, i64 32>
|
|
%b = ashr <2 x i64> %a, <i64 32, i64 32>
|
|
ret <2 x i64> %b
|
|
}
|
|
define <2 x double> @fa(<2 x double> %t) {
|
|
%a = fptrunc <2 x double> %t to <2 x float>
|
|
%b = fpext <2 x float> %a to <2 x double>
|
|
ret <2 x double> %b
|
|
}
|
|
define <2 x double> @fb(<2 x double> %t) {
|
|
%a = fptoui <2 x double> %t to <2 x i64>
|
|
%b = uitofp <2 x i64> %a to <2 x double>
|
|
ret <2 x double> %b
|
|
}
|
|
define <2 x double> @fc(<2 x double> %t) {
|
|
%a = fptosi <2 x double> %t to <2 x i64>
|
|
%b = sitofp <2 x i64> %a to <2 x double>
|
|
ret <2 x double> %b
|
|
}
|