2010-08-27 00:23:39 +02:00
|
|
|
; RUN: opt < %s -instcombine -S | FileCheck %s
|
2010-08-27 22:32:06 +02:00
|
|
|
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
|
2009-06-18 01:17:05 +02:00
|
|
|
|
2009-06-18 18:30:21 +02:00
|
|
|
; Instcombine should be able to eliminate all of these ext casts.
|
2009-06-18 01:17:05 +02:00
|
|
|
|
|
|
|
declare void @use(i32)
|
|
|
|
|
2010-08-27 00:23:39 +02:00
|
|
|
define i64 @test1(i64 %a) {
|
2009-06-18 01:17:05 +02:00
|
|
|
%b = trunc i64 %a to i32
|
|
|
|
%c = and i32 %b, 15
|
|
|
|
%d = zext i32 %c to i64
|
|
|
|
call void @use(i32 %b)
|
|
|
|
ret i64 %d
|
2010-08-27 00:23:39 +02:00
|
|
|
; CHECK: @test1
|
|
|
|
; CHECK: %d = and i64 %a, 15
|
|
|
|
; CHECK: ret i64 %d
|
2009-06-18 01:17:05 +02:00
|
|
|
}
|
2010-08-27 00:23:39 +02:00
|
|
|
define i64 @test2(i64 %a) {
|
2009-06-18 01:17:05 +02:00
|
|
|
%b = trunc i64 %a to i32
|
|
|
|
%c = shl i32 %b, 4
|
|
|
|
%q = ashr i32 %c, 4
|
|
|
|
%d = sext i32 %q to i64
|
|
|
|
call void @use(i32 %b)
|
|
|
|
ret i64 %d
|
2010-08-27 00:23:39 +02:00
|
|
|
; CHECK: @test2
|
|
|
|
; CHECK: shl i64 %a, 36
|
|
|
|
; CHECK: %d = ashr i64 {{.*}}, 36
|
|
|
|
; CHECK: ret i64 %d
|
2009-06-18 01:17:05 +02:00
|
|
|
}
|
2010-08-27 00:23:39 +02:00
|
|
|
define i64 @test3(i64 %a) {
|
2009-06-18 18:30:21 +02:00
|
|
|
%b = trunc i64 %a to i32
|
|
|
|
%c = and i32 %b, 8
|
|
|
|
%d = zext i32 %c to i64
|
|
|
|
call void @use(i32 %b)
|
|
|
|
ret i64 %d
|
2010-08-27 00:23:39 +02:00
|
|
|
; CHECK: @test3
|
|
|
|
; CHECK: %d = and i64 %a, 8
|
|
|
|
; CHECK: ret i64 %d
|
2009-06-18 18:30:21 +02:00
|
|
|
}
|
2010-08-27 00:23:39 +02:00
|
|
|
define i64 @test4(i64 %a) {
|
2009-06-18 18:30:21 +02:00
|
|
|
%b = trunc i64 %a to i32
|
|
|
|
%c = and i32 %b, 8
|
|
|
|
%x = xor i32 %c, 8
|
|
|
|
%d = zext i32 %x to i64
|
|
|
|
call void @use(i32 %b)
|
|
|
|
ret i64 %d
|
2010-08-27 00:23:39 +02:00
|
|
|
; CHECK: @test4
|
|
|
|
; CHECK: = and i64 %a, 8
|
|
|
|
; CHECK: %d = xor i64 {{.*}}, 8
|
|
|
|
; CHECK: ret i64 %d
|
2009-06-18 18:30:21 +02:00
|
|
|
}
|
Add an instcombine to clean up a common pattern produced
by the SRoA "promote to large integer" code, eliminating
some type conversions like this:
%94 = zext i16 %93 to i32 ; <i32> [#uses=2]
%96 = lshr i32 %94, 8 ; <i32> [#uses=1]
%101 = trunc i32 %96 to i8 ; <i8> [#uses=1]
This also unblocks other xforms from happening, now clang is able to compile:
struct S { float A, B, C, D; };
float foo(struct S A) { return A.A + A.B+A.C+A.D; }
into:
_foo: ## @foo
## BB#0: ## %entry
pshufd $1, %xmm0, %xmm2
addss %xmm0, %xmm2
movdqa %xmm1, %xmm3
addss %xmm2, %xmm3
pshufd $1, %xmm1, %xmm0
addss %xmm3, %xmm0
ret
on x86-64, instead of:
_foo: ## @foo
## BB#0: ## %entry
movd %xmm0, %rax
shrq $32, %rax
movd %eax, %xmm2
addss %xmm0, %xmm2
movapd %xmm1, %xmm3
addss %xmm2, %xmm3
movd %xmm1, %rax
shrq $32, %rax
movd %eax, %xmm0
addss %xmm3, %xmm0
ret
This seems pretty close to optimal to me, at least without
using horizontal adds. This also triggers in lots of other
code, including SPEC.
llvm-svn: 112278
2010-08-27 20:31:05 +02:00
|
|
|
|
|
|
|
define i32 @test5(i32 %A) {
|
|
|
|
%B = zext i32 %A to i128
|
|
|
|
%C = lshr i128 %B, 16
|
|
|
|
%D = trunc i128 %C to i32
|
|
|
|
ret i32 %D
|
|
|
|
; CHECK: @test5
|
|
|
|
; CHECK: %C = lshr i32 %A, 16
|
|
|
|
; CHECK: ret i32 %C
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @test6(i64 %A) {
|
|
|
|
%B = zext i64 %A to i128
|
|
|
|
%C = lshr i128 %B, 32
|
|
|
|
%D = trunc i128 %C to i32
|
|
|
|
ret i32 %D
|
|
|
|
; CHECK: @test6
|
|
|
|
; CHECK: %C = lshr i64 %A, 32
|
|
|
|
; CHECK: %D = trunc i64 %C to i32
|
|
|
|
; CHECK: ret i32 %D
|
|
|
|
}
|
|
|
|
|
|
|
|
define i92 @test7(i64 %A) {
|
|
|
|
%B = zext i64 %A to i128
|
|
|
|
%C = lshr i128 %B, 32
|
|
|
|
%D = trunc i128 %C to i92
|
|
|
|
ret i92 %D
|
|
|
|
; CHECK: @test7
|
2010-08-27 22:32:06 +02:00
|
|
|
; CHECK: %B = zext i64 %A to i92
|
|
|
|
; CHECK: %C = lshr i92 %B, 32
|
|
|
|
; CHECK: ret i92 %C
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @test8(i32 %A, i32 %B) {
|
|
|
|
%tmp38 = zext i32 %A to i128
|
|
|
|
%tmp32 = zext i32 %B to i128
|
|
|
|
%tmp33 = shl i128 %tmp32, 32
|
|
|
|
%ins35 = or i128 %tmp33, %tmp38
|
|
|
|
%tmp42 = trunc i128 %ins35 to i64
|
|
|
|
ret i64 %tmp42
|
|
|
|
; CHECK: @test8
|
|
|
|
; CHECK: %tmp38 = zext i32 %A to i64
|
|
|
|
; CHECK: %tmp32 = zext i32 %B to i64
|
|
|
|
; CHECK: %tmp33 = shl i64 %tmp32, 32
|
|
|
|
; CHECK: %ins35 = or i64 %tmp33, %tmp38
|
|
|
|
; CHECK: ret i64 %ins35
|
|
|
|
}
|
|
|
|
|