2009-09-11 20:36:27 +02:00
|
|
|
; RUN: llc < %s -march=cellspu > %t1.s
|
Convert all tests using TCL-style quoting to use shell-style quoting.
This was done through the aid of a terrible Perl creation. I will not
paste any of the horrors here. Suffice to say, it require multiple
staged rounds of replacements, state carried between, and a few
nested-construct-parsing hacks that I'm not proud of. It happens, by
luck, to be able to deal with all the TCL-quoting patterns in evidence
in the LLVM test suite.
If anyone is maintaining large out-of-tree test trees, feel free to poke
me and I'll send you the steps I used to convert things, as well as
answer any painful questions etc. IRC works best for this type of thing
I find.
Once converted, switch the LLVM lit config to use ShTests the same as
Clang. In addition to being able to delete large amounts of Python code
from 'lit', this will also simplify the entire test suite and some of
lit's architecture.
Finally, the test suite runs 33% faster on Linux now. ;]
For my 16-hardware-thread (2x 4-core xeon e5520): 36s -> 24s
llvm-svn: 159525
2012-07-02 14:47:22 +02:00
|
|
|
; RUN: grep 'stqd.*0($3)' %t1.s | count 4
|
|
|
|
; RUN: grep 'stqd.*16($3)' %t1.s | count 4
|
2008-11-25 18:29:43 +01:00
|
|
|
; RUN: grep 16256 %t1.s | count 2
|
|
|
|
; RUN: grep 16384 %t1.s | count 1
|
2008-12-27 05:51:36 +01:00
|
|
|
; RUN: grep 771 %t1.s | count 4
|
|
|
|
; RUN: grep 515 %t1.s | count 2
|
|
|
|
; RUN: grep 1799 %t1.s | count 2
|
2009-03-25 21:20:11 +01:00
|
|
|
; RUN: grep 1543 %t1.s | count 5
|
|
|
|
; RUN: grep 1029 %t1.s | count 3
|
Convert all tests using TCL-style quoting to use shell-style quoting.
This was done through the aid of a terrible Perl creation. I will not
paste any of the horrors here. Suffice to say, it require multiple
staged rounds of replacements, state carried between, and a few
nested-construct-parsing hacks that I'm not proud of. It happens, by
luck, to be able to deal with all the TCL-quoting patterns in evidence
in the LLVM test suite.
If anyone is maintaining large out-of-tree test trees, feel free to poke
me and I'll send you the steps I used to convert things, as well as
answer any painful questions etc. IRC works best for this type of thing
I find.
Once converted, switch the LLVM lit config to use ShTests the same as
Clang. In addition to being able to delete large amounts of Python code
from 'lit', this will also simplify the entire test suite and some of
lit's architecture.
Finally, the test suite runs 33% faster on Linux now. ;]
For my 16-hardware-thread (2x 4-core xeon e5520): 36s -> 24s
llvm-svn: 159525
2012-07-02 14:47:22 +02:00
|
|
|
; RUN: grep 'shli.*, 4' %t1.s | count 4
|
2008-11-25 18:29:43 +01:00
|
|
|
; RUN: grep stqx %t1.s | count 4
|
2009-03-25 21:20:11 +01:00
|
|
|
; RUN: grep ilhu %t1.s | count 11
|
|
|
|
; RUN: grep iohl %t1.s | count 8
|
|
|
|
; RUN: grep shufb %t1.s | count 15
|
2008-12-27 05:51:36 +01:00
|
|
|
; RUN: grep frds %t1.s | count 1
|
2010-11-12 11:14:03 +01:00
|
|
|
; RUN: llc < %s -march=cellspu | FileCheck %s
|
2008-11-21 03:56:16 +01:00
|
|
|
|
|
|
|
; ModuleID = 'stores.bc'
|
|
|
|
target datalayout = "E-p:32:32:128-f64:64:128-f32:32:128-i64:32:128-i32:32:128-i16:16:128-i8:8:128-i1:8:128-a0:0:128-v128:128:128-s0:128:128"
|
|
|
|
target triple = "spu"
|
|
|
|
|
2008-11-25 18:29:43 +01:00
|
|
|
define void @store_v16i8_1(<16 x i8>* %a) nounwind {
|
|
|
|
entry:
|
|
|
|
store <16 x i8> < i8 1, i8 2, i8 1, i8 1, i8 1, i8 2, i8 1, i8 1, i8 1, i8 2, i8 1, i8 1, i8 1, i8 2, i8 1, i8 1 >, <16 x i8>* %a
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_v16i8_2(<16 x i8>* %a) nounwind {
|
|
|
|
entry:
|
|
|
|
%arrayidx = getelementptr <16 x i8>* %a, i32 1
|
|
|
|
store <16 x i8> < i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2 >, <16 x i8>* %arrayidx
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_v16i8_3(<16 x i8>* %a, i32 %i) nounwind {
|
|
|
|
entry:
|
|
|
|
%arrayidx = getelementptr <16 x i8>* %a, i32 %i
|
|
|
|
store <16 x i8> < i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1 >, <16 x i8>* %arrayidx
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_v8i16_1(<8 x i16>* %a) nounwind {
|
|
|
|
entry:
|
|
|
|
store <8 x i16> < i16 1, i16 2, i16 1, i16 1, i16 1, i16 2, i16 1, i16 1 >, <8 x i16>* %a
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_v8i16_2(<8 x i16>* %a) nounwind {
|
|
|
|
entry:
|
|
|
|
%arrayidx = getelementptr <8 x i16>* %a, i16 1
|
|
|
|
store <8 x i16> < i16 2, i16 2, i16 2, i16 2, i16 2, i16 2, i16 2, i16 2 >, <8 x i16>* %arrayidx
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_v8i16_3(<8 x i16>* %a, i32 %i) nounwind {
|
|
|
|
entry:
|
|
|
|
%arrayidx = getelementptr <8 x i16>* %a, i32 %i
|
|
|
|
store <8 x i16> < i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1 >, <8 x i16>* %arrayidx
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_v4i32_1(<4 x i32>* %a) nounwind {
|
|
|
|
entry:
|
|
|
|
store <4 x i32> < i32 1, i32 2, i32 1, i32 1 >, <4 x i32>* %a
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_v4i32_2(<4 x i32>* %a) nounwind {
|
|
|
|
entry:
|
|
|
|
%arrayidx = getelementptr <4 x i32>* %a, i32 1
|
|
|
|
store <4 x i32> < i32 2, i32 2, i32 2, i32 2 >, <4 x i32>* %arrayidx
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_v4i32_3(<4 x i32>* %a, i32 %i) nounwind {
|
|
|
|
entry:
|
|
|
|
%arrayidx = getelementptr <4 x i32>* %a, i32 %i
|
|
|
|
store <4 x i32> < i32 1, i32 1, i32 1, i32 1 >, <4 x i32>* %arrayidx
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2008-11-21 03:56:16 +01:00
|
|
|
define void @store_v4f32_1(<4 x float>* %a) nounwind {
|
|
|
|
entry:
|
|
|
|
store <4 x float> < float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 >, <4 x float>* %a
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_v4f32_2(<4 x float>* %a) nounwind {
|
|
|
|
entry:
|
|
|
|
%arrayidx = getelementptr <4 x float>* %a, i32 1
|
|
|
|
store <4 x float> < float 2.000000e+00, float 2.000000e+00, float 2.000000e+00, float 2.000000e+00 >, <4 x float>* %arrayidx
|
|
|
|
ret void
|
|
|
|
}
|
2008-11-25 18:29:43 +01:00
|
|
|
|
|
|
|
define void @store_v4f32_3(<4 x float>* %a, i32 %i) nounwind {
|
|
|
|
entry:
|
|
|
|
%arrayidx = getelementptr <4 x float>* %a, i32 %i
|
|
|
|
store <4 x float> < float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 >, <4 x float>* %arrayidx
|
|
|
|
ret void
|
|
|
|
}
|
2008-12-27 05:51:36 +01:00
|
|
|
|
|
|
|
; Test truncating stores:
|
|
|
|
|
|
|
|
define zeroext i8 @tstore_i16_i8(i16 signext %val, i8* %dest) nounwind {
|
|
|
|
entry:
|
|
|
|
%conv = trunc i16 %val to i8
|
|
|
|
store i8 %conv, i8* %dest
|
|
|
|
ret i8 %conv
|
|
|
|
}
|
|
|
|
|
|
|
|
define zeroext i8 @tstore_i32_i8(i32 %val, i8* %dest) nounwind {
|
|
|
|
entry:
|
|
|
|
%conv = trunc i32 %val to i8
|
|
|
|
store i8 %conv, i8* %dest
|
|
|
|
ret i8 %conv
|
|
|
|
}
|
|
|
|
|
|
|
|
define signext i16 @tstore_i32_i16(i32 %val, i16* %dest) nounwind {
|
|
|
|
entry:
|
|
|
|
%conv = trunc i32 %val to i16
|
|
|
|
store i16 %conv, i16* %dest
|
|
|
|
ret i16 %conv
|
|
|
|
}
|
|
|
|
|
|
|
|
define zeroext i8 @tstore_i64_i8(i64 %val, i8* %dest) nounwind {
|
|
|
|
entry:
|
|
|
|
%conv = trunc i64 %val to i8
|
|
|
|
store i8 %conv, i8* %dest
|
|
|
|
ret i8 %conv
|
|
|
|
}
|
|
|
|
|
|
|
|
define signext i16 @tstore_i64_i16(i64 %val, i16* %dest) nounwind {
|
|
|
|
entry:
|
|
|
|
%conv = trunc i64 %val to i16
|
|
|
|
store i16 %conv, i16* %dest
|
|
|
|
ret i16 %conv
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @tstore_i64_i32(i64 %val, i32* %dest) nounwind {
|
|
|
|
entry:
|
|
|
|
%conv = trunc i64 %val to i32
|
|
|
|
store i32 %conv, i32* %dest
|
|
|
|
ret i32 %conv
|
|
|
|
}
|
|
|
|
|
|
|
|
define float @tstore_f64_f32(double %val, float* %dest) nounwind {
|
|
|
|
entry:
|
|
|
|
%conv = fptrunc double %val to float
|
|
|
|
store float %conv, float* %dest
|
|
|
|
ret float %conv
|
|
|
|
}
|
2010-11-12 11:14:03 +01:00
|
|
|
|
|
|
|
;Check stores that might span two 16 byte memory blocks
|
|
|
|
define void @store_misaligned( i32 %val, i32* %ptr) {
|
|
|
|
;CHECK: store_misaligned
|
|
|
|
;CHECK: lqd
|
|
|
|
;CHECK: lqd
|
|
|
|
;CHECK: stqd
|
|
|
|
;CHECK: stqd
|
|
|
|
;CHECK: bi $lr
|
|
|
|
store i32 %val, i32*%ptr, align 2
|
|
|
|
ret void
|
|
|
|
}
|
2011-01-17 12:59:20 +01:00
|
|
|
|
|
|
|
define void @store_v8( <8 x float> %val, <8 x float>* %ptr )
|
|
|
|
{
|
|
|
|
;CHECK: stq
|
|
|
|
;CHECK: stq
|
|
|
|
;CHECK: bi $lr
|
|
|
|
store <8 x float> %val, <8 x float>* %ptr
|
|
|
|
ret void
|
|
|
|
}
|
2011-03-04 13:00:11 +01:00
|
|
|
|
|
|
|
define void @store_null_vec( <4 x i32> %val ) {
|
|
|
|
; FIXME - this is for some reason compiled into a il+stqd, not a sta.
|
|
|
|
;CHECK: stqd
|
|
|
|
;CHECK: bi $lr
|
|
|
|
store <4 x i32> %val, <4 x i32>* null
|
|
|
|
ret void
|
|
|
|
}
|