mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 03:02:36 +01:00
8ed3c99d18
Determine the insert/extractelement costs when performing this as a sequence of aliased loads+stores via the stack.
41 lines
1.5 KiB
LLVM
41 lines
1.5 KiB
LLVM
; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-apple-macosx10.8.0 -mcpu=corei7-avx | FileCheck %s
|
|
|
|
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
|
|
target triple = "x86_64-apple-macosx10.8.0"
|
|
|
|
define i32 @insert-extract-at-zero-idx(i32 %arg, float %fl) {
|
|
;CHECK: cost of 0 {{.*}} extract
|
|
%A = extractelement <4 x float> undef, i32 0
|
|
;CHECK: cost of 1 {{.*}} extract
|
|
%B = extractelement <4 x i32> undef, i32 0
|
|
;CHECK: cost of 1 {{.*}} extract
|
|
%C = extractelement <4 x float> undef, i32 1
|
|
|
|
;CHECK: cost of 0 {{.*}} extract
|
|
%D = extractelement <8 x float> undef, i32 0
|
|
;CHECK: cost of 1 {{.*}} extract
|
|
%E = extractelement <8 x float> undef, i32 1
|
|
|
|
;CHECK: cost of 3 {{.*}} extract
|
|
%F = extractelement <8 x float> undef, i32 %arg
|
|
|
|
;CHECK: cost of 0 {{.*}} insert
|
|
%G = insertelement <4 x float> undef, float %fl, i32 0
|
|
;CHECK: cost of 1 {{.*}} insert
|
|
%H = insertelement <4 x float> undef, float %fl, i32 1
|
|
;CHECK: cost of 1 {{.*}} insert
|
|
%I = insertelement <4 x i32> undef, i32 %arg, i32 0
|
|
|
|
;CHECK: cost of 0 {{.*}} insert
|
|
%J = insertelement <4 x double> undef, double undef, i32 0
|
|
|
|
;CHECK: cost of 0 {{.*}} insert
|
|
%K = insertelement <8 x double> undef, double undef, i32 4
|
|
;CHECK: cost of 0 {{.*}} insert
|
|
%L = insertelement <16 x double> undef, double undef, i32 8
|
|
;CHECK: cost of 1 {{.*}} insert
|
|
%M = insertelement <16 x double> undef, double undef, i32 9
|
|
ret i32 0
|
|
}
|
|
|