mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-25 12:12:47 +01:00
[CostModel][X86] getCastInstrCost - attempt to match custom cast/conversion before legalized types.
Move the (SSE-only) generic, legalized type conversion matching after the specific,custom conversion cases, allowing us to properly provide cost overrides. The next step will be to clean up some of the weird existing costs and then to enable AVX+ legalized costs, which will let us strip out a lot of the cost tables entries.
This commit is contained in:
parent
7a8e30eba0
commit
b53b3c8d1c
@ -1519,9 +1519,11 @@ InstructionCost X86TTIImpl::getCastInstrCost(unsigned Opcode, Type *Dst,
|
||||
return Cost;
|
||||
};
|
||||
|
||||
// The cost tables include both specific, custom (non-legal) src/dst type
|
||||
// conversions and generic, legalized types. We test for customs first, before
|
||||
// falling back to legalization.
|
||||
// FIXME: Need a better design of the cost table to handle non-simple types of
|
||||
// potential massive combinations (elem_num x src_type x dst_type).
|
||||
|
||||
static const TypeConversionCostTblEntry AVX512BWConversionTbl[] {
|
||||
{ ISD::SIGN_EXTEND, MVT::v32i16, MVT::v32i8, 1 },
|
||||
{ ISD::ZERO_EXTEND, MVT::v32i16, MVT::v32i8, 1 },
|
||||
@ -2173,6 +2175,74 @@ InstructionCost X86TTIImpl::getCastInstrCost(unsigned Opcode, Type *Dst,
|
||||
{ ISD::TRUNCATE, MVT::v2i32, MVT::v2i64, 1 }, // PSHUFD
|
||||
};
|
||||
|
||||
// Attempt to map directly to (simple) MVT types to let us match custom entries.
|
||||
EVT SrcTy = TLI->getValueType(DL, Src);
|
||||
EVT DstTy = TLI->getValueType(DL, Dst);
|
||||
|
||||
// The function getSimpleVT only handles simple value types.
|
||||
if (SrcTy.isSimple() && DstTy.isSimple()) {
|
||||
MVT SimpleSrcTy = SrcTy.getSimpleVT();
|
||||
MVT SimpleDstTy = DstTy.getSimpleVT();
|
||||
|
||||
if (ST->useAVX512Regs()) {
|
||||
if (ST->hasBWI())
|
||||
if (const auto *Entry = ConvertCostTableLookup(
|
||||
AVX512BWConversionTbl, ISD, SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasDQI())
|
||||
if (const auto *Entry = ConvertCostTableLookup(
|
||||
AVX512DQConversionTbl, ISD, SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasAVX512())
|
||||
if (const auto *Entry = ConvertCostTableLookup(
|
||||
AVX512FConversionTbl, ISD, SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
|
||||
if (ST->hasBWI())
|
||||
if (const auto *Entry = ConvertCostTableLookup(
|
||||
AVX512BWVLConversionTbl, ISD, SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasDQI())
|
||||
if (const auto *Entry = ConvertCostTableLookup(
|
||||
AVX512DQVLConversionTbl, ISD, SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasAVX512())
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVX512VLConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasAVX2()) {
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVX2ConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
|
||||
if (ST->hasAVX()) {
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVXConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
|
||||
if (ST->hasSSE41()) {
|
||||
if (const auto *Entry = ConvertCostTableLookup(SSE41ConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
|
||||
if (ST->hasSSE2()) {
|
||||
if (const auto *Entry = ConvertCostTableLookup(SSE2ConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
}
|
||||
|
||||
// Fall back to legalized types.
|
||||
// TODO: Add AVX support.
|
||||
std::pair<InstructionCost, MVT> LTSrc = TLI->getTypeLegalizationCost(DL, Src);
|
||||
std::pair<InstructionCost, MVT> LTDest =
|
||||
TLI->getTypeLegalizationCost(DL, Dst);
|
||||
@ -2187,72 +2257,6 @@ InstructionCost X86TTIImpl::getCastInstrCost(unsigned Opcode, Type *Dst,
|
||||
LTDest.second, LTSrc.second))
|
||||
return AdjustCost(LTSrc.first * Entry->Cost);
|
||||
|
||||
EVT SrcTy = TLI->getValueType(DL, Src);
|
||||
EVT DstTy = TLI->getValueType(DL, Dst);
|
||||
|
||||
// The function getSimpleVT only handles simple value types.
|
||||
if (!SrcTy.isSimple() || !DstTy.isSimple())
|
||||
return AdjustCost(BaseT::getCastInstrCost(Opcode, Dst, Src, CCH, CostKind));
|
||||
|
||||
MVT SimpleSrcTy = SrcTy.getSimpleVT();
|
||||
MVT SimpleDstTy = DstTy.getSimpleVT();
|
||||
|
||||
if (ST->useAVX512Regs()) {
|
||||
if (ST->hasBWI())
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVX512BWConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasDQI())
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVX512DQConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasAVX512())
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVX512FConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
|
||||
if (ST->hasBWI())
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVX512BWVLConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasDQI())
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVX512DQVLConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasAVX512())
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVX512VLConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
|
||||
if (ST->hasAVX2()) {
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVX2ConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
|
||||
if (ST->hasAVX()) {
|
||||
if (const auto *Entry = ConvertCostTableLookup(AVXConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
|
||||
if (ST->hasSSE41()) {
|
||||
if (const auto *Entry = ConvertCostTableLookup(SSE41ConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
|
||||
if (ST->hasSSE2()) {
|
||||
if (const auto *Entry = ConvertCostTableLookup(SSE2ConversionTbl, ISD,
|
||||
SimpleDstTy, SimpleSrcTy))
|
||||
return AdjustCost(Entry->Cost);
|
||||
}
|
||||
|
||||
return AdjustCost(
|
||||
BaseT::getCastInstrCost(Opcode, Dst, Src, CCH, CostKind, I));
|
||||
}
|
||||
|
@ -391,7 +391,7 @@ define void @sitofp4(<4 x i1> %a, <4 x i8> %b, <4 x i16> %c, <4 x i32> %d) {
|
||||
; SSE41-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %C1 = sitofp <4 x i16> %c to <4 x float>
|
||||
; SSE41-NEXT: Cost Model: Found an estimated cost of 80 for instruction: %C2 = sitofp <4 x i16> %c to <4 x double>
|
||||
; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %D1 = sitofp <4 x i32> %d to <4 x float>
|
||||
; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %D2 = sitofp <4 x i32> %d to <4 x double>
|
||||
; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %D2 = sitofp <4 x i32> %d to <4 x double>
|
||||
; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
|
||||
;
|
||||
; AVX1-LABEL: 'sitofp4'
|
||||
|
@ -79,7 +79,7 @@ define i32 @sitofp_i32_double() {
|
||||
; SSE42-LABEL: 'sitofp_i32_double'
|
||||
; SSE42-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %cvt_i32_f64 = sitofp i32 undef to double
|
||||
; SSE42-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %cvt_v2i32_v2f64 = sitofp <2 x i32> undef to <2 x double>
|
||||
; SSE42-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %cvt_v4i32_v4f64 = sitofp <4 x i32> undef to <4 x double>
|
||||
; SSE42-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %cvt_v4i32_v4f64 = sitofp <4 x i32> undef to <4 x double>
|
||||
; SSE42-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %cvt_v8i32_v8f64 = sitofp <8 x i32> undef to <8 x double>
|
||||
; SSE42-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef
|
||||
;
|
||||
|
Loading…
Reference in New Issue
Block a user