diff options
| -rw-r--r-- | llvm/lib/Target/X86/X86TargetTransformInfo.cpp | 14 | ||||
| -rw-r--r-- | llvm/test/Analysis/CostModel/X86/cmp.ll | 16 | 
2 files changed, 19 insertions, 11 deletions
| diff --git a/llvm/lib/Target/X86/X86TargetTransformInfo.cpp b/llvm/lib/Target/X86/X86TargetTransformInfo.cpp index 6ffef1654ea..28ae96d4108 100644 --- a/llvm/lib/Target/X86/X86TargetTransformInfo.cpp +++ b/llvm/lib/Target/X86/X86TargetTransformInfo.cpp @@ -857,13 +857,17 @@ int X86TTIImpl::getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy) {    int ISD = TLI->InstructionOpcodeToISD(Opcode);    assert(ISD && "Invalid opcode"); +  static const CostTblEntry SSE2CostTbl[] = { +    { ISD::SETCC,   MVT::v2i64,   8 }, +    { ISD::SETCC,   MVT::v4i32,   1 }, +    { ISD::SETCC,   MVT::v8i16,   1 }, +    { ISD::SETCC,   MVT::v16i8,   1 }, +  }; +    static const CostTblEntry SSE42CostTbl[] = {      { ISD::SETCC,   MVT::v2f64,   1 },      { ISD::SETCC,   MVT::v4f32,   1 },      { ISD::SETCC,   MVT::v2i64,   1 }, -    { ISD::SETCC,   MVT::v4i32,   1 }, -    { ISD::SETCC,   MVT::v8i16,   1 }, -    { ISD::SETCC,   MVT::v16i8,   1 },    };    static const CostTblEntry AVX1CostTbl[] = { @@ -906,6 +910,10 @@ int X86TTIImpl::getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy) {      if (const auto *Entry = CostTableLookup(SSE42CostTbl, ISD, MTy))        return LT.first * Entry->Cost; +  if (ST->hasSSE2()) +    if (const auto *Entry = CostTableLookup(SSE2CostTbl, ISD, MTy)) +      return LT.first * Entry->Cost; +    return BaseT::getCmpSelInstrCost(Opcode, ValTy, CondTy);  } diff --git a/llvm/test/Analysis/CostModel/X86/cmp.ll b/llvm/test/Analysis/CostModel/X86/cmp.ll index 80fbbc47089..f4733d6737e 100644 --- a/llvm/test/Analysis/CostModel/X86/cmp.ll +++ b/llvm/test/Analysis/CostModel/X86/cmp.ll @@ -87,18 +87,18 @@ define i32 @cmp(i32 %arg) {    ;AVX:   cost of 1 {{.*}} icmp    %H = icmp eq <4 x i32> undef, undef -  ;SSE2:  cost of 1 {{.*}} icmp -  ;SSE3:  cost of 1 {{.*}} icmp -  ;SSSE3: cost of 1 {{.*}} icmp -  ;SSE41: cost of 1 {{.*}} icmp +  ;SSE2:  cost of 8 {{.*}} icmp +  ;SSE3:  cost of 8 {{.*}} icmp +  ;SSSE3: cost of 8 {{.*}} icmp +  ;SSE41: cost of 8 {{.*}} icmp    ;SSE42: cost of 1 {{.*}} icmp    ;AVX:   cost of 1 {{.*}} icmp    %I = icmp eq <2 x i64> undef, undef -  ;SSE2:  cost of 2 {{.*}} icmp -  ;SSE3:  cost of 2 {{.*}} icmp -  ;SSSE3: cost of 2 {{.*}} icmp -  ;SSE41: cost of 2 {{.*}} icmp +  ;SSE2:  cost of 16 {{.*}} icmp +  ;SSE3:  cost of 16 {{.*}} icmp +  ;SSSE3: cost of 16 {{.*}} icmp +  ;SSE41: cost of 16 {{.*}} icmp    ;SSE42: cost of 2 {{.*}} icmp    ;AVX1:  cost of 4 {{.*}} icmp    ;AVX2:  cost of 1 {{.*}} icmp | 

