ARM cost model: Address computation in vector mem ops not free

[oota-llvm.git] / lib / Target / ARM / ARMTargetTransformInfo.cpp
diff --git a/lib/Target/ARM/ARMTargetTransformInfo.cpp b/lib/Target/ARM/ARMTargetTransformInfo.cpp

index 1f91e0ee362761dafd08e7f0d7a5427982a26c9d..f6fa319970953d2312899b8957e43af5f02b0b7b 100644 (file)
--- a/lib/Target/ARM/ARMTargetTransformInfo.cpp
+++ b/lib/Target/ARM/ARMTargetTransformInfo.cpp
@@ -120,6 +120,8 @@ public:
    unsigned getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy) const;
  
    unsigned getVectorInstrCost(unsigned Opcode, Type *Val, unsigned Index) const;
+
+  unsigned getAddressComputationCost(Type *Val) const;
    /// @}
  };
  
@@ -304,12 +306,13 @@ unsigned ARMTTI::getCastInstrCost(unsigned Opcode, Type *Dst,
  
  unsigned ARMTTI::getVectorInstrCost(unsigned Opcode, Type *ValTy,
                                      unsigned Index) const {
-  // Penalize inserting into an D-subregister.
+  // Penalize inserting into an D-subregister. We end up with a three times
+  // lower estimated throughput on swift.
    if (ST->isSwift() &&
        Opcode == Instruction::InsertElement &&
        ValTy->isVectorTy() &&
        ValTy->getScalarSizeInBits() <= 32)
-    return 2;
+    return 3;
  
    return TargetTransformInfo::getVectorInstrCost(Opcode, ValTy, Index);
  }
@@ -326,3 +329,9 @@ unsigned ARMTTI::getCmpSelInstrCost(unsigned Opcode, Type *ValTy,
  
    return TargetTransformInfo::getCmpSelInstrCost(Opcode, ValTy, CondTy);
  }
+
+unsigned ARMTTI::getAddressComputationCost(Type *Ty) const {
+  // In many cases the address computation is not merged into the instruction
+  // addressing mode.
+  return 1;
+}