switch the flag for using NEON for SP floating point to a subtarget 'feature'

author Jim Grosbach <grosbach@apple.com>

Thu, 25 Mar 2010 23:32:19 +0000 (23:32 +0000)

committer Jim Grosbach <grosbach@apple.com>

Thu, 25 Mar 2010 23:32:19 +0000 (23:32 +0000)
author Jim Grosbach <grosbach@apple.com>
Thu, 25 Mar 2010 23:32:19 +0000 (23:32 +0000)
committer Jim Grosbach <grosbach@apple.com>
Thu, 25 Mar 2010 23:32:19 +0000 (23:32 +0000)
diff --git a/lib/Target/ARM/ARM.td b/lib/Target/ARM/ARM.td

index 50d54b436e076aa4c4dd0c1e222c7a9ccfcdb783..931c81c5b632bf2e91f41e15e5c9d3dbfc29138a 100644 (file)
--- a/lib/Target/ARM/ARM.td
+++ b/lib/Target/ARM/ARM.td
@@ -49,8 +49,14 @@ def FeatureFP16   : SubtargetFeature<"fp16", "HasFP16", "true",
  // FIXME: Currently, this is only flagged for Cortex-A8. It may be true for
  // others as well. We should do more benchmarking and confirm one way or
  // the other.
-def HasSlowVMLx   : SubtargetFeature<"vmlx", "SlowVMLx", "true",
-                                     "Disable VFP MAC instructions">;
+def FeatureHasSlowVMLx   : SubtargetFeature<"vmlx", "SlowVMLx", "true",
+                                            "Disable VFP MAC instructions">;
+// Some processors benefit from using NEON instructions for scalar
+// single-precision FP operations.
+def FeatureNEONForFP : SubtargetFeature<"neonfp", "UseNEONForSinglePrecisionFP",
+                                        "true",
+                                        "Use NEON for single precision FP">;
+
  
  //===----------------------------------------------------------------------===//
  // ARM Processors supported.
@@ -115,7 +121,8 @@ def : Processor<"arm1156t2f-s",    ARMV6Itineraries,
  
  // V7 Processors.
  def : Processor<"cortex-a8",        CortexA8Itineraries,
-                [ArchV7A, FeatureThumb2, FeatureNEON, HasSlowVMLx]>;
+                [ArchV7A, FeatureThumb2, FeatureNEON, FeatureHasSlowVMLx,
+                 FeatureNEONForFP]>;
  def : ProcNoItin<"cortex-a9",       [ArchV7A, FeatureThumb2, FeatureNEON]>;
  
  //===----------------------------------------------------------------------===//
diff --git a/lib/Target/ARM/ARMSubtarget.cpp b/lib/Target/ARM/ARMSubtarget.cpp

index 76ed66fe7df401582a5e43d6242251ffc14212e9..9e55cd870031b4154a0ac2bf45eda8bf945a0e31 100644 (file)
--- a/lib/Target/ARM/ARMSubtarget.cpp
+++ b/lib/Target/ARM/ARMSubtarget.cpp
@@ -22,10 +22,6 @@ using namespace llvm;
  static cl::opt<bool>
  ReserveR9("arm-reserve-r9", cl::Hidden,
            cl::desc("Reserve R9, making it unavailable as GPR"));
-static cl::opt<bool>
-UseNEONFP("arm-use-neon-fp",
-          cl::desc("Use NEON for single-precision FP"),
-          cl::init(false), cl::Hidden);
  
  static cl::opt<bool>
  UseMOVT("arm-use-movt",
@@ -35,7 +31,7 @@ ARMSubtarget::ARMSubtarget(const std::string &TT, const std::string &FS,
                             bool isT)
    : ARMArchVersion(V4)
    , ARMFPUType(None)
-  , UseNEONForSinglePrecisionFP(UseNEONFP)
+  , UseNEONForSinglePrecisionFP(false)
    , SlowVMLx(false)
    , IsThumb(isT)
    , ThumbMode(Thumb1)
@@ -116,14 +112,6 @@ ARMSubtarget::ARMSubtarget(const std::string &TT, const std::string &FS,
  
    if (!isThumb() || hasThumb2())
      PostRAScheduler = true;
-
-  // Set CPU specific features.
-  if (CPUString == "cortex-a8") {
-    // On Cortex-a8, it's faster to perform some single-precision FP
-    // operations with NEON instructions.
-    if (UseNEONFP.getPosition() == 0)
-      UseNEONForSinglePrecisionFP = true;
-  }
  }
  
  /// GVIsIndirectSymbol - true if the GV will be accessed via an indirect symbol.
author	Jim Grosbach <grosbach@apple.com>
	Thu, 25 Mar 2010 23:32:19 +0000 (23:32 +0000)
committer	Jim Grosbach <grosbach@apple.com>
	Thu, 25 Mar 2010 23:32:19 +0000 (23:32 +0000)
lib/Target/ARM/ARM.td		patch \| blob \| history
lib/Target/ARM/ARMSubtarget.cpp		patch \| blob \| history