[TTI] Make the cost APIs in TargetTransformInfo consistently use 'int'

[oota-llvm.git] / lib / Target / X86 / X86TargetMachine.cpp
diff --git a/lib/Target/X86/X86TargetMachine.cpp b/lib/Target/X86/X86TargetMachine.cpp

index 5234f85f24e2557bd687e5f60f44248a157298c4..fb9cb4ba4c86edf8c0c9158fab35d1935b38265e 100644 (file)
--- a/lib/Target/X86/X86TargetMachine.cpp
+++ b/lib/Target/X86/X86TargetMachine.cpp
@@ -94,14 +94,15 @@ static std::string computeDataLayout(const Triple &TT) {
  
  /// X86TargetMachine ctor - Create an X86 target.
  ///
-X86TargetMachine::X86TargetMachine(const Target &T, StringRef TT, StringRef CPU,
-                                   StringRef FS, const TargetOptions &Options,
+X86TargetMachine::X86TargetMachine(const Target &T, const Triple &TT,
+                                   StringRef CPU, StringRef FS,
+                                   const TargetOptions &Options,
                                     Reloc::Model RM, CodeModel::Model CM,
                                     CodeGenOpt::Level OL)
-    : LLVMTargetMachine(T, computeDataLayout(Triple(TT)), TT, CPU, FS, Options,
-                        RM, CM, OL),
-      TLOF(createTLOF(Triple(getTargetTriple()))),
-      Subtarget(Triple(TT), CPU, FS, *this, Options.StackAlignmentOverride) {
+    : LLVMTargetMachine(T, computeDataLayout(TT), TT, CPU, FS, Options, RM, CM,
+                        OL),
+      TLOF(createTLOF(getTargetTriple())),
+      Subtarget(TT, CPU, FS, *this, Options.StackAlignmentOverride) {
    // Windows stack unwinder gets confused when execution flow "falls through"
    // after a call to 'noreturn' function.
    // To prevent that, we emit a trap for 'unreachable' IR instructions.
@@ -109,12 +110,15 @@ X86TargetMachine::X86TargetMachine(const Target &T, StringRef TT, StringRef CPU,
    if (Subtarget.isTargetWin64())
      this->Options.TrapUnreachable = true;
  
-  // TODO: By default, all reciprocal estimate operations are off because
-  // that matches the behavior before TargetRecip was added (except for btver2
-  // which used subtarget features to enable this type of codegen).
-  // We should change this to match GCC behavior where everything but
-  // scalar division estimates are turned on by default with -ffast-math.
-  this->Options.Reciprocals.setDefaults("all", false, 1);
+  // By default (and when -ffast-math is on), enable estimate codegen for
+  // everything except scalar division. By default, use 1 refinement step for
+  // all operations. Defaults may be overridden by using command-line options.
+  // Scalar division estimates are disabled because they break too much
+  // real-world code. These defaults match GCC behavior.
+  this->Options.Reciprocals.setDefaults("sqrtf", true, 1);
+  this->Options.Reciprocals.setDefaults("divf", false, 1);
+  this->Options.Reciprocals.setDefaults("vec-sqrtf", true, 1);
+  this->Options.Reciprocals.setDefaults("vec-divf", true, 1);
  
    initAsmInfo();
  }
@@ -152,7 +156,7 @@ X86TargetMachine::getSubtargetImpl(const Function &F) const {
      // creation will depend on the TM and the code generation flags on the
      // function that reside in TargetOptions.
      resetTargetOptions(F);
-    I = llvm::make_unique<X86Subtarget>(Triple(TargetTriple), CPU, FS, *this,
+    I = llvm::make_unique<X86Subtarget>(TargetTriple, CPU, FS, *this,
                                          Options.StackAlignmentOverride);
    }
    return I.get();
@@ -217,7 +221,7 @@ bool X86PassConfig::addInstSelector() {
    addPass(createX86ISelDag(getX86TargetMachine(), getOptLevel()));
  
    // For ELF, cleanup any local-dynamic TLS accesses.
-  if (Triple(TM->getTargetTriple()).isOSBinFormatELF() &&
+  if (TM->getTargetTriple().isOSBinFormatELF() &&
        getOptLevel() != CodeGenOpt::None)
      addPass(createCleanupLocalDynamicTLSPass());
  
@@ -235,7 +239,7 @@ bool X86PassConfig::addILPOpts() {
  
  bool X86PassConfig::addPreISel() {
    // Only add this pass for 32-bit x86 Windows.
-  Triple TT(TM->getTargetTriple());
+  const Triple &TT = TM->getTargetTriple();
    if (TT.isOSWindows() && TT.getArch() == Triple::x86)
      addPass(createX86WinEHStatePass());
    return true;