Add Triple::isAndroid().

[oota-llvm.git] / lib / Target / PowerPC / PPCTargetMachine.cpp
diff --git a/lib/Target/PowerPC/PPCTargetMachine.cpp b/lib/Target/PowerPC/PPCTargetMachine.cpp

index 50d4395dfbe8c66a45d57b46c380fbf67095312e..df687b2cade30471d23c92d5403ddbf9f75b7b6e 100644 (file)
--- a/lib/Target/PowerPC/PPCTargetMachine.cpp
+++ b/lib/Target/PowerPC/PPCTargetMachine.cpp
@@ -57,6 +57,11 @@ EnableExtraTOCRegDeps("enable-ppc-extra-toc-reg-deps",
                        cl::desc("Add extra TOC register dependencies"),
                        cl::init(true), cl::Hidden);
  
+static cl::opt<bool>
+EnableMachineCombinerPass("ppc-machine-combiner",
+                          cl::desc("Enable the machine combiner pass"),
+                          cl::init(true), cl::Hidden);
+
  extern "C" void LLVMInitializePowerPCTarget() {
    // Register the targets
    RegisterTargetMachine<PPC32TargetMachine> A(ThePPC32Target);
@@ -98,13 +103,12 @@ static std::string getDataLayoutString(const Triple &T) {
    return Ret;
  }
  
-static std::string computeFSAdditions(StringRef FS, CodeGenOpt::Level OL, StringRef TT) {
+static std::string computeFSAdditions(StringRef FS, CodeGenOpt::Level OL,
+                                      const Triple &TT) {
    std::string FullFS = FS;
-  Triple TargetTriple(TT);
  
    // Make sure 64-bit features are available when CPUname is generic
-  if (TargetTriple.getArch() == Triple::ppc64 ||
-      TargetTriple.getArch() == Triple::ppc64le) {
+  if (TT.getArch() == Triple::ppc64 || TT.getArch() == Triple::ppc64le) {
      if (!FullFS.empty())
        FullFS = "+64bit," + FullFS;
      else
@@ -119,7 +123,7 @@ static std::string computeFSAdditions(StringRef FS, CodeGenOpt::Level OL, String
    }
  
    if (OL != CodeGenOpt::None) {
-     if (!FullFS.empty())
+    if (!FullFS.empty())
        FullFS = "+invariant-function-descriptors," + FullFS;
      else
        FullFS = "+invariant-function-descriptors";
@@ -145,7 +149,7 @@ static PPCTargetMachine::PPCABI computeTargetABI(const Triple &TT,
      return PPCTargetMachine::PPC_ABI_ELFv2;
  
    assert(Options.MCOptions.getABIName().empty() &&
-        "Unknown target-abi option!");
+         "Unknown target-abi option!");
  
    if (!TT.isMacOSX()) {
      switch (TT.getArch()) {
@@ -161,18 +165,38 @@ static PPCTargetMachine::PPCABI computeTargetABI(const Triple &TT,
    return PPCTargetMachine::PPC_ABI_UNKNOWN;
  }
  
-// The FeatureString here is a little subtle. We are modifying the feature string
-// with what are (currently) non-function specific overrides as it goes into the
-// LLVMTargetMachine constructor and then using the stored value in the
+// The FeatureString here is a little subtle. We are modifying the feature
+// string with what are (currently) non-function specific overrides as it goes
+// into the LLVMTargetMachine constructor and then using the stored value in the
  // Subtarget constructor below it.
-PPCTargetMachine::PPCTargetMachine(const Target &T, StringRef TT, StringRef CPU,
-                                   StringRef FS, const TargetOptions &Options,
+PPCTargetMachine::PPCTargetMachine(const Target &T, const Triple &TT,
+                                   StringRef CPU, StringRef FS,
+                                   const TargetOptions &Options,
                                     Reloc::Model RM, CodeModel::Model CM,
                                     CodeGenOpt::Level OL)
-    : LLVMTargetMachine(T, getDataLayoutString(Triple(TT)), TT, CPU,
+    : LLVMTargetMachine(T, getDataLayoutString(TT), TT, CPU,
                          computeFSAdditions(FS, OL, TT), Options, RM, CM, OL),
-      TLOF(createTLOF(Triple(getTargetTriple()))),
-      TargetABI(computeTargetABI(Triple(TT), Options)) {
+      TLOF(createTLOF(getTargetTriple())),
+      TargetABI(computeTargetABI(TT, Options)),
+      Subtarget(TargetTriple, CPU, computeFSAdditions(FS, OL, TT), *this) {
+
+  // For the estimates, convergence is quadratic, so we essentially double the
+  // number of digits correct after every iteration. For both FRE and FRSQRTE,
+  // the minimum architected relative accuracy is 2^-5. When hasRecipPrec(),
+  // this is 2^-14. IEEE float has 23 digits and double has 52 digits.
+  unsigned RefinementSteps = Subtarget.hasRecipPrec() ? 1 : 3,
+           RefinementSteps64 = RefinementSteps + 1;
+
+  this->Options.Reciprocals.setDefaults("sqrtf", true, RefinementSteps);
+  this->Options.Reciprocals.setDefaults("vec-sqrtf", true, RefinementSteps);
+  this->Options.Reciprocals.setDefaults("divf", true, RefinementSteps);
+  this->Options.Reciprocals.setDefaults("vec-divf", true, RefinementSteps);
+
+  this->Options.Reciprocals.setDefaults("sqrtd", true, RefinementSteps64);
+  this->Options.Reciprocals.setDefaults("vec-sqrtd", true, RefinementSteps64);
+  this->Options.Reciprocals.setDefaults("divd", true, RefinementSteps64);
+  this->Options.Reciprocals.setDefaults("vec-divd", true, RefinementSteps64);
+
    initAsmInfo();
  }
  
@@ -180,23 +204,21 @@ PPCTargetMachine::~PPCTargetMachine() {}
  
  void PPC32TargetMachine::anchor() { }
  
-PPC32TargetMachine::PPC32TargetMachine(const Target &T, StringRef TT,
+PPC32TargetMachine::PPC32TargetMachine(const Target &T, const Triple &TT,
                                         StringRef CPU, StringRef FS,
                                         const TargetOptions &Options,
                                         Reloc::Model RM, CodeModel::Model CM,
                                         CodeGenOpt::Level OL)
-  : PPCTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL) {
-}
+    : PPCTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL) {}
  
  void PPC64TargetMachine::anchor() { }
  
-PPC64TargetMachine::PPC64TargetMachine(const Target &T, StringRef TT,
-                                       StringRef CPU,  StringRef FS,
+PPC64TargetMachine::PPC64TargetMachine(const Target &T, const Triple &TT,
+                                       StringRef CPU, StringRef FS,
                                         const TargetOptions &Options,
                                         Reloc::Model RM, CodeModel::Model CM,
                                         CodeGenOpt::Level OL)
-  : PPCTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL) {
-}
+    : PPCTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL) {}
  
  const PPCSubtarget *
  PPCTargetMachine::getSubtargetImpl(const Function &F) const {
@@ -264,9 +286,8 @@ void PPCPassConfig::addIRPasses() {
  
    // For the BG/Q (or if explicitly requested), add explicit data prefetch
    // intrinsics.
-  bool UsePrefetching =
-    Triple(TM->getTargetTriple()).getVendor() == Triple::BGQ &&           
-    getOptLevel() != CodeGenOpt::None;
+  bool UsePrefetching = TM->getTargetTriple().getVendor() == Triple::BGQ &&
+                        getOptLevel() != CodeGenOpt::None;
    if (EnablePrefetch.getNumOccurrences() > 0)
      UsePrefetching = EnablePrefetch;
    if (UsePrefetching)
@@ -300,6 +321,10 @@ bool PPCPassConfig::addPreISel() {
  
  bool PPCPassConfig::addILPOpts() {
    addPass(&EarlyIfConverterID);
+
+  if (EnableMachineCombinerPass)
+    addPass(&MachineCombinerID);
+
    return true;
  }
  
@@ -320,7 +345,7 @@ void PPCPassConfig::addMachineSSAOptimization() {
    TargetPassConfig::addMachineSSAOptimization();
    // For little endian, remove where possible the vector swap instructions
    // introduced at code generation to normalize vector element order.
-  if (Triple(TM->getTargetTriple()).getArch() == Triple::ppc64le &&
+  if (TM->getTargetTriple().getArch() == Triple::ppc64le &&
        !DisableVSXSwapRemoval)
      addPass(createPPCVSXSwapRemovalPass());
  }
@@ -348,6 +373,7 @@ void PPCPassConfig::addPreEmitPass() {
  }
  
  TargetIRAnalysis PPCTargetMachine::getTargetIRAnalysis() {
-  return TargetIRAnalysis(
-      [this](Function &F) { return TargetTransformInfo(PPCTTIImpl(this, F)); });
+  return TargetIRAnalysis([this](const Function &F) {
+    return TargetTransformInfo(PPCTTIImpl(this, F));
+  });
  }