Move private classes into anonymous namespaces

[oota-llvm.git] / lib / Transforms / Scalar / LoopRerollPass.cpp
diff --git a/lib/Transforms/Scalar/LoopRerollPass.cpp b/lib/Transforms/Scalar/LoopRerollPass.cpp

index 83538fc7cba986b1e22493571c2c7c8637d59d5a..d87781c98f3005b0d36445d28cde6c9b66492477 100644 (file)
--- a/lib/Transforms/Scalar/LoopRerollPass.cpp
+++ b/lib/Transforms/Scalar/LoopRerollPass.cpp
@@ -45,6 +45,12 @@ static cl::opt<unsigned>
  MaxInc("max-reroll-increment", cl::init(2048), cl::Hidden,
    cl::desc("The maximum increment for loop rerolling"));
  
+static cl::opt<unsigned>
+NumToleratedFailedMatches("reroll-num-tolerated-failed-matches", cl::init(400),
+                          cl::Hidden,
+                          cl::desc("The maximum number of failures to tolerate"
+                                   " during fuzzy matching. (default: 400)"));
+
  // This loop re-rolling transformation aims to transform loops like this:
  //
  // int foo(int a);
@@ -154,7 +160,6 @@ namespace {
      AliasAnalysis *AA;
      LoopInfo *LI;
      ScalarEvolution *SE;
-    const DataLayout *DL;
      TargetLibraryInfo *TLI;
      DominatorTree *DT;
  
@@ -361,10 +366,8 @@ namespace {
      struct DAGRootTracker {
        DAGRootTracker(LoopReroll *Parent, Loop *L, Instruction *IV,
                       ScalarEvolution *SE, AliasAnalysis *AA,
-                     TargetLibraryInfo *TLI, const DataLayout *DL)
-        : Parent(Parent), L(L), SE(SE), AA(AA), TLI(TLI),
-          DL(DL), IV(IV) {
-      }
+                     TargetLibraryInfo *TLI)
+          : Parent(Parent), L(L), SE(SE), AA(AA), TLI(TLI), IV(IV) {}
  
        /// Stage 1: Find all the DAG roots for the induction variable.
        bool findRoots();
@@ -394,9 +397,14 @@ namespace {
                                  const SmallInstructionSet &Final,
                                  DenseSet<Instruction *> &Users);
  
-      UsesTy::iterator nextInstr(int Val, UsesTy &In, UsesTy::iterator I);
+      UsesTy::iterator nextInstr(int Val, UsesTy &In,
+                                 const SmallInstructionSet &Exclude,
+                                 UsesTy::iterator *StartI=nullptr);
        bool isBaseInst(Instruction *I);
        bool isRootInst(Instruction *I);
+      bool instrDependsOn(Instruction *I,
+                          UsesTy::iterator Start,
+                          UsesTy::iterator End);
  
        LoopReroll *Parent;
  
@@ -405,7 +413,6 @@ namespace {
        ScalarEvolution *SE;
        AliasAnalysis *AA;
        TargetLibraryInfo *TLI;
-      const DataLayout *DL;
  
        // The loop induction variable.
        Instruction *IV;
@@ -500,6 +507,8 @@ void LoopReroll::SimpleLoopReduction::add(Loop *L) {
    // (including the PHI), except for the last value (which is used by the PHI
    // and also outside the loop).
    Instruction *C = Instructions.front();
+  if (C->user_empty())
+    return;
  
    do {
      C = cast<Instruction>(*C->user_begin());
@@ -706,14 +715,17 @@ collectPossibleRoots(Instruction *Base, std::map<int64_t,Instruction*> &Roots) {
  
    if (Roots.empty())
      return false;
-  
-  assert(Roots.find(0) == Roots.end() && "Didn't expect a zero index!");
  
    // If we found non-loop-inc, non-root users of Base, assume they are
    // for the zeroth root index. This is because "add %a, 0" gets optimized
    // away.
-  if (BaseUsers.size())
+  if (BaseUsers.size()) {
+    if (Roots.find(0) != Roots.end()) {
+      DEBUG(dbgs() << "LRR: Multiple roots found for base - aborting!\n");
+      return false;
+    }
      Roots[0] = Base;
+  }
  
    // Calculate the number of users of the base, or lowest indexed, iteration.
    unsigned NumBaseUses = BaseUsers.size();
@@ -941,10 +953,16 @@ bool LoopReroll::DAGRootTracker::collectUsedInstructions(SmallInstructionSet &Po
  
  }
  
+/// Get the next instruction in "In" that is a member of set Val.
+/// Start searching from StartI, and do not return anything in Exclude.
+/// If StartI is not given, start from In.begin().
  LoopReroll::DAGRootTracker::UsesTy::iterator
  LoopReroll::DAGRootTracker::nextInstr(int Val, UsesTy &In,
-                                      UsesTy::iterator I) {
-  while (I != In.end() && I->second.test(Val) == 0)
+                                      const SmallInstructionSet &Exclude,
+                                      UsesTy::iterator *StartI) {
+  UsesTy::iterator I = StartI ? *StartI : In.begin();
+  while (I != In.end() && (I->second.test(Val) == 0 ||
+                           Exclude.count(I->first) != 0))
      ++I;
    return I;
  }
@@ -965,6 +983,19 @@ bool LoopReroll::DAGRootTracker::isRootInst(Instruction *I) {
    return false;
  }
  
+/// Return true if instruction I depends on any instruction between
+/// Start and End.
+bool LoopReroll::DAGRootTracker::instrDependsOn(Instruction *I,
+                                                UsesTy::iterator Start,
+                                                UsesTy::iterator End) {
+  for (auto *U : I->users()) {
+    for (auto It = Start; It != End; ++It)
+      if (U == It->first)
+        return true;
+  }
+  return false;
+}
+
  bool LoopReroll::DAGRootTracker::validate(ReductionTracker &Reductions) {
    // We now need to check for equivalence of the use graph of each root with
    // that of the primary induction variable (excluding the roots). Our goal
@@ -1022,8 +1053,9 @@ bool LoopReroll::DAGRootTracker::validate(ReductionTracker &Reductions) {
      DenseMap<Value *, Value *> BaseMap;
  
      // Compare iteration Iter to the base.
-    auto BaseIt = nextInstr(0, Uses, Uses.begin());
-    auto RootIt = nextInstr(Iter, Uses, Uses.begin());
+    SmallInstructionSet Visited;
+    auto BaseIt = nextInstr(0, Uses, Visited);
+    auto RootIt = nextInstr(Iter, Uses, Visited);
      auto LastRootIt = Uses.begin();
  
      while (BaseIt != Uses.end() && RootIt != Uses.end()) {
@@ -1033,20 +1065,58 @@ bool LoopReroll::DAGRootTracker::validate(ReductionTracker &Reductions) {
        // Skip over the IV or root instructions; only match their users.
        bool Continue = false;
        if (isBaseInst(BaseInst)) {
-        BaseIt = nextInstr(0, Uses, ++BaseIt);
+        Visited.insert(BaseInst);
+        BaseIt = nextInstr(0, Uses, Visited);
          Continue = true;
        }
        if (isRootInst(RootInst)) {
          LastRootIt = RootIt;
-        RootIt = nextInstr(Iter, Uses, ++RootIt);
+        Visited.insert(RootInst);
+        RootIt = nextInstr(Iter, Uses, Visited);
          Continue = true;
        }
        if (Continue) continue;
  
+      if (!BaseInst->isSameOperationAs(RootInst)) {
+        // Last chance saloon. We don't try and solve the full isomorphism
+        // problem, but try and at least catch the case where two instructions
+        // *of different types* are round the wrong way. We won't be able to
+        // efficiently tell, given two ADD instructions, which way around we
+        // should match them, but given an ADD and a SUB, we can at least infer
+        // which one is which.
+        //
+        // This should allow us to deal with a greater subset of the isomorphism
+        // problem. It does however change a linear algorithm into a quadratic
+        // one, so limit the number of probes we do.
+        auto TryIt = RootIt;
+        unsigned N = NumToleratedFailedMatches;
+        while (TryIt != Uses.end() &&
+               !BaseInst->isSameOperationAs(TryIt->first) &&
+               N--) {
+          ++TryIt;
+          TryIt = nextInstr(Iter, Uses, Visited, &TryIt);
+        }
+
+        if (TryIt == Uses.end() || TryIt == RootIt ||
+            instrDependsOn(TryIt->first, RootIt, TryIt)) {
+          DEBUG(dbgs() << "LRR: iteration root match failed at " << *BaseInst <<
+                " vs. " << *RootInst << "\n");
+          return false;
+        }
+        
+        RootIt = TryIt;
+        RootInst = TryIt->first;
+      }
+
        // All instructions between the last root and this root
-      // belong to some other iteration. If they belong to a 
+      // may belong to some other iteration. If they belong to a 
        // future iteration, then they're dangerous to alias with.
-      for (; LastRootIt != RootIt; ++LastRootIt) {
+      // 
+      // Note that because we allow a limited amount of flexibility in the order
+      // that we visit nodes, LastRootIt might be *before* RootIt, in which
+      // case we've already checked this set of instructions so we shouldn't
+      // do anything.
+      for (; LastRootIt < RootIt; ++LastRootIt) {
          Instruction *I = LastRootIt->first;
          if (LastRootIt->second.find_first() < (int)Iter)
            continue;
@@ -1057,17 +1127,11 @@ bool LoopReroll::DAGRootTracker::validate(ReductionTracker &Reductions) {
          // needed because otherwise isSafeToSpeculativelyExecute returns
          // false on PHI nodes.
          if (!isa<PHINode>(I) && !isSimpleLoadStore(I) &&
-            !isSafeToSpeculativelyExecute(I, DL))
+            !isSafeToSpeculativelyExecute(I))
            // Intervening instructions cause side effects.
            FutureSideEffects = true;
        }
  
-      if (!BaseInst->isSameOperationAs(RootInst)) {
-        DEBUG(dbgs() << "LRR: iteration root match failed at " << *BaseInst <<
-              " vs. " << *RootInst << "\n");
-        return false;
-      }
-
        // Make sure that this instruction, which is in the use set of this
        // root instruction, does not also belong to the base set or the set of
        // some other root instruction.
@@ -1093,11 +1157,10 @@ bool LoopReroll::DAGRootTracker::validate(ReductionTracker &Reductions) {
        // side effects, and this instruction might also, then we can't reorder
        // them, and this matching fails. As an exception, we allow the alias
        // set tracker to handle regular (simple) load/store dependencies.
-      if (FutureSideEffects &&
-            ((!isSimpleLoadStore(BaseInst) &&
-              !isSafeToSpeculativelyExecute(BaseInst, DL)) ||
-             (!isSimpleLoadStore(RootInst) &&
-              !isSafeToSpeculativelyExecute(RootInst, DL)))) {
+      if (FutureSideEffects && ((!isSimpleLoadStore(BaseInst) &&
+                                 !isSafeToSpeculativelyExecute(BaseInst)) ||
+                                (!isSimpleLoadStore(RootInst) &&
+                                 !isSafeToSpeculativelyExecute(RootInst)))) {
          DEBUG(dbgs() << "LRR: iteration root match failed at " << *BaseInst <<
                          " vs. " << *RootInst <<
                          " (side effects prevent reordering)\n");
@@ -1174,8 +1237,10 @@ bool LoopReroll::DAGRootTracker::validate(ReductionTracker &Reductions) {
        BaseMap.insert(std::make_pair(RootInst, BaseInst));
  
        LastRootIt = RootIt;
-      BaseIt = nextInstr(0, Uses, ++BaseIt);
-      RootIt = nextInstr(Iter, Uses, ++RootIt);
+      Visited.insert(BaseInst);
+      Visited.insert(RootInst);
+      BaseIt = nextInstr(0, Uses, Visited);
+      RootIt = nextInstr(Iter, Uses, Visited);
      }
      assert (BaseIt == Uses.end() && RootIt == Uses.end() &&
              "Mismatched set sizes!");
@@ -1202,6 +1267,7 @@ void LoopReroll::DAGRootTracker::replace(const SCEV *IterCount) {
  
      ++J;
    }
+  const DataLayout &DL = Header->getModule()->getDataLayout();
  
    // We need to create a new induction variable for each different BaseInst.
    for (auto &DRS : RootSets) {
@@ -1214,7 +1280,7 @@ void LoopReroll::DAGRootTracker::replace(const SCEV *IterCount) {
                           SE->getConstant(RealIVSCEV->getType(), 1),
                           L, SCEV::FlagAnyWrap));
      { // Limit the lifetime of SCEVExpander.
-      SCEVExpander Expander(*SE, "reroll");
+      SCEVExpander Expander(*SE, DL, "reroll");
        Value *NewIV = Expander.expandCodeFor(H, IV->getType(), Header->begin());
  
        for (auto &KV : Uses) {
@@ -1254,7 +1320,7 @@ void LoopReroll::DAGRootTracker::replace(const SCEV *IterCount) {
      }
    }
  
-  SimplifyInstructionsInBlock(Header, DL, TLI);
+  SimplifyInstructionsInBlock(Header, TLI);
    DeleteDeadPHIs(Header, TLI);
  }
  
@@ -1378,7 +1444,7 @@ void LoopReroll::ReductionTracker::replaceSelected() {
  bool LoopReroll::reroll(Instruction *IV, Loop *L, BasicBlock *Header,
                          const SCEV *IterCount,
                          ReductionTracker &Reductions) {
-  DAGRootTracker DAGRoots(this, L, IV, SE, AA, TLI, DL);
+  DAGRootTracker DAGRoots(this, L, IV, SE, AA, TLI);
  
    if (!DAGRoots.findRoots())
      return false;
@@ -1407,8 +1473,6 @@ bool LoopReroll::runOnLoop(Loop *L, LPPassManager &LPM) {
    LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
    SE = &getAnalysis<ScalarEvolution>();
    TLI = &getAnalysis<TargetLibraryInfoWrapperPass>().getTLI();
-  DataLayoutPass *DLP = getAnalysisIfAvailable<DataLayoutPass>();
-  DL = DLP ? &DLP->getDataLayout() : nullptr;
    DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
  
    BasicBlock *Header = L->getHeader();