[mips] Correct operand order in DSP's mthi/mtlo

[oota-llvm.git] / lib / Analysis / LoopAccessAnalysis.cpp
diff --git a/lib/Analysis/LoopAccessAnalysis.cpp b/lib/Analysis/LoopAccessAnalysis.cpp

index 58a7d08860ba886645157725231e4173d9fab0c8..8bcdcb862014dc9bd9dc786dd1a63b55914abce8 100644 (file)
--- a/lib/Analysis/LoopAccessAnalysis.cpp
+++ b/lib/Analysis/LoopAccessAnalysis.cpp
@@ -87,11 +87,10 @@ Value *llvm::stripIntegerCast(Value *V) {
    return V;
  }
  
-const SCEV *llvm::replaceSymbolicStrideSCEV(ScalarEvolution *SE,
+const SCEV *llvm::replaceSymbolicStrideSCEV(PredicatedScalarEvolution &PSE,
                                              const ValueToValueMap &PtrToStride,
-                                            SCEVUnionPredicate &Preds,
                                              Value *Ptr, Value *OrigPtr) {
-  const SCEV *OrigSCEV = SE->getSCEV(Ptr);
+  const SCEV *OrigSCEV = PSE.getSCEV(Ptr);
  
    // If there is an entry in the map return the SCEV of the pointer with the
    // symbolic stride replaced by one.
@@ -108,16 +107,17 @@ const SCEV *llvm::replaceSymbolicStrideSCEV(ScalarEvolution *SE,
      ValueToValueMap RewriteMap;
      RewriteMap[StrideVal] = One;
  
+    ScalarEvolution *SE = PSE.getSE();
      const auto *U = cast<SCEVUnknown>(SE->getSCEV(StrideVal));
      const auto *CT =
          static_cast<const SCEVConstant *>(SE->getOne(StrideVal->getType()));
  
-    Preds.add(SE->getEqualPredicate(U, CT));
+    PSE.addPredicate(*SE->getEqualPredicate(U, CT));
+    auto *Expr = PSE.getSCEV(Ptr);
  
-    const SCEV *ByOne = SE->rewriteUsingPredicate(OrigSCEV, Preds);
-    DEBUG(dbgs() << "LAA: Replacing SCEV: " << *OrigSCEV << " by: " << *ByOne
+    DEBUG(dbgs() << "LAA: Replacing SCEV: " << *OrigSCEV << " by: " << *Expr
                   << "\n");
-    return ByOne;
+    return Expr;
    }
  
    // Otherwise, just return the SCEV of the original pointer.
@@ -127,11 +127,12 @@ const SCEV *llvm::replaceSymbolicStrideSCEV(ScalarEvolution *SE,
  void RuntimePointerChecking::insert(Loop *Lp, Value *Ptr, bool WritePtr,
                                      unsigned DepSetId, unsigned ASId,
                                      const ValueToValueMap &Strides,
-                                    SCEVUnionPredicate &Preds) {
+                                    PredicatedScalarEvolution &PSE) {
    // Get the stride replaced scev.
-  const SCEV *Sc = replaceSymbolicStrideSCEV(SE, Strides, Preds, Ptr);
+  const SCEV *Sc = replaceSymbolicStrideSCEV(PSE, Strides, Ptr);
    const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(Sc);
    assert(AR && "Invalid addrec expression");
+  ScalarEvolution *SE = PSE.getSE();
    const SCEV *Ex = SE->getBackedgeTakenCount(Lp);
  
    const SCEV *ScStart = AR->getStart();
@@ -268,7 +269,7 @@ void RuntimePointerChecking::groupChecks(
    // ShouldRetryWithRuntimeCheck is set, and therefore UseDependencies
    // is also false. In this case we will use the fallback path and create
    // separate checking groups for all pointers.
- 
+
    // If we don't have the dependency partitions, construct a new
    // checking pointer group for each pointer. This is also required
    // for correctness, because in this case we can have checking between
@@ -289,7 +290,7 @@ void RuntimePointerChecking::groupChecks(
    // don't process them twice.
    SmallSet<unsigned, 2> Seen;
  
-  // Go through all equivalence classes, get the the "pointer check groups"
+  // Go through all equivalence classes, get the "pointer check groups"
    // and add them to the overall solution. We use the order in which accesses
    // appear in 'Pointers' to enforce determinism.
    for (unsigned I = 0; I < Pointers.size(); ++I) {
@@ -423,9 +424,10 @@ public:
    typedef SmallPtrSet<MemAccessInfo, 8> MemAccessInfoSet;
  
    AccessAnalysis(const DataLayout &Dl, AliasAnalysis *AA, LoopInfo *LI,
-                 MemoryDepChecker::DepCandidates &DA, SCEVUnionPredicate &Preds)
+                 MemoryDepChecker::DepCandidates &DA,
+                 PredicatedScalarEvolution &PSE)
        : DL(Dl), AST(*AA), LI(LI), DepCands(DA), IsRTCheckAnalysisNeeded(false),
-        Preds(Preds) {}
+        PSE(PSE) {}
  
    /// \brief Register a load  and whether it is only read from.
    void addLoad(MemoryLocation &Loc, bool IsReadOnly) {
@@ -512,16 +514,16 @@ private:
    bool IsRTCheckAnalysisNeeded;
  
    /// The SCEV predicate containing all the SCEV-related assumptions.
-  SCEVUnionPredicate &Preds;
+  PredicatedScalarEvolution &PSE;
  };
  
  } // end anonymous namespace
  
  /// \brief Check whether a pointer can participate in a runtime bounds check.
-static bool hasComputableBounds(ScalarEvolution *SE,
+static bool hasComputableBounds(PredicatedScalarEvolution &PSE,
                                  const ValueToValueMap &Strides, Value *Ptr,
-                                Loop *L, SCEVUnionPredicate &Preds) {
-  const SCEV *PtrScev = replaceSymbolicStrideSCEV(SE, Strides, Preds, Ptr);
+                                Loop *L) {
+  const SCEV *PtrScev = replaceSymbolicStrideSCEV(PSE, Strides, Ptr);
    const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(PtrScev);
    if (!AR)
      return false;
@@ -564,11 +566,11 @@ bool AccessAnalysis::canCheckPtrAtRT(RuntimePointerChecking &RtCheck,
        else
          ++NumReadPtrChecks;
  
-      if (hasComputableBounds(SE, StridesMap, Ptr, TheLoop, Preds) &&
+      if (hasComputableBounds(PSE, StridesMap, Ptr, TheLoop) &&
            // When we run after a failing dependency check we have to make sure
            // we don't have wrapping pointers.
            (!ShouldCheckStride ||
-           isStridedPtr(SE, Ptr, TheLoop, StridesMap, Preds) == 1)) {
+           isStridedPtr(PSE, Ptr, TheLoop, StridesMap) == 1)) {
          // The id of the dependence set.
          unsigned DepId;
  
@@ -582,7 +584,7 @@ bool AccessAnalysis::canCheckPtrAtRT(RuntimePointerChecking &RtCheck,
            // Each access has its own dependence set.
            DepId = RunningDepId++;
  
-        RtCheck.insert(TheLoop, Ptr, IsWrite, DepId, ASId, StridesMap, Preds);
+        RtCheck.insert(TheLoop, Ptr, IsWrite, DepId, ASId, StridesMap, PSE);
  
          DEBUG(dbgs() << "LAA: Found a runtime check ptr:" << *Ptr << '\n');
        } else {
@@ -743,6 +745,11 @@ void AccessAnalysis::processMemAccesses() {
            GetUnderlyingObjects(Ptr, TempObjects, DL, LI);
            DEBUG(dbgs() << "Underlying objects for pointer " << *Ptr << "\n");
            for (Value *UnderlyingObj : TempObjects) {
+            // nullptr never alias, don't join sets for pointer that have "null"
+            // in their UnderlyingObjects list.
+            if (isa<ConstantPointerNull>(UnderlyingObj))
+              continue;
+
              UnderlyingObjToAccessMap::iterator Prev =
                  ObjToLastAccess.find(UnderlyingObj);
              if (Prev != ObjToLastAccess.end())
@@ -812,9 +819,8 @@ static bool isNoWrapAddRec(Value *Ptr, const SCEVAddRecExpr *AR,
  }
  
  /// \brief Check whether the access through \p Ptr has a constant stride.
-int llvm::isStridedPtr(ScalarEvolution *SE, Value *Ptr, const Loop *Lp,
-                       const ValueToValueMap &StridesMap,
-                       SCEVUnionPredicate &Preds) {
+int llvm::isStridedPtr(PredicatedScalarEvolution &PSE, Value *Ptr,
+                       const Loop *Lp, const ValueToValueMap &StridesMap) {
    Type *Ty = Ptr->getType();
    assert(Ty->isPointerTy() && "Unexpected non-ptr");
  
@@ -826,7 +832,7 @@ int llvm::isStridedPtr(ScalarEvolution *SE, Value *Ptr, const Loop *Lp,
      return 0;
    }
  
-  const SCEV *PtrScev = replaceSymbolicStrideSCEV(SE, StridesMap, Preds, Ptr);
+  const SCEV *PtrScev = replaceSymbolicStrideSCEV(PSE, StridesMap, Ptr);
  
    const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(PtrScev);
    if (!AR) {
@@ -839,6 +845,7 @@ int llvm::isStridedPtr(ScalarEvolution *SE, Value *Ptr, const Loop *Lp,
    if (Lp != AR->getLoop()) {
      DEBUG(dbgs() << "LAA: Bad stride - Not striding over innermost loop " <<
            *Ptr << " SCEV: " << *PtrScev << "\n");
+    return 0;
    }
  
    // The address calculation must not wrap. Otherwise, a dependence could be
@@ -849,16 +856,16 @@ int llvm::isStridedPtr(ScalarEvolution *SE, Value *Ptr, const Loop *Lp,
    // to access the pointer value "0" which is undefined behavior in address
    // space 0, therefore we can also vectorize this case.
    bool IsInBoundsGEP = isInBoundsGep(Ptr);
-  bool IsNoWrapAddRec = isNoWrapAddRec(Ptr, AR, SE, Lp);
+  bool IsNoWrapAddRec = isNoWrapAddRec(Ptr, AR, PSE.getSE(), Lp);
    bool IsInAddressSpaceZero = PtrTy->getAddressSpace() == 0;
    if (!IsNoWrapAddRec && !IsInBoundsGEP && !IsInAddressSpaceZero) {
      DEBUG(dbgs() << "LAA: Bad stride - Pointer may wrap in the address space "
-          << *Ptr << " SCEV: " << *PtrScev << "\n");
+                 << *Ptr << " SCEV: " << *PtrScev << "\n");
      return 0;
    }
  
    // Check the step is constant.
-  const SCEV *Step = AR->getStepRecurrence(*SE);
+  const SCEV *Step = AR->getStepRecurrence(*PSE.getSE());
  
    // Calculate the pointer stride and check if it is constant.
    const SCEVConstant *C = dyn_cast<SCEVConstant>(Step);
@@ -870,7 +877,7 @@ int llvm::isStridedPtr(ScalarEvolution *SE, Value *Ptr, const Loop *Lp,
  
    auto &DL = Lp->getHeader()->getModule()->getDataLayout();
    int64_t Size = DL.getTypeAllocSize(PtrTy->getElementType());
-  const APInt &APStepVal = C->getValue()->getValue();
+  const APInt &APStepVal = C->getAPInt();
  
    // Huge step value - give up.
    if (APStepVal.getBitWidth() > 64)
@@ -1041,11 +1048,11 @@ MemoryDepChecker::isDependent(const MemAccessInfo &A, unsigned AIdx,
        BPtr->getType()->getPointerAddressSpace())
      return Dependence::Unknown;
  
-  const SCEV *AScev = replaceSymbolicStrideSCEV(SE, Strides, Preds, APtr);
-  const SCEV *BScev = replaceSymbolicStrideSCEV(SE, Strides, Preds, BPtr);
+  const SCEV *AScev = replaceSymbolicStrideSCEV(PSE, Strides, APtr);
+  const SCEV *BScev = replaceSymbolicStrideSCEV(PSE, Strides, BPtr);
  
-  int StrideAPtr = isStridedPtr(SE, APtr, InnermostLoop, Strides, Preds);
-  int StrideBPtr = isStridedPtr(SE, BPtr, InnermostLoop, Strides, Preds);
+  int StrideAPtr = isStridedPtr(PSE, APtr, InnermostLoop, Strides);
+  int StrideBPtr = isStridedPtr(PSE, BPtr, InnermostLoop, Strides);
  
    const SCEV *Src = AScev;
    const SCEV *Sink = BScev;
@@ -1062,12 +1069,12 @@ MemoryDepChecker::isDependent(const MemAccessInfo &A, unsigned AIdx,
      std::swap(StrideAPtr, StrideBPtr);
    }
  
-  const SCEV *Dist = SE->getMinusSCEV(Sink, Src);
+  const SCEV *Dist = PSE.getSE()->getMinusSCEV(Sink, Src);
  
    DEBUG(dbgs() << "LAA: Src Scev: " << *Src << "Sink Scev: " << *Sink
-        << "(Induction step: " << StrideAPtr <<  ")\n");
+               << "(Induction step: " << StrideAPtr << ")\n");
    DEBUG(dbgs() << "LAA: Distance for " << *InstMap[AIdx] << " to "
-        << *InstMap[BIdx] << ": " << *Dist << "\n");
+               << *InstMap[BIdx] << ": " << *Dist << "\n");
  
    // Need accesses with constant stride. We don't want to vectorize
    // "A[B[i]] += ..." and similar code or pointer arithmetic that could wrap in
@@ -1090,7 +1097,7 @@ MemoryDepChecker::isDependent(const MemAccessInfo &A, unsigned AIdx,
    unsigned TypeByteSize = DL.getTypeAllocSize(ATy);
  
    // Negative distances are not plausible dependencies.
-  const APInt &Val = C->getValue()->getValue();
+  const APInt &Val = C->getAPInt();
    if (Val.isNegative()) {
      bool IsTrueDataDependence = (AIsWrite && !BIsWrite);
      if (IsTrueDataDependence &&
@@ -1338,10 +1345,10 @@ bool LoopAccessInfo::canAnalyzeLoop() {
    }
  
    // ScalarEvolution needs to be able to find the exit count.
-  const SCEV *ExitCount = SE->getBackedgeTakenCount(TheLoop);
-  if (ExitCount == SE->getCouldNotCompute()) {
-    emitAnalysis(LoopAccessReport() <<
-                 "could not determine number of loop iterations");
+  const SCEV *ExitCount = PSE.getSE()->getBackedgeTakenCount(TheLoop);
+  if (ExitCount == PSE.getSE()->getCouldNotCompute()) {
+    emitAnalysis(LoopAccessReport()
+                 << "could not determine number of loop iterations");
      DEBUG(dbgs() << "LAA: SCEV could not compute the loop exit count.\n");
      return false;
    }
@@ -1442,7 +1449,7 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
  
    MemoryDepChecker::DepCandidates DependentAccesses;
    AccessAnalysis Accesses(TheLoop->getHeader()->getModule()->getDataLayout(),
-                          AA, LI, DependentAccesses, Preds);
+                          AA, LI, DependentAccesses, PSE);
  
    // Holds the analyzed pointers. We don't want to call GetUnderlyingObjects
    // multiple times on the same object. If the ptr is accessed twice, once
@@ -1493,8 +1500,7 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
      // read a few words, modify, and write a few words, and some of the
      // words may be written to the same address.
      bool IsReadOnlyPtr = false;
-    if (Seen.insert(Ptr).second ||
-        !isStridedPtr(SE, Ptr, TheLoop, Strides, Preds)) {
+    if (Seen.insert(Ptr).second || !isStridedPtr(PSE, Ptr, TheLoop, Strides)) {
        ++NumReads;
        IsReadOnlyPtr = true;
      }
@@ -1524,7 +1530,7 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
    // Find pointers with computable bounds. We are going to use this information
    // to place a runtime bound check.
    bool CanDoRTIfNeeded =
-      Accesses.canCheckPtrAtRT(PtrRtChecking, SE, TheLoop, Strides);
+      Accesses.canCheckPtrAtRT(PtrRtChecking, PSE.getSE(), TheLoop, Strides);
    if (!CanDoRTIfNeeded) {
      emitAnalysis(LoopAccessReport() << "cannot identify array bounds");
      DEBUG(dbgs() << "LAA: We can't vectorize because we can't find "
@@ -1551,6 +1557,7 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
        PtrRtChecking.reset();
        PtrRtChecking.Need = true;
  
+      auto *SE = PSE.getSE();
        CanDoRTIfNeeded =
            Accesses.canCheckPtrAtRT(PtrRtChecking, SE, TheLoop, Strides, true);
  
@@ -1593,7 +1600,7 @@ void LoopAccessInfo::emitAnalysis(LoopAccessReport &Message) {
  }
  
  bool LoopAccessInfo::isUniform(Value *V) const {
-  return (SE->isLoopInvariant(SE->getSCEV(V), TheLoop));
+  return (PSE.getSE()->isLoopInvariant(PSE.getSE()->getSCEV(V), TheLoop));
  }
  
  // FIXME: this function is currently a duplicate of the one in
@@ -1674,7 +1681,7 @@ std::pair<Instruction *, Instruction *> LoopAccessInfo::addRuntimeChecks(
      Instruction *Loc,
      const SmallVectorImpl<RuntimePointerChecking::PointerCheck> &PointerChecks)
      const {
-
+  auto *SE = PSE.getSE();
    SCEVExpander Exp(*SE, DL, "induction");
    auto ExpandedChecks =
        expandBounds(PointerChecks, TheLoop, Loc, SE, Exp, PtrRtChecking);
@@ -1744,7 +1751,7 @@ LoopAccessInfo::LoopAccessInfo(Loop *L, ScalarEvolution *SE,
                                 const TargetLibraryInfo *TLI, AliasAnalysis *AA,
                                 DominatorTree *DT, LoopInfo *LI,
                                 const ValueToValueMap &Strides)
-    : PtrRtChecking(SE), DepChecker(SE, L, Preds), TheLoop(L), SE(SE), DL(DL),
+    : PSE(*SE), PtrRtChecking(SE), DepChecker(PSE, L), TheLoop(L), DL(DL),
        TLI(TLI), AA(AA), DT(DT), LI(LI), NumLoads(0), NumStores(0),
        MaxSafeDepDistBytes(-1U), CanVecMem(false),
        StoreToLoopInvariantAddress(false) {
@@ -1781,7 +1788,7 @@ void LoopAccessInfo::print(raw_ostream &OS, unsigned Depth) const {
                     << "found in loop.\n";
  
    OS.indent(Depth) << "SCEV assumptions:\n";
-  Preds.print(OS, Depth);
+  PSE.getUnionPredicate().print(OS, Depth);
  }
  
  const LoopAccessInfo &