raw_ostream: Forward declare OpenFlags and include FileSystem.h only where necessary.

[oota-llvm.git] / lib / Analysis / ValueTracking.cpp
diff --git a/lib/Analysis/ValueTracking.cpp b/lib/Analysis/ValueTracking.cpp

index 8e3994e8f52079b511bbf2e4aacf8dfc9382651e..07720d78bf05c66a6487deca5906efc15c43515e 100644 (file)
--- a/lib/Analysis/ValueTracking.cpp
+++ b/lib/Analysis/ValueTracking.cpp
@@ -15,8 +15,11 @@
  #include "llvm/Analysis/ValueTracking.h"
  #include "llvm/ADT/SmallPtrSet.h"
  #include "llvm/Analysis/InstructionSimplify.h"
+#include "llvm/Analysis/MemoryBuiltins.h"
+#include "llvm/IR/ConstantRange.h"
  #include "llvm/IR/Constants.h"
  #include "llvm/IR/DataLayout.h"
+#include "llvm/IR/GetElementPtrTypeIterator.h"
  #include "llvm/IR/GlobalAlias.h"
  #include "llvm/IR/GlobalVariable.h"
  #include "llvm/IR/Instructions.h"
@@ -24,10 +27,8 @@
  #include "llvm/IR/LLVMContext.h"
  #include "llvm/IR/Metadata.h"
  #include "llvm/IR/Operator.h"
-#include "llvm/Support/ConstantRange.h"
-#include "llvm/Support/GetElementPtrTypeIterator.h"
+#include "llvm/IR/PatternMatch.h"
  #include "llvm/Support/MathExtras.h"
-#include "llvm/Support/PatternMatch.h"
  #include <cstring>
  using namespace llvm;
  using namespace llvm::PatternMatch;
@@ -39,8 +40,8 @@ const unsigned MaxDepth = 6;
  static unsigned getBitWidth(Type *Ty, const DataLayout *TD) {
    if (unsigned BitWidth = Ty->getScalarSizeInBits())
      return BitWidth;
-  assert(isa<PointerType>(Ty) && "Expected a pointer type!");
-  return TD ? TD->getPointerSizeInBits() : 0;
+
+  return TD ? TD->getPointerTypeSizeInBits(Ty) : 0;
  }
  
  static void ComputeMaskedBitsAddSub(bool Add, Value *Op0, Value *Op1, bool NSW,
@@ -290,7 +291,7 @@ void llvm::ComputeMaskedBits(Value *V, APInt &KnownZero, APInt &KnownOne,
      }
      if (Align > 0)
        KnownZero = APInt::getLowBitsSet(BitWidth,
-                                       CountTrailingZeros_32(Align));
+                                       countTrailingZeros(Align));
      else
        KnownZero.clearAllBits();
      KnownOne.clearAllBits();
@@ -310,8 +311,9 @@ void llvm::ComputeMaskedBits(Value *V, APInt &KnownZero, APInt &KnownOne,
    if (Argument *A = dyn_cast<Argument>(V)) {
      unsigned Align = 0;
  
-    if (A->hasByValAttr()) {
-      // Get alignment information off byval arguments if specified in the IR.
+    if (A->hasByValOrInAllocaAttr()) {
+      // Get alignment information off byval/inalloca arguments if specified in
+      // the IR.
        Align = A->getParamAlignment();
      } else if (TD && A->hasStructRetAttr()) {
        // An sret parameter has at least the ABI alignment of the return type.
@@ -321,7 +323,7 @@ void llvm::ComputeMaskedBits(Value *V, APInt &KnownZero, APInt &KnownOne,
      }
  
      if (Align)
-      KnownZero = APInt::getLowBitsSet(BitWidth, CountTrailingZeros_32(Align));
+      KnownZero = APInt::getLowBitsSet(BitWidth, countTrailingZeros(Align));
      return;
    }
  
@@ -613,7 +615,7 @@ void llvm::ComputeMaskedBits(Value *V, APInt &KnownZero, APInt &KnownOne,
        Align = TD->getABITypeAlignment(AI->getType()->getElementType());
  
      if (Align > 0)
-      KnownZero = APInt::getLowBitsSet(BitWidth, CountTrailingZeros_32(Align));
+      KnownZero = APInt::getLowBitsSet(BitWidth, countTrailingZeros(Align));
      break;
    }
    case Instruction::GetElementPtr: {
@@ -629,12 +631,22 @@ void llvm::ComputeMaskedBits(Value *V, APInt &KnownZero, APInt &KnownOne,
        Value *Index = I->getOperand(i);
        if (StructType *STy = dyn_cast<StructType>(*GTI)) {
          // Handle struct member offset arithmetic.
-        if (!TD) return;
-        const StructLayout *SL = TD->getStructLayout(STy);
+        if (!TD)
+          return;
+
+        // Handle case when index is vector zeroinitializer
+        Constant *CIndex = cast<Constant>(Index);
+        if (CIndex->isZeroValue())
+          continue;
+
+        if (CIndex->getType()->isVectorTy())
+          Index = CIndex->getSplatValue();
+
          unsigned Idx = cast<ConstantInt>(Index)->getZExtValue();
+        const StructLayout *SL = TD->getStructLayout(STy);
          uint64_t Offset = SL->getElementOffset(Idx);
-        TrailZ = std::min(TrailZ,
-                          CountTrailingZeros_64(Offset));
+        TrailZ = std::min<unsigned>(TrailZ,
+                                    countTrailingZeros(Offset));
        } else {
          // Handle array index arithmetic.
          Type *IndexedTy = GTI.getIndexedType();
@@ -644,7 +656,7 @@ void llvm::ComputeMaskedBits(Value *V, APInt &KnownZero, APInt &KnownOne,
          LocalKnownZero = LocalKnownOne = APInt(GEPOpiBits, 0);
          ComputeMaskedBits(Index, LocalKnownZero, LocalKnownOne, TD, Depth+1);
          TrailZ = std::min(TrailZ,
-                          unsigned(CountTrailingZeros_64(TypeSize) +
+                          unsigned(countTrailingZeros(TypeSize) +
                                     LocalKnownZero.countTrailingOnes()));
        }
      }
@@ -749,7 +761,6 @@ void llvm::ComputeMaskedBits(Value *V, APInt &KnownZero, APInt &KnownOne,
          KnownZero = APInt::getHighBitsSet(BitWidth, BitWidth - LowBits);
          break;
        }
-      case Intrinsic::x86_sse42_crc32_64_8:
        case Intrinsic::x86_sse42_crc32_64_64:
          KnownZero = APInt::getHighBitsSet(64, 32);
          break;
@@ -831,7 +842,7 @@ bool llvm::isKnownToBeAPowerOfTwo(Value *V, bool OrZero, unsigned Depth) {
    if (Depth++ == MaxDepth)
      return false;
  
-  Value *X = 0, *Y = 0;
+  Value *X = nullptr, *Y = nullptr;
    // A shift of a power of two is a power of two or zero.
    if (OrZero && (match(V, m_Shl(m_Value(X), m_Value())) ||
                   match(V, m_Shr(m_Value(X), m_Value()))))
@@ -855,6 +866,37 @@ bool llvm::isKnownToBeAPowerOfTwo(Value *V, bool OrZero, unsigned Depth) {
      return false;
    }
  
+  // Adding a power-of-two or zero to the same power-of-two or zero yields
+  // either the original power-of-two, a larger power-of-two or zero.
+  if (match(V, m_Add(m_Value(X), m_Value(Y)))) {
+    OverflowingBinaryOperator *VOBO = cast<OverflowingBinaryOperator>(V);
+    if (OrZero || VOBO->hasNoUnsignedWrap() || VOBO->hasNoSignedWrap()) {
+      if (match(X, m_And(m_Specific(Y), m_Value())) ||
+          match(X, m_And(m_Value(), m_Specific(Y))))
+        if (isKnownToBeAPowerOfTwo(Y, OrZero, Depth))
+          return true;
+      if (match(Y, m_And(m_Specific(X), m_Value())) ||
+          match(Y, m_And(m_Value(), m_Specific(X))))
+        if (isKnownToBeAPowerOfTwo(X, OrZero, Depth))
+          return true;
+
+      unsigned BitWidth = V->getType()->getScalarSizeInBits();
+      APInt LHSZeroBits(BitWidth, 0), LHSOneBits(BitWidth, 0);
+      ComputeMaskedBits(X, LHSZeroBits, LHSOneBits, nullptr, Depth);
+
+      APInt RHSZeroBits(BitWidth, 0), RHSOneBits(BitWidth, 0);
+      ComputeMaskedBits(Y, RHSZeroBits, RHSOneBits, nullptr, Depth);
+      // If i8 V is a power of two or zero:
+      //  ZeroBits: 1 1 1 0 1 1 1 1
+      // ~ZeroBits: 0 0 0 1 0 0 0 0
+      if ((~(LHSZeroBits & RHSZeroBits)).isPowerOf2())
+        // If OrZero isn't set, we cannot give back a zero result.
+        // Make sure either the LHS or RHS has a bit set.
+        if (OrZero || RHSOneBits.getBoolValue() || LHSOneBits.getBoolValue())
+          return true;
+    }
+  }
+
    // An exact divide or right shift can only shift off zero bits, so the result
    // is a power of two only if the first operand is a power of two and not
    // copying a sign bit (sdiv int_min, 2).
@@ -953,6 +995,8 @@ bool llvm::isKnownNonZero(Value *V, const DataLayout *TD, unsigned Depth) {
  
    // Check for pointer simplifications.
    if (V->getType()->isPointerTy()) {
+    if (isKnownNonNull(V))
+      return true; 
      if (GEPOperator *GEP = dyn_cast<GEPOperator>(V))
        if (isGEPKnownNonNull(GEP, TD, Depth))
          return true;
@@ -961,7 +1005,7 @@ bool llvm::isKnownNonZero(Value *V, const DataLayout *TD, unsigned Depth) {
    unsigned BitWidth = getBitWidth(V->getType()->getScalarType(), TD);
  
    // X | Y != 0 if X != 0 or Y != 0.
-  Value *X = 0, *Y = 0;
+  Value *X = nullptr, *Y = nullptr;
    if (match(V, m_Or(m_Value(X), m_Value(Y))))
      return isKnownNonZero(X, TD, Depth) || isKnownNonZero(Y, TD, Depth);
  
@@ -1320,7 +1364,7 @@ bool llvm::ComputeMultiple(Value *V, unsigned Base, Value *&Multiple,
        Op1 = ConstantInt::get(V->getContext(), API);
      }
  
-    Value *Mul0 = NULL;
+    Value *Mul0 = nullptr;
      if (ComputeMultiple(Op0, Base, Mul0, LookThroughSExt, Depth+1)) {
        if (Constant *Op1C = dyn_cast<Constant>(Op1))
          if (Constant *MulC = dyn_cast<Constant>(Mul0)) {
@@ -1344,7 +1388,7 @@ bool llvm::ComputeMultiple(Value *V, unsigned Base, Value *&Multiple,
          }
      }
  
-    Value *Mul1 = NULL;
+    Value *Mul1 = nullptr;
      if (ComputeMultiple(Op1, Base, Mul1, LookThroughSExt, Depth+1)) {
        if (Constant *Op0C = dyn_cast<Constant>(Op0))
          if (Constant *MulC = dyn_cast<Constant>(Mul1)) {
@@ -1388,7 +1432,7 @@ bool llvm::CannotBeNegativeZero(const Value *V, unsigned Depth) {
      return 1;  // Limit search depth.
  
    const Operator *I = dyn_cast<Operator>(V);
-  if (I == 0) return false;
+  if (!I) return false;
  
    // Check if the nsz fast-math flag is set
    if (const FPMathOperator *FPO = dyn_cast<FPMathOperator>(I))
@@ -1396,10 +1440,10 @@ bool llvm::CannotBeNegativeZero(const Value *V, unsigned Depth) {
        return true;
  
    // (add x, 0.0) is guaranteed to return +0.0, not -0.0.
-  if (I->getOpcode() == Instruction::FAdd &&
-      isa<ConstantFP>(I->getOperand(1)) &&
-      cast<ConstantFP>(I->getOperand(1))->isNullValue())
-    return true;
+  if (I->getOpcode() == Instruction::FAdd)
+    if (ConstantFP *CFP = dyn_cast<ConstantFP>(I->getOperand(1)))
+      if (CFP->isNullValue())
+        return true;
  
    // sitofp and uitofp turn into +0.0 for zero.
    if (isa<SIToFPInst>(I) || isa<UIToFPInst>(I))
@@ -1469,7 +1513,7 @@ Value *llvm::isBytewiseValue(Value *V) {
  
          // If the top/bottom halves aren't the same, reject it.
          if (Val != Val2)
-          return 0;
+          return nullptr;
        }
        return ConstantInt::get(V->getContext(), Val);
      }
@@ -1481,11 +1525,11 @@ Value *llvm::isBytewiseValue(Value *V) {
      Value *Elt = CA->getElementAsConstant(0);
      Value *Val = isBytewiseValue(Elt);
      if (!Val)
-      return 0;
+      return nullptr;
  
      for (unsigned I = 1, E = CA->getNumElements(); I != E; ++I)
        if (CA->getElementAsConstant(I) != Elt)
-        return 0;
+        return nullptr;
  
      return Val;
    }
@@ -1496,7 +1540,7 @@ Value *llvm::isBytewiseValue(Value *V) {
    //   %c = or i16 %a, %b
    // but until there is an example that actually needs this, it doesn't seem
    // worth worrying about.
-  return 0;
+  return nullptr;
  }
  
  
@@ -1507,7 +1551,7 @@ Value *llvm::isBytewiseValue(Value *V) {
  // struct. To is the result struct built so far, new insertvalue instructions
  // build on that.
  static Value *BuildSubAggregate(Value *From, Value* To, Type *IndexedType,
-                                SmallVector<unsigned, 10> &Idxs,
+                                SmallVectorImpl<unsigned> &Idxs,
                                  unsigned IdxSkip,
                                  Instruction *InsertBefore) {
    llvm::StructType *STy = dyn_cast<llvm::StructType>(IndexedType);
@@ -1546,7 +1590,7 @@ static Value *BuildSubAggregate(Value *From, Value* To, Type *IndexedType,
    Value *V = FindInsertedValue(From, Idxs);
  
    if (!V)
-    return NULL;
+    return nullptr;
  
    // Insert the value in the new (sub) aggregrate
    return llvm::InsertValueInst::Create(To, V, makeArrayRef(Idxs).slice(IdxSkip),
@@ -1597,7 +1641,7 @@ Value *llvm::FindInsertedValue(Value *V, ArrayRef<unsigned> idx_range,
  
    if (Constant *C = dyn_cast<Constant>(V)) {
      C = C->getAggregateElement(idx_range[0]);
-    if (C == 0) return 0;
+    if (!C) return nullptr;
      return FindInsertedValue(C, idx_range.slice(1), InsertBefore);
    }
  
@@ -1610,7 +1654,7 @@ Value *llvm::FindInsertedValue(Value *V, ArrayRef<unsigned> idx_range,
        if (req_idx == idx_range.end()) {
          // We can't handle this without inserting insertvalues
          if (!InsertBefore)
-          return 0;
+          return nullptr;
  
          // The requested index identifies a part of a nested aggregate. Handle
          // this specially. For example,
@@ -1664,27 +1708,31 @@ Value *llvm::FindInsertedValue(Value *V, ArrayRef<unsigned> idx_range,
    }
    // Otherwise, we don't know (such as, extracting from a function return value
    // or load instruction)
-  return 0;
+  return nullptr;
  }
  
  /// GetPointerBaseWithConstantOffset - Analyze the specified pointer to see if
  /// it can be expressed as a base pointer plus a constant offset.  Return the
  /// base and offset to the caller.
  Value *llvm::GetPointerBaseWithConstantOffset(Value *Ptr, int64_t &Offset,
-                                              const DataLayout *TD) {
+                                              const DataLayout *DL) {
    // Without DataLayout, conservatively assume 64-bit offsets, which is
    // the widest we support.
-  unsigned BitWidth = TD ? TD->getPointerSizeInBits() : 64;
+  unsigned BitWidth = DL ? DL->getPointerTypeSizeInBits(Ptr->getType()) : 64;
    APInt ByteOffset(BitWidth, 0);
    while (1) {
      if (Ptr->getType()->isVectorTy())
        break;
  
      if (GEPOperator *GEP = dyn_cast<GEPOperator>(Ptr)) {
-      APInt GEPOffset(BitWidth, 0);
-      if (TD && !GEP->accumulateConstantOffset(*TD, GEPOffset))
-        break;
-      ByteOffset += GEPOffset;
+      if (DL) {
+        APInt GEPOffset(BitWidth, 0);
+        if (!GEP->accumulateConstantOffset(*DL, GEPOffset))
+          break;
+
+        ByteOffset += GEPOffset;
+      }
+
        Ptr = GEP->getPointerOperand();
      } else if (Operator::getOpcode(Ptr) == Instruction::BitCast) {
        Ptr = cast<Operator>(Ptr)->getOperand(0);
@@ -1721,13 +1769,13 @@ bool llvm::getConstantStringInfo(const Value *V, StringRef &Str,
      // Make sure the index-ee is a pointer to array of i8.
      PointerType *PT = cast<PointerType>(GEP->getOperand(0)->getType());
      ArrayType *AT = dyn_cast<ArrayType>(PT->getElementType());
-    if (AT == 0 || !AT->getElementType()->isIntegerTy(8))
+    if (!AT || !AT->getElementType()->isIntegerTy(8))
        return false;
  
      // Check to make sure that the first operand of the GEP is an integer and
      // has value 0 so that we are sure we're indexing into the initializer.
      const ConstantInt *FirstIdx = dyn_cast<ConstantInt>(GEP->getOperand(1));
-    if (FirstIdx == 0 || !FirstIdx->isZero())
+    if (!FirstIdx || !FirstIdx->isZero())
        return false;
  
      // If the second index isn't a ConstantInt, then this is a variable index
@@ -1759,7 +1807,7 @@ bool llvm::getConstantStringInfo(const Value *V, StringRef &Str,
    // Must be a Constant Array
    const ConstantDataArray *Array =
      dyn_cast<ConstantDataArray>(GV->getInitializer());
-  if (Array == 0 || !Array->isString())
+  if (!Array || !Array->isString())
      return false;
  
    // Get the number of elements in the array
@@ -1865,7 +1913,7 @@ llvm::GetUnderlyingObject(Value *V, const DataLayout *TD, unsigned MaxLookup) {
        // See if InstructionSimplify knows any relevant tricks.
        if (Instruction *I = dyn_cast<Instruction>(V))
          // TODO: Acquire a DominatorTree and use it.
-        if (Value *Simplified = SimplifyInstruction(I, TD, 0)) {
+        if (Value *Simplified = SimplifyInstruction(I, TD, nullptr)) {
            V = Simplified;
            continue;
          }
@@ -1912,9 +1960,8 @@ llvm::GetUnderlyingObjects(Value *V,
  /// are lifetime markers.
  ///
  bool llvm::onlyUsedByLifetimeMarkers(const Value *V) {
-  for (Value::const_use_iterator UI = V->use_begin(), UE = V->use_end();
-       UI != UE; ++UI) {
-    const IntrinsicInst *II = dyn_cast<IntrinsicInst>(*UI);
+  for (const User *U : V->users()) {
+    const IntrinsicInst *II = dyn_cast<IntrinsicInst>(U);
      if (!II) return false;
  
      if (II->getIntrinsicID() != Intrinsic::lifetime_start &&
@@ -1959,7 +2006,9 @@ bool llvm::isSafeToSpeculativelyExecute(const Value *V,
    }
    case Instruction::Load: {
      const LoadInst *LI = cast<LoadInst>(Inst);
-    if (!LI->isUnordered())
+    if (!LI->isUnordered() ||
+        // Speculative load may create a race that did not exist in the source.
+        LI->getParent()->getParent()->hasFnAttribute(Attribute::SanitizeThread))
        return false;
      return LI->getPointerOperand()->isDereferenceablePointer();
    }
@@ -1986,6 +2035,12 @@ bool llvm::isSafeToSpeculativelyExecute(const Value *V,
         case Intrinsic::umul_with_overflow:
         case Intrinsic::usub_with_overflow:
           return true;
+       // Sqrt should be OK, since the llvm sqrt intrinsic isn't defined to set
+       // errno like libm sqrt would.
+       case Intrinsic::sqrt:
+       case Intrinsic::fma:
+       case Intrinsic::fmuladd:
+         return true;
         // TODO: some fp intrinsics are marked as having the same error handling
         // as libm. They're safe to speculate when they won't error.
         // TODO: are convert_{from,to}_fp16 safe?
@@ -2017,16 +2072,21 @@ bool llvm::isSafeToSpeculativelyExecute(const Value *V,
  
  /// isKnownNonNull - Return true if we know that the specified value is never
  /// null.
-bool llvm::isKnownNonNull(const Value *V) {
+bool llvm::isKnownNonNull(const Value *V, const TargetLibraryInfo *TLI) {
    // Alloca never returns null, malloc might.
    if (isa<AllocaInst>(V)) return true;
  
-  // A byval argument is never null.
+  // A byval or inalloca argument is never null.
    if (const Argument *A = dyn_cast<Argument>(V))
-    return A->hasByValAttr();
+    return A->hasByValOrInAllocaAttr();
  
    // Global values are not null unless extern weak.
    if (const GlobalValue *GV = dyn_cast<GlobalValue>(V))
      return !GV->hasExternalWeakLinkage();
+
+  // operator new never returns null.
+  if (isOperatorNewLikeFn(V, TLI, /*LookThroughBitCast=*/true))
+    return true;
+
    return false;
  }