SLPVectorizer: AllSameOpcode* starts "true" only for instructions

[oota-llvm.git] / lib / Support / APFloat.cpp
diff --git a/lib/Support/APFloat.cpp b/lib/Support/APFloat.cpp

index e1fd3c602b789c4671a2b9e7161ac277413c305f..91b3db59d0e3d82e02271a07acf2339c1b6f1087 100644 (file)
--- a/lib/Support/APFloat.cpp
+++ b/lib/Support/APFloat.cpp
@@ -35,8 +35,7 @@ using namespace llvm;
  
  /* Assumed in hexadecimal significand parsing, and conversion to
     hexadecimal strings.  */
-#define COMPILE_TIME_ASSERT(cond) extern int CTAssert[(cond) ? 1 : -1]
-COMPILE_TIME_ASSERT(integerPartWidth % 4 == 0);
+static_assert(integerPartWidth % 4 == 0, "Part width must be divisible by 4!");
  
  namespace llvm {
  
@@ -53,14 +52,17 @@ namespace llvm {
      /* Number of bits in the significand.  This includes the integer
         bit.  */
      unsigned int precision;
+
+    /* Number of bits actually used in the semantics. */
+    unsigned int sizeInBits;
    };
  
-  const fltSemantics APFloat::IEEEhalf = { 15, -14, 11 };
-  const fltSemantics APFloat::IEEEsingle = { 127, -126, 24 };
-  const fltSemantics APFloat::IEEEdouble = { 1023, -1022, 53 };
-  const fltSemantics APFloat::IEEEquad = { 16383, -16382, 113 };
-  const fltSemantics APFloat::x87DoubleExtended = { 16383, -16382, 64 };
-  const fltSemantics APFloat::Bogus = { 0, 0, 0 };
+  const fltSemantics APFloat::IEEEhalf = { 15, -14, 11, 16 };
+  const fltSemantics APFloat::IEEEsingle = { 127, -126, 24, 32 };
+  const fltSemantics APFloat::IEEEdouble = { 1023, -1022, 53, 64 };
+  const fltSemantics APFloat::IEEEquad = { 16383, -16382, 113, 128 };
+  const fltSemantics APFloat::x87DoubleExtended = { 16383, -16382, 64, 80 };
+  const fltSemantics APFloat::Bogus = { 0, 0, 0, 0 };
  
    /* The PowerPC format consists of two doubles.  It does not map cleanly
       onto the usual format above.  It is approximated using twice the
@@ -73,7 +75,7 @@ namespace llvm {
       to represent all possible values held by a PPC double-double number,
       for example: (long double) 1.0 + (long double) 0x1p-106
       Should this be replaced by a full emulation of PPC double-double?  */
-  const fltSemantics APFloat::PPCDoubleDouble = { 1023, -1022 + 53, 53 + 53 };
+  const fltSemantics APFloat::PPCDoubleDouble = { 1023, -1022 + 53, 53 + 53, 128 };
  
    /* A tight upper bound on number of parts required to hold the value
       pow(5, power) is
@@ -212,15 +214,15 @@ skipLeadingZeroesAndAnyDot(StringRef::iterator begin, StringRef::iterator end,
  {
    StringRef::iterator p = begin;
    *dot = end;
-  while (*p == '0' && p != end)
+  while (p != end && *p == '0')
      p++;
  
-  if (*p == '.') {
+  if (p != end && *p == '.') {
      *dot = p++;
  
      assert(end - begin != 1 && "Significand has no digits");
  
-    while (*p == '0' && p != end)
+    while (p != end && *p == '0')
        p++;
    }
  
@@ -775,18 +777,12 @@ APFloat::bitwiseIsEqual(const APFloat &rhs) const {
      return false;
    if (category==fcZero || category==fcInfinity)
      return true;
-  else if (isFiniteNonZero() && exponent!=rhs.exponent)
+
+  if (isFiniteNonZero() && exponent != rhs.exponent)
      return false;
-  else {
-    int i= partCount();
-    const integerPart* p=significandParts();
-    const integerPart* q=rhs.significandParts();
-    for (; i>0; i--, p++, q++) {
-      if (*p != *q)
-        return false;
-    }
-    return true;
-  }
+
+  return std::equal(significandParts(), significandParts() + partCount(),
+                    rhs.significandParts());
  }
  
  APFloat::APFloat(const fltSemantics &ourSemantics, integerPart value) {
@@ -845,6 +841,21 @@ APFloat::semanticsPrecision(const fltSemantics &semantics)
  {
    return semantics.precision;
  }
+APFloat::ExponentType
+APFloat::semanticsMaxExponent(const fltSemantics &semantics)
+{
+  return semantics.maxExponent;
+}
+APFloat::ExponentType
+APFloat::semanticsMinExponent(const fltSemantics &semantics)
+{
+  return semantics.minExponent;
+}
+unsigned int
+APFloat::semanticsSizeInBits(const fltSemantics &semantics)
+{
+  return semantics.sizeInBits;
+}
  
  const integerPart *
  APFloat::significandParts() const
@@ -927,7 +938,10 @@ APFloat::multiplySignificand(const APFloat &rhs, const APFloat *addend)
    assert(semantics == rhs.semantics);
  
    precision = semantics->precision;
-  newPartsCount = partCountForBits(precision * 2);
+
+  // Allocate space for twice as many bits as the original significand, plus one
+  // extra bit for the addition to overflow into.
+  newPartsCount = partCountForBits(precision * 2 + 1);
  
    if (newPartsCount > 4)
      fullSignificand = new integerPart[newPartsCount];
@@ -949,13 +963,14 @@ APFloat::multiplySignificand(const APFloat &rhs, const APFloat *addend)
    //   *this = a23 . a22 ... a0 * 2^e1
    //     rhs = b23 . b22 ... b0 * 2^e2
    // the result of multiplication is:
-  //   *this = c47 c46 . c45 ... c0 * 2^(e1+e2)
-  // Note that there are two significant bits at the left-hand side of the 
-  // radix point. Move the radix point toward left by one bit, and adjust
-  // exponent accordingly.
-  exponent += 1;
-
-  if (addend) {
+  //   *this = c48 c47 c46 . c45 ... c0 * 2^(e1+e2)
+  // Note that there are three significant bits at the left-hand side of the 
+  // radix point: two for the multiplication, and an overflow bit for the
+  // addition (that will always be zero at this point). Move the radix point
+  // toward left by two bits, and adjust exponent accordingly.
+  exponent += 2;
+
+  if (addend && addend->isNonZero()) {
      // The intermediate result of the multiplication has "2 * precision" 
      // signicant bit; adjust the addend to be consistent with mul result.
      //
@@ -965,13 +980,13 @@ APFloat::multiplySignificand(const APFloat &rhs, const APFloat *addend)
      opStatus status;
      unsigned int extendedPrecision;
  
-    /* Normalize our MSB.  */
-    extendedPrecision = 2 * precision;
-    if (omsb != extendedPrecision) {
+    // Normalize our MSB to one below the top bit to allow for overflow.
+    extendedPrecision = 2 * precision + 1;
+    if (omsb != extendedPrecision - 1) {
        assert(extendedPrecision > omsb);
        APInt::tcShiftLeft(fullSignificand, newPartsCount,
-                         extendedPrecision - omsb);
-      exponent -= extendedPrecision - omsb;
+                         (extendedPrecision - 1) - omsb);
+      exponent -= (extendedPrecision - 1) - omsb;
      }
  
      /* Create new semantics.  */
@@ -988,6 +1003,14 @@ APFloat::multiplySignificand(const APFloat &rhs, const APFloat *addend)
      status = extendedAddend.convert(extendedSemantics, rmTowardZero, &ignored);
      assert(status == opOK);
      (void)status;
+
+    // Shift the significand of the addend right by one bit. This guarantees
+    // that the high bit of the significand is zero (same as fullSignificand),
+    // so the addition will overflow (if it does overflow at all) into the top bit.
+    lost_fraction = extendedAddend.shiftSignificandRight(1);
+    assert(lost_fraction == lfExactlyZero &&
+           "Lost precision while shifting addend for fused-multiply-add.");
+
      lost_fraction = addOrSubtractSignificand(extendedAddend, false);
  
      /* Restore our state.  */
@@ -1003,7 +1026,7 @@ APFloat::multiplySignificand(const APFloat &rhs, const APFloat *addend)
    // having "precision" significant-bits. First, move the radix point from 
    // poision "2*precision - 1" to "precision - 1". The exponent need to be
    // adjusted by "2*precision - 1" - "precision - 1" = "precision".
-  exponent -= precision;
+  exponent -= precision + 1;
  
    // In case MSB resides at the left-hand side of radix point, shift the
    // mantissa right by some amount to make sure the MSB reside right before
@@ -1237,10 +1260,10 @@ APFloat::roundAwayFromZero(roundingMode rounding_mode,
      return false;
  
    case rmTowardPositive:
-    return sign == false;
+    return !sign;
  
    case rmTowardNegative:
-    return sign == true;
+    return sign;
    }
    llvm_unreachable("Invalid rounding mode found");
  }
@@ -1358,7 +1381,7 @@ APFloat::addOrSubtractSpecials(const APFloat &rhs, bool subtract)
  {
    switch (PackCategoriesIntoKey(category, rhs.category)) {
    default:
-    llvm_unreachable(0);
+    llvm_unreachable(nullptr);
  
    case PackCategoriesIntoKey(fcNaN, fcZero):
    case PackCategoriesIntoKey(fcNaN, fcNormal):
@@ -1372,7 +1395,9 @@ APFloat::addOrSubtractSpecials(const APFloat &rhs, bool subtract)
    case PackCategoriesIntoKey(fcZero, fcNaN):
    case PackCategoriesIntoKey(fcNormal, fcNaN):
    case PackCategoriesIntoKey(fcInfinity, fcNaN):
-    sign = false;
+    // We need to be sure to flip the sign here for subtraction because we
+    // don't have a separate negate operation so -NaN becomes 0 - NaN here.
+    sign = rhs.sign ^ subtract;
      category = fcNaN;
      copySignificand(rhs);
      return opOK;
@@ -1417,7 +1442,7 @@ APFloat::addOrSubtractSignificand(const APFloat &rhs, bool subtract)
  
    /* Determine if the operation on the absolute values is effectively
       an addition or subtraction.  */
-  subtract ^= (sign ^ rhs.sign) ? true : false;
+  subtract ^= static_cast<bool>(sign ^ rhs.sign);
  
    /* Are we bigger exponent-wise than the RHS?  */
    bits = exponent - rhs.exponent;
@@ -1485,7 +1510,7 @@ APFloat::multiplySpecials(const APFloat &rhs)
  {
    switch (PackCategoriesIntoKey(category, rhs.category)) {
    default:
-    llvm_unreachable(0);
+    llvm_unreachable(nullptr);
  
    case PackCategoriesIntoKey(fcNaN, fcZero):
    case PackCategoriesIntoKey(fcNaN, fcNormal):
@@ -1529,7 +1554,7 @@ APFloat::divideSpecials(const APFloat &rhs)
  {
    switch (PackCategoriesIntoKey(category, rhs.category)) {
    default:
-    llvm_unreachable(0);
+    llvm_unreachable(nullptr);
  
    case PackCategoriesIntoKey(fcZero, fcNaN):
    case PackCategoriesIntoKey(fcNormal, fcNaN):
@@ -1570,7 +1595,7 @@ APFloat::modSpecials(const APFloat &rhs)
  {
    switch (PackCategoriesIntoKey(category, rhs.category)) {
    default:
-    llvm_unreachable(0);
+    llvm_unreachable(nullptr);
  
    case PackCategoriesIntoKey(fcNaN, fcZero):
    case PackCategoriesIntoKey(fcNaN, fcNormal):
@@ -1746,7 +1771,7 @@ APFloat::remainder(const APFloat &rhs)
  /* Normalized llvm frem (C fmod).
     This is not currently correct in all cases.  */
  APFloat::opStatus
-APFloat::mod(const APFloat &rhs, roundingMode rounding_mode)
+APFloat::mod(const APFloat &rhs)
  {
    opStatus fs;
    fs = modSpecials(rhs);
@@ -1771,10 +1796,10 @@ APFloat::mod(const APFloat &rhs, roundingMode rounding_mode)
                                            rmNearestTiesToEven);
      assert(fs==opOK);   // should always work
  
-    fs = V.multiply(rhs, rounding_mode);
+    fs = V.multiply(rhs, rmNearestTiesToEven);
      assert(fs==opOK || fs==opInexact);   // should not overflow or underflow
  
-    fs = subtract(V, rounding_mode);
+    fs = subtract(V, rmNearestTiesToEven);
      assert(fs==opOK || fs==opInexact);   // likewise
  
      if (isZero())
@@ -1799,7 +1824,7 @@ APFloat::fusedMultiplyAdd(const APFloat &multiplicand,
       extended-precision calculation.  */
    if (isFiniteNonZero() &&
        multiplicand.isFiniteNonZero() &&
-      addend.isFiniteNonZero()) {
+      addend.isFinite()) {
      lostFraction lost_fraction;
  
      lost_fraction = multiplySignificand(multiplicand, &addend);
@@ -1810,7 +1835,7 @@ APFloat::fusedMultiplyAdd(const APFloat &multiplicand,
      /* If two numbers add (exactly) to zero, IEEE 754 decrees it is a
         positive zero unless rounding to minus infinity, except that
         adding two like-signed zeroes gives that zero.  */
-    if (category == fcZero && sign != addend.sign)
+    if (category == fcZero && !(fs & opUnderflow) && sign != addend.sign)
        sign = (rounding_mode == rmTowardNegative);
    } else {
      fs = multiplySpecials(multiplicand);
@@ -1882,7 +1907,7 @@ APFloat::compare(const APFloat &rhs) const
  
    switch (PackCategoriesIntoKey(category, rhs.category)) {
    default:
-    llvm_unreachable(0);
+    llvm_unreachable(nullptr);
  
    case PackCategoriesIntoKey(fcNaN, fcZero):
    case PackCategoriesIntoKey(fcNaN, fcNormal):
@@ -2403,7 +2428,7 @@ APFloat::roundSignificandWithExponent(const integerPart *decSigParts,
                                        roundingMode rounding_mode)
  {
    unsigned int parts, pow5PartCount;
-  fltSemantics calcSemantics = { 32767, -32767, 0 };
+  fltSemantics calcSemantics = { 32767, -32767, 0, 0 };
    integerPart pow5Parts[maxPowerOfFiveParts];
    bool isNearest;
  
@@ -3331,7 +3356,7 @@ APFloat::initFromAPInt(const fltSemantics* Sem, const APInt& api)
    if (Sem == &PPCDoubleDouble)
      return initFromPPCDoubleDoubleAPInt(api);
  
-  llvm_unreachable(0);
+  llvm_unreachable(nullptr);
  }
  
  APFloat
@@ -3355,6 +3380,10 @@ APFloat::getAllOnesValue(unsigned BitWidth, bool isIEEE)
    }
  }
  
+unsigned APFloat::getSizeInBits(const fltSemantics &Sem) {
+  return Sem.sizeInBits;
+}
+
  /// Make this number the largest magnitude normal number in the given
  /// semantics.
  void APFloat::makeLargest(bool Negative) {
@@ -3375,7 +3404,9 @@ void APFloat::makeLargest(bool Negative) {
    // internal consistency.
    const unsigned NumUnusedHighBits =
      PartCount*integerPartWidth - semantics->precision;
-  significand[PartCount - 1] = ~integerPart(0) >> NumUnusedHighBits;
+  significand[PartCount - 1] = (NumUnusedHighBits < integerPartWidth)
+                                   ? (~integerPart(0) >> NumUnusedHighBits)
+                                   : 0;
  }
  
  /// Make this number the smallest magnitude denormal number in the given
@@ -3902,3 +3933,20 @@ APFloat::makeZero(bool Negative) {
    exponent = semantics->minExponent-1;
    APInt::tcSet(significandParts(), 0, partCount());  
  }
+
+APFloat llvm::scalbn(APFloat X, int Exp) {
+  if (X.isInfinity() || X.isZero() || X.isNaN())
+    return X;
+
+  auto MaxExp = X.getSemantics().maxExponent;
+  auto MinExp = X.getSemantics().minExponent;
+  if (Exp > (MaxExp - X.exponent))
+    // Overflow saturates to infinity.
+    return APFloat::getInf(X.getSemantics(), X.isNegative());
+  if (Exp < (MinExp - X.exponent))
+    // Underflow saturates to zero.
+    return APFloat::getZero(X.getSemantics(), X.isNegative());
+
+  X.exponent += Exp;
+  return X;
+}