ARM: support .watchos_version_min and .tvos_version_min.

[oota-llvm.git] / lib / Support / APInt.cpp
diff --git a/lib/Support/APInt.cpp b/lib/Support/APInt.cpp

index e7ff15cadb80847034efe686ff5e2a81da5f4f6e..23f89bb66f9e562204cd136d5ed21c9ad5f414a4 100644 (file)
--- a/lib/Support/APInt.cpp
+++ b/lib/Support/APInt.cpp
@@ -12,21 +12,23 @@
  //
  //===----------------------------------------------------------------------===//
  
-#define DEBUG_TYPE "apint"
  #include "llvm/ADT/APInt.h"
-#include "llvm/ADT/StringRef.h"
  #include "llvm/ADT/FoldingSet.h"
+#include "llvm/ADT/Hashing.h"
  #include "llvm/ADT/SmallString.h"
+#include "llvm/ADT/StringRef.h"
  #include "llvm/Support/Debug.h"
  #include "llvm/Support/ErrorHandling.h"
  #include "llvm/Support/MathExtras.h"
  #include "llvm/Support/raw_ostream.h"
  #include <cmath>
-#include <limits>
-#include <cstring>
  #include <cstdlib>
+#include <cstring>
+#include <limits>
  using namespace llvm;
  
+#define DEBUG_TYPE "apint"
+
  /// A utility function for allocating memory, checking for allocation failures,
  /// and ensuring the contents are zeroed.
  inline static uint64_t* getClearedMemory(unsigned numWords) {
@@ -48,18 +50,20 @@ inline static uint64_t* getMemory(unsigned numWords) {
  inline static unsigned getDigit(char cdigit, uint8_t radix) {
    unsigned r;
  
-  if (radix == 16) {
+  if (radix == 16 || radix == 36) {
      r = cdigit - '0';
      if (r <= 9)
        return r;
  
      r = cdigit - 'A';
-    if (r <= 5)
+    if (r <= radix - 11U)
        return r + 10;
  
      r = cdigit - 'a';
-    if (r <= 5)
+    if (r <= radix - 11U)
        return r + 10;
+    
+    radix = 10;
    }
  
    r = cdigit - '0';
@@ -83,25 +87,33 @@ void APInt::initSlowCase(const APInt& that) {
    memcpy(pVal, that.pVal, getNumWords() * APINT_WORD_SIZE);
  }
  
-
-APInt::APInt(unsigned numBits, unsigned numWords, const uint64_t bigVal[])
-  : BitWidth(numBits), VAL(0) {
+void APInt::initFromArray(ArrayRef<uint64_t> bigVal) {
    assert(BitWidth && "Bitwidth too small");
-  assert(bigVal && "Null pointer detected!");
+  assert(bigVal.data() && "Null pointer detected!");
    if (isSingleWord())
      VAL = bigVal[0];
    else {
      // Get memory, cleared to 0
      pVal = getClearedMemory(getNumWords());
      // Calculate the number of words to copy
-    unsigned words = std::min<unsigned>(numWords, getNumWords());
+    unsigned words = std::min<unsigned>(bigVal.size(), getNumWords());
      // Copy the words from bigVal to pVal
-    memcpy(pVal, bigVal, words * APINT_WORD_SIZE);
+    memcpy(pVal, bigVal.data(), words * APINT_WORD_SIZE);
    }
    // Make sure unused high bits are cleared
    clearUnusedBits();
  }
  
+APInt::APInt(unsigned numBits, ArrayRef<uint64_t> bigVal)
+  : BitWidth(numBits), VAL(0) {
+  initFromArray(bigVal);
+}
+
+APInt::APInt(unsigned numBits, unsigned numWords, const uint64_t bigVal[])
+  : BitWidth(numBits), VAL(0) {
+  initFromArray(makeArrayRef(bigVal, numWords));
+}
+
  APInt::APInt(unsigned numbits, StringRef Str, uint8_t radix)
    : BitWidth(numbits), VAL(0) {
    assert(BitWidth && "Bitwidth too small");
@@ -150,7 +162,7 @@ APInt& APInt::operator=(uint64_t RHS) {
    return clearUnusedBits();
  }
  
-/// Profile - This method 'profiles' an APInt for use with FoldingSet.
+/// This method 'profiles' an APInt for use with FoldingSet.
  void APInt::Profile(FoldingSetNodeID& ID) const {
    ID.AddInteger(BitWidth);
  
@@ -164,7 +176,7 @@ void APInt::Profile(FoldingSetNodeID& ID) const {
      ID.AddInteger(pVal[i]);
  }
  
-/// add_1 - This function adds a single "digit" integer, y, to the multiple
+/// This function adds a single "digit" integer, y, to the multiple
  /// "digit" integer array,  x[]. x[] is modified to reflect the addition and
  /// 1 is returned if there is a carry out, otherwise 0 is returned.
  /// @returns the carry of the addition.
@@ -190,7 +202,7 @@ APInt& APInt::operator++() {
    return clearUnusedBits();
  }
  
-/// sub_1 - This function subtracts a single "digit" (64-bit word), y, from
+/// This function subtracts a single "digit" (64-bit word), y, from
  /// the multi-digit integer array, x[], propagating the borrowed 1 value until
  /// no further borrowing is neeeded or it runs out of "digits" in x.  The result
  /// is 1 if "borrowing" exhausted the digits in x, or 0 if x was not exhausted.
@@ -219,7 +231,7 @@ APInt& APInt::operator--() {
    return clearUnusedBits();
  }
  
-/// add - This function adds the integer array x to the integer array Y and
+/// This function adds the integer array x to the integer array Y and
  /// places the result in dest.
  /// @returns the carry out from the addition
  /// @brief General addition of 64-bit integer arrays
@@ -376,6 +388,7 @@ APInt& APInt::operator*=(const APInt& RHS) {
    clearAllBits();
    unsigned wordsToCopy = destWords >= getNumWords() ? getNumWords() : destWords;
    memcpy(pVal, dest, wordsToCopy * APINT_WORD_SIZE);
+  clearUnusedBits();
  
    // delete dest array and return
    delete[] dest;
@@ -441,18 +454,10 @@ APInt APInt::XorSlowCase(const APInt& RHS) const {
    for (unsigned i = 0; i < numWords; ++i)
      val[i] = pVal[i] ^ RHS.pVal[i];
  
+  APInt Result(val, getBitWidth());
    // 0^0==1 so clear the high bits in case they got set.
-  return APInt(val, getBitWidth()).clearUnusedBits();
-}
-
-bool APInt::operator !() const {
-  if (isSingleWord())
-    return !VAL;
-
-  for (unsigned i = 0; i < getNumWords(); ++i)
-    if (pVal[i])
-      return false;
-  return true;
+  Result.clearUnusedBits();
+  return Result;
  }
  
  APInt APInt::operator*(const APInt& RHS) const {
@@ -461,7 +466,7 @@ APInt APInt::operator*(const APInt& RHS) const {
      return APInt(BitWidth, VAL * RHS.VAL);
    APInt Result(*this);
    Result *= RHS;
-  return Result.clearUnusedBits();
+  return Result;
  }
  
  APInt APInt::operator+(const APInt& RHS) const {
@@ -470,7 +475,8 @@ APInt APInt::operator+(const APInt& RHS) const {
      return APInt(BitWidth, VAL + RHS.VAL);
    APInt Result(BitWidth, 0);
    add(Result.pVal, this->pVal, RHS.pVal, getNumWords());
-  return Result.clearUnusedBits();
+  Result.clearUnusedBits();
+  return Result;
  }
  
  APInt APInt::operator-(const APInt& RHS) const {
@@ -479,13 +485,8 @@ APInt APInt::operator-(const APInt& RHS) const {
      return APInt(BitWidth, VAL - RHS.VAL);
    APInt Result(BitWidth, 0);
    sub(Result.pVal, this->pVal, RHS.pVal, getNumWords());
-  return Result.clearUnusedBits();
-}
-
-bool APInt::operator[](unsigned bitPosition) const {
-  assert(bitPosition < getBitWidth() && "Bit position out of bounds!");
-  return (maskBit(bitPosition) &
-          (isSingleWord() ?  VAL : pVal[whichWord(bitPosition)])) != 0;
+  Result.clearUnusedBits();
+  return Result;
  }
  
  bool APInt::EqualSlowCase(const APInt& RHS) const {
@@ -563,12 +564,12 @@ bool APInt::slt(const APInt& RHS) const {
    if (lhsNeg) {
      // Sign bit is set so perform two's complement to make it positive
      lhs.flipAllBits();
-    lhs++;
+    ++lhs;
    }
    if (rhsNeg) {
      // Sign bit is set so perform two's complement to make it positive
      rhs.flipAllBits();
-    rhs++;
+    ++rhs;
    }
  
    // Now we have unsigned values to compare so do the comparison if necessary
@@ -613,8 +614,9 @@ void APInt::flipBit(unsigned bitPosition) {
  
  unsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
    assert(!str.empty() && "Invalid string length");
-  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2) &&
-         "Radix should be 2, 8, 10, or 16!");
+  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 || 
+          radix == 36) &&
+         "Radix should be 2, 8, 10, 16, or 36!");
  
    size_t slen = str.size();
  
@@ -636,6 +638,8 @@ unsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
    if (radix == 16)
      return slen * 4 + isNegative;
  
+  // FIXME: base 36
+  
    // This is grossly inefficient but accurate. We could probably do something
    // with a computation of roughly slen*64/20 and then adjust by the value of
    // the first few digits. But, I'm not sure how accurate that could be.
@@ -644,7 +648,9 @@ unsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
    // be too large. This avoids the assertion in the constructor. This
    // calculation doesn't work appropriately for the numbers 0-9, so just use 4
    // bits in that case.
-  unsigned sufficient = slen == 1 ? 4 : slen * 64/18;
+  unsigned sufficient 
+    = radix == 10? (slen == 1 ? 4 : slen * 64/18)
+                 : (slen == 1 ? 7 : slen * 16/3);
  
    // Convert to the actual binary value.
    APInt tmp(sufficient, StringRef(p, slen), radix);
@@ -659,101 +665,27 @@ unsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
    }
  }
  
-// From http://www.burtleburtle.net, byBob Jenkins.
-// When targeting x86, both GCC and LLVM seem to recognize this as a
-// rotate instruction.
-#define rot(x,k) (((x)<<(k)) | ((x)>>(32-(k))))
-
-// From http://www.burtleburtle.net, by Bob Jenkins.
-#define mix(a,b,c) \
-  { \
-    a -= c;  a ^= rot(c, 4);  c += b; \
-    b -= a;  b ^= rot(a, 6);  a += c; \
-    c -= b;  c ^= rot(b, 8);  b += a; \
-    a -= c;  a ^= rot(c,16);  c += b; \
-    b -= a;  b ^= rot(a,19);  a += c; \
-    c -= b;  c ^= rot(b, 4);  b += a; \
-  }
-
-// From http://www.burtleburtle.net, by Bob Jenkins.
-#define final(a,b,c) \
-  { \
-    c ^= b; c -= rot(b,14); \
-    a ^= c; a -= rot(c,11); \
-    b ^= a; b -= rot(a,25); \
-    c ^= b; c -= rot(b,16); \
-    a ^= c; a -= rot(c,4);  \
-    b ^= a; b -= rot(a,14); \
-    c ^= b; c -= rot(b,24); \
-  }
-
-// hashword() was adapted from http://www.burtleburtle.net, by Bob
-// Jenkins.  k is a pointer to an array of uint32_t values; length is
-// the length of the key, in 32-bit chunks.  This version only handles
-// keys that are a multiple of 32 bits in size.
-static inline uint32_t hashword(const uint64_t *k64, size_t length)
-{
-  const uint32_t *k = reinterpret_cast<const uint32_t *>(k64);
-  uint32_t a,b,c;
-
-  /* Set up the internal state */
-  a = b = c = 0xdeadbeef + (((uint32_t)length)<<2);
-
-  /*------------------------------------------------- handle most of the key */
-  while (length > 3) {
-    a += k[0];
-    b += k[1];
-    c += k[2];
-    mix(a,b,c);
-    length -= 3;
-    k += 3;
-  }
-
-  /*------------------------------------------- handle the last 3 uint32_t's */
-  switch (length) {                  /* all the case statements fall through */
-  case 3 : c+=k[2];
-  case 2 : b+=k[1];
-  case 1 : a+=k[0];
-    final(a,b,c);
-    case 0:     /* case 0: nothing left to add */
-      break;
-    }
-  /*------------------------------------------------------ report the result */
-  return c;
-}
+hash_code llvm::hash_value(const APInt &Arg) {
+  if (Arg.isSingleWord())
+    return hash_combine(Arg.VAL);
  
-// hashword8() was adapted from http://www.burtleburtle.net, by Bob
-// Jenkins.  This computes a 32-bit hash from one 64-bit word.  When
-// targeting x86 (32 or 64 bit), both LLVM and GCC compile this
-// function into about 35 instructions when inlined.
-static inline uint32_t hashword8(const uint64_t k64)
-{
-  uint32_t a,b,c;
-  a = b = c = 0xdeadbeef + 4;
-  b += k64 >> 32;
-  a += k64 & 0xffffffff;
-  final(a,b,c);
-  return c;
+  return hash_combine_range(Arg.pVal, Arg.pVal + Arg.getNumWords());
  }
-#undef final
-#undef mix
-#undef rot
  
-uint64_t APInt::getHashValue() const {
-  uint64_t hash;
-  if (isSingleWord())
-    hash = hashword8(VAL);
-  else
-    hash = hashword(pVal, getNumWords()*2);
-  return hash;
+bool APInt::isSplat(unsigned SplatSizeInBits) const {
+  assert(getBitWidth() % SplatSizeInBits == 0 &&
+         "SplatSizeInBits must divide width!");
+  // We can check that all parts of an integer are equal by making use of a
+  // little trick: rotate and check if it's still the same value.
+  return *this == rotl(SplatSizeInBits);
  }
  
-/// HiBits - This function returns the high "numBits" bits of this APInt.
+/// This function returns the high "numBits" bits of this APInt.
  APInt APInt::getHiBits(unsigned numBits) const {
    return APIntOps::lshr(*this, BitWidth - numBits);
  }
  
-/// LoBits - This function returns the low "numBits" bits of this APInt.
+/// This function returns the low "numBits" bits of this APInt.
  APInt APInt::getLoBits(unsigned numBits) const {
    return APIntOps::lshr(APIntOps::shl(*this, BitWidth - numBits),
                          BitWidth - numBits);
@@ -773,34 +705,23 @@ unsigned APInt::countLeadingZerosSlowCase() const {
    unsigned i = getNumWords();
    integerPart MSW = pVal[i-1] & MSWMask;
    if (MSW)
-    return CountLeadingZeros_64(MSW) - (APINT_BITS_PER_WORD - BitsInMSW);
+    return llvm::countLeadingZeros(MSW) - (APINT_BITS_PER_WORD - BitsInMSW);
  
    unsigned Count = BitsInMSW;
    for (--i; i > 0u; --i) {
      if (pVal[i-1] == 0)
        Count += APINT_BITS_PER_WORD;
      else {
-      Count += CountLeadingZeros_64(pVal[i-1]);
+      Count += llvm::countLeadingZeros(pVal[i-1]);
        break;
      }
    }
    return Count;
  }
  
-static unsigned countLeadingOnes_64(uint64_t V, unsigned skip) {
-  unsigned Count = 0;
-  if (skip)
-    V <<= skip;
-  while (V && (V & (1ULL << 63))) {
-    Count++;
-    V <<= 1;
-  }
-  return Count;
-}
-
  unsigned APInt::countLeadingOnes() const {
    if (isSingleWord())
-    return countLeadingOnes_64(VAL, APINT_BITS_PER_WORD - BitWidth);
+    return llvm::countLeadingOnes(VAL << (APINT_BITS_PER_WORD - BitWidth));
  
    unsigned highWordBits = BitWidth % APINT_BITS_PER_WORD;
    unsigned shift;
@@ -811,13 +732,13 @@ unsigned APInt::countLeadingOnes() const {
      shift = APINT_BITS_PER_WORD - highWordBits;
    }
    int i = getNumWords() - 1;
-  unsigned Count = countLeadingOnes_64(pVal[i], shift);
+  unsigned Count = llvm::countLeadingOnes(pVal[i] << shift);
    if (Count == highWordBits) {
      for (i--; i >= 0; --i) {
        if (pVal[i] == -1ULL)
          Count += APINT_BITS_PER_WORD;
        else {
-        Count += countLeadingOnes_64(pVal[i], 0);
+        Count += llvm::countLeadingOnes(pVal[i]);
          break;
        }
      }
@@ -827,13 +748,13 @@ unsigned APInt::countLeadingOnes() const {
  
  unsigned APInt::countTrailingZeros() const {
    if (isSingleWord())
-    return std::min(unsigned(CountTrailingZeros_64(VAL)), BitWidth);
+    return std::min(unsigned(llvm::countTrailingZeros(VAL)), BitWidth);
    unsigned Count = 0;
    unsigned i = 0;
    for (; i < getNumWords() && pVal[i] == 0; ++i)
      Count += APINT_BITS_PER_WORD;
    if (i < getNumWords())
-    Count += CountTrailingZeros_64(pVal[i]);
+    Count += llvm::countTrailingZeros(pVal[i]);
    return std::min(Count, BitWidth);
  }
  
@@ -843,41 +764,54 @@ unsigned APInt::countTrailingOnesSlowCase() const {
    for (; i < getNumWords() && pVal[i] == -1ULL; ++i)
      Count += APINT_BITS_PER_WORD;
    if (i < getNumWords())
-    Count += CountTrailingOnes_64(pVal[i]);
+    Count += llvm::countTrailingOnes(pVal[i]);
    return std::min(Count, BitWidth);
  }
  
  unsigned APInt::countPopulationSlowCase() const {
    unsigned Count = 0;
    for (unsigned i = 0; i < getNumWords(); ++i)
-    Count += CountPopulation_64(pVal[i]);
+    Count += llvm::countPopulation(pVal[i]);
    return Count;
  }
  
+/// Perform a logical right-shift from Src to Dst, which must be equal or
+/// non-overlapping, of Words words, by Shift, which must be less than 64.
+static void lshrNear(uint64_t *Dst, uint64_t *Src, unsigned Words,
+                     unsigned Shift) {
+  uint64_t Carry = 0;
+  for (int I = Words - 1; I >= 0; --I) {
+    uint64_t Tmp = Src[I];
+    Dst[I] = (Tmp >> Shift) | Carry;
+    Carry = Tmp << (64 - Shift);
+  }
+}
+
  APInt APInt::byteSwap() const {
    assert(BitWidth >= 16 && BitWidth % 16 == 0 && "Cannot byteswap!");
    if (BitWidth == 16)
      return APInt(BitWidth, ByteSwap_16(uint16_t(VAL)));
-  else if (BitWidth == 32)
+  if (BitWidth == 32)
      return APInt(BitWidth, ByteSwap_32(unsigned(VAL)));
-  else if (BitWidth == 48) {
+  if (BitWidth == 48) {
      unsigned Tmp1 = unsigned(VAL >> 16);
      Tmp1 = ByteSwap_32(Tmp1);
      uint16_t Tmp2 = uint16_t(VAL);
      Tmp2 = ByteSwap_16(Tmp2);
      return APInt(BitWidth, (uint64_t(Tmp2) << 32) | Tmp1);
-  } else if (BitWidth == 64)
+  }
+  if (BitWidth == 64)
      return APInt(BitWidth, ByteSwap_64(VAL));
-  else {
-    APInt Result(BitWidth, 0);
-    char *pByte = (char*)Result.pVal;
-    for (unsigned i = 0; i < BitWidth / APINT_WORD_SIZE / 2; ++i) {
-      char Tmp = pByte[i];
-      pByte[i] = pByte[BitWidth / APINT_WORD_SIZE - 1 - i];
-      pByte[BitWidth / APINT_WORD_SIZE - i - 1] = Tmp;
-    }
-    return Result;
+
+  APInt Result(getNumWords() * APINT_BITS_PER_WORD, 0);
+  for (unsigned I = 0, N = getNumWords(); I != N; ++I)
+    Result.pVal[I] = ByteSwap_64(pVal[N - I - 1]);
+  if (Result.BitWidth != BitWidth) {
+    lshrNear(Result.pVal, Result.pVal, getNumWords(),
+             Result.BitWidth - BitWidth);
+    Result.BitWidth = BitWidth;
    }
+  return Result;
  }
  
  APInt llvm::APIntOps::GreatestCommonDivisor(const APInt& API1,
@@ -927,7 +861,7 @@ APInt llvm::APIntOps::RoundDoubleToAPInt(double Double, unsigned width) {
    return isNeg ? -Tmp : Tmp;
  }
  
-/// RoundToDouble - This function converts this APInt to a double.
+/// This function converts this APInt to a double.
  /// The layout for double is as following (IEEE Standard 754):
  ///  --------------------------------------
  /// |  Sign    Exponent    Fraction    Bias |
@@ -995,96 +929,90 @@ double APInt::roundToDouble(bool isSigned) const {
  }
  
  // Truncate to new width.
-APInt &APInt::trunc(unsigned width) {
+APInt APInt::trunc(unsigned width) const {
    assert(width < BitWidth && "Invalid APInt Truncate request");
    assert(width && "Can't truncate to 0 bits");
-  unsigned wordsBefore = getNumWords();
-  BitWidth = width;
-  unsigned wordsAfter = getNumWords();
-  if (wordsBefore != wordsAfter) {
-    if (wordsAfter == 1) {
-      uint64_t *tmp = pVal;
-      VAL = pVal[0];
-      delete [] tmp;
-    } else {
-      uint64_t *newVal = getClearedMemory(wordsAfter);
-      for (unsigned i = 0; i < wordsAfter; ++i)
-        newVal[i] = pVal[i];
-      delete [] pVal;
-      pVal = newVal;
-    }
-  }
-  return clearUnusedBits();
+
+  if (width <= APINT_BITS_PER_WORD)
+    return APInt(width, getRawData()[0]);
+
+  APInt Result(getMemory(getNumWords(width)), width);
+
+  // Copy full words.
+  unsigned i;
+  for (i = 0; i != width / APINT_BITS_PER_WORD; i++)
+    Result.pVal[i] = pVal[i];
+
+  // Truncate and copy any partial word.
+  unsigned bits = (0 - width) % APINT_BITS_PER_WORD;
+  if (bits != 0)
+    Result.pVal[i] = pVal[i] << bits >> bits;
+
+  return Result;
  }
  
  // Sign extend to a new width.
-APInt &APInt::sext(unsigned width) {
+APInt APInt::sext(unsigned width) const {
    assert(width > BitWidth && "Invalid APInt SignExtend request");
-  // If the sign bit isn't set, this is the same as zext.
-  if (!isNegative()) {
-    zext(width);
-    return *this;
+
+  if (width <= APINT_BITS_PER_WORD) {
+    uint64_t val = VAL << (APINT_BITS_PER_WORD - BitWidth);
+    val = (int64_t)val >> (width - BitWidth);
+    return APInt(width, val >> (APINT_BITS_PER_WORD - width));
    }
  
-  // The sign bit is set. First, get some facts
-  unsigned wordsBefore = getNumWords();
-  unsigned wordBits = BitWidth % APINT_BITS_PER_WORD;
-  BitWidth = width;
-  unsigned wordsAfter = getNumWords();
-
-  // Mask the high order word appropriately
-  if (wordsBefore == wordsAfter) {
-    unsigned newWordBits = width % APINT_BITS_PER_WORD;
-    // The extension is contained to the wordsBefore-1th word.
-    uint64_t mask = ~0ULL;
-    if (newWordBits)
-      mask >>= APINT_BITS_PER_WORD - newWordBits;
-    mask <<= wordBits;
-    if (wordsBefore == 1)
-      VAL |= mask;
-    else
-      pVal[wordsBefore-1] |= mask;
-    return clearUnusedBits();
+  APInt Result(getMemory(getNumWords(width)), width);
+
+  // Copy full words.
+  unsigned i;
+  uint64_t word = 0;
+  for (i = 0; i != BitWidth / APINT_BITS_PER_WORD; i++) {
+    word = getRawData()[i];
+    Result.pVal[i] = word;
    }
  
-  uint64_t mask = wordBits == 0 ? 0 : ~0ULL << wordBits;
-  uint64_t *newVal = getMemory(wordsAfter);
-  if (wordsBefore == 1)
-    newVal[0] = VAL | mask;
-  else {
-    for (unsigned i = 0; i < wordsBefore; ++i)
-      newVal[i] = pVal[i];
-    newVal[wordsBefore-1] |= mask;
+  // Read and sign-extend any partial word.
+  unsigned bits = (0 - BitWidth) % APINT_BITS_PER_WORD;
+  if (bits != 0)
+    word = (int64_t)getRawData()[i] << bits >> bits;
+  else
+    word = (int64_t)word >> (APINT_BITS_PER_WORD - 1);
+
+  // Write remaining full words.
+  for (; i != width / APINT_BITS_PER_WORD; i++) {
+    Result.pVal[i] = word;
+    word = (int64_t)word >> (APINT_BITS_PER_WORD - 1);
    }
-  for (unsigned i = wordsBefore; i < wordsAfter; i++)
-    newVal[i] = -1ULL;
-  if (wordsBefore != 1)
-    delete [] pVal;
-  pVal = newVal;
-  return clearUnusedBits();
+
+  // Write any partial word.
+  bits = (0 - width) % APINT_BITS_PER_WORD;
+  if (bits != 0)
+    Result.pVal[i] = word << bits >> bits;
+
+  return Result;
  }
  
  //  Zero extend to a new width.
-APInt &APInt::zext(unsigned width) {
+APInt APInt::zext(unsigned width) const {
    assert(width > BitWidth && "Invalid APInt ZeroExtend request");
-  unsigned wordsBefore = getNumWords();
-  BitWidth = width;
-  unsigned wordsAfter = getNumWords();
-  if (wordsBefore != wordsAfter) {
-    uint64_t *newVal = getClearedMemory(wordsAfter);
-    if (wordsBefore == 1)
-      newVal[0] = VAL;
-    else
-      for (unsigned i = 0; i < wordsBefore; ++i)
-        newVal[i] = pVal[i];
-    if (wordsBefore != 1)
-      delete [] pVal;
-    pVal = newVal;
-  }
-  return *this;
+
+  if (width <= APINT_BITS_PER_WORD)
+    return APInt(width, VAL);
+
+  APInt Result(getMemory(getNumWords(width)), width);
+
+  // Copy words.
+  unsigned i;
+  for (i = 0; i != getNumWords(); i++)
+    Result.pVal[i] = getRawData()[i];
+
+  // Zero remaining words.
+  memset(&Result.pVal[i], 0, (Result.getNumWords() - i) * APINT_WORD_SIZE);
+
+  return Result;
  }
  
-APInt &APInt::zextOrTrunc(unsigned width) {
+APInt APInt::zextOrTrunc(unsigned width) const {
    if (BitWidth < width)
      return zext(width);
    if (BitWidth > width)
@@ -1092,7 +1020,7 @@ APInt &APInt::zextOrTrunc(unsigned width) {
    return *this;
  }
  
-APInt &APInt::sextOrTrunc(unsigned width) {
+APInt APInt::sextOrTrunc(unsigned width) const {
    if (BitWidth < width)
      return sext(width);
    if (BitWidth > width)
@@ -1100,6 +1028,18 @@ APInt &APInt::sextOrTrunc(unsigned width) {
    return *this;
  }
  
+APInt APInt::zextOrSelf(unsigned width) const {
+  if (BitWidth < width)
+    return zext(width);
+  return *this;
+}
+
+APInt APInt::sextOrSelf(unsigned width) const {
+  if (BitWidth < width)
+    return sext(width);
+  return *this;
+}
+
  /// Arithmetic right-shift this APInt by shiftAmt.
  /// @brief Arithmetic right-shift function.
  APInt APInt::ashr(const APInt &shiftAmt) const {
@@ -1169,7 +1109,7 @@ APInt APInt::ashr(unsigned shiftAmt) const {
      // to include in this word.
      val[breakWord] = pVal[breakWord+offset] >> wordShift;
  
-    // Deal with sign extenstion in the break word, and possibly the word before
+    // Deal with sign extension in the break word, and possibly the word before
      // it.
      if (isNegative()) {
        if (wordShift > bitsInWord) {
@@ -1186,7 +1126,9 @@ APInt APInt::ashr(unsigned shiftAmt) const {
    uint64_t fillValue = (isNegative() ? -1ULL : 0);
    for (unsigned i = breakWord+1; i < getNumWords(); ++i)
      val[i] = fillValue;
-  return APInt(val, BitWidth).clearUnusedBits();
+  APInt Result(val, BitWidth);
+  Result.clearUnusedBits();
+  return Result;
  }
  
  /// Logical right-shift this APInt by shiftAmt.
@@ -1199,7 +1141,7 @@ APInt APInt::lshr(const APInt &shiftAmt) const {
  /// @brief Logical right-shift function.
  APInt APInt::lshr(unsigned shiftAmt) const {
    if (isSingleWord()) {
-    if (shiftAmt == BitWidth)
+    if (shiftAmt >= BitWidth)
        return APInt(BitWidth, 0);
      else
        return APInt(BitWidth, this->VAL >> shiftAmt);
@@ -1208,7 +1150,7 @@ APInt APInt::lshr(unsigned shiftAmt) const {
    // If all the bits were shifted out, the result is 0. This avoids issues
    // with shifting by the size of the integer type, which produces undefined
    // results. We define these "undefined results" to always be 0.
-  if (shiftAmt == BitWidth)
+  if (shiftAmt >= BitWidth)
      return APInt(BitWidth, 0);
  
    // If none of the bits are shifted out, the result is *this. This avoids
@@ -1222,12 +1164,10 @@ APInt APInt::lshr(unsigned shiftAmt) const {
  
    // If we are shifting less than a word, compute the shift with a simple carry
    if (shiftAmt < APINT_BITS_PER_WORD) {
-    uint64_t carry = 0;
-    for (int i = getNumWords()-1; i >= 0; --i) {
-      val[i] = (pVal[i] >> shiftAmt) | carry;
-      carry = pVal[i] << (APINT_BITS_PER_WORD - shiftAmt);
-    }
-    return APInt(val, BitWidth).clearUnusedBits();
+    lshrNear(val, pVal, getNumWords(), shiftAmt);
+    APInt Result(val, BitWidth);
+    Result.clearUnusedBits();
+    return Result;
    }
  
    // Compute some values needed by the remaining shift algorithms
@@ -1240,7 +1180,9 @@ APInt APInt::lshr(unsigned shiftAmt) const {
        val[i] = pVal[i+offset];
      for (unsigned i = getNumWords()-offset; i < getNumWords(); i++)
        val[i] = 0;
-    return APInt(val,BitWidth).clearUnusedBits();
+    APInt Result(val, BitWidth);
+    Result.clearUnusedBits();
+    return Result;
    }
  
    // Shift the low order words
@@ -1254,7 +1196,9 @@ APInt APInt::lshr(unsigned shiftAmt) const {
    // Remaining words are 0
    for (unsigned i = breakWord+1; i < getNumWords(); ++i)
      val[i] = 0;
-  return APInt(val, BitWidth).clearUnusedBits();
+  APInt Result(val, BitWidth);
+  Result.clearUnusedBits();
+  return Result;
  }
  
  /// Left-shift this APInt by shiftAmt.
@@ -1287,7 +1231,9 @@ APInt APInt::shlSlowCase(unsigned shiftAmt) const {
        val[i] = pVal[i] << shiftAmt | carry;
        carry = pVal[i] >> (APINT_BITS_PER_WORD - shiftAmt);
      }
-    return APInt(val, BitWidth).clearUnusedBits();
+    APInt Result(val, BitWidth);
+    Result.clearUnusedBits();
+    return Result;
    }
  
    // Compute some values needed by the remaining shift algorithms
@@ -1300,7 +1246,9 @@ APInt APInt::shlSlowCase(unsigned shiftAmt) const {
        val[i] = 0;
      for (unsigned i = offset; i < getNumWords(); i++)
        val[i] = pVal[i-offset];
-    return APInt(val,BitWidth).clearUnusedBits();
+    APInt Result(val, BitWidth);
+    Result.clearUnusedBits();
+    return Result;
    }
  
    // Copy whole words from this to Result.
@@ -1311,7 +1259,9 @@ APInt APInt::shlSlowCase(unsigned shiftAmt) const {
    val[offset] = pVal[0] << wordShift;
    for (i = 0; i < offset; ++i)
      val[i] = 0;
-  return APInt(val, BitWidth).clearUnusedBits();
+  APInt Result(val, BitWidth);
+  Result.clearUnusedBits();
+  return Result;
  }
  
  APInt APInt::rotl(const APInt &rotateAmt) const {
@@ -1319,14 +1269,10 @@ APInt APInt::rotl(const APInt &rotateAmt) const {
  }
  
  APInt APInt::rotl(unsigned rotateAmt) const {
+  rotateAmt %= BitWidth;
    if (rotateAmt == 0)
      return *this;
-  // Don't get too fancy, just use existing shift/or facilities
-  APInt hi(*this);
-  APInt lo(*this);
-  hi.shl(rotateAmt);
-  lo.lshr(BitWidth - rotateAmt);
-  return hi | lo;
+  return shl(rotateAmt) | lshr(BitWidth - rotateAmt);
  }
  
  APInt APInt::rotr(const APInt &rotateAmt) const {
@@ -1334,14 +1280,10 @@ APInt APInt::rotr(const APInt &rotateAmt) const {
  }
  
  APInt APInt::rotr(unsigned rotateAmt) const {
+  rotateAmt %= BitWidth;
    if (rotateAmt == 0)
      return *this;
-  // Don't get too fancy, just use existing shift/or facilities
-  APInt hi(*this);
-  APInt lo(*this);
-  lo.lshr(rotateAmt);
-  hi.shl(BitWidth - rotateAmt);
-  return hi | lo;
+  return lshr(rotateAmt) | shl(BitWidth - rotateAmt);
  }
  
  // Square Root - this method computes and returns the square root of "this".
@@ -1376,18 +1318,13 @@ APInt APInt::sqrt() const {
    // libc sqrt function which will probably use a hardware sqrt computation.
    // This should be faster than the algorithm below.
    if (magnitude < 52) {
-#if HAVE_ROUND
      return APInt(BitWidth,
                   uint64_t(::round(::sqrt(double(isSingleWord()?VAL:pVal[0])))));
-#else
-    return APInt(BitWidth,
-                 uint64_t(::sqrt(double(isSingleWord()?VAL:pVal[0]))) + 0.5);
-#endif
    }
  
    // Okay, all the short cuts are exhausted. We must compute it. The following
    // is a classical Babylonian method for computing the square root. This code
-  // was adapted to APINt from a wikipedia article on such computations.
+  // was adapted to APInt from a wikipedia article on such computations.
    // See http://www.wikipedia.org/ and go to the page named
    // Calculate_an_integer_square_root.
    unsigned nbits = BitWidth, i = 4;
@@ -1421,15 +1358,11 @@ APInt APInt::sqrt() const {
    APInt nextSquare((x_old + 1) * (x_old +1));
    if (this->ult(square))
      return x_old;
-  else if (this->ule(nextSquare)) {
-    APInt midpoint((nextSquare - square).udiv(two));
-    APInt offset(*this - square);
-    if (offset.ult(midpoint))
-      return x_old;
-    else
-      return x_old + 1;
-  } else
-    llvm_unreachable("Error in APInt::sqrt computation");
+  assert(this->ule(nextSquare) && "Error in APInt::sqrt computation");
+  APInt midpoint((nextSquare - square).udiv(two));
+  APInt offset(*this - square);
+  if (offset.ult(midpoint))
+    return x_old;
    return x_old + 1;
  }
  
@@ -1511,7 +1444,7 @@ APInt::ms APInt::magic() const {
        r2 = r2 - ad;
      }
      delta = ad - r2;
-  } while (q1.ule(delta) || (q1 == delta && r1 == 0));
+  } while (q1.ult(delta) || (q1 == delta && r1 == 0));
  
    mag.m = q2 + 1;
    if (d.isNegative()) mag.m = -mag.m;   // resulting magic number
@@ -1523,17 +1456,19 @@ APInt::ms APInt::magic() const {
  /// division by a constant as a sequence of multiplies, adds and shifts.
  /// Requires that the divisor not be 0.  Taken from "Hacker's Delight", Henry
  /// S. Warren, Jr., chapter 10.
-APInt::mu APInt::magicu() const {
+/// LeadingZeros can be used to simplify the calculation if the upper bits
+/// of the divided value are known zero.
+APInt::mu APInt::magicu(unsigned LeadingZeros) const {
    const APInt& d = *this;
    unsigned p;
    APInt nc, delta, q1, r1, q2, r2;
    struct mu magu;
    magu.a = 0;               // initialize "add" indicator
-  APInt allOnes = APInt::getAllOnesValue(d.getBitWidth());
+  APInt allOnes = APInt::getAllOnesValue(d.getBitWidth()).lshr(LeadingZeros);
    APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
    APInt signedMax = APInt::getSignedMaxValue(d.getBitWidth());
  
-  nc = allOnes - (-d).urem(d);
+  nc = allOnes - (allOnes - d).urem(d);
    p = d.getBitWidth() - 1;  // initialize p
    q1 = signedMin.udiv(nc);  // initialize q1 = 2p/nc
    r1 = signedMin - q1*nc;   // initialize r1 = rem(2p,nc)
@@ -1576,21 +1511,18 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
    assert(u && "Must provide dividend");
    assert(v && "Must provide divisor");
    assert(q && "Must provide quotient");
-  assert(u != v && u != q && v != q && "Must us different memory");
+  assert(u != v && u != q && v != q && "Must use different memory");
    assert(n>1 && "n must be > 1");
  
-  // Knuth uses the value b as the base of the number system. In our case b
-  // is 2^31 so we just set it to -1u.
-  uint64_t b = uint64_t(1) << 32;
+  // b denotes the base of the number system. In our case b is 2^32.
+  LLVM_CONSTEXPR uint64_t b = uint64_t(1) << 32;
  
-#if 0
    DEBUG(dbgs() << "KnuthDiv: m=" << m << " n=" << n << '\n');
    DEBUG(dbgs() << "KnuthDiv: original:");
    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
    DEBUG(dbgs() << " by");
    DEBUG(for (int i = n; i >0; i--) dbgs() << " " << v[i-1]);
    DEBUG(dbgs() << '\n');
-#endif
    // D1. [Normalize.] Set d = b / (v[n-1] + 1) and multiply all the digits of
    // u and v by d. Note that we have taken Knuth's advice here to use a power
    // of 2 value for d such that d * v[n-1] >= b/2 (b is the base). A power of
@@ -1599,7 +1531,7 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
    // and v so that its high bits are shifted to the top of v's range without
    // overflow. Note that this can require an extra word in u so that u must
    // be of length m+n+1.
-  unsigned shift = CountLeadingZeros_32(v[n-1]);
+  unsigned shift = countLeadingZeros(v[n-1]);
    unsigned v_carry = 0;
    unsigned u_carry = 0;
    if (shift) {
@@ -1615,13 +1547,12 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
      }
    }
    u[m+n] = u_carry;
-#if 0
+
    DEBUG(dbgs() << "KnuthDiv:   normal:");
    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
    DEBUG(dbgs() << " by");
    DEBUG(for (int i = n; i >0; i--) dbgs() << " " << v[i-1]);
    DEBUG(dbgs() << '\n');
-#endif
  
    // D2. [Initialize j.]  Set j to m. This is the loop counter over the places.
    int j = m;
@@ -1651,44 +1582,23 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
      // (u[j+n]u[j+n-1]..u[j]) - qp * (v[n-1]...v[1]v[0]). This computation
      // consists of a simple multiplication by a one-place number, combined with
      // a subtraction.
-    bool isNeg = false;
-    for (unsigned i = 0; i < n; ++i) {
-      uint64_t u_tmp = uint64_t(u[j+i]) | (uint64_t(u[j+i+1]) << 32);
-      uint64_t subtrahend = uint64_t(qp) * uint64_t(v[i]);
-      bool borrow = subtrahend > u_tmp;
-      DEBUG(dbgs() << "KnuthDiv: u_tmp == " << u_tmp
-                   << ", subtrahend == " << subtrahend
-                   << ", borrow = " << borrow << '\n');
-
-      uint64_t result = u_tmp - subtrahend;
-      unsigned k = j + i;
-      u[k++] = (unsigned)(result & (b-1)); // subtract low word
-      u[k++] = (unsigned)(result >> 32);   // subtract high word
-      while (borrow && k <= m+n) { // deal with borrow to the left
-        borrow = u[k] == 0;
-        u[k]--;
-        k++;
-      }
-      isNeg |= borrow;
-      DEBUG(dbgs() << "KnuthDiv: u[j+i] == " << u[j+i] << ",  u[j+i+1] == " <<
-                    u[j+i+1] << '\n');
-    }
-    DEBUG(dbgs() << "KnuthDiv: after subtraction:");
-    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
-    DEBUG(dbgs() << '\n');
      // The digits (u[j+n]...u[j]) should be kept positive; if the result of
      // this step is actually negative, (u[j+n]...u[j]) should be left as the
      // true value plus b**(n+1), namely as the b's complement of
      // the true value, and a "borrow" to the left should be remembered.
-    //
-    if (isNeg) {
-      bool carry = true;  // true because b's complement is "complement + 1"
-      for (unsigned i = 0; i <= m+n; ++i) {
-        u[i] = ~u[i] + carry; // b's complement
-        carry = carry && u[i] == 0;
-      }
+    int64_t borrow = 0;
+    for (unsigned i = 0; i < n; ++i) {
+      uint64_t p = uint64_t(qp) * uint64_t(v[i]);
+      int64_t subres = int64_t(u[j+i]) - borrow - (unsigned)p;
+      u[j+i] = (unsigned)subres;
+      borrow = (p >> 32) - (subres >> 32);
+      DEBUG(dbgs() << "KnuthDiv: u[j+i] = " << u[j+i]
+                   << ", borrow = " << borrow << '\n');
      }
-    DEBUG(dbgs() << "KnuthDiv: after complement:");
+    bool isNeg = u[j+n] < borrow;
+    u[j+n] -= (unsigned)borrow;
+
+    DEBUG(dbgs() << "KnuthDiv: after subtraction:");
      DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
      DEBUG(dbgs() << '\n');
  
@@ -1712,7 +1622,7 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
        u[j+n] += carry;
      }
      DEBUG(dbgs() << "KnuthDiv: after correction:");
-    DEBUG(for (int i = m+n; i >=0; i--) dbgs() <<" " << u[i]);
+    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
      DEBUG(dbgs() << "\nKnuthDiv: digit result = " << q[j] << '\n');
  
    // D7. [Loop on j.]  Decrease j by one. Now if j >= 0, go back to D3.
@@ -1745,9 +1655,7 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
      }
      DEBUG(dbgs() << '\n');
    }
-#if 0
    DEBUG(dbgs() << '\n');
-#endif
  }
  
  void APInt::divide(const APInt LHS, unsigned lhsWords,
@@ -1770,10 +1678,10 @@ void APInt::divide(const APInt LHS, unsigned lhsWords,
    // Allocate space for the temporary values we need either on the stack, if
    // it will fit, or on the heap if it won't.
    unsigned SPACE[128];
-  unsigned *U = 0;
-  unsigned *V = 0;
-  unsigned *Q = 0;
-  unsigned *R = 0;
+  unsigned *U = nullptr;
+  unsigned *V = nullptr;
+  unsigned *Q = nullptr;
+  unsigned *R = nullptr;
    if ((Remainder?4:3)*n+2*m+1 <= 128) {
      U = &SPACE[0];
      V = &SPACE[m+n+1];
@@ -1871,6 +1779,8 @@ void APInt::divide(const APInt LHS, unsigned lhsWords,
  
      // The quotient is in Q. Reconstitute the quotient into Quotient's low
      // order words.
+    // This case is currently dead as all users of divide() handle trivial cases
+    // earlier.
      if (lhsWords == 1) {
        uint64_t tmp =
          uint64_t(Q[0]) | (uint64_t(Q[1]) << (APINT_BITS_PER_WORD / 2));
@@ -1959,10 +1869,21 @@ APInt APInt::udiv(const APInt& RHS) const {
  
    // We have to compute it the hard way. Invoke the Knuth divide algorithm.
    APInt Quotient(1,0); // to hold result.
-  divide(*this, lhsWords, RHS, rhsWords, &Quotient, 0);
+  divide(*this, lhsWords, RHS, rhsWords, &Quotient, nullptr);
    return Quotient;
  }
  
+APInt APInt::sdiv(const APInt &RHS) const {
+  if (isNegative()) {
+    if (RHS.isNegative())
+      return (-(*this)).udiv(-RHS);
+    return -((-(*this)).udiv(RHS));
+  }
+  if (RHS.isNegative())
+    return -(this->udiv(-RHS));
+  return this->udiv(RHS);
+}
+
  APInt APInt::urem(const APInt& RHS) const {
    assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
    if (isSingleWord()) {
@@ -1996,12 +1917,35 @@ APInt APInt::urem(const APInt& RHS) const {
  
    // We have to compute it the hard way. Invoke the Knuth divide algorithm.
    APInt Remainder(1,0);
-  divide(*this, lhsWords, RHS, rhsWords, 0, &Remainder);
+  divide(*this, lhsWords, RHS, rhsWords, nullptr, &Remainder);
    return Remainder;
  }
  
+APInt APInt::srem(const APInt &RHS) const {
+  if (isNegative()) {
+    if (RHS.isNegative())
+      return -((-(*this)).urem(-RHS));
+    return -((-(*this)).urem(RHS));
+  }
+  if (RHS.isNegative())
+    return this->urem(-RHS);
+  return this->urem(RHS);
+}
+
  void APInt::udivrem(const APInt &LHS, const APInt &RHS,
                      APInt &Quotient, APInt &Remainder) {
+  assert(LHS.BitWidth == RHS.BitWidth && "Bit widths must be the same");
+
+  // First, deal with the easy case
+  if (LHS.isSingleWord()) {
+    assert(RHS.VAL != 0 && "Divide by zero?");
+    uint64_t QuotVal = LHS.VAL / RHS.VAL;
+    uint64_t RemVal = LHS.VAL % RHS.VAL;
+    Quotient = APInt(LHS.BitWidth, QuotVal);
+    Remainder = APInt(LHS.BitWidth, RemVal);
+    return;
+  }
+
    // Get some size facts about the dividend and divisor
    unsigned lhsBits  = LHS.getActiveBits();
    unsigned lhsWords = !lhsBits ? 0 : (APInt::whichWord(lhsBits - 1) + 1);
@@ -2040,6 +1984,24 @@ void APInt::udivrem(const APInt &LHS, const APInt &RHS,
    divide(LHS, lhsWords, RHS, rhsWords, &Quotient, &Remainder);
  }
  
+void APInt::sdivrem(const APInt &LHS, const APInt &RHS,
+                    APInt &Quotient, APInt &Remainder) {
+  if (LHS.isNegative()) {
+    if (RHS.isNegative())
+      APInt::udivrem(-LHS, -RHS, Quotient, Remainder);
+    else {
+      APInt::udivrem(-LHS, RHS, Quotient, Remainder);
+      Quotient = -Quotient;
+    }
+    Remainder = -Remainder;
+  } else if (RHS.isNegative()) {
+    APInt::udivrem(LHS, -RHS, Quotient, Remainder);
+    Quotient = -Quotient;
+  } else {
+    APInt::udivrem(LHS, RHS, Quotient, Remainder);
+  }
+}
+
  APInt APInt::sadd_ov(const APInt &RHS, bool &Overflow) const {
    APInt Res = *this+RHS;
    Overflow = isNonNegative() == RHS.isNonNegative() &&
@@ -2082,27 +2044,48 @@ APInt APInt::smul_ov(const APInt &RHS, bool &Overflow) const {
    return Res;
  }
  
-APInt APInt::sshl_ov(unsigned ShAmt, bool &Overflow) const {
-  Overflow = ShAmt >= getBitWidth();
+APInt APInt::umul_ov(const APInt &RHS, bool &Overflow) const {
+  APInt Res = *this * RHS;
+
+  if (*this != 0 && RHS != 0)
+    Overflow = Res.udiv(RHS) != *this || Res.udiv(*this) != RHS;
+  else
+    Overflow = false;
+  return Res;
+}
+
+APInt APInt::sshl_ov(const APInt &ShAmt, bool &Overflow) const {
+  Overflow = ShAmt.uge(getBitWidth());
    if (Overflow)
-    ShAmt = getBitWidth()-1;
+    return APInt(BitWidth, 0);
  
    if (isNonNegative()) // Don't allow sign change.
-    Overflow = ShAmt >= countLeadingZeros();
+    Overflow = ShAmt.uge(countLeadingZeros());
    else
-    Overflow = ShAmt >= countLeadingOnes();
+    Overflow = ShAmt.uge(countLeadingOnes());
    
    return *this << ShAmt;
  }
  
+APInt APInt::ushl_ov(const APInt &ShAmt, bool &Overflow) const {
+  Overflow = ShAmt.uge(getBitWidth());
+  if (Overflow)
+    return APInt(BitWidth, 0);
+
+  Overflow = ShAmt.ugt(countLeadingZeros());
+
+  return *this << ShAmt;
+}
+
  
  
  
  void APInt::fromString(unsigned numbits, StringRef str, uint8_t radix) {
    // Check our assumptions here
    assert(!str.empty() && "Invalid string length");
-  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2) &&
-         "Radix should be 2, 8, 10, or 16!");
+  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 || 
+          radix == 36) &&
+         "Radix should be 2, 8, 10, 16, or 36!");
  
    StringRef::iterator p = str.begin();
    size_t slen = str.size();
@@ -2152,23 +2135,49 @@ void APInt::fromString(unsigned numbits, StringRef str, uint8_t radix) {
    }
    // If its negative, put it in two's complement form
    if (isNeg) {
-    (*this)--;
+    --(*this);
      this->flipAllBits();
    }
  }
  
  void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
-                     bool Signed) const {
-  assert((Radix == 10 || Radix == 8 || Radix == 16 || Radix == 2) &&
-         "Radix should be 2, 8, 10, or 16!");
+                     bool Signed, bool formatAsCLiteral) const {
+  assert((Radix == 10 || Radix == 8 || Radix == 16 || Radix == 2 || 
+          Radix == 36) &&
+         "Radix should be 2, 8, 10, 16, or 36!");
+
+  const char *Prefix = "";
+  if (formatAsCLiteral) {
+    switch (Radix) {
+      case 2:
+        // Binary literals are a non-standard extension added in gcc 4.3:
+        // http://gcc.gnu.org/onlinedocs/gcc-4.3.0/gcc/Binary-constants.html
+        Prefix = "0b";
+        break;
+      case 8:
+        Prefix = "0";
+        break;
+      case 10:
+        break; // No prefix
+      case 16:
+        Prefix = "0x";
+        break;
+      default:
+        llvm_unreachable("Invalid radix!");
+    }
+  }
  
    // First, check for a zero value and just short circuit the logic below.
    if (*this == 0) {
+    while (*Prefix) {
+      Str.push_back(*Prefix);
+      ++Prefix;
+    };
      Str.push_back('0');
      return;
    }
  
-  static const char Digits[] = "0123456789ABCDEF";
+  static const char Digits[] = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ";
  
    if (isSingleWord()) {
      char Buffer[65];
@@ -2187,6 +2196,11 @@ void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
        }
      }
  
+    while (*Prefix) {
+      Str.push_back(*Prefix);
+      ++Prefix;
+    };
+
      while (N) {
        *--BufPtr = Digits[N % Radix];
        N /= Radix;
@@ -2202,17 +2216,22 @@ void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
      // Flip the bits and add one to turn it into the equivalent positive
      // value and put a '-' in the result.
      Tmp.flipAllBits();
-    Tmp++;
+    ++Tmp;
      Str.push_back('-');
    }
  
+  while (*Prefix) {
+    Str.push_back(*Prefix);
+    ++Prefix;
+  };
+
    // We insert the digits backward, then reverse them to get the right order.
    unsigned StartDig = Str.size();
  
    // For the 2, 8 and 16 bit cases, we can just shift instead of divide
    // because the number of bits per digit (1, 3 and 4 respectively) divides
    // equaly.  We just shift until the value is zero.
-  if (Radix != 10) {
+  if (Radix == 2 || Radix == 8 || Radix == 16) {
      // Just shift tmp right for each digit width until it becomes zero
      unsigned ShiftAmt = (Radix == 16 ? 4 : (Radix == 8 ? 3 : 1));
      unsigned MaskAmt = Radix - 1;
@@ -2223,7 +2242,7 @@ void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
        Tmp = Tmp.lshr(ShiftAmt);
      }
    } else {
-    APInt divisor(4, 10);
+    APInt divisor(Radix == 10? 4 : 8, Radix);
      while (Tmp != 0) {
        APInt APdigit(1, 0);
        APInt tmp2(Tmp.getBitWidth(), 0);
@@ -2240,12 +2259,11 @@ void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
    std::reverse(Str.begin()+StartDig, Str.end());
  }
  
-/// toString - This returns the APInt as a std::string.  Note that this is an
-/// inefficient method.  It is better to pass in a SmallVector/SmallString
-/// to the methods above.
+/// Returns the APInt as a std::string. Note that this is an inefficient method.
+/// It is better to pass in a SmallVector/SmallString to the methods above.
  std::string APInt::toString(unsigned Radix = 10, bool Signed = true) const {
    SmallString<40> S;
-  toString(S, Radix, Signed);
+  toString(S, Radix, Signed, /* formatAsCLiteral = */false);
    return S.str();
  }
  
@@ -2255,13 +2273,13 @@ void APInt::dump() const {
    this->toStringUnsigned(U);
    this->toStringSigned(S);
    dbgs() << "APInt(" << BitWidth << "b, "
-         << U.str() << "u " << S.str() << "s)";
+         << U << "u " << S << "s)";
  }
  
  void APInt::print(raw_ostream &OS, bool isSigned) const {
    SmallString<40> S;
-  this->toString(S, 10, isSigned);
-  OS << S.str();
+  this->toString(S, 10, isSigned, /* formatAsCLiteral = */false);
+  OS << S;
  }
  
  // This implements a variety of operations on a representation of
@@ -2269,8 +2287,7 @@ void APInt::print(raw_ostream &OS, bool isSigned) const {
  
  // Assumed by lowHalf, highHalf, partMSB and partLSB.  A fairly safe
  // and unrestricting assumption.
-#define COMPILE_TIME_ASSERT(cond) extern int CTAssert[(cond) ? 1 : -1]
-COMPILE_TIME_ASSERT(integerPartWidth % 2 == 0);
+static_assert(integerPartWidth % 2 == 0, "Part width must be divisible by 2!");
  
  /* Some handy functions local to this file.  */
  namespace {
@@ -2304,24 +2321,7 @@ namespace {
    static unsigned int
    partMSB(integerPart value)
    {
-    unsigned int n, msb;
-
-    if (value == 0)
-      return -1U;
-
-    n = integerPartWidth / 2;
-
-    msb = 0;
-    do {
-      if (value >> n) {
-        value >>= n;
-        msb += n;
-      }
-
-      n >>= 1;
-    } while (n);
-
-    return msb;
+    return findLastSet(value, ZB_Max);
    }
  
    /* Returns the bit number of the least significant set bit of a
@@ -2329,24 +2329,7 @@ namespace {
    static unsigned int
    partLSB(integerPart value)
    {
-    unsigned int n, lsb;
-
-    if (value == 0)
-      return -1U;
-
-    lsb = integerPartWidth - 1;
-    n = integerPartWidth / 2;
-
-    do {
-      if (value << n) {
-        value <<= n;
-        lsb -= n;
-      }
-
-      n >>= 1;
-    } while (n);
-
-    return lsb;
+    return findFirstSet(value, ZB_Max);
    }
  }
  
@@ -2888,6 +2871,20 @@ APInt::tcIncrement(integerPart *dst, unsigned int parts)
    return i == parts;
  }
  
+/* Decrement a bignum in-place, return the borrow flag.  */
+integerPart
+APInt::tcDecrement(integerPart *dst, unsigned int parts) {
+  for (unsigned int i = 0; i < parts; i++) {
+    // If the current word is non-zero, then the decrement has no effect on the
+    // higher-order words of the integer and no borrow can occur. Exit early.
+    if (dst[i]--)
+      return 0;
+  }
+  // If every word was zero, then there is a borrow.
+  return 1;
+}
+
+
  /* Set the least significant BITS bits of a bignum, clear the
     rest.  */
  void