Fix undefined behavior.

[oota-llvm.git] / lib / Support / APInt.cpp
diff --git a/lib/Support/APInt.cpp b/lib/Support/APInt.cpp

index 73bf774b171762301395eaac7c4cc4632ce1b51d..0d4e0f9f752aff20b341283196aacadcb2e871b8 100644 (file)
--- a/lib/Support/APInt.cpp
+++ b/lib/Support/APInt.cpp
@@ -14,9 +14,11 @@
  
  #define DEBUG_TYPE "apint"
  #include "llvm/ADT/APInt.h"
+#include "llvm/ADT/StringRef.h"
  #include "llvm/ADT/FoldingSet.h"
  #include "llvm/ADT/SmallString.h"
  #include "llvm/Support/Debug.h"
+#include "llvm/Support/ErrorHandling.h"
  #include "llvm/Support/MathExtras.h"
  #include "llvm/Support/raw_ostream.h"
  #include <cmath>
@@ -34,7 +36,7 @@ inline static uint64_t* getClearedMemory(unsigned numWords) {
    return result;
  }
  
-/// A utility function for allocating memory and checking for allocation 
+/// A utility function for allocating memory and checking for allocation
  /// failure.  The content is not zeroed.
  inline static uint64_t* getMemory(unsigned numWords) {
    uint64_t * result = new uint64_t[numWords];
@@ -42,10 +44,38 @@ inline static uint64_t* getMemory(unsigned numWords) {
    return result;
  }
  
+/// A utility function that converts a character to a digit.
+inline static unsigned getDigit(char cdigit, uint8_t radix) {
+  unsigned r;
+
+  if (radix == 16 || radix == 36) {
+    r = cdigit - '0';
+    if (r <= 9)
+      return r;
+
+    r = cdigit - 'A';
+    if (r <= radix - 11U)
+      return r + 10;
+
+    r = cdigit - 'a';
+    if (r <= radix - 11U)
+      return r + 10;
+    
+    radix = 10;
+  }
+
+  r = cdigit - '0';
+  if (r < radix)
+    return r;
+
+  return -1U;
+}
+
+
  void APInt::initSlowCase(unsigned numBits, uint64_t val, bool isSigned) {
    pVal = getClearedMemory(getNumWords());
    pVal[0] = val;
-  if (isSigned && int64_t(val) < 0) 
+  if (isSigned && int64_t(val) < 0)
      for (unsigned i = 1; i < getNumWords(); ++i)
        pVal[i] = -1ULL;
  }
@@ -55,30 +85,37 @@ void APInt::initSlowCase(const APInt& that) {
    memcpy(pVal, that.pVal, getNumWords() * APINT_WORD_SIZE);
  }
  
-
-APInt::APInt(unsigned numBits, unsigned numWords, const uint64_t bigVal[])
-  : BitWidth(numBits), VAL(0) {
-  assert(BitWidth && "bitwidth too small");
-  assert(bigVal && "Null pointer detected!");
+void APInt::initFromArray(ArrayRef<uint64_t> bigVal) {
+  assert(BitWidth && "Bitwidth too small");
+  assert(bigVal.data() && "Null pointer detected!");
    if (isSingleWord())
      VAL = bigVal[0];
    else {
      // Get memory, cleared to 0
      pVal = getClearedMemory(getNumWords());
      // Calculate the number of words to copy
-    unsigned words = std::min<unsigned>(numWords, getNumWords());
+    unsigned words = std::min<unsigned>(bigVal.size(), getNumWords());
      // Copy the words from bigVal to pVal
-    memcpy(pVal, bigVal, words * APINT_WORD_SIZE);
+    memcpy(pVal, bigVal.data(), words * APINT_WORD_SIZE);
    }
    // Make sure unused high bits are cleared
    clearUnusedBits();
  }
  
-APInt::APInt(unsigned numbits, const char StrStart[], unsigned slen,
-             uint8_t radix) 
+APInt::APInt(unsigned numBits, ArrayRef<uint64_t> bigVal)
+  : BitWidth(numBits), VAL(0) {
+  initFromArray(bigVal);
+}
+
+APInt::APInt(unsigned numBits, unsigned numWords, const uint64_t bigVal[])
+  : BitWidth(numBits), VAL(0) {
+  initFromArray(makeArrayRef(bigVal, numWords));
+}
+
+APInt::APInt(unsigned numbits, StringRef Str, uint8_t radix)
    : BitWidth(numbits), VAL(0) {
-  assert(BitWidth && "bitwidth too small");
-  fromString(numbits, StrStart, slen, radix);
+  assert(BitWidth && "Bitwidth too small");
+  fromString(numbits, Str, radix);
  }
  
  APInt& APInt::AssignSlowCase(const APInt& RHS) {
@@ -99,7 +136,7 @@ APInt& APInt::AssignSlowCase(const APInt& RHS) {
      VAL = 0;
      pVal = getMemory(RHS.getNumWords());
      memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
-  } else if (getNumWords() == RHS.getNumWords()) 
+  } else if (getNumWords() == RHS.getNumWords())
      memcpy(pVal, RHS.pVal, RHS.getNumWords() * APINT_WORD_SIZE);
    else if (RHS.isSingleWord()) {
      delete [] pVal;
@@ -114,7 +151,7 @@ APInt& APInt::AssignSlowCase(const APInt& RHS) {
  }
  
  APInt& APInt::operator=(uint64_t RHS) {
-  if (isSingleWord()) 
+  if (isSingleWord())
      VAL = RHS;
    else {
      pVal[0] = RHS;
@@ -126,7 +163,7 @@ APInt& APInt::operator=(uint64_t RHS) {
  /// Profile - This method 'profiles' an APInt for use with FoldingSet.
  void APInt::Profile(FoldingSetNodeID& ID) const {
    ID.AddInteger(BitWidth);
-  
+
    if (isSingleWord()) {
      ID.AddInteger(VAL);
      return;
@@ -137,7 +174,7 @@ void APInt::Profile(FoldingSetNodeID& ID) const {
      ID.AddInteger(pVal[i]);
  }
  
-/// add_1 - This function adds a single "digit" integer, y, to the multiple 
+/// add_1 - This function adds a single "digit" integer, y, to the multiple
  /// "digit" integer array,  x[]. x[] is modified to reflect the addition and
  /// 1 is returned if there is a carry out, otherwise 0 is returned.
  /// @returns the carry of the addition.
@@ -156,15 +193,15 @@ static bool add_1(uint64_t dest[], uint64_t x[], unsigned len, uint64_t y) {
  
  /// @brief Prefix increment operator. Increments the APInt by one.
  APInt& APInt::operator++() {
-  if (isSingleWord()) 
+  if (isSingleWord())
      ++VAL;
    else
      add_1(pVal, pVal, getNumWords(), 1);
    return clearUnusedBits();
  }
  
-/// sub_1 - This function subtracts a single "digit" (64-bit word), y, from 
-/// the multi-digit integer array, x[], propagating the borrowed 1 value until 
+/// sub_1 - This function subtracts a single "digit" (64-bit word), y, from
+/// the multi-digit integer array, x[], propagating the borrowed 1 value until
  /// no further borrowing is neeeded or it runs out of "digits" in x.  The result
  /// is 1 if "borrowing" exhausted the digits in x, or 0 if x was not exhausted.
  /// In other words, if y > x then this function returns 1, otherwise 0.
@@ -173,7 +210,7 @@ static bool sub_1(uint64_t x[], unsigned len, uint64_t y) {
    for (unsigned i = 0; i < len; ++i) {
      uint64_t X = x[i];
      x[i] -= y;
-    if (y > X) 
+    if (y > X)
        y = 1;  // We have to "borrow 1" from next "digit"
      else {
        y = 0;  // No need to borrow
@@ -185,7 +222,7 @@ static bool sub_1(uint64_t x[], unsigned len, uint64_t y) {
  
  /// @brief Prefix decrement operator. Decrements the APInt by one.
  APInt& APInt::operator--() {
-  if (isSingleWord()) 
+  if (isSingleWord())
      --VAL;
    else
      sub_1(pVal, getNumWords(), 1);
@@ -193,10 +230,10 @@ APInt& APInt::operator--() {
  }
  
  /// add - This function adds the integer array x to the integer array Y and
-/// places the result in dest. 
+/// places the result in dest.
  /// @returns the carry out from the addition
  /// @brief General addition of 64-bit integer arrays
-static bool add(uint64_t *dest, const uint64_t *x, const uint64_t *y, 
+static bool add(uint64_t *dest, const uint64_t *x, const uint64_t *y,
                  unsigned len) {
    bool carry = false;
    for (unsigned i = 0; i< len; ++i) {
@@ -209,10 +246,10 @@ static bool add(uint64_t *dest, const uint64_t *x, const uint64_t *y,
  
  /// Adds the RHS APint to this APInt.
  /// @returns this, after addition of RHS.
-/// @brief Addition assignment operator. 
+/// @brief Addition assignment operator.
  APInt& APInt::operator+=(const APInt& RHS) {
    assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
-  if (isSingleWord()) 
+  if (isSingleWord())
      VAL += RHS.VAL;
    else {
      add(pVal, pVal, RHS.pVal, getNumWords());
@@ -220,10 +257,10 @@ APInt& APInt::operator+=(const APInt& RHS) {
    return clearUnusedBits();
  }
  
-/// Subtracts the integer array y from the integer array x 
+/// Subtracts the integer array y from the integer array x
  /// @returns returns the borrow out.
  /// @brief Generalized subtraction of 64-bit integer arrays.
-static bool sub(uint64_t *dest, const uint64_t *x, const uint64_t *y, 
+static bool sub(uint64_t *dest, const uint64_t *x, const uint64_t *y,
                  unsigned len) {
    bool borrow = false;
    for (unsigned i = 0; i < len; ++i) {
@@ -236,18 +273,18 @@ static bool sub(uint64_t *dest, const uint64_t *x, const uint64_t *y,
  
  /// Subtracts the RHS APInt from this APInt
  /// @returns this, after subtraction
-/// @brief Subtraction assignment operator. 
+/// @brief Subtraction assignment operator.
  APInt& APInt::operator-=(const APInt& RHS) {
    assert(BitWidth == RHS.BitWidth && "Bit widths must be the same");
-  if (isSingleWord()) 
+  if (isSingleWord())
      VAL -= RHS.VAL;
    else
      sub(pVal, pVal, RHS.pVal, getNumWords());
    return clearUnusedBits();
  }
  
-/// Multiplies an integer array, x by a a uint64_t integer and places the result
-/// into dest. 
+/// Multiplies an integer array, x, by a uint64_t integer and places the result
+/// into dest.
  /// @returns the carry out of the multiplication.
  /// @brief Multiply a multi-digit APInt by a single digit (64-bit) integer.
  static uint64_t mul_1(uint64_t dest[], uint64_t x[], unsigned len, uint64_t y) {
@@ -269,19 +306,19 @@ static uint64_t mul_1(uint64_t dest[], uint64_t x[], unsigned len, uint64_t y) {
      // Determine if the add above introduces carry.
      hasCarry = (dest[i] < carry) ? 1 : 0;
      carry = hx * ly + (dest[i] >> 32) + (hasCarry ? (1ULL << 32) : 0);
-    // The upper limit of carry can be (2^32 - 1)(2^32 - 1) + 
+    // The upper limit of carry can be (2^32 - 1)(2^32 - 1) +
      // (2^32 - 1) + 2^32 = 2^64.
      hasCarry = (!carry && hasCarry) ? 1 : (!carry ? 2 : 0);
  
      carry += (lx * hy) & 0xffffffffULL;
      dest[i] = (carry << 32) | (dest[i] & 0xffffffffULL);
-    carry = (((!carry && hasCarry != 2) || hasCarry == 1) ? (1ULL << 32) : 0) + 
+    carry = (((!carry && hasCarry != 2) || hasCarry == 1) ? (1ULL << 32) : 0) +
              (carry >> 32) + ((lx * hy) >> 32) + hx * hy;
    }
    return carry;
  }
  
-/// Multiplies integer array x by integer array y and stores the result into 
+/// Multiplies integer array x by integer array y and stores the result into
  /// the integer array dest. Note that dest's size must be >= xlen + ylen.
  /// @brief Generalized multiplicate of integer arrays.
  static void mul(uint64_t dest[], uint64_t x[], unsigned xlen, uint64_t y[],
@@ -307,7 +344,7 @@ static void mul(uint64_t dest[], uint64_t x[], unsigned xlen, uint64_t y[],
        resul = (carry << 32) | (resul & 0xffffffffULL);
        dest[i+j] += resul;
        carry = (((!carry && hasCarry != 2) || hasCarry == 1) ? (1ULL << 32) : 0)+
-              (carry >> 32) + (dest[i+j] < resul ? 1 : 0) + 
+              (carry >> 32) + (dest[i+j] < resul ? 1 : 0) +
                ((lx * hy) >> 32) + hx * hy;
      }
      dest[i+xlen] = carry;
@@ -325,7 +362,7 @@ APInt& APInt::operator*=(const APInt& RHS) {
    // Get some bit facts about LHS and check for zero
    unsigned lhsBits = getActiveBits();
    unsigned lhsWords = !lhsBits ? 0 : whichWord(lhsBits - 1) + 1;
-  if (!lhsWords) 
+  if (!lhsWords)
      // 0 * X ===> 0
      return *this;
  
@@ -334,7 +371,7 @@ APInt& APInt::operator*=(const APInt& RHS) {
    unsigned rhsWords = !rhsBits ? 0 : whichWord(rhsBits - 1) + 1;
    if (!rhsWords) {
      // X * 0 ===> 0
-    clear();
+    clearAllBits();
      return *this;
    }
  
@@ -346,9 +383,10 @@ APInt& APInt::operator*=(const APInt& RHS) {
    mul(dest, pVal, lhsWords, RHS.pVal, rhsWords);
  
    // Copy result back into *this
-  clear();
+  clearAllBits();
    unsigned wordsToCopy = destWords >= getNumWords() ? getNumWords() : destWords;
    memcpy(pVal, dest, wordsToCopy * APINT_WORD_SIZE);
+  clearUnusedBits();
  
    // delete dest array and return
    delete[] dest;
@@ -385,7 +423,7 @@ APInt& APInt::operator^=(const APInt& RHS) {
      VAL ^= RHS.VAL;
      this->clearUnusedBits();
      return *this;
-  } 
+  }
    unsigned numWords = getNumWords();
    for (unsigned i = 0; i < numWords; ++i)
      pVal[i] ^= RHS.pVal[i];
@@ -423,7 +461,7 @@ bool APInt::operator !() const {
      return !VAL;
  
    for (unsigned i = 0; i < getNumWords(); ++i)
-    if (pVal[i]) 
+    if (pVal[i])
        return false;
    return true;
  }
@@ -434,7 +472,7 @@ APInt APInt::operator*(const APInt& RHS) const {
      return APInt(BitWidth, VAL * RHS.VAL);
    APInt Result(*this);
    Result *= RHS;
-  return Result.clearUnusedBits();
+  return Result;
  }
  
  APInt APInt::operator+(const APInt& RHS) const {
@@ -456,7 +494,8 @@ APInt APInt::operator-(const APInt& RHS) const {
  }
  
  bool APInt::operator[](unsigned bitPosition) const {
-  return (maskBit(bitPosition) & 
+  assert(bitPosition < getBitWidth() && "Bit position out of bounds!");
+  return (maskBit(bitPosition) &
            (isSingleWord() ?  VAL : pVal[whichWord(bitPosition)])) != 0;
  }
  
@@ -466,7 +505,7 @@ bool APInt::EqualSlowCase(const APInt& RHS) const {
    unsigned n2 = RHS.getActiveBits();
  
    // If the number of bits isn't the same, they aren't equal
-  if (n1 != n2) 
+  if (n1 != n2)
      return false;
  
    // If the number of bits fits in a word, we only need to compare the low word.
@@ -475,7 +514,7 @@ bool APInt::EqualSlowCase(const APInt& RHS) const {
  
    // Otherwise, compare everything
    for (int i = whichWord(n1 - 1); i >= 0; --i)
-    if (pVal[i] != RHS.pVal[i]) 
+    if (pVal[i] != RHS.pVal[i])
        return false;
    return true;
  }
@@ -512,9 +551,9 @@ bool APInt::ult(const APInt& RHS) const {
    // Otherwise, compare all words
    unsigned topWord = whichWord(std::max(n1,n2)-1);
    for (int i = topWord; i >= 0; --i) {
-    if (pVal[i] > RHS.pVal[i]) 
+    if (pVal[i] > RHS.pVal[i])
        return false;
-    if (pVal[i] < RHS.pVal[i]) 
+    if (pVal[i] < RHS.pVal[i])
        return true;
    }
    return false;
@@ -534,12 +573,12 @@ bool APInt::slt(const APInt& RHS) const {
    bool rhsNeg = rhs.isNegative();
    if (lhsNeg) {
      // Sign bit is set so perform two's complement to make it positive
-    lhs.flip();
+    lhs.flipAllBits();
      lhs++;
    }
    if (rhsNeg) {
      // Sign bit is set so perform two's complement to make it positive
-    rhs.flip();
+    rhs.flipAllBits();
      rhs++;
    }
  
@@ -552,50 +591,54 @@ bool APInt::slt(const APInt& RHS) const {
        return true;
    else if (rhsNeg)
      return false;
-  else 
+  else
      return lhs.ult(rhs);
  }
  
-APInt& APInt::set(unsigned bitPosition) {
-  if (isSingleWord()) 
+void APInt::setBit(unsigned bitPosition) {
+  if (isSingleWord())
      VAL |= maskBit(bitPosition);
-  else 
+  else
      pVal[whichWord(bitPosition)] |= maskBit(bitPosition);
-  return *this;
  }
  
  /// Set the given bit to 0 whose position is given as "bitPosition".
  /// @brief Set a given bit to 0.
-APInt& APInt::clear(unsigned bitPosition) {
-  if (isSingleWord()) 
+void APInt::clearBit(unsigned bitPosition) {
+  if (isSingleWord())
      VAL &= ~maskBit(bitPosition);
-  else 
+  else
      pVal[whichWord(bitPosition)] &= ~maskBit(bitPosition);
-  return *this;
  }
  
  /// @brief Toggle every bit to its opposite value.
  
-/// Toggle a given bit to its opposite value whose position is given 
+/// Toggle a given bit to its opposite value whose position is given
  /// as "bitPosition".
  /// @brief Toggles a given bit to its opposite value.
-APInt& APInt::flip(unsigned bitPosition) {
+void APInt::flipBit(unsigned bitPosition) {
    assert(bitPosition < BitWidth && "Out of the bit-width range!");
-  if ((*this)[bitPosition]) clear(bitPosition);
-  else set(bitPosition);
-  return *this;
+  if ((*this)[bitPosition]) clearBit(bitPosition);
+  else setBit(bitPosition);
  }
  
-unsigned APInt::getBitsNeeded(const char* str, unsigned slen, uint8_t radix) {
-  assert(str != 0 && "Invalid value string");
-  assert(slen > 0 && "Invalid string length");
+unsigned APInt::getBitsNeeded(StringRef str, uint8_t radix) {
+  assert(!str.empty() && "Invalid string length");
+  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 || 
+          radix == 36) &&
+         "Radix should be 2, 8, 10, 16, or 36!");
  
-  // Each computation below needs to know if its negative
-  unsigned isNegative = str[0] == '-';
-  if (isNegative) {
+  size_t slen = str.size();
+
+  // Each computation below needs to know if it's negative.
+  StringRef::iterator p = str.begin();
+  unsigned isNegative = *p == '-';
+  if (*p == '-' || *p == '+') {
+    p++;
      slen--;
-    str++;
+    assert(slen && "String is only a sign, needs a value.");
    }
+
    // For radixes of power-of-two values, the bits required is accurately and
    // easily computed
    if (radix == 2)
@@ -605,22 +648,31 @@ unsigned APInt::getBitsNeeded(const char* str, unsigned slen, uint8_t radix) {
    if (radix == 16)
      return slen * 4 + isNegative;
  
-  // Otherwise it must be radix == 10, the hard case
-  assert(radix == 10 && "Invalid radix");
-
+  // FIXME: base 36
+  
    // This is grossly inefficient but accurate. We could probably do something
    // with a computation of roughly slen*64/20 and then adjust by the value of
    // the first few digits. But, I'm not sure how accurate that could be.
  
    // Compute a sufficient number of bits that is always large enough but might
-  // be too large. This avoids the assertion in the constructor.
-  unsigned sufficient = slen*64/18;
+  // be too large. This avoids the assertion in the constructor. This
+  // calculation doesn't work appropriately for the numbers 0-9, so just use 4
+  // bits in that case.
+  unsigned sufficient 
+    = radix == 10? (slen == 1 ? 4 : slen * 64/18)
+                 : (slen == 1 ? 7 : slen * 16/3);
  
    // Convert to the actual binary value.
-  APInt tmp(sufficient, str, slen, radix);
+  APInt tmp(sufficient, StringRef(p, slen), radix);
  
-  // Compute how many bits are required.
-  return isNegative + tmp.logBase2() + 1;
+  // Compute how many bits are required. If the log is infinite, assume we need
+  // just bit.
+  unsigned log = tmp.logBase2();
+  if (log == (unsigned)-1) {
+    return isNegative + 1;
+  } else {
+    return isNegative + log + 1;
+  }
  }
  
  // From http://www.burtleburtle.net, byBob Jenkins.
@@ -664,15 +716,14 @@ static inline uint32_t hashword(const uint64_t *k64, size_t length)
    a = b = c = 0xdeadbeef + (((uint32_t)length)<<2);
  
    /*------------------------------------------------- handle most of the key */
-  while (length > 3)
-    {
-      a += k[0];
-      b += k[1];
-      c += k[2];
-      mix(a,b,c);
-      length -= 3;
-      k += 3;
-    }
+  while (length > 3) {
+    a += k[0];
+    b += k[1];
+    c += k[2];
+    mix(a,b,c);
+    length -= 3;
+    k += 3;
+  }
  
    /*------------------------------------------- handle the last 3 uint32_t's */
    switch (length) {                  /* all the case statements fall through */
@@ -720,17 +771,28 @@ APInt APInt::getHiBits(unsigned numBits) const {
  
  /// LoBits - This function returns the low "numBits" bits of this APInt.
  APInt APInt::getLoBits(unsigned numBits) const {
-  return APIntOps::lshr(APIntOps::shl(*this, BitWidth - numBits), 
+  return APIntOps::lshr(APIntOps::shl(*this, BitWidth - numBits),
                          BitWidth - numBits);
  }
  
-bool APInt::isPowerOf2() const {
-  return (!!*this) && !(*this & (*this - APInt(BitWidth,1)));
-}
-
  unsigned APInt::countLeadingZerosSlowCase() const {
-  unsigned Count = 0;
-  for (unsigned i = getNumWords(); i > 0u; --i) {
+  // Treat the most significand word differently because it might have
+  // meaningless bits set beyond the precision.
+  unsigned BitsInMSW = BitWidth % APINT_BITS_PER_WORD;
+  integerPart MSWMask;
+  if (BitsInMSW) MSWMask = (integerPart(1) << BitsInMSW) - 1;
+  else {
+    MSWMask = ~integerPart(0);
+    BitsInMSW = APINT_BITS_PER_WORD;
+  }
+
+  unsigned i = getNumWords();
+  integerPart MSW = pVal[i-1] & MSWMask;
+  if (MSW)
+    return CountLeadingZeros_64(MSW) - (APINT_BITS_PER_WORD - BitsInMSW);
+
+  unsigned Count = BitsInMSW;
+  for (--i; i > 0u; --i) {
      if (pVal[i-1] == 0)
        Count += APINT_BITS_PER_WORD;
      else {
@@ -738,10 +800,7 @@ unsigned APInt::countLeadingZerosSlowCase() const {
        break;
      }
    }
-  unsigned remainder = BitWidth % APINT_BITS_PER_WORD;
-  if (remainder)
-    Count -= APINT_BITS_PER_WORD - remainder;
-  return std::min(Count, BitWidth);
+  return Count;
  }
  
  static unsigned countLeadingOnes_64(uint64_t V, unsigned skip) {
@@ -811,33 +870,46 @@ unsigned APInt::countPopulationSlowCase() const {
    return Count;
  }
  
+/// Perform a logical right-shift from Src to Dst, which must be equal or
+/// non-overlapping, of Words words, by Shift, which must be less than 64.
+static void lshrNear(uint64_t *Dst, uint64_t *Src, unsigned Words,
+                     unsigned Shift) {
+  uint64_t Carry = 0;
+  for (int I = Words - 1; I >= 0; --I) {
+    uint64_t Tmp = Src[I];
+    Dst[I] = (Tmp >> Shift) | Carry;
+    Carry = Tmp << (64 - Shift);
+  }
+}
+
  APInt APInt::byteSwap() const {
    assert(BitWidth >= 16 && BitWidth % 16 == 0 && "Cannot byteswap!");
    if (BitWidth == 16)
      return APInt(BitWidth, ByteSwap_16(uint16_t(VAL)));
-  else if (BitWidth == 32)
+  if (BitWidth == 32)
      return APInt(BitWidth, ByteSwap_32(unsigned(VAL)));
-  else if (BitWidth == 48) {
+  if (BitWidth == 48) {
      unsigned Tmp1 = unsigned(VAL >> 16);
      Tmp1 = ByteSwap_32(Tmp1);
      uint16_t Tmp2 = uint16_t(VAL);
      Tmp2 = ByteSwap_16(Tmp2);
      return APInt(BitWidth, (uint64_t(Tmp2) << 32) | Tmp1);
-  } else if (BitWidth == 64)
+  }
+  if (BitWidth == 64)
      return APInt(BitWidth, ByteSwap_64(VAL));
-  else {
-    APInt Result(BitWidth, 0);
-    char *pByte = (char*)Result.pVal;
-    for (unsigned i = 0; i < BitWidth / APINT_WORD_SIZE / 2; ++i) {
-      char Tmp = pByte[i];
-      pByte[i] = pByte[BitWidth / APINT_WORD_SIZE - 1 - i];
-      pByte[BitWidth / APINT_WORD_SIZE - i - 1] = Tmp;
-    }
-    return Result;
+
+  APInt Result(getNumWords() * APINT_BITS_PER_WORD, 0);
+  for (unsigned I = 0, N = getNumWords(); I != N; ++I)
+    Result.pVal[I] = ByteSwap_64(pVal[N - I - 1]);
+  if (Result.BitWidth != BitWidth) {
+    lshrNear(Result.pVal, Result.pVal, getNumWords(),
+             Result.BitWidth - BitWidth);
+    Result.BitWidth = BitWidth;
    }
+  return Result;
  }
  
-APInt llvm::APIntOps::GreatestCommonDivisor(const APInt& API1, 
+APInt llvm::APIntOps::GreatestCommonDivisor(const APInt& API1,
                                              const APInt& API2) {
    APInt A = API1, B = API2;
    while (!!B) {
@@ -870,7 +942,7 @@ APInt llvm::APIntOps::RoundDoubleToAPInt(double Double, unsigned width) {
  
    // If the exponent doesn't shift all bits out of the mantissa
    if (exp < 52)
-    return isNeg ? -APInt(width, mantissa >> (52 - exp)) : 
+    return isNeg ? -APInt(width, mantissa >> (52 - exp)) :
                      APInt(width, mantissa >> (52 - exp));
  
    // If the client didn't provide enough bits for us to shift the mantissa into
@@ -884,22 +956,23 @@ APInt llvm::APIntOps::RoundDoubleToAPInt(double Double, unsigned width) {
    return isNeg ? -Tmp : Tmp;
  }
  
-/// RoundToDouble - This function convert this APInt to a double.
+/// RoundToDouble - This function converts this APInt to a double.
  /// The layout for double is as following (IEEE Standard 754):
  ///  --------------------------------------
  /// |  Sign    Exponent    Fraction    Bias |
  /// |-------------------------------------- |
  /// |  1[63]   11[62-52]   52[51-00]   1023 |
-///  -------------------------------------- 
+///  --------------------------------------
  double APInt::roundToDouble(bool isSigned) const {
  
    // Handle the simple case where the value is contained in one uint64_t.
+  // It is wrong to optimize getWord(0) to VAL; there might be more than one word.
    if (isSingleWord() || getActiveBits() <= APINT_BITS_PER_WORD) {
      if (isSigned) {
-      int64_t sext = (int64_t(VAL) << (64-BitWidth)) >> (64-BitWidth);
+      int64_t sext = (int64_t(getWord(0)) << (64-BitWidth)) >> (64-BitWidth);
        return double(sext);
      } else
-      return double(VAL);
+      return double(getWord(0));
    }
  
    // Determine if the value is negative.
@@ -920,7 +993,7 @@ double APInt::roundToDouble(bool isSigned) const {
    if (exp > 1023) {
      if (!isSigned || !isNeg)
        return std::numeric_limits<double>::infinity();
-    else 
+    else
        return -std::numeric_limits<double>::infinity();
    }
    exp += 1023; // Increment for 1023 bias
@@ -951,96 +1024,90 @@ double APInt::roundToDouble(bool isSigned) const {
  }
  
  // Truncate to new width.
-APInt &APInt::trunc(unsigned width) {
+APInt APInt::trunc(unsigned width) const {
    assert(width < BitWidth && "Invalid APInt Truncate request");
    assert(width && "Can't truncate to 0 bits");
-  unsigned wordsBefore = getNumWords();
-  BitWidth = width;
-  unsigned wordsAfter = getNumWords();
-  if (wordsBefore != wordsAfter) {
-    if (wordsAfter == 1) {
-      uint64_t *tmp = pVal;
-      VAL = pVal[0];
-      delete [] tmp;
-    } else {
-      uint64_t *newVal = getClearedMemory(wordsAfter);
-      for (unsigned i = 0; i < wordsAfter; ++i)
-        newVal[i] = pVal[i];
-      delete [] pVal;
-      pVal = newVal;
-    }
-  }
-  return clearUnusedBits();
+
+  if (width <= APINT_BITS_PER_WORD)
+    return APInt(width, getRawData()[0]);
+
+  APInt Result(getMemory(getNumWords(width)), width);
+
+  // Copy full words.
+  unsigned i;
+  for (i = 0; i != width / APINT_BITS_PER_WORD; i++)
+    Result.pVal[i] = pVal[i];
+
+  // Truncate and copy any partial word.
+  unsigned bits = (0 - width) % APINT_BITS_PER_WORD;
+  if (bits != 0)
+    Result.pVal[i] = pVal[i] << bits >> bits;
+
+  return Result;
  }
  
  // Sign extend to a new width.
-APInt &APInt::sext(unsigned width) {
+APInt APInt::sext(unsigned width) const {
    assert(width > BitWidth && "Invalid APInt SignExtend request");
-  // If the sign bit isn't set, this is the same as zext.
-  if (!isNegative()) {
-    zext(width);
-    return *this;
+
+  if (width <= APINT_BITS_PER_WORD) {
+    uint64_t val = VAL << (APINT_BITS_PER_WORD - BitWidth);
+    val = (int64_t)val >> (width - BitWidth);
+    return APInt(width, val >> (APINT_BITS_PER_WORD - width));
    }
  
-  // The sign bit is set. First, get some facts
-  unsigned wordsBefore = getNumWords();
-  unsigned wordBits = BitWidth % APINT_BITS_PER_WORD;
-  BitWidth = width;
-  unsigned wordsAfter = getNumWords();
-
-  // Mask the high order word appropriately
-  if (wordsBefore == wordsAfter) {
-    unsigned newWordBits = width % APINT_BITS_PER_WORD;
-    // The extension is contained to the wordsBefore-1th word.
-    uint64_t mask = ~0ULL;
-    if (newWordBits)
-      mask >>= APINT_BITS_PER_WORD - newWordBits;
-    mask <<= wordBits;
-    if (wordsBefore == 1)
-      VAL |= mask;
-    else
-      pVal[wordsBefore-1] |= mask;
-    return clearUnusedBits();
+  APInt Result(getMemory(getNumWords(width)), width);
+
+  // Copy full words.
+  unsigned i;
+  uint64_t word = 0;
+  for (i = 0; i != BitWidth / APINT_BITS_PER_WORD; i++) {
+    word = getRawData()[i];
+    Result.pVal[i] = word;
    }
  
-  uint64_t mask = wordBits == 0 ? 0 : ~0ULL << wordBits;
-  uint64_t *newVal = getMemory(wordsAfter);
-  if (wordsBefore == 1)
-    newVal[0] = VAL | mask;
-  else {
-    for (unsigned i = 0; i < wordsBefore; ++i)
-      newVal[i] = pVal[i];
-    newVal[wordsBefore-1] |= mask;
+  // Read and sign-extend any partial word.
+  unsigned bits = (0 - BitWidth) % APINT_BITS_PER_WORD;
+  if (bits != 0)
+    word = (int64_t)getRawData()[i] << bits >> bits;
+  else
+    word = (int64_t)word >> (APINT_BITS_PER_WORD - 1);
+
+  // Write remaining full words.
+  for (; i != width / APINT_BITS_PER_WORD; i++) {
+    Result.pVal[i] = word;
+    word = (int64_t)word >> (APINT_BITS_PER_WORD - 1);
    }
-  for (unsigned i = wordsBefore; i < wordsAfter; i++)
-    newVal[i] = -1ULL;
-  if (wordsBefore != 1)
-    delete [] pVal;
-  pVal = newVal;
-  return clearUnusedBits();
+
+  // Write any partial word.
+  bits = (0 - width) % APINT_BITS_PER_WORD;
+  if (bits != 0)
+    Result.pVal[i] = word << bits >> bits;
+
+  return Result;
  }
  
  //  Zero extend to a new width.
-APInt &APInt::zext(unsigned width) {
+APInt APInt::zext(unsigned width) const {
    assert(width > BitWidth && "Invalid APInt ZeroExtend request");
-  unsigned wordsBefore = getNumWords();
-  BitWidth = width;
-  unsigned wordsAfter = getNumWords();
-  if (wordsBefore != wordsAfter) {
-    uint64_t *newVal = getClearedMemory(wordsAfter);
-    if (wordsBefore == 1)
-      newVal[0] = VAL;
-    else 
-      for (unsigned i = 0; i < wordsBefore; ++i)
-        newVal[i] = pVal[i];
-    if (wordsBefore != 1)
-      delete [] pVal;
-    pVal = newVal;
-  }
-  return *this;
+
+  if (width <= APINT_BITS_PER_WORD)
+    return APInt(width, VAL);
+
+  APInt Result(getMemory(getNumWords(width)), width);
+
+  // Copy words.
+  unsigned i;
+  for (i = 0; i != getNumWords(); i++)
+    Result.pVal[i] = getRawData()[i];
+
+  // Zero remaining words.
+  memset(&Result.pVal[i], 0, (Result.getNumWords() - i) * APINT_WORD_SIZE);
+
+  return Result;
  }
  
-APInt &APInt::zextOrTrunc(unsigned width) {
+APInt APInt::zextOrTrunc(unsigned width) const {
    if (BitWidth < width)
      return zext(width);
    if (BitWidth > width)
@@ -1048,7 +1115,7 @@ APInt &APInt::zextOrTrunc(unsigned width) {
    return *this;
  }
  
-APInt &APInt::sextOrTrunc(unsigned width) {
+APInt APInt::sextOrTrunc(unsigned width) const {
    if (BitWidth < width)
      return sext(width);
    if (BitWidth > width)
@@ -1056,6 +1123,18 @@ APInt &APInt::sextOrTrunc(unsigned width) {
    return *this;
  }
  
+APInt APInt::zextOrSelf(unsigned width) const {
+  if (BitWidth < width)
+    return zext(width);
+  return *this;
+}
+
+APInt APInt::sextOrSelf(unsigned width) const {
+  if (BitWidth < width)
+    return sext(width);
+  return *this;
+}
+
  /// Arithmetic right-shift this APInt by shiftAmt.
  /// @brief Arithmetic right-shift function.
  APInt APInt::ashr(const APInt &shiftAmt) const {
@@ -1076,7 +1155,7 @@ APInt APInt::ashr(unsigned shiftAmt) const {
        return APInt(BitWidth, 0); // undefined
      else {
        unsigned SignBit = APINT_BITS_PER_WORD - BitWidth;
-      return APInt(BitWidth, 
+      return APInt(BitWidth,
          (((int64_t(VAL) << SignBit) >> SignBit) >> shiftAmt));
      }
    }
@@ -1113,11 +1192,11 @@ APInt APInt::ashr(unsigned shiftAmt) const {
        if (bitsInWord < APINT_BITS_PER_WORD)
          val[breakWord] |= ~0ULL << bitsInWord; // set high bits
    } else {
-    // Shift the low order words 
+    // Shift the low order words
      for (unsigned i = 0; i < breakWord; ++i) {
        // This combines the shifted corresponding word with the low bits from
        // the next word (shifted into this word's high bits).
-      val[i] = (pVal[i+offset] >> wordShift) | 
+      val[i] = (pVal[i+offset] >> wordShift) |
                 (pVal[i+offset+1] << (APINT_BITS_PER_WORD - wordShift));
      }
  
@@ -1130,10 +1209,10 @@ APInt APInt::ashr(unsigned shiftAmt) const {
      if (isNegative()) {
        if (wordShift > bitsInWord) {
          if (breakWord > 0)
-          val[breakWord-1] |= 
+          val[breakWord-1] |=
              ~0ULL << (APINT_BITS_PER_WORD - (wordShift - bitsInWord));
          val[breakWord] |= ~0ULL;
-      } else 
+      } else
          val[breakWord] |= (~0ULL << (bitsInWord - wordShift));
      }
    }
@@ -1155,9 +1234,9 @@ APInt APInt::lshr(const APInt &shiftAmt) const {
  /// @brief Logical right-shift function.
  APInt APInt::lshr(unsigned shiftAmt) const {
    if (isSingleWord()) {
-    if (shiftAmt == BitWidth)
+    if (shiftAmt >= BitWidth)
        return APInt(BitWidth, 0);
-    else 
+    else
        return APInt(BitWidth, this->VAL >> shiftAmt);
    }
  
@@ -1168,7 +1247,7 @@ APInt APInt::lshr(unsigned shiftAmt) const {
      return APInt(BitWidth, 0);
  
    // If none of the bits are shifted out, the result is *this. This avoids
-  // issues with shifting by the size of the integer type, which produces 
+  // issues with shifting by the size of the integer type, which produces
    // undefined results in the code below. This is also an optimization.
    if (shiftAmt == 0)
      return *this;
@@ -1178,11 +1257,7 @@ APInt APInt::lshr(unsigned shiftAmt) const {
  
    // If we are shifting less than a word, compute the shift with a simple carry
    if (shiftAmt < APINT_BITS_PER_WORD) {
-    uint64_t carry = 0;
-    for (int i = getNumWords()-1; i >= 0; --i) {
-      val[i] = (pVal[i] >> shiftAmt) | carry;
-      carry = pVal[i] << (APINT_BITS_PER_WORD - shiftAmt);
-    }
+    lshrNear(val, pVal, getNumWords(), shiftAmt);
      return APInt(val, BitWidth).clearUnusedBits();
    }
  
@@ -1199,7 +1274,7 @@ APInt APInt::lshr(unsigned shiftAmt) const {
      return APInt(val,BitWidth).clearUnusedBits();
    }
  
-  // Shift the low order words 
+  // Shift the low order words
    unsigned breakWord = getNumWords() - offset -1;
    for (unsigned i = 0; i < breakWord; ++i)
      val[i] = (pVal[i+offset] >> wordShift) |
@@ -1275,14 +1350,10 @@ APInt APInt::rotl(const APInt &rotateAmt) const {
  }
  
  APInt APInt::rotl(unsigned rotateAmt) const {
+  rotateAmt %= BitWidth;
    if (rotateAmt == 0)
      return *this;
-  // Don't get too fancy, just use existing shift/or facilities
-  APInt hi(*this);
-  APInt lo(*this);
-  hi.shl(rotateAmt);
-  lo.lshr(BitWidth - rotateAmt);
-  return hi | lo;
+  return shl(rotateAmt) | lshr(BitWidth - rotateAmt);
  }
  
  APInt APInt::rotr(const APInt &rotateAmt) const {
@@ -1290,14 +1361,10 @@ APInt APInt::rotr(const APInt &rotateAmt) const {
  }
  
  APInt APInt::rotr(unsigned rotateAmt) const {
+  rotateAmt %= BitWidth;
    if (rotateAmt == 0)
      return *this;
-  // Don't get too fancy, just use existing shift/or facilities
-  APInt hi(*this);
-  APInt lo(*this);
-  lo.lshr(rotateAmt);
-  hi.shl(BitWidth - rotateAmt);
-  return hi | lo;
+  return lshr(rotateAmt) | shl(BitWidth - rotateAmt);
  }
  
  // Square Root - this method computes and returns the square root of "this".
@@ -1306,7 +1373,7 @@ APInt APInt::rotr(unsigned rotateAmt) const {
  // values using less than 52 bits, the value is converted to double and then
  // the libc sqrt function is called. The result is rounded and then converted
  // back to a uint64_t which is then used to construct the result. Finally,
-// the Babylonian method for computing square roots is used. 
+// the Babylonian method for computing square roots is used.
  APInt APInt::sqrt() const {
  
    // Determine the magnitude of the value.
@@ -1318,7 +1385,7 @@ APInt APInt::sqrt() const {
      static const uint8_t results[32] = {
        /*     0 */ 0,
        /*  1- 2 */ 1, 1,
-      /*  3- 6 */ 2, 2, 2, 2, 
+      /*  3- 6 */ 2, 2, 2, 2,
        /*  7-12 */ 3, 3, 3, 3, 3, 3,
        /* 13-20 */ 4, 4, 4, 4, 4, 4, 4, 4,
        /* 21-30 */ 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
@@ -1332,13 +1399,12 @@ APInt APInt::sqrt() const {
    // libc sqrt function which will probably use a hardware sqrt computation.
    // This should be faster than the algorithm below.
    if (magnitude < 52) {
-#ifdef _MSC_VER
-    // Amazingly, VC++ doesn't have round().
-    return APInt(BitWidth, 
-                 uint64_t(::sqrt(double(isSingleWord()?VAL:pVal[0]))) + 0.5);
-#else
-    return APInt(BitWidth, 
+#if HAVE_ROUND
+    return APInt(BitWidth,
                   uint64_t(::round(::sqrt(double(isSingleWord()?VAL:pVal[0])))));
+#else
+    return APInt(BitWidth,
+                 uint64_t(::sqrt(double(isSingleWord()?VAL:pVal[0])) + 0.5));
  #endif
    }
  
@@ -1346,7 +1412,7 @@ APInt APInt::sqrt() const {
    // is a classical Babylonian method for computing the square root. This code
    // was adapted to APINt from a wikipedia article on such computations.
    // See http://www.wikipedia.org/ and go to the page named
-  // Calculate_an_integer_square_root. 
+  // Calculate_an_integer_square_root.
    unsigned nbits = BitWidth, i = 4;
    APInt testy(BitWidth, 16);
    APInt x_old(BitWidth, 1);
@@ -1354,13 +1420,13 @@ APInt APInt::sqrt() const {
    APInt two(BitWidth, 2);
  
    // Select a good starting value using binary logarithms.
-  for (;; i += 2, testy = testy.shl(2)) 
+  for (;; i += 2, testy = testy.shl(2))
      if (i >= nbits || this->ule(testy)) {
        x_old = x_old.shl(i / 2);
        break;
      }
  
-  // Use the Babylonian method to arrive at the integer square root: 
+  // Use the Babylonian method to arrive at the integer square root:
    for (;;) {
      x_new = (this->udiv(x_old) + x_old).udiv(two);
      if (x_old.ule(x_new))
@@ -1369,24 +1435,20 @@ APInt APInt::sqrt() const {
    }
  
    // Make sure we return the closest approximation
-  // NOTE: The rounding calculation below is correct. It will produce an 
+  // NOTE: The rounding calculation below is correct. It will produce an
    // off-by-one discrepancy with results from pari/gp. That discrepancy has been
-  // determined to be a rounding issue with pari/gp as it begins to use a 
+  // determined to be a rounding issue with pari/gp as it begins to use a
    // floating point representation after 192 bits. There are no discrepancies
    // between this algorithm and pari/gp for bit widths < 192 bits.
    APInt square(x_old * x_old);
    APInt nextSquare((x_old + 1) * (x_old +1));
    if (this->ult(square))
      return x_old;
-  else if (this->ule(nextSquare)) {
-    APInt midpoint((nextSquare - square).udiv(two));
-    APInt offset(*this - square);
-    if (offset.ult(midpoint))
-      return x_old;
-    else
-      return x_old + 1;
-  } else
-    assert(0 && "Error in APInt::sqrt computation");
+  assert(this->ule(nextSquare) && "Error in APInt::sqrt computation");
+  APInt midpoint((nextSquare - square).udiv(two));
+  APInt offset(*this - square);
+  if (offset.ult(midpoint))
+    return x_old;
    return x_old + 1;
  }
  
@@ -1409,7 +1471,7 @@ APInt APInt::multiplicativeInverse(const APInt& modulo) const {
    APInt r[2] = { modulo, *this };
    APInt t[2] = { APInt(BitWidth, 0), APInt(BitWidth, 1) };
    APInt q(BitWidth, 0);
-  
+
    unsigned i;
    for (i = 0; r[i^1] != 0; i ^= 1) {
      // An overview of the math without the confusing bit-flipping:
@@ -1442,11 +1504,9 @@ APInt::ms APInt::magic() const {
    const APInt& d = *this;
    unsigned p;
    APInt ad, anc, delta, q1, r1, q2, r2, t;
-  APInt allOnes = APInt::getAllOnesValue(d.getBitWidth());
    APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
-  APInt signedMax = APInt::getSignedMaxValue(d.getBitWidth());
    struct ms mag;
-  
+
    ad = d.abs();
    t = signedMin + (d.lshr(d.getBitWidth() - 1));
    anc = t - 1 - t.urem(ad);   // absolute value of nc
@@ -1470,8 +1530,8 @@ APInt::ms APInt::magic() const {
        r2 = r2 - ad;
      }
      delta = ad - r2;
-  } while (q1.ule(delta) || (q1 == delta && r1 == 0));
-  
+  } while (q1.ult(delta) || (q1 == delta && r1 == 0));
+
    mag.m = q2 + 1;
    if (d.isNegative()) mag.m = -mag.m;   // resulting magic number
    mag.s = p - d.getBitWidth();          // resulting shift
@@ -1482,13 +1542,15 @@ APInt::ms APInt::magic() const {
  /// division by a constant as a sequence of multiplies, adds and shifts.
  /// Requires that the divisor not be 0.  Taken from "Hacker's Delight", Henry
  /// S. Warren, Jr., chapter 10.
-APInt::mu APInt::magicu() const {
+/// LeadingZeros can be used to simplify the calculation if the upper bits
+/// of the divided value are known zero.
+APInt::mu APInt::magicu(unsigned LeadingZeros) const {
    const APInt& d = *this;
    unsigned p;
    APInt nc, delta, q1, r1, q2, r2;
    struct mu magu;
    magu.a = 0;               // initialize "add" indicator
-  APInt allOnes = APInt::getAllOnesValue(d.getBitWidth());
+  APInt allOnes = APInt::getAllOnesValue(d.getBitWidth()).lshr(LeadingZeros);
    APInt signedMin = APInt::getSignedMinValue(d.getBitWidth());
    APInt signedMax = APInt::getSignedMaxValue(d.getBitWidth());
  
@@ -1543,17 +1605,17 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
    uint64_t b = uint64_t(1) << 32;
  
  #if 0
-  DEBUG(cerr << "KnuthDiv: m=" << m << " n=" << n << '\n');
-  DEBUG(cerr << "KnuthDiv: original:");
-  DEBUG(for (int i = m+n; i >=0; i--) cerr << " " << std::setbase(16) << u[i]);
-  DEBUG(cerr << " by");
-  DEBUG(for (int i = n; i >0; i--) cerr << " " << std::setbase(16) << v[i-1]);
-  DEBUG(cerr << '\n');
+  DEBUG(dbgs() << "KnuthDiv: m=" << m << " n=" << n << '\n');
+  DEBUG(dbgs() << "KnuthDiv: original:");
+  DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
+  DEBUG(dbgs() << " by");
+  DEBUG(for (int i = n; i >0; i--) dbgs() << " " << v[i-1]);
+  DEBUG(dbgs() << '\n');
  #endif
-  // D1. [Normalize.] Set d = b / (v[n-1] + 1) and multiply all the digits of 
-  // u and v by d. Note that we have taken Knuth's advice here to use a power 
-  // of 2 value for d such that d * v[n-1] >= b/2 (b is the base). A power of 
-  // 2 allows us to shift instead of multiply and it is easy to determine the 
+  // D1. [Normalize.] Set d = b / (v[n-1] + 1) and multiply all the digits of
+  // u and v by d. Note that we have taken Knuth's advice here to use a power
+  // of 2 value for d such that d * v[n-1] >= b/2 (b is the base). A power of
+  // 2 allows us to shift instead of multiply and it is easy to determine the
    // shift amount from the leading zeros.  We are basically normalizing the u
    // and v so that its high bits are shifted to the top of v's range without
    // overflow. Note that this can require an extra word in u so that u must
@@ -1575,27 +1637,27 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
    }
    u[m+n] = u_carry;
  #if 0
-  DEBUG(cerr << "KnuthDiv:   normal:");
-  DEBUG(for (int i = m+n; i >=0; i--) cerr << " " << std::setbase(16) << u[i]);
-  DEBUG(cerr << " by");
-  DEBUG(for (int i = n; i >0; i--) cerr << " " << std::setbase(16) << v[i-1]);
-  DEBUG(cerr << '\n');
+  DEBUG(dbgs() << "KnuthDiv:   normal:");
+  DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
+  DEBUG(dbgs() << " by");
+  DEBUG(for (int i = n; i >0; i--) dbgs() << " " << v[i-1]);
+  DEBUG(dbgs() << '\n');
  #endif
  
    // D2. [Initialize j.]  Set j to m. This is the loop counter over the places.
    int j = m;
    do {
-    DEBUG(cerr << "KnuthDiv: quotient digit #" << j << '\n');
-    // D3. [Calculate q'.]. 
+    DEBUG(dbgs() << "KnuthDiv: quotient digit #" << j << '\n');
+    // D3. [Calculate q'.].
      //     Set qp = (u[j+n]*b + u[j+n-1]) / v[n-1]. (qp=qprime=q')
      //     Set rp = (u[j+n]*b + u[j+n-1]) % v[n-1]. (rp=rprime=r')
      // Now test if qp == b or qp*v[n-2] > b*rp + u[j+n-2]; if so, decrease
      // qp by 1, inrease rp by v[n-1], and repeat this test if rp < b. The test
      // on v[n-2] determines at high speed most of the cases in which the trial
-    // value qp is one too large, and it eliminates all cases where qp is two 
-    // too large. 
+    // value qp is one too large, and it eliminates all cases where qp is two
+    // too large.
      uint64_t dividend = ((uint64_t(u[j+n]) << 32) + u[j+n-1]);
-    DEBUG(cerr << "KnuthDiv: dividend == " << dividend << '\n');
+    DEBUG(dbgs() << "KnuthDiv: dividend == " << dividend << '\n');
      uint64_t qp = dividend / v[n-1];
      uint64_t rp = dividend % v[n-1];
      if (qp == b || qp*v[n-2] > b*rp + u[j+n-2]) {
@@ -1604,20 +1666,20 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
        if (rp < b && (qp == b || qp*v[n-2] > b*rp + u[j+n-2]))
          qp--;
      }
-    DEBUG(cerr << "KnuthDiv: qp == " << qp << ", rp == " << rp << '\n');
+    DEBUG(dbgs() << "KnuthDiv: qp == " << qp << ", rp == " << rp << '\n');
  
      // D4. [Multiply and subtract.] Replace (u[j+n]u[j+n-1]...u[j]) with
      // (u[j+n]u[j+n-1]..u[j]) - qp * (v[n-1]...v[1]v[0]). This computation
      // consists of a simple multiplication by a one-place number, combined with
-    // a subtraction. 
+    // a subtraction.
      bool isNeg = false;
      for (unsigned i = 0; i < n; ++i) {
        uint64_t u_tmp = uint64_t(u[j+i]) | (uint64_t(u[j+i+1]) << 32);
        uint64_t subtrahend = uint64_t(qp) * uint64_t(v[i]);
        bool borrow = subtrahend > u_tmp;
-      DEBUG(cerr << "KnuthDiv: u_tmp == " << u_tmp 
-                 << ", subtrahend == " << subtrahend
-                 << ", borrow = " << borrow << '\n');
+      DEBUG(dbgs() << "KnuthDiv: u_tmp == " << u_tmp
+                   << ", subtrahend == " << subtrahend
+                   << ", borrow = " << borrow << '\n');
  
        uint64_t result = u_tmp - subtrahend;
        unsigned k = j + i;
@@ -1629,14 +1691,14 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
          k++;
        }
        isNeg |= borrow;
-      DEBUG(cerr << "KnuthDiv: u[j+i] == " << u[j+i] << ",  u[j+i+1] == " << 
-                    u[j+i+1] << '\n'); 
+      DEBUG(dbgs() << "KnuthDiv: u[j+i] == " << u[j+i] << ",  u[j+i+1] == " <<
+                    u[j+i+1] << '\n');
      }
-    DEBUG(cerr << "KnuthDiv: after subtraction:");
-    DEBUG(for (int i = m+n; i >=0; i--) cerr << " " << u[i]);
-    DEBUG(cerr << '\n');
-    // The digits (u[j+n]...u[j]) should be kept positive; if the result of 
-    // this step is actually negative, (u[j+n]...u[j]) should be left as the 
+    DEBUG(dbgs() << "KnuthDiv: after subtraction:");
+    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
+    DEBUG(dbgs() << '\n');
+    // The digits (u[j+n]...u[j]) should be kept positive; if the result of
+    // this step is actually negative, (u[j+n]...u[j]) should be left as the
      // true value plus b**(n+1), namely as the b's complement of
      // the true value, and a "borrow" to the left should be remembered.
      //
@@ -1647,20 +1709,20 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
          carry = carry && u[i] == 0;
        }
      }
-    DEBUG(cerr << "KnuthDiv: after complement:");
-    DEBUG(for (int i = m+n; i >=0; i--) cerr << " " << u[i]);
-    DEBUG(cerr << '\n');
+    DEBUG(dbgs() << "KnuthDiv: after complement:");
+    DEBUG(for (int i = m+n; i >=0; i--) dbgs() << " " << u[i]);
+    DEBUG(dbgs() << '\n');
  
-    // D5. [Test remainder.] Set q[j] = qp. If the result of step D4 was 
+    // D5. [Test remainder.] Set q[j] = qp. If the result of step D4 was
      // negative, go to step D6; otherwise go on to step D7.
      q[j] = (unsigned)qp;
      if (isNeg) {
-      // D6. [Add back]. The probability that this step is necessary is very 
+      // D6. [Add back]. The probability that this step is necessary is very
        // small, on the order of only 2/b. Make sure that test data accounts for
-      // this possibility. Decrease q[j] by 1 
+      // this possibility. Decrease q[j] by 1
        q[j]--;
-      // and add (0v[n-1]...v[1]v[0]) to (u[j+n]u[j+n-1]...u[j+1]u[j]). 
-      // A carry will occur to the left of u[j+n], and it should be ignored 
+      // and add (0v[n-1]...v[1]v[0]) to (u[j+n]u[j+n-1]...u[j+1]u[j]).
+      // A carry will occur to the left of u[j+n], and it should be ignored
        // since it cancels with the borrow that occurred in D4.
        bool carry = false;
        for (unsigned i = 0; i < n; i++) {
@@ -1670,16 +1732,16 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
        }
        u[j+n] += carry;
      }
-    DEBUG(cerr << "KnuthDiv: after correction:");
-    DEBUG(for (int i = m+n; i >=0; i--) cerr <<" " << u[i]);
-    DEBUG(cerr << "\nKnuthDiv: digit result = " << q[j] << '\n');
+    DEBUG(dbgs() << "KnuthDiv: after correction:");
+    DEBUG(for (int i = m+n; i >=0; i--) dbgs() <<" " << u[i]);
+    DEBUG(dbgs() << "\nKnuthDiv: digit result = " << q[j] << '\n');
  
    // D7. [Loop on j.]  Decrease j by one. Now if j >= 0, go back to D3.
    } while (--j >= 0);
  
-  DEBUG(cerr << "KnuthDiv: quotient:");
-  DEBUG(for (int i = m; i >=0; i--) cerr <<" " << q[i]);
-  DEBUG(cerr << '\n');
+  DEBUG(dbgs() << "KnuthDiv: quotient:");
+  DEBUG(for (int i = m; i >=0; i--) dbgs() <<" " << q[i]);
+  DEBUG(dbgs() << '\n');
  
    // D8. [Unnormalize]. Now q[...] is the desired quotient, and the desired
    // remainder may be obtained by dividing u[...] by d. If r is non-null we
@@ -1690,22 +1752,22 @@ static void KnuthDiv(unsigned *u, unsigned *v, unsigned *q, unsigned* r,
      // shift right here. In order to mak
      if (shift) {
        unsigned carry = 0;
-      DEBUG(cerr << "KnuthDiv: remainder:");
+      DEBUG(dbgs() << "KnuthDiv: remainder:");
        for (int i = n-1; i >= 0; i--) {
          r[i] = (u[i] >> shift) | carry;
          carry = u[i] << (32 - shift);
-        DEBUG(cerr << " " << r[i]);
+        DEBUG(dbgs() << " " << r[i]);
        }
      } else {
        for (int i = n-1; i >= 0; i--) {
          r[i] = u[i];
-        DEBUG(cerr << " " << r[i]);
+        DEBUG(dbgs() << " " << r[i]);
        }
      }
-    DEBUG(cerr << '\n');
+    DEBUG(dbgs() << '\n');
    }
  #if 0
-  DEBUG(cerr << std::setbase(10) << '\n');
+  DEBUG(dbgs() << '\n');
  #endif
  }
  
@@ -1715,12 +1777,12 @@ void APInt::divide(const APInt LHS, unsigned lhsWords,
  {
    assert(lhsWords >= rhsWords && "Fractional result");
  
-  // First, compose the values into an array of 32-bit words instead of 
+  // First, compose the values into an array of 32-bit words instead of
    // 64-bit words. This is a necessity of both the "short division" algorithm
-  // and the the Knuth "classical algorithm" which requires there to be native 
-  // operations for +, -, and * on an m bit value with an m*2 bit result. We 
-  // can't use 64-bit operands here because we don't have native results of 
-  // 128-bits. Furthermore, casting the 64-bit values to 32-bit values won't 
+  // and the Knuth "classical algorithm" which requires there to be native
+  // operations for +, -, and * on an m bit value with an m*2 bit result. We
+  // can't use 64-bit operands here because we don't have native results of
+  // 128-bits. Furthermore, casting the 64-bit values to 32-bit values won't
    // work on large-endian machines.
    uint64_t mask = ~0ull >> (sizeof(unsigned)*CHAR_BIT);
    unsigned n = rhsWords * 2;
@@ -1769,9 +1831,9 @@ void APInt::divide(const APInt LHS, unsigned lhsWords,
    if (Remainder)
      memset(R, 0, n * sizeof(unsigned));
  
-  // Now, adjust m and n for the Knuth division. n is the number of words in 
+  // Now, adjust m and n for the Knuth division. n is the number of words in
    // the divisor. m is the number of words by which the dividend exceeds the
-  // divisor (i.e. m+n is the length of the dividend). These sizes must not 
+  // divisor (i.e. m+n is the length of the dividend). These sizes must not
    // contain any zero words or the Knuth algorithm fails.
    for (unsigned i = n; i > 0 && V[i-1] == 0; i--) {
      n--;
@@ -1826,12 +1888,12 @@ void APInt::divide(const APInt LHS, unsigned lhsWords,
        if (!Quotient->isSingleWord())
          Quotient->pVal = getClearedMemory(Quotient->getNumWords());
      } else
-      Quotient->clear();
+      Quotient->clearAllBits();
  
-    // The quotient is in Q. Reconstitute the quotient into Quotient's low 
+    // The quotient is in Q. Reconstitute the quotient into Quotient's low
      // order words.
      if (lhsWords == 1) {
-      uint64_t tmp = 
+      uint64_t tmp =
          uint64_t(Q[0]) | (uint64_t(Q[1]) << (APINT_BITS_PER_WORD / 2));
        if (Quotient->isSingleWord())
          Quotient->VAL = tmp;
@@ -1840,7 +1902,7 @@ void APInt::divide(const APInt LHS, unsigned lhsWords,
      } else {
        assert(!Quotient->isSingleWord() && "Quotient APInt not large enough");
        for (unsigned i = 0; i < lhsWords; ++i)
-        Quotient->pVal[i] = 
+        Quotient->pVal[i] =
            uint64_t(Q[i*2]) | (uint64_t(Q[i*2+1]) << (APINT_BITS_PER_WORD / 2));
      }
    }
@@ -1857,12 +1919,12 @@ void APInt::divide(const APInt LHS, unsigned lhsWords,
        if (!Remainder->isSingleWord())
          Remainder->pVal = getClearedMemory(Remainder->getNumWords());
      } else
-      Remainder->clear();
+      Remainder->clearAllBits();
  
      // The remainder is in R. Reconstitute the remainder into Remainder's low
      // order words.
      if (rhsWords == 1) {
-      uint64_t tmp = 
+      uint64_t tmp =
          uint64_t(R[0]) | (uint64_t(R[1]) << (APINT_BITS_PER_WORD / 2));
        if (Remainder->isSingleWord())
          Remainder->VAL = tmp;
@@ -1871,7 +1933,7 @@ void APInt::divide(const APInt LHS, unsigned lhsWords,
      } else {
        assert(!Remainder->isSingleWord() && "Remainder APInt not large enough");
        for (unsigned i = 0; i < rhsWords; ++i)
-        Remainder->pVal[i] = 
+        Remainder->pVal[i] =
            uint64_t(R[i*2]) | (uint64_t(R[i*2+1]) << (APINT_BITS_PER_WORD / 2));
      }
    }
@@ -1902,9 +1964,9 @@ APInt APInt::udiv(const APInt& RHS) const {
    unsigned lhsWords = !lhsBits ? 0 : (APInt::whichWord(lhsBits - 1) + 1);
  
    // Deal with some degenerate cases
-  if (!lhsWords) 
+  if (!lhsWords)
      // 0 / X ===> 0
-    return APInt(BitWidth, 0); 
+    return APInt(BitWidth, 0);
    else if (lhsWords < rhsWords || this->ult(RHS)) {
      // X / Y ===> 0, iff X < Y
      return APInt(BitWidth, 0);
@@ -1959,7 +2021,7 @@ APInt APInt::urem(const APInt& RHS) const {
    return Remainder;
  }
  
-void APInt::udivrem(const APInt &LHS, const APInt &RHS, 
+void APInt::udivrem(const APInt &LHS, const APInt &RHS,
                      APInt &Quotient, APInt &Remainder) {
    // Get some size facts about the dividend and divisor
    unsigned lhsBits  = LHS.getActiveBits();
@@ -1968,24 +2030,24 @@ void APInt::udivrem(const APInt &LHS, const APInt &RHS,
    unsigned rhsWords = !rhsBits ? 0 : (APInt::whichWord(rhsBits - 1) + 1);
  
    // Check the degenerate cases
-  if (lhsWords == 0) {              
+  if (lhsWords == 0) {
      Quotient = 0;                // 0 / Y ===> 0
      Remainder = 0;               // 0 % Y ===> 0
      return;
-  } 
-  
-  if (lhsWords < rhsWords || LHS.ult(RHS)) { 
-    Quotient = 0;               // X / Y ===> 0, iff X < Y
+  }
+
+  if (lhsWords < rhsWords || LHS.ult(RHS)) {
      Remainder = LHS;            // X % Y ===> X, iff X < Y
+    Quotient = 0;               // X / Y ===> 0, iff X < Y
      return;
-  } 
-  
+  }
+
    if (LHS == RHS) {
      Quotient  = 1;              // X / X ===> 1
      Remainder = 0;              // X % X ===> 0;
      return;
-  } 
-  
+  }
+
    if (lhsWords == 1 && rhsWords == 1) {
      // There is only one word to consider so use the native versions.
      uint64_t lhsValue = LHS.isSingleWord() ? LHS.VAL : LHS.pVal[0];
@@ -1999,19 +2061,94 @@ void APInt::udivrem(const APInt &LHS, const APInt &RHS,
    divide(LHS, lhsWords, RHS, rhsWords, &Quotient, &Remainder);
  }
  
-void APInt::fromString(unsigned numbits, const char *str, unsigned slen,
-                       uint8_t radix) {
+APInt APInt::sadd_ov(const APInt &RHS, bool &Overflow) const {
+  APInt Res = *this+RHS;
+  Overflow = isNonNegative() == RHS.isNonNegative() &&
+             Res.isNonNegative() != isNonNegative();
+  return Res;
+}
+
+APInt APInt::uadd_ov(const APInt &RHS, bool &Overflow) const {
+  APInt Res = *this+RHS;
+  Overflow = Res.ult(RHS);
+  return Res;
+}
+
+APInt APInt::ssub_ov(const APInt &RHS, bool &Overflow) const {
+  APInt Res = *this - RHS;
+  Overflow = isNonNegative() != RHS.isNonNegative() &&
+             Res.isNonNegative() != isNonNegative();
+  return Res;
+}
+
+APInt APInt::usub_ov(const APInt &RHS, bool &Overflow) const {
+  APInt Res = *this-RHS;
+  Overflow = Res.ugt(*this);
+  return Res;
+}
+
+APInt APInt::sdiv_ov(const APInt &RHS, bool &Overflow) const {
+  // MININT/-1  -->  overflow.
+  Overflow = isMinSignedValue() && RHS.isAllOnesValue();
+  return sdiv(RHS);
+}
+
+APInt APInt::smul_ov(const APInt &RHS, bool &Overflow) const {
+  APInt Res = *this * RHS;
+  
+  if (*this != 0 && RHS != 0)
+    Overflow = Res.sdiv(RHS) != *this || Res.sdiv(*this) != RHS;
+  else
+    Overflow = false;
+  return Res;
+}
+
+APInt APInt::umul_ov(const APInt &RHS, bool &Overflow) const {
+  APInt Res = *this * RHS;
+
+  if (*this != 0 && RHS != 0)
+    Overflow = Res.udiv(RHS) != *this || Res.udiv(*this) != RHS;
+  else
+    Overflow = false;
+  return Res;
+}
+
+APInt APInt::sshl_ov(unsigned ShAmt, bool &Overflow) const {
+  Overflow = ShAmt >= getBitWidth();
+  if (Overflow)
+    ShAmt = getBitWidth()-1;
+
+  if (isNonNegative()) // Don't allow sign change.
+    Overflow = ShAmt >= countLeadingZeros();
+  else
+    Overflow = ShAmt >= countLeadingOnes();
+  
+  return *this << ShAmt;
+}
+
+
+
+
+void APInt::fromString(unsigned numbits, StringRef str, uint8_t radix) {
    // Check our assumptions here
-  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2) &&
-         "Radix should be 2, 8, 10, or 16!");
-  assert(str && "String is null?");
-  bool isNeg = str[0] == '-';
-  if (isNeg)
-    str++, slen--;
+  assert(!str.empty() && "Invalid string length");
+  assert((radix == 10 || radix == 8 || radix == 16 || radix == 2 || 
+          radix == 36) &&
+         "Radix should be 2, 8, 10, 16, or 36!");
+
+  StringRef::iterator p = str.begin();
+  size_t slen = str.size();
+  bool isNeg = *p == '-';
+  if (*p == '-' || *p == '+') {
+    p++;
+    slen--;
+    assert(slen && "String is only a sign, needs a value.");
+  }
    assert((slen <= numbits || radix != 2) && "Insufficient bit width");
    assert(((slen-1)*3 <= numbits || radix != 8) && "Insufficient bit width");
    assert(((slen-1)*4 <= numbits || radix != 16) && "Insufficient bit width");
-  assert((((slen-1)*64)/22 <= numbits || radix != 10) && "Insufficient bit width");
+  assert((((slen-1)*64)/22 <= numbits || radix != 10) &&
+         "Insufficient bit width");
  
    // Allocate memory
    if (!isSingleWord())
@@ -2026,30 +2163,9 @@ void APInt::fromString(unsigned numbits, const char *str, unsigned slen,
    APInt apradix(getBitWidth(), radix);
  
    // Enter digit traversal loop
-  for (unsigned i = 0; i < slen; i++) {
-    // Get a digit
-    unsigned digit = 0;
-    char cdigit = str[i];
-    if (radix == 16) {
-      if (!isxdigit(cdigit))
-        assert(0 && "Invalid hex digit in string");
-      if (isdigit(cdigit))
-        digit = cdigit - '0';
-      else if (cdigit >= 'a')
-        digit = cdigit - 'a' + 10;
-      else if (cdigit >= 'A')
-        digit = cdigit - 'A' + 10;
-      else
-        assert(0 && "huh? we shouldn't get here");
-    } else if (isdigit(cdigit)) {
-      digit = cdigit - '0';
-      assert((radix == 10 ||
-              (radix == 8 && digit != 8 && digit != 9) ||
-              (radix == 2 && (digit == 0 || digit == 1))) &&
-             "Invalid digit in string for given radix");
-    } else {
-      assert(0 && "Invalid character in digit string");
-    }
+  for (StringRef::iterator e = str.end(); p != e; ++p) {
+    unsigned digit = getDigit(*p, radix);
+    assert(digit < radix && "Invalid character in digit string");
  
      // Shift or multiply the value by the radix
      if (slen > 1) {
@@ -2069,39 +2185,71 @@ void APInt::fromString(unsigned numbits, const char *str, unsigned slen,
    // If its negative, put it in two's complement form
    if (isNeg) {
      (*this)--;
-    this->flip();
+    this->flipAllBits();
    }
  }
  
  void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
-                     bool Signed) const {
-  assert((Radix == 10 || Radix == 8 || Radix == 16 || Radix == 2) &&
-         "Radix should be 2, 8, 10, or 16!");
-  
+                     bool Signed, bool formatAsCLiteral) const {
+  assert((Radix == 10 || Radix == 8 || Radix == 16 || Radix == 2 || 
+          Radix == 36) &&
+         "Radix should be 2, 8, 10, 16, or 36!");
+
+  const char *Prefix = "";
+  if (formatAsCLiteral) {
+    switch (Radix) {
+      case 2:
+        // Binary literals are a non-standard extension added in gcc 4.3:
+        // http://gcc.gnu.org/onlinedocs/gcc-4.3.0/gcc/Binary-constants.html
+        Prefix = "0b";
+        break;
+      case 8:
+        Prefix = "0";
+        break;
+      case 10:
+        break; // No prefix
+      case 16:
+        Prefix = "0x";
+        break;
+      default:
+        llvm_unreachable("Invalid radix!");
+    }
+  }
+
    // First, check for a zero value and just short circuit the logic below.
    if (*this == 0) {
+    while (*Prefix) {
+      Str.push_back(*Prefix);
+      ++Prefix;
+    };
      Str.push_back('0');
      return;
    }
-  
-  static const char Digits[] = "0123456789ABCDEF";
-  
+
+  static const char Digits[] = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ";
+
    if (isSingleWord()) {
      char Buffer[65];
      char *BufPtr = Buffer+65;
-    
+
      uint64_t N;
-    if (Signed) {
+    if (!Signed) {
+      N = getZExtValue();
+    } else {
        int64_t I = getSExtValue();
-      if (I < 0) {
+      if (I >= 0) {
+        N = I;
+      } else {
          Str.push_back('-');
-        I = -I;
+        N = -(uint64_t)I;
        }
-      N = I;
-    } else {
-      N = getZExtValue();
      }
-    
+
+    while (*Prefix) {
+      Str.push_back(*Prefix);
+      ++Prefix;
+    };
+
      while (N) {
        *--BufPtr = Digits[N % Radix];
        N /= Radix;
@@ -2111,38 +2259,43 @@ void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
    }
  
    APInt Tmp(*this);
-  
+
    if (Signed && isNegative()) {
      // They want to print the signed version and it is a negative value
      // Flip the bits and add one to turn it into the equivalent positive
      // value and put a '-' in the result.
-    Tmp.flip();
+    Tmp.flipAllBits();
      Tmp++;
      Str.push_back('-');
    }
-  
+
+  while (*Prefix) {
+    Str.push_back(*Prefix);
+    ++Prefix;
+  };
+
    // We insert the digits backward, then reverse them to get the right order.
    unsigned StartDig = Str.size();
-  
-  // For the 2, 8 and 16 bit cases, we can just shift instead of divide 
-  // because the number of bits per digit (1, 3 and 4 respectively) divides 
+
+  // For the 2, 8 and 16 bit cases, we can just shift instead of divide
+  // because the number of bits per digit (1, 3 and 4 respectively) divides
    // equaly.  We just shift until the value is zero.
-  if (Radix != 10) {
+  if (Radix == 2 || Radix == 8 || Radix == 16) {
      // Just shift tmp right for each digit width until it becomes zero
      unsigned ShiftAmt = (Radix == 16 ? 4 : (Radix == 8 ? 3 : 1));
      unsigned MaskAmt = Radix - 1;
-    
+
      while (Tmp != 0) {
        unsigned Digit = unsigned(Tmp.getRawData()[0]) & MaskAmt;
        Str.push_back(Digits[Digit]);
        Tmp = Tmp.lshr(ShiftAmt);
      }
    } else {
-    APInt divisor(4, 10);
+    APInt divisor(Radix == 10? 4 : 8, Radix);
      while (Tmp != 0) {
        APInt APdigit(1, 0);
        APInt tmp2(Tmp.getBitWidth(), 0);
-      divide(Tmp, Tmp.getNumWords(), divisor, divisor.getNumWords(), &tmp2, 
+      divide(Tmp, Tmp.getNumWords(), divisor, divisor.getNumWords(), &tmp2,
               &APdigit);
        unsigned Digit = (unsigned)APdigit.getZExtValue();
        assert(Digit < Radix && "divide failed");
@@ -2150,7 +2303,7 @@ void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
        Tmp = tmp2;
      }
    }
-  
+
    // Reverse the digits before returning.
    std::reverse(Str.begin()+StartDig, Str.end());
  }
@@ -2160,8 +2313,8 @@ void APInt::toString(SmallVectorImpl<char> &Str, unsigned Radix,
  /// to the methods above.
  std::string APInt::toString(unsigned Radix = 10, bool Signed = true) const {
    SmallString<40> S;
-  toString(S, Radix, Signed);
-  return S.c_str();
+  toString(S, Radix, Signed, /* formatAsCLiteral = */false);
+  return S.str();
  }
  
  
@@ -2169,20 +2322,21 @@ void APInt::dump() const {
    SmallString<40> S, U;
    this->toStringUnsigned(U);
    this->toStringSigned(S);
-  fprintf(stderr, "APInt(%db, %su %ss)", BitWidth, U.c_str(), S.c_str());
+  dbgs() << "APInt(" << BitWidth << "b, "
+         << U.str() << "u " << S.str() << "s)";
  }
  
  void APInt::print(raw_ostream &OS, bool isSigned) const {
    SmallString<40> S;
-  this->toString(S, 10, isSigned);
-  OS << S.c_str();
+  this->toString(S, 10, isSigned, /* formatAsCLiteral = */false);
+  OS << S.str();
  }
  
  // This implements a variety of operations on a representation of
  // arbitrary precision, two's-complement, bignum integer values.
  
-/* Assumed by lowHalf, highHalf, partMSB and partLSB.  A fairly safe
-   and unrestricting assumption.  */
+// Assumed by lowHalf, highHalf, partMSB and partLSB.  A fairly safe
+// and unrestricting assumption.
  #define COMPILE_TIME_ASSERT(cond) extern int CTAssert[(cond) ? 1 : -1]
  COMPILE_TIME_ASSERT(integerPartWidth % 2 == 0);
  
@@ -2194,7 +2348,7 @@ namespace {
    static inline integerPart
    lowBitMask(unsigned int bits)
    {
-    assert (bits != 0 && bits <= integerPartWidth);
+    assert(bits != 0 && bits <= integerPartWidth);
  
      return ~(integerPart) 0 >> (integerPartWidth - bits);
    }
@@ -2271,10 +2425,10 @@ APInt::tcSet(integerPart *dst, integerPart part, unsigned int parts)
  {
    unsigned int i;
  
-  assert (parts > 0);
+  assert(parts > 0);
  
    dst[0] = part;
-  for(i = 1; i < parts; i++)
+  for (i = 1; i < parts; i++)
      dst[i] = 0;
  }
  
@@ -2284,7 +2438,7 @@ APInt::tcAssign(integerPart *dst, const integerPart *src, unsigned int parts)
  {
    unsigned int i;
  
-  for(i = 0; i < parts; i++)
+  for (i = 0; i < parts; i++)
      dst[i] = src[i];
  }
  
@@ -2294,7 +2448,7 @@ APInt::tcIsZero(const integerPart *src, unsigned int parts)
  {
    unsigned int i;
  
-  for(i = 0; i < parts; i++)
+  for (i = 0; i < parts; i++)
      if (src[i])
        return false;
  
@@ -2305,17 +2459,25 @@ APInt::tcIsZero(const integerPart *src, unsigned int parts)
  int
  APInt::tcExtractBit(const integerPart *parts, unsigned int bit)
  {
-  return(parts[bit / integerPartWidth]
-         & ((integerPart) 1 << bit % integerPartWidth)) != 0;
+  return (parts[bit / integerPartWidth] &
+          ((integerPart) 1 << bit % integerPartWidth)) != 0;
  }
  
-/* Set the given bit of a bignum.  */
+/* Set the given bit of a bignum. */
  void
  APInt::tcSetBit(integerPart *parts, unsigned int bit)
  {
    parts[bit / integerPartWidth] |= (integerPart) 1 << (bit % integerPartWidth);
  }
  
+/* Clears the given bit of a bignum. */
+void
+APInt::tcClearBit(integerPart *parts, unsigned int bit)
+{
+  parts[bit / integerPartWidth] &=
+    ~((integerPart) 1 << (bit % integerPartWidth));
+}
+
  /* Returns the bit number of the least significant set bit of a
     number.  If the input number has no bits set -1U is returned.  */
  unsigned int
@@ -2323,7 +2485,7 @@ APInt::tcLSB(const integerPart *parts, unsigned int n)
  {
    unsigned int i, lsb;
  
-  for(i = 0; i < n; i++) {
+  for (i = 0; i < n; i++) {
        if (parts[i] != 0) {
            lsb = partLSB(parts[i]);
  
@@ -2342,13 +2504,13 @@ APInt::tcMSB(const integerPart *parts, unsigned int n)
    unsigned int msb;
  
    do {
-      --n;
+    --n;
  
-      if (parts[n] != 0) {
-          msb = partMSB(parts[n]);
+    if (parts[n] != 0) {
+      msb = partMSB(parts[n]);
  
-          return msb + n * integerPartWidth;
-      }
+      return msb + n * integerPartWidth;
+    }
    } while (n);
  
    return -1U;
@@ -2365,7 +2527,7 @@ APInt::tcExtract(integerPart *dst, unsigned int dstCount,const integerPart *src,
    unsigned int firstSrcPart, dstParts, shift, n;
  
    dstParts = (srcBits + integerPartWidth - 1) / integerPartWidth;
-  assert (dstParts <= dstCount);
+  assert(dstParts <= dstCount);
  
    firstSrcPart = srcLSB / integerPartWidth;
    tcAssign (dst, src + firstSrcPart, dstParts);
@@ -2400,7 +2562,7 @@ APInt::tcAdd(integerPart *dst, const integerPart *rhs,
  
    assert(c <= 1);
  
-  for(i = 0; i < parts; i++) {
+  for (i = 0; i < parts; i++) {
      integerPart l;
  
      l = dst[i];
@@ -2425,7 +2587,7 @@ APInt::tcSubtract(integerPart *dst, const integerPart *rhs,
  
    assert(c <= 1);
  
-  for(i = 0; i < parts; i++) {
+  for (i = 0; i < parts; i++) {
      integerPart l;
  
      l = dst[i];
@@ -2475,7 +2637,7 @@ APInt::tcMultiplyPart(integerPart *dst, const integerPart *src,
    /* N loops; minimum of dstParts and srcParts.  */
    n = dstParts < srcParts ? dstParts: srcParts;
  
-  for(i = 0; i < n; i++) {
+  for (i = 0; i < n; i++) {
      integerPart low, mid, high, srcPart;
  
        /* [ LOW, HIGH ] = MULTIPLIER * SRC[i] + DST[i] + CARRY.
@@ -2540,7 +2702,7 @@ APInt::tcMultiplyPart(integerPart *dst, const integerPart *src,
         non-zero.  This is true if any remaining src parts are non-zero
         and the multiplier is non-zero.  */
      if (multiplier)
-      for(; i < srcParts; i++)
+      for (; i < srcParts; i++)
          if (src[i])
            return 1;
  
@@ -2565,7 +2727,7 @@ APInt::tcMultiply(integerPart *dst, const integerPart *lhs,
    overflow = 0;
    tcSet(dst, 0, parts);
  
-  for(i = 0; i < parts; i++)
+  for (i = 0; i < parts; i++)
      overflow |= tcMultiplyPart(&dst[i], lhs, rhs[i], 0, parts,
                                 parts - i, true);
  
@@ -2591,7 +2753,7 @@ APInt::tcFullMultiply(integerPart *dst, const integerPart *lhs,
  
      tcSet(dst, 0, rhsParts);
  
-    for(n = 0; n < lhsParts; n++)
+    for (n = 0; n < lhsParts; n++)
        tcMultiplyPart(&dst[n], rhs, lhs[n], 0, rhsParts, rhsParts + 1, true);
  
      n = lhsParts + rhsParts;
@@ -2635,7 +2797,7 @@ APInt::tcDivide(integerPart *lhs, const integerPart *rhs,
  
    /* Loop, subtracting SRHS if REMAINDER is greater and adding that to
       the total.  */
-  for(;;) {
+  for (;;) {
        int compare;
  
        compare = tcCompare(remainder, srhs, parts);
@@ -2703,7 +2865,7 @@ APInt::tcShiftRight(integerPart *dst, unsigned int parts, unsigned int count)
  
      /* Perform the shift.  This leaves the most significant COUNT bits
         of the result at zero.  */
-    for(i = 0; i < parts; i++) {
+    for (i = 0; i < parts; i++) {
        integerPart part;
  
        if (i + jump >= parts) {
@@ -2728,7 +2890,7 @@ APInt::tcAnd(integerPart *dst, const integerPart *rhs, unsigned int parts)
  {
    unsigned int i;
  
-  for(i = 0; i < parts; i++)
+  for (i = 0; i < parts; i++)
      dst[i] &= rhs[i];
  }
  
@@ -2738,7 +2900,7 @@ APInt::tcOr(integerPart *dst, const integerPart *rhs, unsigned int parts)
  {
    unsigned int i;
  
-  for(i = 0; i < parts; i++)
+  for (i = 0; i < parts; i++)
      dst[i] |= rhs[i];
  }
  
@@ -2748,7 +2910,7 @@ APInt::tcXor(integerPart *dst, const integerPart *rhs, unsigned int parts)
  {
    unsigned int i;
  
-  for(i = 0; i < parts; i++)
+  for (i = 0; i < parts; i++)
      dst[i] ^= rhs[i];
  }
  
@@ -2758,7 +2920,7 @@ APInt::tcComplement(integerPart *dst, unsigned int parts)
  {
    unsigned int i;
  
-  for(i = 0; i < parts; i++)
+  for (i = 0; i < parts; i++)
      dst[i] = ~dst[i];
  }
  
@@ -2787,7 +2949,7 @@ APInt::tcIncrement(integerPart *dst, unsigned int parts)
  {
    unsigned int i;
  
-  for(i = 0; i < parts; i++)
+  for (i = 0; i < parts; i++)
      if (++dst[i] != 0)
        break;