X-Git-Url: http://plrg.eecs.uci.edu/git/?p=oota-llvm.git;a=blobdiff_plain;f=include%2Fllvm%2FSupport%2FMathExtras.h;h=d853e8a21e4d0c59cf2be94dbf86ed081dbb9b00;hp=53aad36e929f588832145a9dca4801351dfa225a;hb=f2bc179203d0e17bfcfa28bd5b9c1ba1d04cd6fe;hpb=e5c2c47f2fbe37712e50765d405e17cc46694e12 diff --git a/include/llvm/Support/MathExtras.h b/include/llvm/Support/MathExtras.h index 53aad36e929..d853e8a21e4 100644 --- a/include/llvm/Support/MathExtras.h +++ b/include/llvm/Support/MathExtras.h @@ -671,12 +671,30 @@ SaturatingAdd(T X, T Y) { template typename std::enable_if::value, T>::type SaturatingMultiply(T X, T Y) { - // Hacker's Delight, p. 30 - T Z = X * Y; - if (Y != 0 && Z / Y != X) - return std::numeric_limits::max(); - else - return Z; + // Hacker's Delight, p. 30 has a different algorithm, but we don't use that + // because it fails for uint16_t (where multiplication can have undefined + // behavior due to promotion to int), and requires a division in addition + // to the multiplication. + + // Log2(Z) would be either Log2Z or Log2Z + 1. + // Special case: if X or Y is 0, Log2_64 gives -1, and Log2Z + // will necessarily be less than Log2Max as desired. + int Log2Z = Log2_64(X) + Log2_64(Y); + const T Max = std::numeric_limits::max(); + int Log2Max = Log2_64(Max); + if (Log2Z < Log2Max) + return X * Y; + if (Log2Z > Log2Max) + return Max; + + // We're going to use the top bit, and maybe overflow one + // bit past it. Multiply all but the bottom bit then add + // that on at the end. + T Z = (X >> 1) * Y; + if (Z & ~(Max >> 1)) + return Max; + Z <<= 1; + return (X & 1) ? SaturatingAdd(Z, Y) : Z; } extern const float huge_valf;