Make MemoryBuiltins aware of TargetLibraryInfo.

[oota-llvm.git] / lib / Transforms / Scalar / SimplifyLibCalls.cpp
diff --git a/lib/Transforms/Scalar/SimplifyLibCalls.cpp b/lib/Transforms/Scalar/SimplifyLibCalls.cpp

index 9f136d4e3077a2821469d5454b2ca7fa6af008a5..65311fe72dcf02deaa4c29cc9c48f706d587ffed 100644 (file)
--- a/lib/Transforms/Scalar/SimplifyLibCalls.cpp
+++ b/lib/Transforms/Scalar/SimplifyLibCalls.cpp
@@ -18,26 +18,31 @@
  #define DEBUG_TYPE "simplify-libcalls"
  #include "llvm/Transforms/Scalar.h"
  #include "llvm/Transforms/Utils/BuildLibCalls.h"
+#include "llvm/IRBuilder.h"
  #include "llvm/Intrinsics.h"
  #include "llvm/LLVMContext.h"
  #include "llvm/Module.h"
  #include "llvm/Pass.h"
-#include "llvm/Support/IRBuilder.h"
-#include "llvm/Analysis/ValueTracking.h"
-#include "llvm/Target/TargetData.h"
-#include "llvm/Target/TargetLibraryInfo.h"
+#include "llvm/ADT/STLExtras.h"
  #include "llvm/ADT/SmallPtrSet.h"
-#include "llvm/ADT/StringMap.h"
  #include "llvm/ADT/Statistic.h"
-#include "llvm/ADT/STLExtras.h"
+#include "llvm/ADT/StringMap.h"
+#include "llvm/Analysis/ValueTracking.h"
+#include "llvm/Support/CommandLine.h"
  #include "llvm/Support/Debug.h"
  #include "llvm/Support/raw_ostream.h"
+#include "llvm/Target/TargetData.h"
+#include "llvm/Target/TargetLibraryInfo.h"
  #include "llvm/Config/config.h"            // FIXME: Shouldn't depend on host!
  using namespace llvm;
  
  STATISTIC(NumSimplified, "Number of library calls simplified");
  STATISTIC(NumAnnotated, "Number of attributes added to library functions");
  
+static cl::opt<bool> UnsafeFPShrink("enable-double-float-shrink", cl::Hidden,
+                                   cl::init(false),
+                                   cl::desc("Enable unsafe double to float "
+                                            "shrinking for math lib calls"));
  //===----------------------------------------------------------------------===//
  // Optimizer Base Class
  //===----------------------------------------------------------------------===//
@@ -49,6 +54,7 @@ class LibCallOptimization {
  protected:
    Function *Caller;
    const TargetData *TD;
+  const TargetLibraryInfo *TLI;
    LLVMContext* Context;
  public:
    LibCallOptimization() { }
@@ -62,9 +68,11 @@ public:
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B)
      =0;
  
-  Value *OptimizeCall(CallInst *CI, const TargetData *TD, IRBuilder<> &B) {
+  Value *OptimizeCall(CallInst *CI, const TargetData *TD,
+                      const TargetLibraryInfo *TLI, IRBuilder<> &B) {
      Caller = CI->getParent()->getParent();
      this->TD = TD;
+    this->TLI = TLI;
      if (CI->getCalledFunction())
        Context = &CI->getCalledFunction()->getContext();
  
@@ -98,6 +106,15 @@ static bool IsOnlyUsedInZeroEqualityComparison(Value *V) {
    return true;
  }
  
+static bool CallHasFloatingPointArgument(const CallInst *CI) {
+  for (CallInst::const_op_iterator it = CI->op_begin(), e = CI->op_end();
+       it != e; ++it) {
+    if ((*it)->getType()->isFloatingPointTy())
+      return true;
+  }
+  return false;
+}
+
  /// IsOnlyUsedInEqualityComparison - Return true if it is only used in equality
  /// comparisons with With.
  static bool IsOnlyUsedInEqualityComparison(Value *V, Value *With) {
@@ -122,7 +139,7 @@ namespace {
  struct StrCatOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
      // Verify the "strcat" function prototype.
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 2 ||
          FT->getReturnType() != B.getInt8PtrTy() ||
          FT->getParamType(0) != FT->getReturnType() ||
@@ -145,14 +162,15 @@ struct StrCatOpt : public LibCallOptimization {
      // These optimizations require TargetData.
      if (!TD) return 0;
  
-    EmitStrLenMemCpy(Src, Dst, Len, B);
-    return Dst;
+    return EmitStrLenMemCpy(Src, Dst, Len, B);
    }
  
-  void EmitStrLenMemCpy(Value *Src, Value *Dst, uint64_t Len, IRBuilder<> &B) {
+  Value *EmitStrLenMemCpy(Value *Src, Value *Dst, uint64_t Len, IRBuilder<> &B) {
      // We need to find the end of the destination string.  That's where the
      // memory is to be moved to. We just generate a call to strlen.
-    Value *DstLen = EmitStrLen(Dst, B, TD);
+    Value *DstLen = EmitStrLen(Dst, B, TD, TLI);
+    if (!DstLen)
+      return 0;
  
      // Now that we have the destination's length, we must index into the
      // destination's pointer to get the actual memcpy destination (end of
@@ -163,6 +181,7 @@ struct StrCatOpt : public LibCallOptimization {
      // concatenation for us.  Make a memcpy to copy the nul byte with align = 1.
      B.CreateMemCpy(CpyDst, Src,
                     ConstantInt::get(TD->getIntPtrType(*Context), Len + 1), 1);
+    return Dst;
    }
  };
  
@@ -172,7 +191,7 @@ struct StrCatOpt : public LibCallOptimization {
  struct StrNCatOpt : public StrCatOpt {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
      // Verify the "strncat" function prototype.
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 3 ||
          FT->getReturnType() != B.getInt8PtrTy() ||
          FT->getParamType(0) != FT->getReturnType() ||
@@ -209,8 +228,7 @@ struct StrNCatOpt : public StrCatOpt {
  
      // strncat(x, s, c) -> strcat(x, s)
      // s is constant so the strcat can be optimized further
-    EmitStrLenMemCpy(Src, Dst, SrcLen, B);
-    return Dst;
+    return EmitStrLenMemCpy(Src, Dst, SrcLen, B);
    }
  };
  
@@ -220,7 +238,7 @@ struct StrNCatOpt : public StrCatOpt {
  struct StrChrOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
      // Verify the "strchr" function prototype.
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 2 ||
          FT->getReturnType() != B.getInt8PtrTy() ||
          FT->getParamType(0) != FT->getReturnType() ||
@@ -242,21 +260,20 @@ struct StrChrOpt : public LibCallOptimization {
  
        return EmitMemChr(SrcStr, CI->getArgOperand(1), // include nul.
                          ConstantInt::get(TD->getIntPtrType(*Context), Len),
-                        B, TD);
+                        B, TD, TLI);
      }
  
      // Otherwise, the character is a constant, see if the first argument is
      // a string literal.  If so, we can constant fold.
-    std::string Str;
-    if (!GetConstantStringInfo(SrcStr, Str))
+    StringRef Str;
+    if (!getConstantStringInfo(SrcStr, Str))
        return 0;
  
-    // strchr can find the nul character.
-    Str += '\0';
-
-    // Compute the offset.
-    size_t I = Str.find(CharC->getSExtValue());
-    if (I == std::string::npos) // Didn't find the char.  strchr returns null.
+    // Compute the offset, make sure to handle the case when we're searching for
+    // zero (a weird way to spell strlen).
+    size_t I = CharC->getSExtValue() == 0 ?
+        Str.size() : Str.find(CharC->getSExtValue());
+    if (I == StringRef::npos) // Didn't find the char.  strchr returns null.
        return Constant::getNullValue(CI->getType());
  
      // strchr(s+n,c)  -> gep(s+n+i,c)
@@ -270,7 +287,7 @@ struct StrChrOpt : public LibCallOptimization {
  struct StrRChrOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
      // Verify the "strrchr" function prototype.
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 2 ||
          FT->getReturnType() != B.getInt8PtrTy() ||
          FT->getParamType(0) != FT->getReturnType() ||
@@ -284,20 +301,18 @@ struct StrRChrOpt : public LibCallOptimization {
      if (!CharC)
        return 0;
  
-    std::string Str;
-    if (!GetConstantStringInfo(SrcStr, Str)) {
+    StringRef Str;
+    if (!getConstantStringInfo(SrcStr, Str)) {
        // strrchr(s, 0) -> strchr(s, 0)
        if (TD && CharC->isZero())
-        return EmitStrChr(SrcStr, '\0', B, TD);
+        return EmitStrChr(SrcStr, '\0', B, TD, TLI);
        return 0;
      }
  
-    // strrchr can find the nul character.
-    Str += '\0';
-
      // Compute the offset.
-    size_t I = Str.rfind(CharC->getSExtValue());
-    if (I == std::string::npos) // Didn't find the char. Return null.
+    size_t I = CharC->getSExtValue() == 0 ?
+        Str.size() : Str.rfind(CharC->getSExtValue());
+    if (I == StringRef::npos) // Didn't find the char. Return null.
        return Constant::getNullValue(CI->getType());
  
      // strrchr(s+n,c) -> gep(s+n+i,c)
@@ -311,7 +326,7 @@ struct StrRChrOpt : public LibCallOptimization {
  struct StrCmpOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
      // Verify the "strcmp" function prototype.
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 2 ||
          !FT->getReturnType()->isIntegerTy(32) ||
          FT->getParamType(0) != FT->getParamType(1) ||
@@ -322,21 +337,21 @@ struct StrCmpOpt : public LibCallOptimization {
      if (Str1P == Str2P)      // strcmp(x,x)  -> 0
        return ConstantInt::get(CI->getType(), 0);
  
-    std::string Str1, Str2;
-    bool HasStr1 = GetConstantStringInfo(Str1P, Str1);
-    bool HasStr2 = GetConstantStringInfo(Str2P, Str2);
+    StringRef Str1, Str2;
+    bool HasStr1 = getConstantStringInfo(Str1P, Str1);
+    bool HasStr2 = getConstantStringInfo(Str2P, Str2);
  
-    if (HasStr1 && Str1.empty()) // strcmp("", x) -> *x
-      return B.CreateZExt(B.CreateLoad(Str2P, "strcmpload"), CI->getType());
+    // strcmp(x, y)  -> cnst  (if both x and y are constant strings)
+    if (HasStr1 && HasStr2)
+      return ConstantInt::get(CI->getType(), Str1.compare(Str2));
+
+    if (HasStr1 && Str1.empty()) // strcmp("", x) -> -*x
+      return B.CreateNeg(B.CreateZExt(B.CreateLoad(Str2P, "strcmpload"),
+                                      CI->getType()));
  
      if (HasStr2 && Str2.empty()) // strcmp(x,"") -> *x
        return B.CreateZExt(B.CreateLoad(Str1P, "strcmpload"), CI->getType());
  
-    // strcmp(x, y)  -> cnst  (if both x and y are constant strings)
-    if (HasStr1 && HasStr2)
-      return ConstantInt::get(CI->getType(),
-                                     strcmp(Str1.c_str(),Str2.c_str()));
-
      // strcmp(P, "x") -> memcmp(P, "x", 2)
      uint64_t Len1 = GetStringLength(Str1P);
      uint64_t Len2 = GetStringLength(Str2P);
@@ -346,7 +361,7 @@ struct StrCmpOpt : public LibCallOptimization {
  
        return EmitMemCmp(Str1P, Str2P,
                          ConstantInt::get(TD->getIntPtrType(*Context),
-                        std::min(Len1, Len2)), B, TD);
+                        std::min(Len1, Len2)), B, TD, TLI);
      }
  
      return 0;
@@ -359,7 +374,7 @@ struct StrCmpOpt : public LibCallOptimization {
  struct StrNCmpOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
      // Verify the "strncmp" function prototype.
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 3 ||
          !FT->getReturnType()->isIntegerTy(32) ||
          FT->getParamType(0) != FT->getParamType(1) ||
@@ -382,22 +397,26 @@ struct StrNCmpOpt : public LibCallOptimization {
        return ConstantInt::get(CI->getType(), 0);
  
      if (TD && Length == 1) // strncmp(x,y,1) -> memcmp(x,y,1)
-      return EmitMemCmp(Str1P, Str2P, CI->getArgOperand(2), B, TD);
+      return EmitMemCmp(Str1P, Str2P, CI->getArgOperand(2), B, TD, TLI);
  
-    std::string Str1, Str2;
-    bool HasStr1 = GetConstantStringInfo(Str1P, Str1);
-    bool HasStr2 = GetConstantStringInfo(Str2P, Str2);
+    StringRef Str1, Str2;
+    bool HasStr1 = getConstantStringInfo(Str1P, Str1);
+    bool HasStr2 = getConstantStringInfo(Str2P, Str2);
  
-    if (HasStr1 && Str1.empty())  // strncmp("", x, n) -> *x
-      return B.CreateZExt(B.CreateLoad(Str2P, "strcmpload"), CI->getType());
+    // strncmp(x, y)  -> cnst  (if both x and y are constant strings)
+    if (HasStr1 && HasStr2) {
+      StringRef SubStr1 = Str1.substr(0, Length);
+      StringRef SubStr2 = Str2.substr(0, Length);
+      return ConstantInt::get(CI->getType(), SubStr1.compare(SubStr2));
+    }
+
+    if (HasStr1 && Str1.empty())  // strncmp("", x, n) -> -*x
+      return B.CreateNeg(B.CreateZExt(B.CreateLoad(Str2P, "strcmpload"),
+                                      CI->getType()));
  
      if (HasStr2 && Str2.empty())  // strncmp(x, "", n) -> *x
        return B.CreateZExt(B.CreateLoad(Str1P, "strcmpload"), CI->getType());
  
-    // strncmp(x, y)  -> cnst  (if both x and y are constant strings)
-    if (HasStr1 && HasStr2)
-      return ConstantInt::get(CI->getType(),
-                              strncmp(Str1.c_str(), Str2.c_str(), Length));
      return 0;
    }
  };
@@ -414,7 +433,7 @@ struct StrCpyOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
      // Verify the "strcpy" function prototype.
      unsigned NumParams = OptChkCall ? 3 : 2;
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != NumParams ||
          FT->getReturnType() != FT->getParamType(0) ||
          FT->getParamType(0) != FT->getParamType(1) ||
@@ -434,23 +453,67 @@ struct StrCpyOpt : public LibCallOptimization {
  
      // We have enough information to now generate the memcpy call to do the
      // concatenation for us.  Make a memcpy to copy the nul byte with align = 1.
-    if (OptChkCall)
-      EmitMemCpyChk(Dst, Src,
-                    ConstantInt::get(TD->getIntPtrType(*Context), Len),
-                    CI->getArgOperand(2), B, TD);
-    else
+    if (!OptChkCall ||
+        !EmitMemCpyChk(Dst, Src,
+                       ConstantInt::get(TD->getIntPtrType(*Context), Len),
+                       CI->getArgOperand(2), B, TD, TLI))
        B.CreateMemCpy(Dst, Src,
                       ConstantInt::get(TD->getIntPtrType(*Context), Len), 1);
      return Dst;
    }
  };
  
+//===---------------------------------------===//
+// 'stpcpy' Optimizations
+
+struct StpCpyOpt: public LibCallOptimization {
+  bool OptChkCall;  // True if it's optimizing a __stpcpy_chk libcall.
+
+  StpCpyOpt(bool c) : OptChkCall(c) {}
+
+  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
+    // Verify the "stpcpy" function prototype.
+    unsigned NumParams = OptChkCall ? 3 : 2;
+    FunctionType *FT = Callee->getFunctionType();
+    if (FT->getNumParams() != NumParams ||
+        FT->getReturnType() != FT->getParamType(0) ||
+        FT->getParamType(0) != FT->getParamType(1) ||
+        FT->getParamType(0) != B.getInt8PtrTy())
+      return 0;
+
+    // These optimizations require TargetData.
+    if (!TD) return 0;
+
+    Value *Dst = CI->getArgOperand(0), *Src = CI->getArgOperand(1);
+    if (Dst == Src) {  // stpcpy(x,x)  -> x+strlen(x)
+      Value *StrLen = EmitStrLen(Src, B, TD, TLI);
+      return StrLen ? B.CreateInBoundsGEP(Dst, StrLen) : 0;
+    }
+
+    // See if we can get the length of the input string.
+    uint64_t Len = GetStringLength(Src);
+    if (Len == 0) return 0;
+
+    Value *LenV = ConstantInt::get(TD->getIntPtrType(*Context), Len);
+    Value *DstEnd = B.CreateGEP(Dst,
+                                ConstantInt::get(TD->getIntPtrType(*Context),
+                                                 Len - 1));
+
+    // We have enough information to now generate the memcpy call to do the
+    // copy for us.  Make a memcpy to copy the nul byte with align = 1.
+    if (!OptChkCall || !EmitMemCpyChk(Dst, Src, LenV, CI->getArgOperand(2), B,
+                                      TD, TLI))
+      B.CreateMemCpy(Dst, Src, LenV, 1);
+    return DstEnd;
+  }
+};
+
  //===---------------------------------------===//
  // 'strncpy' Optimizations
  
  struct StrNCpyOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 3 || FT->getReturnType() != FT->getParamType(0) ||
          FT->getParamType(0) != FT->getParamType(1) ||
          FT->getParamType(0) != B.getInt8PtrTy() ||
@@ -499,7 +562,7 @@ struct StrNCpyOpt : public LibCallOptimization {
  
  struct StrLenOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 1 ||
          FT->getParamType(0) != B.getInt8PtrTy() ||
          !FT->getReturnType()->isIntegerTy())
@@ -525,16 +588,16 @@ struct StrLenOpt : public LibCallOptimization {
  
  struct StrPBrkOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 2 ||
          FT->getParamType(0) != B.getInt8PtrTy() ||
          FT->getParamType(1) != FT->getParamType(0) ||
          FT->getReturnType() != FT->getParamType(0))
        return 0;
  
-    std::string S1, S2;
-    bool HasS1 = GetConstantStringInfo(CI->getArgOperand(0), S1);
-    bool HasS2 = GetConstantStringInfo(CI->getArgOperand(1), S2);
+    StringRef S1, S2;
+    bool HasS1 = getConstantStringInfo(CI->getArgOperand(0), S1);
+    bool HasS2 = getConstantStringInfo(CI->getArgOperand(1), S2);
  
      // strpbrk(s, "") -> NULL
      // strpbrk("", s) -> NULL
@@ -552,7 +615,7 @@ struct StrPBrkOpt : public LibCallOptimization {
  
      // strpbrk(s, "a") -> strchr(s, 'a')
      if (TD && HasS2 && S2.size() == 1)
-      return EmitStrChr(CI->getArgOperand(0), S2[0], B, TD);
+      return EmitStrChr(CI->getArgOperand(0), S2[0], B, TD, TLI);
  
      return 0;
    }
@@ -563,7 +626,7 @@ struct StrPBrkOpt : public LibCallOptimization {
  
  struct StrToOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if ((FT->getNumParams() != 2 && FT->getNumParams() != 3) ||
          !FT->getParamType(0)->isPointerTy() ||
          !FT->getParamType(1)->isPointerTy())
@@ -585,16 +648,16 @@ struct StrToOpt : public LibCallOptimization {
  
  struct StrSpnOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 2 ||
          FT->getParamType(0) != B.getInt8PtrTy() ||
          FT->getParamType(1) != FT->getParamType(0) ||
          !FT->getReturnType()->isIntegerTy())
        return 0;
  
-    std::string S1, S2;
-    bool HasS1 = GetConstantStringInfo(CI->getArgOperand(0), S1);
-    bool HasS2 = GetConstantStringInfo(CI->getArgOperand(1), S2);
+    StringRef S1, S2;
+    bool HasS1 = getConstantStringInfo(CI->getArgOperand(0), S1);
+    bool HasS2 = getConstantStringInfo(CI->getArgOperand(1), S2);
  
      // strspn(s, "") -> 0
      // strspn("", s) -> 0
@@ -602,8 +665,11 @@ struct StrSpnOpt : public LibCallOptimization {
        return Constant::getNullValue(CI->getType());
  
      // Constant folding.
-    if (HasS1 && HasS2)
-      return ConstantInt::get(CI->getType(), strspn(S1.c_str(), S2.c_str()));
+    if (HasS1 && HasS2) {
+      size_t Pos = S1.find_first_not_of(S2);
+      if (Pos == StringRef::npos) Pos = S1.size();
+      return ConstantInt::get(CI->getType(), Pos);
+    }
  
      return 0;
    }
@@ -614,28 +680,31 @@ struct StrSpnOpt : public LibCallOptimization {
  
  struct StrCSpnOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 2 ||
          FT->getParamType(0) != B.getInt8PtrTy() ||
          FT->getParamType(1) != FT->getParamType(0) ||
          !FT->getReturnType()->isIntegerTy())
        return 0;
  
-    std::string S1, S2;
-    bool HasS1 = GetConstantStringInfo(CI->getArgOperand(0), S1);
-    bool HasS2 = GetConstantStringInfo(CI->getArgOperand(1), S2);
+    StringRef S1, S2;
+    bool HasS1 = getConstantStringInfo(CI->getArgOperand(0), S1);
+    bool HasS2 = getConstantStringInfo(CI->getArgOperand(1), S2);
  
      // strcspn("", s) -> 0
      if (HasS1 && S1.empty())
        return Constant::getNullValue(CI->getType());
  
      // Constant folding.
-    if (HasS1 && HasS2)
-      return ConstantInt::get(CI->getType(), strcspn(S1.c_str(), S2.c_str()));
+    if (HasS1 && HasS2) {
+      size_t Pos = S1.find_first_of(S2);
+      if (Pos == StringRef::npos) Pos = S1.size();
+      return ConstantInt::get(CI->getType(), Pos);
+    }
  
      // strcspn(s, "") -> strlen(s)
      if (TD && HasS2 && S2.empty())
-      return EmitStrLen(CI->getArgOperand(0), B, TD);
+      return EmitStrLen(CI->getArgOperand(0), B, TD, TLI);
  
      return 0;
    }
@@ -646,7 +715,7 @@ struct StrCSpnOpt : public LibCallOptimization {
  
  struct StrStrOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 2 ||
          !FT->getParamType(0)->isPointerTy() ||
          !FT->getParamType(1)->isPointerTy() ||
@@ -659,9 +728,13 @@ struct StrStrOpt : public LibCallOptimization {
  
      // fold strstr(a, b) == a -> strncmp(a, b, strlen(b)) == 0
      if (TD && IsOnlyUsedInEqualityComparison(CI, CI->getArgOperand(0))) {
-      Value *StrLen = EmitStrLen(CI->getArgOperand(1), B, TD);
+      Value *StrLen = EmitStrLen(CI->getArgOperand(1), B, TD, TLI);
+      if (!StrLen)
+        return 0;
        Value *StrNCmp = EmitStrNCmp(CI->getArgOperand(0), CI->getArgOperand(1),
-                                   StrLen, B, TD);
+                                   StrLen, B, TD, TLI);
+      if (!StrNCmp)
+        return 0;
        for (Value::use_iterator UI = CI->use_begin(), UE = CI->use_end();
             UI != UE; ) {
          ICmpInst *Old = cast<ICmpInst>(*UI++);
@@ -675,9 +748,9 @@ struct StrStrOpt : public LibCallOptimization {
      }
  
      // See if either input string is a constant string.
-    std::string SearchStr, ToFindStr;
-    bool HasStr1 = GetConstantStringInfo(CI->getArgOperand(0), SearchStr);
-    bool HasStr2 = GetConstantStringInfo(CI->getArgOperand(1), ToFindStr);
+    StringRef SearchStr, ToFindStr;
+    bool HasStr1 = getConstantStringInfo(CI->getArgOperand(0), SearchStr);
+    bool HasStr2 = getConstantStringInfo(CI->getArgOperand(1), ToFindStr);
  
      // fold strstr(x, "") -> x.
      if (HasStr2 && ToFindStr.empty())
@@ -687,7 +760,7 @@ struct StrStrOpt : public LibCallOptimization {
      if (HasStr1 && HasStr2) {
        std::string::size_type Offset = SearchStr.find(ToFindStr);
  
-      if (Offset == std::string::npos) // strstr("foo", "bar") -> null
+      if (Offset == StringRef::npos) // strstr("foo", "bar") -> null
          return Constant::getNullValue(CI->getType());
  
        // strstr("abcd", "bc") -> gep((char*)"abcd", 1)
@@ -697,9 +770,10 @@ struct StrStrOpt : public LibCallOptimization {
      }
  
      // fold strstr(x, "y") -> strchr(x, 'y').
-    if (HasStr2 && ToFindStr.size() == 1)
-      return B.CreateBitCast(EmitStrChr(CI->getArgOperand(0),
-                             ToFindStr[0], B, TD), CI->getType());
+    if (HasStr2 && ToFindStr.size() == 1) {
+      Value *StrChr= EmitStrChr(CI->getArgOperand(0), ToFindStr[0], B, TD, TLI);
+      return StrChr ? B.CreateBitCast(StrChr, CI->getType()) : 0;
+    }
      return 0;
    }
  };
@@ -710,7 +784,7 @@ struct StrStrOpt : public LibCallOptimization {
  
  struct MemCmpOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 3 || !FT->getParamType(0)->isPointerTy() ||
          !FT->getParamType(1)->isPointerTy() ||
          !FT->getReturnType()->isIntegerTy(32))
@@ -739,11 +813,11 @@ struct MemCmpOpt : public LibCallOptimization {
      }
  
      // Constant folding: memcmp(x, y, l) -> cnst (all arguments are constant)
-    std::string LHSStr, RHSStr;
-    if (GetConstantStringInfo(LHS, LHSStr) &&
-        GetConstantStringInfo(RHS, RHSStr)) {
+    StringRef LHSStr, RHSStr;
+    if (getConstantStringInfo(LHS, LHSStr) &&
+        getConstantStringInfo(RHS, RHSStr)) {
        // Make sure we're not reading out-of-bounds memory.
-      if (Len > LHSStr.length() || Len > RHSStr.length())
+      if (Len > LHSStr.size() || Len > RHSStr.size())
          return 0;
        uint64_t Ret = memcmp(LHSStr.data(), RHSStr.data(), Len);
        return ConstantInt::get(CI->getType(), Ret);
@@ -761,7 +835,7 @@ struct MemCpyOpt : public LibCallOptimization {
      // These optimizations require TargetData.
      if (!TD) return 0;
  
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 3 || FT->getReturnType() != FT->getParamType(0) ||
          !FT->getParamType(0)->isPointerTy() ||
          !FT->getParamType(1)->isPointerTy() ||
@@ -783,7 +857,7 @@ struct MemMoveOpt : public LibCallOptimization {
      // These optimizations require TargetData.
      if (!TD) return 0;
  
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 3 || FT->getReturnType() != FT->getParamType(0) ||
          !FT->getParamType(0)->isPointerTy() ||
          !FT->getParamType(1)->isPointerTy() ||
@@ -805,7 +879,7 @@ struct MemSetOpt : public LibCallOptimization {
      // These optimizations require TargetData.
      if (!TD) return 0;
  
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 3 || FT->getReturnType() != FT->getParamType(0) ||
          !FT->getParamType(0)->isPointerTy() ||
          !FT->getParamType(1)->isIntegerTy() ||
@@ -823,18 +897,87 @@ struct MemSetOpt : public LibCallOptimization {
  // Math Library Optimizations
  //===----------------------------------------------------------------------===//
  
+//===---------------------------------------===//
+// Double -> Float Shrinking Optimizations for Unary Functions like 'floor'
+
+struct UnaryDoubleFPOpt : public LibCallOptimization {
+  bool CheckRetType;
+  UnaryDoubleFPOpt(bool CheckReturnType): CheckRetType(CheckReturnType) {}
+  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
+    FunctionType *FT = Callee->getFunctionType();
+    if (FT->getNumParams() != 1 || !FT->getReturnType()->isDoubleTy() ||
+        !FT->getParamType(0)->isDoubleTy())
+      return 0;
+
+    if (CheckRetType) {
+      // Check if all the uses for function like 'sin' are converted to float.
+      for (Value::use_iterator UseI = CI->use_begin(); UseI != CI->use_end();
+          ++UseI) {
+        FPTruncInst *Cast = dyn_cast<FPTruncInst>(*UseI);
+        if (Cast == 0 || !Cast->getType()->isFloatTy())
+          return 0;
+      }
+    }
+
+    // If this is something like 'floor((double)floatval)', convert to floorf.
+    FPExtInst *Cast = dyn_cast<FPExtInst>(CI->getArgOperand(0));
+    if (Cast == 0 || !Cast->getOperand(0)->getType()->isFloatTy())
+      return 0;
+
+    // floor((double)floatval) -> (double)floorf(floatval)
+    Value *V = Cast->getOperand(0);
+    V = EmitUnaryFloatFnCall(V, Callee->getName(), B, Callee->getAttributes());
+    return B.CreateFPExt(V, B.getDoubleTy());
+  }
+};
+
+//===---------------------------------------===//
+// 'cos*' Optimizations
+struct CosOpt : public LibCallOptimization {
+  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
+    Value *Ret = NULL;
+    if (UnsafeFPShrink && Callee->getName() == "cos" &&
+        TLI->has(LibFunc::cosf)) {
+      UnaryDoubleFPOpt UnsafeUnaryDoubleFP(true);
+      Ret = UnsafeUnaryDoubleFP.CallOptimizer(Callee, CI, B);
+    }
+
+    FunctionType *FT = Callee->getFunctionType();
+    // Just make sure this has 1 argument of FP type, which matches the
+    // result type.
+    if (FT->getNumParams() != 1 || FT->getReturnType() != FT->getParamType(0) ||
+        !FT->getParamType(0)->isFloatingPointTy())
+      return Ret;
+
+    // cos(-x) -> cos(x)
+    Value *Op1 = CI->getArgOperand(0);
+    if (BinaryOperator::isFNeg(Op1)) {
+      BinaryOperator *BinExpr = cast<BinaryOperator>(Op1);
+      return B.CreateCall(Callee, BinExpr->getOperand(1), "cos");
+    }
+    return Ret;
+  }
+};
+
  //===---------------------------------------===//
  // 'pow*' Optimizations
  
  struct PowOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    Value *Ret = NULL;
+    if (UnsafeFPShrink && Callee->getName() == "pow" &&
+        TLI->has(LibFunc::powf)) {
+      UnaryDoubleFPOpt UnsafeUnaryDoubleFP(true);
+      Ret = UnsafeUnaryDoubleFP.CallOptimizer(Callee, CI, B);
+    }
+
+    FunctionType *FT = Callee->getFunctionType();
      // Just make sure this has 2 arguments of the same FP type, which match the
      // result type.
      if (FT->getNumParams() != 2 || FT->getReturnType() != FT->getParamType(0) ||
          FT->getParamType(0) != FT->getParamType(1) ||
          !FT->getParamType(0)->isFloatingPointTy())
-      return 0;
+      return Ret;
  
      Value *Op1 = CI->getArgOperand(0), *Op2 = CI->getArgOperand(1);
      if (ConstantFP *Op1C = dyn_cast<ConstantFP>(Op1)) {
@@ -845,7 +988,7 @@ struct PowOpt : public LibCallOptimization {
      }
  
      ConstantFP *Op2C = dyn_cast<ConstantFP>(Op2);
-    if (Op2C == 0) return 0;
+    if (Op2C == 0) return Ret;
  
      if (Op2C->getValueAPF().isZero())  // pow(x, 0.0) -> 1.0
        return ConstantFP::get(CI->getType(), 1.0);
@@ -853,7 +996,7 @@ struct PowOpt : public LibCallOptimization {
      if (Op2C->isExactlyValue(0.5)) {
        // Expand pow(x, 0.5) to (x == -infinity ? +infinity : fabs(sqrt(x))).
        // This is faster than calling pow, and still handles negative zero
-      // and negative infinite correctly.
+      // and negative infinity correctly.
        // TODO: In fast-math mode, this could be just sqrt(x).
        // TODO: In finite-only mode, this could be just fabs(sqrt(x)).
        Value *Inf = ConstantFP::getInfinity(CI->getType());
@@ -862,8 +1005,8 @@ struct PowOpt : public LibCallOptimization {
                                           Callee->getAttributes());
        Value *FAbs = EmitUnaryFloatFnCall(Sqrt, "fabs", B,
                                           Callee->getAttributes());
-      Value *FCmp = B.CreateFCmpOEQ(Op1, NegInf, "tmp");
-      Value *Sel = B.CreateSelect(FCmp, Inf, FAbs, "tmp");
+      Value *FCmp = B.CreateFCmpOEQ(Op1, NegInf);
+      Value *Sel = B.CreateSelect(FCmp, Inf, FAbs);
        return Sel;
      }
  
@@ -883,12 +1026,19 @@ struct PowOpt : public LibCallOptimization {
  
  struct Exp2Opt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    Value *Ret = NULL;
+    if (UnsafeFPShrink && Callee->getName() == "exp2" &&
+        TLI->has(LibFunc::exp2)) {
+      UnaryDoubleFPOpt UnsafeUnaryDoubleFP(true);
+      Ret = UnsafeUnaryDoubleFP.CallOptimizer(Callee, CI, B);
+    }
+
+    FunctionType *FT = Callee->getFunctionType();
      // Just make sure this has 1 argument of FP type, which matches the
      // result type.
      if (FT->getNumParams() != 1 || FT->getReturnType() != FT->getParamType(0) ||
          !FT->getParamType(0)->isFloatingPointTy())
-      return 0;
+      return Ret;
  
      Value *Op = CI->getArgOperand(0);
      // Turn exp2(sitofp(x)) -> ldexp(1.0, sext(x))  if sizeof(x) <= 32
@@ -896,10 +1046,10 @@ struct Exp2Opt : public LibCallOptimization {
      Value *LdExpArg = 0;
      if (SIToFPInst *OpC = dyn_cast<SIToFPInst>(Op)) {
        if (OpC->getOperand(0)->getType()->getPrimitiveSizeInBits() <= 32)
-        LdExpArg = B.CreateSExt(OpC->getOperand(0), B.getInt32Ty(), "tmp");
+        LdExpArg = B.CreateSExt(OpC->getOperand(0), B.getInt32Ty());
      } else if (UIToFPInst *OpC = dyn_cast<UIToFPInst>(Op)) {
        if (OpC->getOperand(0)->getType()->getPrimitiveSizeInBits() < 32)
-        LdExpArg = B.CreateZExt(OpC->getOperand(0), B.getInt32Ty(), "tmp");
+        LdExpArg = B.CreateZExt(OpC->getOperand(0), B.getInt32Ty());
      }
  
      if (LdExpArg) {
@@ -925,30 +1075,7 @@ struct Exp2Opt : public LibCallOptimization {
  
        return CI;
      }
-    return 0;
-  }
-};
-
-//===---------------------------------------===//
-// Double -> Float Shrinking Optimizations for Unary Functions like 'floor'
-
-struct UnaryDoubleFPOpt : public LibCallOptimization {
-  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
-    if (FT->getNumParams() != 1 || !FT->getReturnType()->isDoubleTy() ||
-        !FT->getParamType(0)->isDoubleTy())
-      return 0;
-
-    // If this is something like 'floor((double)floatval)', convert to floorf.
-    FPExtInst *Cast = dyn_cast<FPExtInst>(CI->getArgOperand(0));
-    if (Cast == 0 || !Cast->getOperand(0)->getType()->isFloatTy())
-      return 0;
-
-    // floor((double)floatval) -> (double)floorf(floatval)
-    Value *V = Cast->getOperand(0);
-    V = EmitUnaryFloatFnCall(V, Callee->getName().data(), B,
-                             Callee->getAttributes());
-    return B.CreateFPExt(V, B.getDoubleTy());
+    return Ret;
    }
  };
  
@@ -961,7 +1088,7 @@ struct UnaryDoubleFPOpt : public LibCallOptimization {
  
  struct FFSOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      // Just make sure this has 2 arguments of the same FP type, which match the
      // result type.
      if (FT->getNumParams() != 1 ||
@@ -980,14 +1107,14 @@ struct FFSOpt : public LibCallOptimization {
      }
  
      // ffs(x) -> x != 0 ? (i32)llvm.cttz(x)+1 : 0
-    const Type *ArgType = Op->getType();
+    Type *ArgType = Op->getType();
      Value *F = Intrinsic::getDeclaration(Callee->getParent(),
-                                         Intrinsic::cttz, &ArgType, 1);
-    Value *V = B.CreateCall(F, Op, "cttz");
-    V = B.CreateAdd(V, ConstantInt::get(V->getType(), 1), "tmp");
-    V = B.CreateIntCast(V, B.getInt32Ty(), false, "tmp");
+                                         Intrinsic::cttz, ArgType);
+    Value *V = B.CreateCall2(F, Op, B.getFalse(), "cttz");
+    V = B.CreateAdd(V, ConstantInt::get(V->getType(), 1));
+    V = B.CreateIntCast(V, B.getInt32Ty(), false);
  
-    Value *Cond = B.CreateICmpNE(Op, Constant::getNullValue(ArgType), "tmp");
+    Value *Cond = B.CreateICmpNE(Op, Constant::getNullValue(ArgType));
      return B.CreateSelect(Cond, V, B.getInt32(0));
    }
  };
@@ -997,7 +1124,7 @@ struct FFSOpt : public LibCallOptimization {
  
  struct IsDigitOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      // We require integer(i32)
      if (FT->getNumParams() != 1 || !FT->getReturnType()->isIntegerTy() ||
          !FT->getParamType(0)->isIntegerTy(32))
@@ -1016,7 +1143,7 @@ struct IsDigitOpt : public LibCallOptimization {
  
  struct IsAsciiOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      // We require integer(i32)
      if (FT->getNumParams() != 1 || !FT->getReturnType()->isIntegerTy() ||
          !FT->getParamType(0)->isIntegerTy(32))
@@ -1034,7 +1161,7 @@ struct IsAsciiOpt : public LibCallOptimization {
  
  struct AbsOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      // We require integer(integer) where the types agree.
      if (FT->getNumParams() != 1 || !FT->getReturnType()->isIntegerTy() ||
          FT->getParamType(0) != FT->getReturnType())
@@ -1055,7 +1182,7 @@ struct AbsOpt : public LibCallOptimization {
  
  struct ToAsciiOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      // We require i32(i32)
      if (FT->getNumParams() != 1 || FT->getReturnType() != FT->getParamType(0) ||
          !FT->getParamType(0)->isIntegerTy(32))
@@ -1075,17 +1202,11 @@ struct ToAsciiOpt : public LibCallOptimization {
  // 'printf' Optimizations
  
  struct PrintFOpt : public LibCallOptimization {
-  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    // Require one fixed pointer argument and an integer/void result.
-    const FunctionType *FT = Callee->getFunctionType();
-    if (FT->getNumParams() < 1 || !FT->getParamType(0)->isPointerTy() ||
-        !(FT->getReturnType()->isIntegerTy() ||
-          FT->getReturnType()->isVoidTy()))
-      return 0;
-
+  Value *OptimizeFixedFormatString(Function *Callee, CallInst *CI,
+                                   IRBuilder<> &B) {
      // Check for a fixed format string.
-    std::string FormatStr;
-    if (!GetConstantStringInfo(CI->getArgOperand(0), FormatStr))
+    StringRef FormatStr;
+    if (!getConstantStringInfo(CI->getArgOperand(0), FormatStr))
        return 0;
  
      // Empty format string -> noop.
@@ -1101,8 +1222,8 @@ struct PrintFOpt : public LibCallOptimization {
  
      // printf("x") -> putchar('x'), even for '%'.
      if (FormatStr.size() == 1) {
-      Value *Res = EmitPutChar(B.getInt32(FormatStr[0]), B, TD);
-      if (CI->use_empty()) return CI;
+      Value *Res = EmitPutChar(B.getInt32(FormatStr[0]), B, TD, TLI);
+      if (CI->use_empty() || !Res) return Res;
        return B.CreateIntCast(Res, CI->getType(), true);
      }
  
@@ -1111,30 +1232,54 @@ struct PrintFOpt : public LibCallOptimization {
          FormatStr.find('%') == std::string::npos) {  // no format characters.
        // Create a string literal with no \n on it.  We expect the constant merge
        // pass to be run after this pass, to merge duplicate strings.
-      FormatStr.erase(FormatStr.end()-1);
-      Constant *C = ConstantArray::get(*Context, FormatStr, true);
-      C = new GlobalVariable(*Callee->getParent(), C->getType(), true,
-                             GlobalVariable::InternalLinkage, C, "str");
-      EmitPutS(C, B, TD);
-      return CI->use_empty() ? (Value*)CI :
-                    ConstantInt::get(CI->getType(), FormatStr.size()+1);
+      FormatStr = FormatStr.drop_back();
+      Value *GV = B.CreateGlobalString(FormatStr, "str");
+      Value *NewCI = EmitPutS(GV, B, TD, TLI);
+      return (CI->use_empty() || !NewCI) ?
+              NewCI :
+              ConstantInt::get(CI->getType(), FormatStr.size()+1);
      }
  
      // Optimize specific format strings.
      // printf("%c", chr) --> putchar(chr)
      if (FormatStr == "%c" && CI->getNumArgOperands() > 1 &&
          CI->getArgOperand(1)->getType()->isIntegerTy()) {
-      Value *Res = EmitPutChar(CI->getArgOperand(1), B, TD);
+      Value *Res = EmitPutChar(CI->getArgOperand(1), B, TD, TLI);
  
-      if (CI->use_empty()) return CI;
+      if (CI->use_empty() || !Res) return Res;
        return B.CreateIntCast(Res, CI->getType(), true);
      }
  
      // printf("%s\n", str) --> puts(str)
      if (FormatStr == "%s\n" && CI->getNumArgOperands() > 1 &&
          CI->getArgOperand(1)->getType()->isPointerTy()) {
-      EmitPutS(CI->getArgOperand(1), B, TD);
-      return CI;
+      return EmitPutS(CI->getArgOperand(1), B, TD, TLI);
+    }
+    return 0;
+  }
+
+  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
+    // Require one fixed pointer argument and an integer/void result.
+    FunctionType *FT = Callee->getFunctionType();
+    if (FT->getNumParams() < 1 || !FT->getParamType(0)->isPointerTy() ||
+        !(FT->getReturnType()->isIntegerTy() ||
+          FT->getReturnType()->isVoidTy()))
+      return 0;
+
+    if (Value *V = OptimizeFixedFormatString(Callee, CI, B)) {
+      return V;
+    }
+
+    // printf(format, ...) -> iprintf(format, ...) if no floating point
+    // arguments.
+    if (TLI->has(LibFunc::iprintf) && !CallHasFloatingPointArgument(CI)) {
+      Module *M = B.GetInsertBlock()->getParent()->getParent();
+      Constant *IPrintFFn =
+        M->getOrInsertFunction("iprintf", FT, Callee->getAttributes());
+      CallInst *New = cast<CallInst>(CI->clone());
+      New->setCalledFunction(IPrintFFn);
+      B.Insert(New);
+      return New;
      }
      return 0;
    }
@@ -1144,17 +1289,11 @@ struct PrintFOpt : public LibCallOptimization {
  // 'sprintf' Optimizations
  
  struct SPrintFOpt : public LibCallOptimization {
-  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    // Require two fixed pointer arguments and an integer result.
-    const FunctionType *FT = Callee->getFunctionType();
-    if (FT->getNumParams() != 2 || !FT->getParamType(0)->isPointerTy() ||
-        !FT->getParamType(1)->isPointerTy() ||
-        !FT->getReturnType()->isIntegerTy())
-      return 0;
-
+  Value *OptimizeFixedFormatString(Function *Callee, CallInst *CI,
+                                   IRBuilder<> &B) {
      // Check for a fixed format string.
-    std::string FormatStr;
-    if (!GetConstantStringInfo(CI->getArgOperand(1), FormatStr))
+    StringRef FormatStr;
+    if (!getConstantStringInfo(CI->getArgOperand(1), FormatStr))
        return 0;
  
      // If we just have a format string (nothing else crazy) transform it.
@@ -1201,7 +1340,9 @@ struct SPrintFOpt : public LibCallOptimization {
        // sprintf(dest, "%s", str) -> llvm.memcpy(dest, str, strlen(str)+1, 1)
        if (!CI->getArgOperand(2)->getType()->isPointerTy()) return 0;
  
-      Value *Len = EmitStrLen(CI->getArgOperand(2), B, TD);
+      Value *Len = EmitStrLen(CI->getArgOperand(2), B, TD, TLI);
+      if (!Len)
+        return 0;
        Value *IncLen = B.CreateAdd(Len,
                                    ConstantInt::get(Len->getType(), 1),
                                    "leninc");
@@ -1212,6 +1353,32 @@ struct SPrintFOpt : public LibCallOptimization {
      }
      return 0;
    }
+
+  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
+    // Require two fixed pointer arguments and an integer result.
+    FunctionType *FT = Callee->getFunctionType();
+    if (FT->getNumParams() != 2 || !FT->getParamType(0)->isPointerTy() ||
+        !FT->getParamType(1)->isPointerTy() ||
+        !FT->getReturnType()->isIntegerTy())
+      return 0;
+
+    if (Value *V = OptimizeFixedFormatString(Callee, CI, B)) {
+      return V;
+    }
+
+    // sprintf(str, format, ...) -> siprintf(str, format, ...) if no floating
+    // point arguments.
+    if (TLI->has(LibFunc::siprintf) && !CallHasFloatingPointArgument(CI)) {
+      Module *M = B.GetInsertBlock()->getParent()->getParent();
+      Constant *SIPrintFFn =
+        M->getOrInsertFunction("siprintf", FT, Callee->getAttributes());
+      CallInst *New = cast<CallInst>(CI->clone());
+      New->setCalledFunction(SIPrintFFn);
+      B.Insert(New);
+      return New;
+    }
+    return 0;
+  }
  };
  
  //===---------------------------------------===//
@@ -1220,7 +1387,7 @@ struct SPrintFOpt : public LibCallOptimization {
  struct FWriteOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
      // Require a pointer, an integer, an integer, a pointer, returning integer.
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 4 || !FT->getParamType(0)->isPointerTy() ||
          !FT->getParamType(1)->isIntegerTy() ||
          !FT->getParamType(2)->isIntegerTy() ||
@@ -1239,10 +1406,11 @@ struct FWriteOpt : public LibCallOptimization {
        return ConstantInt::get(CI->getType(), 0);
  
      // If this is writing one byte, turn it into fputc.
-    if (Bytes == 1) {  // fwrite(S,1,1,F) -> fputc(S[0],F)
+    // This optimisation is only valid, if the return value is unused.
+    if (Bytes == 1 && CI->use_empty()) {  // fwrite(S,1,1,F) -> fputc(S[0],F)
        Value *Char = B.CreateLoad(CastToCStr(CI->getArgOperand(0), B), "char");
-      EmitFPutC(Char, CI->getArgOperand(3), B, TD);
-      return ConstantInt::get(CI->getType(), 1);
+      Value *NewCI = EmitFPutC(Char, CI->getArgOperand(3), B, TD, TLI);
+      return NewCI ? ConstantInt::get(CI->getType(), 1) : 0;
      }
  
      return 0;
@@ -1258,7 +1426,7 @@ struct FPutsOpt : public LibCallOptimization {
      if (!TD) return 0;
  
      // Require two pointers.  Also, we can't optimize if return value is used.
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() != 2 || !FT->getParamType(0)->isPointerTy() ||
          !FT->getParamType(1)->isPointerTy() ||
          !CI->use_empty())
@@ -1267,10 +1435,10 @@ struct FPutsOpt : public LibCallOptimization {
      // fputs(s,F) --> fwrite(s,1,strlen(s),F)
      uint64_t Len = GetStringLength(CI->getArgOperand(0));
      if (!Len) return 0;
-    EmitFWrite(CI->getArgOperand(0),
-               ConstantInt::get(TD->getIntPtrType(*Context), Len-1),
-               CI->getArgOperand(1), B, TD);
-    return CI;  // Known to have no uses (see above).
+    // Known to have no uses (see above).
+    return EmitFWrite(CI->getArgOperand(0),
+                      ConstantInt::get(TD->getIntPtrType(*Context), Len-1),
+                      CI->getArgOperand(1), B, TD, TLI);
    }
  };
  
@@ -1278,17 +1446,11 @@ struct FPutsOpt : public LibCallOptimization {
  // 'fprintf' Optimizations
  
  struct FPrintFOpt : public LibCallOptimization {
-  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
-    // Require two fixed paramters as pointers and integer result.
-    const FunctionType *FT = Callee->getFunctionType();
-    if (FT->getNumParams() != 2 || !FT->getParamType(0)->isPointerTy() ||
-        !FT->getParamType(1)->isPointerTy() ||
-        !FT->getReturnType()->isIntegerTy())
-      return 0;
-
+  Value *OptimizeFixedFormatString(Function *Callee, CallInst *CI,
+                                   IRBuilder<> &B) {
      // All the optimizations depend on the format string.
-    std::string FormatStr;
-    if (!GetConstantStringInfo(CI->getArgOperand(1), FormatStr))
+    StringRef FormatStr;
+    if (!getConstantStringInfo(CI->getArgOperand(1), FormatStr))
        return 0;
  
      // fprintf(F, "foo") --> fwrite("foo", 3, 1, F)
@@ -1300,11 +1462,11 @@ struct FPrintFOpt : public LibCallOptimization {
        // These optimizations require TargetData.
        if (!TD) return 0;
  
-      EmitFWrite(CI->getArgOperand(1),
-                 ConstantInt::get(TD->getIntPtrType(*Context),
-                                  FormatStr.size()),
-                 CI->getArgOperand(0), B, TD);
-      return ConstantInt::get(CI->getType(), FormatStr.size());
+      Value *NewCI = EmitFWrite(CI->getArgOperand(1),
+                                ConstantInt::get(TD->getIntPtrType(*Context),
+                                                 FormatStr.size()),
+                                CI->getArgOperand(0), B, TD, TLI);
+      return NewCI ? ConstantInt::get(CI->getType(), FormatStr.size()) : 0;
      }
  
      // The remaining optimizations require the format string to be "%s" or "%c"
@@ -1317,16 +1479,42 @@ struct FPrintFOpt : public LibCallOptimization {
      if (FormatStr[1] == 'c') {
        // fprintf(F, "%c", chr) --> fputc(chr, F)
        if (!CI->getArgOperand(2)->getType()->isIntegerTy()) return 0;
-      EmitFPutC(CI->getArgOperand(2), CI->getArgOperand(0), B, TD);
-      return ConstantInt::get(CI->getType(), 1);
+      Value *NewCI = EmitFPutC(CI->getArgOperand(2), CI->getArgOperand(0), B,
+                               TD, TLI);
+      return NewCI ? ConstantInt::get(CI->getType(), 1) : 0;
      }
  
      if (FormatStr[1] == 's') {
        // fprintf(F, "%s", str) --> fputs(str, F)
        if (!CI->getArgOperand(2)->getType()->isPointerTy() || !CI->use_empty())
          return 0;
-      EmitFPutS(CI->getArgOperand(2), CI->getArgOperand(0), B, TD);
-      return CI;
+      return EmitFPutS(CI->getArgOperand(2), CI->getArgOperand(0), B, TD, TLI);
+    }
+    return 0;
+  }
+
+  virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
+    // Require two fixed paramters as pointers and integer result.
+    FunctionType *FT = Callee->getFunctionType();
+    if (FT->getNumParams() != 2 || !FT->getParamType(0)->isPointerTy() ||
+        !FT->getParamType(1)->isPointerTy() ||
+        !FT->getReturnType()->isIntegerTy())
+      return 0;
+
+    if (Value *V = OptimizeFixedFormatString(Callee, CI, B)) {
+      return V;
+    }
+
+    // fprintf(stream, format, ...) -> fiprintf(stream, format, ...) if no
+    // floating point arguments.
+    if (TLI->has(LibFunc::fiprintf) && !CallHasFloatingPointArgument(CI)) {
+      Module *M = B.GetInsertBlock()->getParent()->getParent();
+      Constant *FIPrintFFn =
+        M->getOrInsertFunction("fiprintf", FT, Callee->getAttributes());
+      CallInst *New = cast<CallInst>(CI->clone());
+      New->setCalledFunction(FIPrintFFn);
+      B.Insert(New);
+      return New;
      }
      return 0;
    }
@@ -1338,21 +1526,21 @@ struct FPrintFOpt : public LibCallOptimization {
  struct PutsOpt : public LibCallOptimization {
    virtual Value *CallOptimizer(Function *Callee, CallInst *CI, IRBuilder<> &B) {
      // Require one fixed pointer argument and an integer/void result.
-    const FunctionType *FT = Callee->getFunctionType();
+    FunctionType *FT = Callee->getFunctionType();
      if (FT->getNumParams() < 1 || !FT->getParamType(0)->isPointerTy() ||
          !(FT->getReturnType()->isIntegerTy() ||
            FT->getReturnType()->isVoidTy()))
        return 0;
  
      // Check for a constant string.
-    std::string Str;
-    if (!GetConstantStringInfo(CI->getArgOperand(0), Str))
+    StringRef Str;
+    if (!getConstantStringInfo(CI->getArgOperand(0), Str))
        return 0;
  
      if (Str.empty() && CI->use_empty()) {
        // puts("") -> putchar('\n')
-      Value *Res = EmitPutChar(B.getInt32('\n'), B, TD);
-      if (CI->use_empty()) return CI;
+      Value *Res = EmitPutChar(B.getInt32('\n'), B, TD, TLI);
+      if (CI->use_empty() || !Res) return Res;
        return B.CreateIntCast(Res, CI->getType(), true);
      }
  
@@ -1371,16 +1559,20 @@ namespace {
    ///
    class SimplifyLibCalls : public FunctionPass {
      TargetLibraryInfo *TLI;
-    
+
      StringMap<LibCallOptimization*> Optimizations;
      // String and Memory LibCall Optimizations
      StrCatOpt StrCat; StrNCatOpt StrNCat; StrChrOpt StrChr; StrRChrOpt StrRChr;
-    StrCmpOpt StrCmp; StrNCmpOpt StrNCmp; StrCpyOpt StrCpy; StrCpyOpt StrCpyChk;
-    StrNCpyOpt StrNCpy; StrLenOpt StrLen; StrPBrkOpt StrPBrk;
+    StrCmpOpt StrCmp; StrNCmpOpt StrNCmp;
+    StrCpyOpt StrCpy; StrCpyOpt StrCpyChk;
+    StpCpyOpt StpCpy; StpCpyOpt StpCpyChk;
+    StrNCpyOpt StrNCpy;
+    StrLenOpt StrLen; StrPBrkOpt StrPBrk;
      StrToOpt StrTo; StrSpnOpt StrSpn; StrCSpnOpt StrCSpn; StrStrOpt StrStr;
      MemCmpOpt MemCmp; MemCpyOpt MemCpy; MemMoveOpt MemMove; MemSetOpt MemSet;
      // Math Library Optimizations
-    PowOpt Pow; Exp2Opt Exp2; UnaryDoubleFPOpt UnaryDoubleFP;
+    CosOpt Cos; PowOpt Pow; Exp2Opt Exp2;
+    UnaryDoubleFPOpt UnaryDoubleFP, UnsafeUnaryDoubleFP;
      // Integer Optimizations
      FFSOpt FFS; AbsOpt Abs; IsDigitOpt IsDigit; IsAsciiOpt IsAscii;
      ToAsciiOpt ToAscii;
@@ -1388,13 +1580,18 @@ namespace {
      SPrintFOpt SPrintF; PrintFOpt PrintF;
      FWriteOpt FWrite; FPutsOpt FPuts; FPrintFOpt FPrintF;
      PutsOpt Puts;
-    
+
      bool Modified;  // This is only used by doInitialization.
    public:
      static char ID; // Pass identification
-    SimplifyLibCalls() : FunctionPass(ID), StrCpy(false), StrCpyChk(true) {
+    SimplifyLibCalls() : FunctionPass(ID), StrCpy(false), StrCpyChk(true),
+                         StpCpy(false), StpCpyChk(true),
+                         UnaryDoubleFP(false), UnsafeUnaryDoubleFP(true) {
        initializeSimplifyLibCallsPass(*PassRegistry::getPassRegistry());
      }
+    void AddOpt(LibFunc::Func F, LibCallOptimization* Opt);
+    void AddOpt(LibFunc::Func F1, LibFunc::Func F2, LibCallOptimization* Opt);
+
      void InitOptimizations();
      bool runOnFunction(Function &F);
  
@@ -1425,6 +1622,17 @@ FunctionPass *llvm::createSimplifyLibCallsPass() {
    return new SimplifyLibCalls();
  }
  
+void SimplifyLibCalls::AddOpt(LibFunc::Func F, LibCallOptimization* Opt) {
+  if (TLI->has(F))
+    Optimizations[TLI->getName(F)] = Opt;
+}
+
+void SimplifyLibCalls::AddOpt(LibFunc::Func F1, LibFunc::Func F2,
+                              LibCallOptimization* Opt) {
+  if (TLI->has(F1) && TLI->has(F2))
+    Optimizations[TLI->getName(F1)] = Opt;
+}
+
  /// Optimizations - Populate the Optimizations map with all the optimizations
  /// we know.
  void SimplifyLibCalls::InitOptimizations() {
@@ -1437,6 +1645,7 @@ void SimplifyLibCalls::InitOptimizations() {
    Optimizations["strncmp"] = &StrNCmp;
    Optimizations["strcpy"] = &StrCpy;
    Optimizations["strncpy"] = &StrNCpy;
+  Optimizations["stpcpy"] = &StpCpy;
    Optimizations["strlen"] = &StrLen;
    Optimizations["strpbrk"] = &StrPBrk;
    Optimizations["strtol"] = &StrTo;
@@ -1450,14 +1659,18 @@ void SimplifyLibCalls::InitOptimizations() {
    Optimizations["strcspn"] = &StrCSpn;
    Optimizations["strstr"] = &StrStr;
    Optimizations["memcmp"] = &MemCmp;
-  if (TLI->has(LibFunc::memcpy)) Optimizations["memcpy"] = &MemCpy;
+  AddOpt(LibFunc::memcpy, &MemCpy);
    Optimizations["memmove"] = &MemMove;
-  if (TLI->has(LibFunc::memset)) Optimizations["memset"] = &MemSet;
+  AddOpt(LibFunc::memset, &MemSet);
  
    // _chk variants of String and Memory LibCall Optimizations.
    Optimizations["__strcpy_chk"] = &StrCpyChk;
+  Optimizations["__stpcpy_chk"] = &StpCpyChk;
  
    // Math Library Optimizations
+  Optimizations["cosf"] = &Cos;
+  Optimizations["cos"] = &Cos;
+  Optimizations["cosl"] = &Cos;
    Optimizations["powf"] = &Pow;
    Optimizations["pow"] = &Pow;
    Optimizations["powl"] = &Pow;
@@ -1475,21 +1688,37 @@ void SimplifyLibCalls::InitOptimizations() {
    Optimizations["llvm.exp2.f64"] = &Exp2;
    Optimizations["llvm.exp2.f32"] = &Exp2;
  
-#ifdef HAVE_FLOORF
-  Optimizations["floor"] = &UnaryDoubleFP;
-#endif
-#ifdef HAVE_CEILF
-  Optimizations["ceil"] = &UnaryDoubleFP;
-#endif
-#ifdef HAVE_ROUNDF
-  Optimizations["round"] = &UnaryDoubleFP;
-#endif
-#ifdef HAVE_RINTF
-  Optimizations["rint"] = &UnaryDoubleFP;
-#endif
-#ifdef HAVE_NEARBYINTF
-  Optimizations["nearbyint"] = &UnaryDoubleFP;
-#endif
+  AddOpt(LibFunc::ceil, LibFunc::ceilf, &UnaryDoubleFP);
+  AddOpt(LibFunc::fabs, LibFunc::fabsf, &UnaryDoubleFP);
+  AddOpt(LibFunc::floor, LibFunc::floorf, &UnaryDoubleFP);
+  AddOpt(LibFunc::rint, LibFunc::rintf, &UnaryDoubleFP);
+  AddOpt(LibFunc::round, LibFunc::roundf, &UnaryDoubleFP);
+  AddOpt(LibFunc::nearbyint, LibFunc::nearbyintf, &UnaryDoubleFP);
+  AddOpt(LibFunc::trunc, LibFunc::truncf, &UnaryDoubleFP);
+
+  if(UnsafeFPShrink) {
+    AddOpt(LibFunc::acos, LibFunc::acosf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::acosh, LibFunc::acoshf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::asin, LibFunc::asinf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::asinh, LibFunc::asinhf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::atan, LibFunc::atanf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::atanh, LibFunc::atanhf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::cbrt, LibFunc::cbrtf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::cosh, LibFunc::coshf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::exp, LibFunc::expf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::exp10, LibFunc::exp10f, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::expm1, LibFunc::expm1f, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::log, LibFunc::logf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::log10, LibFunc::log10f, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::log1p, LibFunc::log1pf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::log2, LibFunc::log2f, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::logb, LibFunc::logbf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::sin, LibFunc::sinf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::sinh, LibFunc::sinhf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::sqrt, LibFunc::sqrtf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::tan, LibFunc::tanf, &UnsafeUnaryDoubleFP);
+    AddOpt(LibFunc::tanh, LibFunc::tanhf, &UnsafeUnaryDoubleFP);
+  }
  
    // Integer Optimizations
    Optimizations["ffs"] = &FFS;
@@ -1505,8 +1734,8 @@ void SimplifyLibCalls::InitOptimizations() {
    // Formatting and IO Optimizations
    Optimizations["sprintf"] = &SPrintF;
    Optimizations["printf"] = &PrintF;
-  Optimizations["fwrite"] = &FWrite;
-  Optimizations["fputs"] = &FPuts;
+  AddOpt(LibFunc::fwrite, &FWrite);
+  AddOpt(LibFunc::fputs, &FPuts);
    Optimizations["fprintf"] = &FPrintF;
    Optimizations["puts"] = &Puts;
  }
@@ -1544,8 +1773,11 @@ bool SimplifyLibCalls::runOnFunction(Function &F) {
        // Set the builder to the instruction after the call.
        Builder.SetInsertPoint(BB, I);
  
+      // Use debug location of CI for all new instructions.
+      Builder.SetCurrentDebugLocation(CI->getDebugLoc());
+
        // Try to optimize this call.
-      Value *Result = LCO->OptimizeCall(CI, TD, Builder);
+      Value *Result = LCO->OptimizeCall(CI, TD, TLI, Builder);
        if (Result == 0) continue;
  
        DEBUG(dbgs() << "SimplifyLibCalls simplified: " << *CI;
@@ -1610,8 +1842,8 @@ void SimplifyLibCalls::setDoesNotAlias(Function &F, unsigned n) {
  
  
  void SimplifyLibCalls::inferPrototypeAttributes(Function &F) {
-  const FunctionType *FTy = F.getFunctionType();
-  
+  FunctionType *FTy = F.getFunctionType();
+
    StringRef Name = F.getName();
    switch (Name[0]) {
    case 's':
@@ -1640,6 +1872,7 @@ void SimplifyLibCalls::inferPrototypeAttributes(Function &F) {
                 Name == "strtold" ||
                 Name == "strncat" ||
                 Name == "strncpy" ||
+               Name == "stpncpy" ||
                 Name == "strtoull") {
        if (FTy->getNumParams() < 2 ||
            !FTy->getParamType(1)->isPointerTy())
@@ -2268,9 +2501,6 @@ bool SimplifyLibCalls::doInitialization(Module &M) {
  //   * cbrt(sqrt(x))  -> pow(x,1/6)
  //   * cbrt(sqrt(x))  -> pow(x,1/9)
  //
-// cos, cosf, cosl:
-//   * cos(-x)  -> cos(x)
-//
  // exp, expf, expl:
  //   * exp(log(x))  -> x
  //
@@ -2303,10 +2533,8 @@ bool SimplifyLibCalls::doInitialization(Module &M) {
  //   * sqrt(Nroot(x)) -> pow(x,1/(2*N))
  //   * sqrt(pow(x,y)) -> pow(|x|,y*0.5)
  //
-// stpcpy:
-//   * stpcpy(str, "literal") ->
-//           llvm.memcpy(str,"literal",strlen("literal")+1,1)
-//
+// strchr:
+//   * strchr(p, 0) -> strlen(p)
  // tan, tanf, tanl:
  //   * tan(atan(x)) -> x
  //