Make the sqrt intrinsic return undef for a negative input.

author Sanjay Patel <spatel@rotateright.com>

Wed, 1 Oct 2014 20:36:33 +0000 (20:36 +0000)

committer Sanjay Patel <spatel@rotateright.com>

Wed, 1 Oct 2014 20:36:33 +0000 (20:36 +0000)
author Sanjay Patel <spatel@rotateright.com>
Wed, 1 Oct 2014 20:36:33 +0000 (20:36 +0000)
committer Sanjay Patel <spatel@rotateright.com>
Wed, 1 Oct 2014 20:36:33 +0000 (20:36 +0000)
diff --git a/lib/Analysis/ConstantFolding.cpp b/lib/Analysis/ConstantFolding.cpp

index 88e255832f1d2329fba7179cca2d18c75cea9e81..c703491ace22267058010ec067318e0feac9ff9c 100644 (file)
--- a/lib/Analysis/ConstantFolding.cpp
+++ b/lib/Analysis/ConstantFolding.cpp
@@ -1520,8 +1520,14 @@ static Constant *ConstantFoldScalarCall(StringRef Name, unsigned IntrinsicID,
                   (Ty->isHalfTy() || Ty->isFloatTy() || Ty->isDoubleTy())) {
            if (V >= -0.0)
              return ConstantFoldFP(sqrt, V, Ty);
-          else // Undefined
-            return Constant::getNullValue(Ty);
+          else {
+            // Unlike the sqrt definitions in C/C++, POSIX, and IEEE-754 - which
+            // all guarantee or favor returning NaN - the square root of a
+            // negative number is not defined for the LLVM sqrt intrinsic.
+            // This is because the intrinsic should only be emitted in place of
+            // libm's sqrt function when using "no-nans-fp-math".
+            return UndefValue::get(Ty);
+          }
          }
          break;
        case 's':
diff --git a/test/Transforms/InstCombine/constant-fold-math.ll b/test/Transforms/InstCombine/constant-fold-math.ll

index 14377df37299b9d536766a9095fdcd18744e93ec..ce8d337c08bfc97eeef001b5466c88d8125798d2 100644 (file)
--- a/test/Transforms/InstCombine/constant-fold-math.ll
+++ b/test/Transforms/InstCombine/constant-fold-math.ll
@@ -7,6 +7,7 @@ declare <4 x float> @llvm.fma.v4f32(<4 x float>, <4 x float>, <4 x float>) #0
  declare double @llvm.fma.f64(double, double, double) #0
  declare double @llvm.fmuladd.f64(double, double, double) #0
  
+declare double @llvm.sqrt.f64(double) #0
  
  
  ; CHECK-LABEL: @constant_fold_fma_f32
@@ -44,4 +45,12 @@ define double @constant_fold_fmuladd_f64() #0 {
    ret double %x
  }
  
+; The sqrt intrinsic is undefined for negative inputs besides -0.0.
+; CHECK-LABEL: @bad_sqrt
+; CHECK-NEXT: ret double undef
+define double @bad_sqrt() {
+  %x = call double @llvm.sqrt.f64(double -2.000000e+00)
+  ret double %x
+}
+
  attributes #0 = { nounwind readnone }
author	Sanjay Patel <spatel@rotateright.com>
	Wed, 1 Oct 2014 20:36:33 +0000 (20:36 +0000)
committer	Sanjay Patel <spatel@rotateright.com>
	Wed, 1 Oct 2014 20:36:33 +0000 (20:36 +0000)
lib/Analysis/ConstantFolding.cpp		patch \| blob \| history
test/Transforms/InstCombine/constant-fold-math.ll		patch \| blob \| history