Teach SimplifyDemandedBits how to look through fpext and fptrunc to simplify their...

author Pete Cooper <peter_cooper@apple.com>

Thu, 26 Jul 2012 22:37:04 +0000 (22:37 +0000)

committer Pete Cooper <peter_cooper@apple.com>

Thu, 26 Jul 2012 22:37:04 +0000 (22:37 +0000)
author Pete Cooper <peter_cooper@apple.com>
Thu, 26 Jul 2012 22:37:04 +0000 (22:37 +0000)
committer Pete Cooper <peter_cooper@apple.com>
Thu, 26 Jul 2012 22:37:04 +0000 (22:37 +0000)
diff --git a/lib/Transforms/InstCombine/InstCombineSimplifyDemanded.cpp b/lib/Transforms/InstCombine/InstCombineSimplifyDemanded.cpp

index 125c74a89a119e458c2c9605ef25c33acc6091c8..46ba83b6513661a13072fec3df5e9e33eaad8040 100644 (file)
--- a/lib/Transforms/InstCombine/InstCombineSimplifyDemanded.cpp
+++ b/lib/Transforms/InstCombine/InstCombineSimplifyDemanded.cpp
@@ -1074,6 +1074,12 @@ Value *InstCombiner::SimplifyDemandedVectorElts(Value *V, APInt DemandedElts,
      // like undef&0.  The result is known zero, not undef.
      UndefElts &= UndefElts2;
      break;
+  case Instruction::FPTrunc:
+  case Instruction::FPExt:
+    TmpV = SimplifyDemandedVectorElts(I->getOperand(0), DemandedElts,
+                                      UndefElts, Depth+1);
+    if (TmpV) { I->setOperand(0, TmpV); MadeChange = true; }
+    break;
      
    case Instruction::Call: {
      IntrinsicInst *II = dyn_cast<IntrinsicInst>(I);
diff --git a/test/Transforms/InstCombine/vec_demanded_elts.ll b/test/Transforms/InstCombine/vec_demanded_elts.ll

index cc63371eded671103dfa9154e16ece7a193d136e..d904196d13b010d71199e455c703c33603c9833f 100644 (file)
--- a/test/Transforms/InstCombine/vec_demanded_elts.ll
+++ b/test/Transforms/InstCombine/vec_demanded_elts.ll
@@ -162,4 +162,32 @@ entry:
    ret <4 x float> %shuffle9.i
  }
  
+define <2 x float> @test_fptrunc(double %f) {
+; CHECK: @test_fptrunc
+; CHECK: insertelement
+; CHECK: insertelement
+; CHECK-NOT: insertelement
+  %tmp9 = insertelement <4 x double> undef, double %f, i32 0
+  %tmp10 = insertelement <4 x double> %tmp9, double 0.000000e+00, i32 1
+  %tmp11 = insertelement <4 x double> %tmp10, double 0.000000e+00, i32 2
+  %tmp12 = insertelement <4 x double> %tmp11, double 0.000000e+00, i32 3
+  %tmp5 = fptrunc <4 x double> %tmp12 to <4 x float>
+  %ret = shufflevector <4 x float> %tmp5, <4 x float> undef, <2 x i32> <i32 0, i32 1>
+  ret <2 x float> %ret
+}
+
+define <2 x double> @test_fpext(float %f) {
+; CHECK: @test_fpext
+; CHECK: insertelement
+; CHECK: insertelement
+; CHECK-NOT: insertelement
+  %tmp9 = insertelement <4 x float> undef, float %f, i32 0
+  %tmp10 = insertelement <4 x float> %tmp9, float 0.000000e+00, i32 1
+  %tmp11 = insertelement <4 x float> %tmp10, float 0.000000e+00, i32 2
+  %tmp12 = insertelement <4 x float> %tmp11, float 0.000000e+00, i32 3
+  %tmp5 = fpext <4 x float> %tmp12 to <4 x double>
+  %ret = shufflevector <4 x double> %tmp5, <4 x double> undef, <2 x i32> <i32 0, i32 1>
+  ret <2 x double> %ret
+}
+
author	Pete Cooper <peter_cooper@apple.com>
	Thu, 26 Jul 2012 22:37:04 +0000 (22:37 +0000)
committer	Pete Cooper <peter_cooper@apple.com>
	Thu, 26 Jul 2012 22:37:04 +0000 (22:37 +0000)
lib/Transforms/InstCombine/InstCombineSimplifyDemanded.cpp		patch \| blob \| history
test/Transforms/InstCombine/vec_demanded_elts.ll		patch \| blob \| history