InstCombine: Don't assume that m_ZExt matches an Instruction

[oota-llvm.git] / lib / Transforms / InstCombine / InstCombineCompares.cpp
diff --git a/lib/Transforms/InstCombine/InstCombineCompares.cpp b/lib/Transforms/InstCombine/InstCombineCompares.cpp

index 4cf836c03b213795355d623300e6a8a090dfe2b5..f7eb16cbb96dd5f985f0103db2db646176e2d4b8 100644 (file)
--- a/lib/Transforms/InstCombine/InstCombineCompares.cpp
+++ b/lib/Transforms/InstCombine/InstCombineCompares.cpp
@@ -740,21 +740,6 @@ Instruction *InstCombiner::FoldGEPICmp(GEPOperator *GEPLHS, Value *RHS,
  Instruction *InstCombiner::FoldICmpAddOpCst(Instruction &ICI,
                                              Value *X, ConstantInt *CI,
                                              ICmpInst::Predicate Pred) {
-  // If we have X+0, exit early (simplifying logic below) and let it get folded
-  // elsewhere.   icmp X+0, X  -> icmp X, X
-  if (CI->isZero()) {
-    bool isTrue = ICmpInst::isTrueWhenEqual(Pred);
-    return ReplaceInstUsesWith(ICI, ConstantInt::get(ICI.getType(), isTrue));
-  }
-
-  // (X+4) == X -> false.
-  if (Pred == ICmpInst::ICMP_EQ)
-    return ReplaceInstUsesWith(ICI, Builder->getFalse());
-
-  // (X+4) != X -> true.
-  if (Pred == ICmpInst::ICMP_NE)
-    return ReplaceInstUsesWith(ICI, Builder->getTrue());
-
    // From this point on, we know that (X+C <= X) --> (X+C < X) because C != 0,
    // so the values can never be equal.  Similarly for all other "or equals"
    // operators.
@@ -1067,62 +1052,83 @@ Instruction *InstCombiner::FoldICmpCstShrCst(ICmpInst &I, Value *Op, Value *A,
    APInt AP1 = CI1->getValue();
    APInt AP2 = CI2->getValue();
  
-  if (!AP1) {
-    if (!AP2) {
-      // Both Constants are 0.
-      return getConstant(true);
-    }
-
-    if (cast<BinaryOperator>(Op)->isExact())
-      return getConstant(false);
-
-    if (AP2.isNegative()) {
-      // MSB is set, so a lshr with a large enough 'A' would be undefined.
-      return getConstant(false);
-    }
+  // Don't bother doing any work for cases which InstSimplify handles.
+  if (AP2 == 0)
+    return nullptr;
+  bool IsAShr = isa<AShrOperator>(Op);
+  if (IsAShr) {
+    if (AP2.isAllOnesValue())
+      return nullptr;
+    if (AP2.isNegative() != AP1.isNegative())
+      return nullptr;
+    if (AP2.sgt(AP1))
+      return nullptr;
+  }
  
+  if (!AP1)
      // 'A' must be large enough to shift out the highest set bit.
      return getICmp(I.ICMP_UGT, A,
                     ConstantInt::get(A->getType(), AP2.logBase2()));
-  }
  
-  if (!AP2) {
-    // Shifting 0 by any value gives 0.
-    return getConstant(false);
-  }
-
-  bool IsAShr = isa<AShrOperator>(Op);
-  if (AP1 == AP2) {
-    if (AP1.isAllOnesValue() && IsAShr) {
-      // Arithmatic shift of -1 is always -1.
-      return getConstant(true);
-    }
+  if (AP1 == AP2)
      return getICmp(I.ICMP_EQ, A, ConstantInt::getNullValue(A->getType()));
-  }
  
-  if (IsAShr) {
-    if (AP1.isNegative() != AP2.isNegative()) {
-      // Arithmetic shift will never change the sign.
-      return getConstant(false);
-    }
-    // Both the constants are negative, take their positive to calculate
-    // log.
-    if (AP1.isNegative()) {
-      AP1 = -AP1;
-      AP2 = -AP2;
-    }
-  }
+  // Get the distance between the highest bit that's set.
+  int Shift;
+  // Both the constants are negative, take their positive to calculate log.
+  if (IsAShr && AP1.isNegative())
+    // Get the ones' complement of AP2 and AP1 when computing the distance.
+    Shift = (~AP2).logBase2() - (~AP1).logBase2();
+  else
+    Shift = AP2.logBase2() - AP1.logBase2();
  
-  if (AP1.ugt(AP2)) {
-    // Right-shifting will not increase the value.
-    return getConstant(false);
+  if (Shift > 0) {
+    if (IsAShr ? AP1 == AP2.ashr(Shift) : AP1 == AP2.lshr(Shift))
+      return getICmp(I.ICMP_EQ, A, ConstantInt::get(A->getType(), Shift));
    }
+  // Shifting const2 will never be equal to const1.
+  return getConstant(false);
+}
  
-  // Get the distance between the highest bit that's set.
-  int Shift = AP2.logBase2() - AP1.logBase2();
+/// FoldICmpCstShlCst - Handle "(icmp eq/ne (shl const2, A), const1)" ->
+/// (icmp eq/ne A, TrailingZeros(const1) - TrailingZeros(const2)).
+Instruction *InstCombiner::FoldICmpCstShlCst(ICmpInst &I, Value *Op, Value *A,
+                                             ConstantInt *CI1,
+                                             ConstantInt *CI2) {
+  assert(I.isEquality() && "Cannot fold icmp gt/lt");
+
+  auto getConstant = [&I, this](bool IsTrue) {
+    if (I.getPredicate() == I.ICMP_NE)
+      IsTrue = !IsTrue;
+    return ReplaceInstUsesWith(I, ConstantInt::get(I.getType(), IsTrue));
+  };
+
+  auto getICmp = [&I](CmpInst::Predicate Pred, Value *LHS, Value *RHS) {
+    if (I.getPredicate() == I.ICMP_NE)
+      Pred = CmpInst::getInversePredicate(Pred);
+    return new ICmpInst(Pred, LHS, RHS);
+  };
  
-  // Use lshr here, since we've canonicalized to +ve numbers.
-  if (AP1 == AP2.lshr(Shift))
+  APInt AP1 = CI1->getValue();
+  APInt AP2 = CI2->getValue();
+
+  // Don't bother doing any work for cases which InstSimplify handles.
+  if (AP2 == 0)
+    return nullptr;
+
+  unsigned AP2TrailingZeros = AP2.countTrailingZeros();
+
+  if (!AP1 && AP2TrailingZeros != 0)
+    return getICmp(I.ICMP_UGE, A,
+                   ConstantInt::get(A->getType(), AP2.getBitWidth() - AP2TrailingZeros));
+
+  if (AP1 == AP2)
+    return getICmp(I.ICMP_EQ, A, ConstantInt::getNullValue(A->getType()));
+
+  // Get the distance between the lowest bits that are set.
+  int Shift = AP1.countTrailingZeros() - AP2TrailingZeros;
+
+  if (Shift > 0 && AP2.shl(Shift) == AP1)
      return getICmp(I.ICMP_EQ, A, ConstantInt::get(A->getType(), Shift));
  
    // Shifting const2 will never be equal to const1.
@@ -1144,7 +1150,7 @@ Instruction *InstCombiner::visitICmpInstWithInstAndIntCst(ICmpInst &ICI,
        unsigned DstBits = LHSI->getType()->getPrimitiveSizeInBits(),
               SrcBits = LHSI->getOperand(0)->getType()->getPrimitiveSizeInBits();
        APInt KnownZero(SrcBits, 0), KnownOne(SrcBits, 0);
-      computeKnownBits(LHSI->getOperand(0), KnownZero, KnownOne);
+      computeKnownBits(LHSI->getOperand(0), KnownZero, KnownOne, 0, &ICI);
  
        // If all the high bits are known, we can do this xform.
        if ((KnownZero|KnownOne).countLeadingOnes() >= SrcBits-DstBits) {
@@ -1503,16 +1509,10 @@ Instruction *InstCombiner::visitICmpInstWithInstAndIntCst(ICmpInst &ICI,
            unsigned RHSLog2 = RHSV.logBase2();
  
            // (1 << X) >= 2147483648 -> X >= 31 -> X == 31
-          // (1 << X) >  2147483648 -> X >  31 -> false
-          // (1 << X) <= 2147483648 -> X <= 31 -> true
            // (1 << X) <  2147483648 -> X <  31 -> X != 31
            if (RHSLog2 == TypeBits-1) {
              if (Pred == ICmpInst::ICMP_UGE)
                Pred = ICmpInst::ICMP_EQ;
-            else if (Pred == ICmpInst::ICMP_UGT)
-              return ReplaceInstUsesWith(ICI, Builder->getFalse());
-            else if (Pred == ICmpInst::ICMP_ULE)
-              return ReplaceInstUsesWith(ICI, Builder->getTrue());
              else if (Pred == ICmpInst::ICMP_ULT)
                Pred = ICmpInst::ICMP_NE;
            }
@@ -1547,10 +1547,6 @@ Instruction *InstCombiner::visitICmpInstWithInstAndIntCst(ICmpInst &ICI,
            if (RHSVIsPowerOf2)
              return new ICmpInst(
                  Pred, X, ConstantInt::get(RHS->getType(), RHSV.logBase2()));
-
-          return ReplaceInstUsesWith(
-              ICI, Pred == ICmpInst::ICMP_EQ ? Builder->getFalse()
-                                             : Builder->getTrue());
          }
        }
        break;
@@ -2058,8 +2054,8 @@ static Instruction *ProcessUGT_ADDCST_ADD(ICmpInst &I, Value *A, Value *B,
    // sign-extended; check for that condition. For example, if CI2 is 2^31 and
    // the operands of the add are 64 bits wide, we need at least 33 sign bits.
    unsigned NeededSignBits = CI1->getBitWidth() - NewWidth + 1;
-  if (IC.ComputeNumSignBits(A) < NeededSignBits ||
-      IC.ComputeNumSignBits(B) < NeededSignBits)
+  if (IC.ComputeNumSignBits(A, 0, &I) < NeededSignBits ||
+      IC.ComputeNumSignBits(B, 0, &I) < NeededSignBits)
      return nullptr;
  
    // In order to replace the original add with a narrower
@@ -2164,8 +2160,8 @@ static Instruction *ProcessUMulZExtIdiom(ICmpInst &I, Value *MulVal,
    Instruction *MulInstr = cast<Instruction>(MulVal);
    assert(MulInstr->getOpcode() == Instruction::Mul);
  
-  Instruction *LHS = cast<Instruction>(MulInstr->getOperand(0)),
-              *RHS = cast<Instruction>(MulInstr->getOperand(1));
+  auto *LHS = cast<ZExtOperator>(MulInstr->getOperand(0)),
+       *RHS = cast<ZExtOperator>(MulInstr->getOperand(1));
    assert(LHS->getOpcode() == Instruction::ZExt);
    assert(RHS->getOpcode() == Instruction::ZExt);
    Value *A = LHS->getOperand(0), *B = RHS->getOperand(0);
@@ -2467,7 +2463,7 @@ Instruction *InstCombiner::visitICmpInst(ICmpInst &I) {
      Changed = true;
    }
  
-  if (Value *V = SimplifyICmpInst(I.getPredicate(), Op0, Op1, DL))
+  if (Value *V = SimplifyICmpInst(I.getPredicate(), Op0, Op1, DL, TLI, DT, AT))
      return ReplaceInstUsesWith(I, V);
  
    // comparing -val or val with non-zero is the same as just comparing val
@@ -2595,12 +2591,18 @@ Instruction *InstCombiner::visitICmpInst(ICmpInst &I) {
                            Builder->getInt(CI->getValue()-1));
      }
  
-    // (icmp eq/ne (ashr/lshr const2, A), const1)
      if (I.isEquality()) {
        ConstantInt *CI2;
        if (match(Op0, m_AShr(m_ConstantInt(CI2), m_Value(A))) ||
            match(Op0, m_LShr(m_ConstantInt(CI2), m_Value(A)))) {
-        return FoldICmpCstShrCst(I, Op0, A, CI, CI2);
+        // (icmp eq/ne (ashr/lshr const2, A), const1)
+        if (Instruction *Inst = FoldICmpCstShrCst(I, Op0, A, CI, CI2))
+          return Inst;
+      }
+      if (match(Op0, m_Shl(m_ConstantInt(CI2), m_Value(A)))) {
+        // (icmp eq/ne (shl const2, A), const1)
+        if (Instruction *Inst = FoldICmpCstShlCst(I, Op0, A, CI, CI2))
+          return Inst;
        }
      }
  
@@ -3013,6 +3015,12 @@ Instruction *InstCombiner::visitICmpInst(ICmpInst &I) {
      if (BO1 && BO1->getOpcode() == Instruction::Add)
        C = BO1->getOperand(0), D = BO1->getOperand(1);
  
+    // icmp (X+cst) < 0 --> X < -cst
+    if (NoOp0WrapProblem && ICmpInst::isSigned(Pred) && match(Op1, m_Zero()))
+      if (ConstantInt *RHSC = dyn_cast_or_null<ConstantInt>(B))
+        if (!RHSC->isMinValue(/*isSigned=*/true))
+          return new ICmpInst(Pred, A, ConstantExpr::getNeg(RHSC));
+
      // icmp (X+Y), X -> icmp Y, 0 for equalities or if there is no overflow.
      if ((A == Op1 || B == Op1) && NoOp0WrapProblem)
        return new ICmpInst(Pred, A == Op1 ? B : A,
@@ -3247,7 +3255,9 @@ Instruction *InstCombiner::visitICmpInst(ICmpInst &I) {
      // and       (A & ~B) != 0 --> (A & B) == 0
      // if A is a power of 2.
      if (match(Op0, m_And(m_Value(A), m_Not(m_Value(B)))) &&
-        match(Op1, m_Zero()) && isKnownToBeAPowerOfTwo(A) && I.isEquality())
+        match(Op1, m_Zero()) && isKnownToBeAPowerOfTwo(A, false,
+                                                       0, AT, &I, DT) &&
+                                I.isEquality())
        return new ICmpInst(I.getInversePredicate(),
                            Builder->CreateAnd(A, B),
                            Op1);
@@ -3637,7 +3647,7 @@ Instruction *InstCombiner::visitFCmpInst(FCmpInst &I) {
  
    Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
  
-  if (Value *V = SimplifyFCmpInst(I.getPredicate(), Op0, Op1, DL))
+  if (Value *V = SimplifyFCmpInst(I.getPredicate(), Op0, Op1, DL, TLI, DT, AT))
      return ReplaceInstUsesWith(I, V);
  
    // Simplify 'fcmp pred X, X'