[InstCombine] mark ADD with nuw if no unsigned overflow

author Jingyue Wu <jingyue@google.com>

Tue, 17 Jun 2014 00:42:07 +0000 (00:42 +0000)

committer Jingyue Wu <jingyue@google.com>

Tue, 17 Jun 2014 00:42:07 +0000 (00:42 +0000)
author Jingyue Wu <jingyue@google.com>
Tue, 17 Jun 2014 00:42:07 +0000 (00:42 +0000)
committer Jingyue Wu <jingyue@google.com>
Tue, 17 Jun 2014 00:42:07 +0000 (00:42 +0000)
diff --git a/lib/Transforms/InstCombine/InstCombine.h b/lib/Transforms/InstCombine/InstCombine.h

index ea1839c3bcf8a256ecd83c5733f2da5195eed463..ab4dc1ce23e664cc4898345ec97af86014aa3a0e 100644 (file)
--- a/lib/Transforms/InstCombine/InstCombine.h
+++ b/lib/Transforms/InstCombine/InstCombine.h
@@ -247,6 +247,7 @@ private:
                                   bool DoXform = true);
    Instruction *transformSExtICmp(ICmpInst *ICI, Instruction &CI);
    bool WillNotOverflowSignedAdd(Value *LHS, Value *RHS);
+  bool WillNotOverflowUnsignedAdd(Value *LHS, Value *RHS);
    Value *EmitGEPOffset(User *GEP);
    Instruction *scalarizePHI(ExtractElementInst &EI, PHINode *PN);
    Value *EvaluateInDifferentElementOrder(Value *V, ArrayRef<int> Mask);
diff --git a/lib/Transforms/InstCombine/InstCombineAddSub.cpp b/lib/Transforms/InstCombine/InstCombineAddSub.cpp

index 63c440afcd71eed8a6765c4e41361f1153484286..f6658964ae851f82995180b058bab8aea56d63cf 100644 (file)
--- a/lib/Transforms/InstCombine/InstCombineAddSub.cpp
+++ b/lib/Transforms/InstCombine/InstCombineAddSub.cpp
@@ -965,6 +965,21 @@ bool InstCombiner::WillNotOverflowSignedAdd(Value *LHS, Value *RHS) {
    return false;
  }
  
+/// WillNotOverflowUnsignedAdd - Return true if we can prove that:
+///    (zext (add LHS, RHS))  === (add (zext LHS), (zext RHS))
+bool InstCombiner::WillNotOverflowUnsignedAdd(Value *LHS, Value *RHS) {
+  // There are different heuristics we can use for this. Here is a simple one.
+  // If the sign bit of LHS and that of RHS are both zero, no unsigned wrap.
+  bool LHSKnownNonNegative, LHSKnownNegative;
+  bool RHSKnownNonNegative, RHSKnownNegative;
+  ComputeSignBit(LHS, LHSKnownNonNegative, LHSKnownNegative, DL, 0);
+  ComputeSignBit(RHS, RHSKnownNonNegative, RHSKnownNegative, DL, 0);
+  if (LHSKnownNonNegative && RHSKnownNonNegative)
+    return true;
+
+  return false;
+}
+
  Instruction *InstCombiner::visitAdd(BinaryOperator &I) {
    bool Changed = SimplifyAssociativeOrCommutative(I);
    Value *LHS = I.getOperand(0), *RHS = I.getOperand(1);
@@ -1240,10 +1255,17 @@ Instruction *InstCombiner::visitAdd(BinaryOperator &I) {
        return BinaryOperator::CreateOr(A, B);
    }
  
+  // TODO(jingyue): Consider WillNotOverflowSignedAdd and
+  // WillNotOverflowUnsignedAdd to reduce the number of invocations of
+  // computeKnownBits.
    if (!I.hasNoSignedWrap() && WillNotOverflowSignedAdd(LHS, RHS)) {
      Changed = true;
      I.setHasNoSignedWrap(true);
    }
+  if (!I.hasNoUnsignedWrap() && WillNotOverflowUnsignedAdd(LHS, RHS)) {
+    Changed = true;
+    I.setHasNoUnsignedWrap(true);
+  }
  
    return Changed ? &I : nullptr;
  }
diff --git a/test/Transforms/InstCombine/AddOverFlow.ll b/test/Transforms/InstCombine/AddOverFlow.ll

index 590c65af01fa902339130f5d0331df5639e301ec..70178ec83b6ea5e1b80feb4da3df976cd8a7997a 100644 (file)
--- a/test/Transforms/InstCombine/AddOverFlow.ll
+++ b/test/Transforms/InstCombine/AddOverFlow.ll
@@ -12,6 +12,28 @@ define i16 @oppositesign(i16 %x, i16 %y) {
    ret i16 %c
  }
  
+define i16 @zero_sign_bit(i16 %a) {
+; CHECK-LABEL: @zero_sign_bit(
+; CHECK-NEXT: and
+; CHECK-NEXT: add nuw
+; CHECK-NEXT: ret
+  %1 = and i16 %a, 32767
+  %2 = add i16 %1, 512
+  ret i16 %2
+}
+
+define i16 @zero_sign_bit2(i16 %a, i16 %b) {
+; CHECK-LABEL: @zero_sign_bit2(
+; CHECK-NEXT: and
+; CHECK-NEXT: and
+; CHECK-NEXT: add nuw
+; CHECK-NEXT: ret
+  %1 = and i16 %a, 32767
+  %2 = and i16 %b, 32767
+  %3 = add i16 %1, %2
+  ret i16 %3
+}
+
  ; CHECK-LABEL: @ripple_nsw1
  ; CHECK: add nsw i16 %a, %b
  define i16 @ripple_nsw1(i16 %x, i16 %y) {
@@ -45,7 +67,7 @@ define i32 @ripple_no_nsw1(i32 %x, i32 %y) {
  }
  
  ; CHECK-LABEL: @ripple_no_nsw2
-; CHECK: add i16 %a, %b
+; CHECK: add nuw i16 %a, %b
  define i16 @ripple_no_nsw2(i16 %x, i16 %y) {
  ; %a has at most one bit set
    %a = and i16 %y, 1
diff --git a/test/Transforms/InstCombine/add-sitofp.ll b/test/Transforms/InstCombine/add-sitofp.ll

index 40edf7114a068845703f3e34738a27489630cb18..3b5485e005284ee0684ee8aad03e767cbf4544a1 100644 (file)
--- a/test/Transforms/InstCombine/add-sitofp.ll
+++ b/test/Transforms/InstCombine/add-sitofp.ll
@@ -1,4 +1,4 @@
-; RUN: opt < %s -instcombine -S | grep "add nsw i32"
+; RUN: opt < %s -instcombine -S | grep "add nuw nsw i32"
  
  define double @x(i32 %a, i32 %b) nounwind {
    %m = lshr i32 %a, 24
diff --git a/test/Transforms/InstCombine/ffs-1.ll b/test/Transforms/InstCombine/ffs-1.ll

index 261f488613007691bbb240c4478f4a93e75d8b9b..c8763dc199a97e87687b7d2351ee33122c225e35 100644 (file)
--- a/test/Transforms/InstCombine/ffs-1.ll
+++ b/test/Transforms/InstCombine/ffs-1.ll
@@ -103,7 +103,7 @@ define i32 @test_simplify13(i32 %x) {
  ; CHECK-LABEL: @test_simplify13(
    %ret = call i32 @ffs(i32 %x)
  ; CHECK-NEXT: [[CTTZ:%[a-z0-9]+]] = call i32 @llvm.cttz.i32(i32 %x, i1 false)
-; CHECK-NEXT: [[INC:%[a-z0-9]+]] = add nsw i32 [[CTTZ]], 1
+; CHECK-NEXT: [[INC:%[a-z0-9]+]] = add nuw nsw i32 [[CTTZ]], 1
  ; CHECK-NEXT: [[CMP:%[a-z0-9]+]] = icmp ne i32 %x, 0
  ; CHECK-NEXT: [[RET:%[a-z0-9]+]] = select i1 [[CMP]], i32 [[INC]], i32 0
    ret i32 %ret
@@ -114,7 +114,7 @@ define i32 @test_simplify14(i32 %x) {
  ; CHECK-LINUX-LABEL: @test_simplify14(
    %ret = call i32 @ffsl(i32 %x)
  ; CHECK-LINUX-NEXT: [[CTTZ:%[a-z0-9]+]] = call i32 @llvm.cttz.i32(i32 %x, i1 false)
-; CHECK-LINUX-NEXT: [[INC:%[a-z0-9]+]] = add nsw i32 [[CTTZ]], 1
+; CHECK-LINUX-NEXT: [[INC:%[a-z0-9]+]] = add nuw nsw i32 [[CTTZ]], 1
  ; CHECK-LINUX-NEXT: [[CMP:%[a-z0-9]+]] = icmp ne i32 %x, 0
  ; CHECK-LINUX-NEXT: [[RET:%[a-z0-9]+]] = select i1 [[CMP]], i32 [[INC]], i32 0
    ret i32 %ret
@@ -125,7 +125,7 @@ define i32 @test_simplify15(i64 %x) {
  ; CHECK-LINUX-LABEL: @test_simplify15(
    %ret = call i32 @ffsll(i64 %x)
  ; CHECK-LINUX-NEXT: [[CTTZ:%[a-z0-9]+]] = call i64 @llvm.cttz.i64(i64 %x, i1 false)
-; CHECK-LINUX-NEXT: [[INC:%[a-z0-9]+]] = add nsw i64 [[CTTZ]], 1
+; CHECK-LINUX-NEXT: [[INC:%[a-z0-9]+]] = add nuw nsw i64 [[CTTZ]], 1
  ; CHECK-LINUX-NEXT: [[TRUNC:%[a-z0-9]+]] = trunc i64 [[INC]] to i32
  ; CHECK-LINUX-NEXT: [[CMP:%[a-z0-9]+]] = icmp ne i64 %x, 0
  ; CHECK-LINUX-NEXT: [[RET:%[a-z0-9]+]] = select i1 [[CMP]], i32 [[TRUNC]], i32 0
diff --git a/test/Transforms/InstCombine/select.ll b/test/Transforms/InstCombine/select.ll

index 762a9dad9f156441eeadb65f1cd04ff0a4280706..d625f3b1b33d6fe5993165b8d82b18de6f8b8ddf 100644 (file)
--- a/test/Transforms/InstCombine/select.ll
+++ b/test/Transforms/InstCombine/select.ll
@@ -281,7 +281,7 @@ define i32 @test15i(i32 %X) {
  ; CHECK-NEXT: %t1 = shl i32 %X, 8
  ; CHECK-NEXT: %1 = and i32 %t1, 512
  ; CHECK-NEXT: %2 = xor i32 %1, 512
-; CHECK-NEXT: %3 = add nsw i32 %2, 577
+; CHECK-NEXT: %3 = add nuw nsw i32 %2, 577
  ; CHECK-NEXT: ret i32 %3
  }
  
@@ -294,7 +294,7 @@ define i32 @test15j(i32 %X) {
  ; CHECK-LABEL: @test15j(
  ; CHECK-NEXT: %t1 = shl i32 %X, 8
  ; CHECK-NEXT: %1 = and i32 %t1, 512
-; CHECK-NEXT: %2 = add nsw i32 %1, 577
+; CHECK-NEXT: %2 = add nuw nsw i32 %1, 577
  ; CHECK-NEXT: ret i32 %2
  }
  
@@ -521,7 +521,7 @@ define i32 @test35(i32 %x) {
  ; CHECK-LABEL: @test35(
  ; CHECK: ashr i32 %x, 31
  ; CHECK: and i32 {{.*}}, 40
-; CHECK: add nsw i32 {{.*}}, 60
+; CHECK: add nuw nsw i32 {{.*}}, 60
  ; CHECK: ret
  }
  
@@ -1235,4 +1235,4 @@ define i32 @test75(i32 %x) {
  ; CHECK-NEXT: [[CMP:%[a-z0-9]+]] = icmp ult i32 %x, 68
  ; CHECK-NEXT: [[SEL:%[a-z0-9]+]] = select i1 [[CMP]], i32 68, i32 %x
  ; CHECK-NEXT: ret i32 [[SEL]]
-}
-\ No newline at end of file
+}
author	Jingyue Wu <jingyue@google.com>
	Tue, 17 Jun 2014 00:42:07 +0000 (00:42 +0000)
committer	Jingyue Wu <jingyue@google.com>
	Tue, 17 Jun 2014 00:42:07 +0000 (00:42 +0000)
lib/Transforms/InstCombine/InstCombine.h		patch \| blob \| history
lib/Transforms/InstCombine/InstCombineAddSub.cpp		patch \| blob \| history
test/Transforms/InstCombine/AddOverFlow.ll		patch \| blob \| history
test/Transforms/InstCombine/add-sitofp.ll		patch \| blob \| history
test/Transforms/InstCombine/ffs-1.ll		patch \| blob \| history
test/Transforms/InstCombine/select.ll		patch \| blob \| history