When sinking an insn in InstCombine bring its debug

[oota-llvm.git] / lib / Transforms / Scalar / InstructionCombining.cpp
diff --git a/lib/Transforms/Scalar/InstructionCombining.cpp b/lib/Transforms/Scalar/InstructionCombining.cpp

index bca6abc60515e3d64a87d60148e01fbc46192c0b..e0d3ac4d4282ce918c2c0fcb626e4fd0b8563790 100644 (file)
--- a/lib/Transforms/Scalar/InstructionCombining.cpp
+++ b/lib/Transforms/Scalar/InstructionCombining.cpp
@@ -5822,7 +5822,7 @@ Instruction *InstCombiner::visitICmpInst(ICmpInst &I) {
  
    // See if we are doing a comparison with a constant.
    if (ConstantInt *CI = dyn_cast<ConstantInt>(Op1)) {
-    Value *A, *B;
+    Value *A = 0, *B = 0;
      
      // (icmp ne/eq (sub A B) 0) -> (icmp ne/eq A, B)
      if (I.isEquality() && CI->isNullValue() &&
@@ -7031,7 +7031,12 @@ Instruction *InstCombiner::visitAShr(BinaryOperator &I) {
        MaskedValueIsZero(Op0,
                        APInt::getSignBit(I.getType()->getPrimitiveSizeInBits())))
      return BinaryOperator::CreateLShr(Op0, I.getOperand(1));
-  
+
+  // Arithmetic shifting an all-sign-bit value is a no-op.
+  unsigned NumSignBits = ComputeNumSignBits(Op0);
+  if (NumSignBits == Op0->getType()->getPrimitiveSizeInBits())
+    return ReplaceInstUsesWith(I, Op0);
+
    return 0;
  }
  
@@ -9286,7 +9291,7 @@ unsigned InstCombiner::GetOrEnforceKnownAlignment(Value *V,
  
  Instruction *InstCombiner::SimplifyMemTransfer(MemIntrinsic *MI) {
    unsigned DstAlign = GetOrEnforceKnownAlignment(MI->getOperand(1));
-  unsigned SrcAlign = GetOrEnforceKnownAlignment(MI->getOperand(2), DstAlign);
+  unsigned SrcAlign = GetOrEnforceKnownAlignment(MI->getOperand(2));
    unsigned MinAlign = std::min(DstAlign, SrcAlign);
    unsigned CopyAlign = MI->getAlignment()->getZExtValue();
  
@@ -10180,6 +10185,9 @@ Instruction *InstCombiner::FoldPHIArgGEPIntoPHI(PHINode &PN) {
    
    SmallVector<Value*, 16> FixedOperands(FirstInst->op_begin(), 
                                          FirstInst->op_end());
+  // This is true if all GEP bases are allocas and if all indices into them are
+  // constants.
+  bool AllBasePointersAreAllocas = true;
    
    // Scan to see if all operands are the same opcode, all have one use, and all
    // kill their operands (i.e. the operands have one use).
@@ -10189,6 +10197,12 @@ Instruction *InstCombiner::FoldPHIArgGEPIntoPHI(PHINode &PN) {
        GEP->getNumOperands() != FirstInst->getNumOperands())
        return 0;
  
+    // Keep track of whether or not all GEPs are of alloca pointers.
+    if (AllBasePointersAreAllocas &&
+        (!isa<AllocaInst>(GEP->getOperand(0)) ||
+         !GEP->hasAllConstantIndices()))
+      AllBasePointersAreAllocas = false;
+    
      // Compare the operand lists.
      for (unsigned op = 0, e = FirstInst->getNumOperands(); op != e; ++op) {
        if (FirstInst->getOperand(op) == GEP->getOperand(op))
@@ -10209,6 +10223,15 @@ Instruction *InstCombiner::FoldPHIArgGEPIntoPHI(PHINode &PN) {
      }
    }
    
+  // If all of the base pointers of the PHI'd GEPs are from allocas, don't
+  // bother doing this transformation.  At best, this will just save a bit of
+  // offset calculation, but all the predecessors will have to materialize the
+  // stack address into a register anyway.  We'd actually rather *clone* the
+  // load up into the predecessors so that we have a load of a gep of an alloca,
+  // which can usually all be folded into the load.
+  if (AllBasePointersAreAllocas)
+    return 0;
+  
    // Otherwise, this is safe to transform.  Insert PHI nodes for each operand
    // that is variable.
    SmallVector<PHINode*, 16> OperandPhis(FixedOperands.size());
@@ -10247,15 +10270,15 @@ Instruction *InstCombiner::FoldPHIArgGEPIntoPHI(PHINode &PN) {
  }
  
  
-/// isSafeToSinkLoad - Return true if we know that it is safe sink the load out
-/// of the block that defines it.  This means that it must be obvious the value
-/// of the load is not changed from the point of the load to the end of the
-/// block it is in.
+/// isSafeAndProfitableToSinkLoad - Return true if we know that it is safe to
+/// sink the load out of the block that defines it.  This means that it must be
+/// obvious the value of the load is not changed from the point of the load to
+/// the end of the block it is in.
  ///
  /// Finally, it is safe, but not profitable, to sink a load targetting a
  /// non-address-taken alloca.  Doing so will cause us to not promote the alloca
  /// to a register.
-static bool isSafeToSinkLoad(LoadInst *L) {
+static bool isSafeAndProfitableToSinkLoad(LoadInst *L) {
    BasicBlock::iterator BBI = L, E = L->getParent()->end();
    
    for (++BBI; BBI != E; ++BBI)
@@ -10277,10 +10300,20 @@ static bool isSafeToSinkLoad(LoadInst *L) {
        break;
      }
      
-    if (!isAddressTaken)
+    if (!isAddressTaken && AI->isStaticAlloca())
        return false;
    }
    
+  // If this load is a load from a GEP with a constant offset from an alloca,
+  // then we don't want to sink it.  In its present form, it will be
+  // load [constant stack offset].  Sinking it will cause us to have to
+  // materialize the stack addresses in each predecessor in a register only to
+  // do a shared load from register in the successor.
+  if (GetElementPtrInst *GEP = dyn_cast<GetElementPtrInst>(L->getOperand(0)))
+    if (AllocaInst *AI = dyn_cast<AllocaInst>(GEP->getOperand(0)))
+      if (AI->isStaticAlloca() && GEP->hasAllConstantIndices())
+        return false;
+  
    return true;
  }
  
@@ -10311,7 +10344,7 @@ Instruction *InstCombiner::FoldPHIArgOpIntoPHI(PHINode &PN) {
      // We can't sink the load if the loaded value could be modified between the
      // load and the PHI.
      if (LI->getParent() != PN.getIncomingBlock(0) ||
-        !isSafeToSinkLoad(LI))
+        !isSafeAndProfitableToSinkLoad(LI))
        return 0;
      
      // If the PHI is of volatile loads and the load block has multiple
@@ -10341,7 +10374,7 @@ Instruction *InstCombiner::FoldPHIArgOpIntoPHI(PHINode &PN) {
        // the load and the PHI.
        if (LI->isVolatile() != isVolatile ||
            LI->getParent() != PN.getIncomingBlock(i) ||
-          !isSafeToSinkLoad(LI))
+          !isSafeAndProfitableToSinkLoad(LI))
          return 0;
        
        // If the PHI is of volatile loads and the load block has multiple
@@ -10350,7 +10383,6 @@ Instruction *InstCombiner::FoldPHIArgOpIntoPHI(PHINode &PN) {
        if (isVolatile &&
            LI->getParent()->getTerminator()->getNumSuccessors() != 1)
          return 0;
-
        
      } else if (I->getOperand(1) != ConstantOp) {
        return 0;
@@ -10734,15 +10766,25 @@ Instruction *InstCombiner::visitGetElementPtrInst(GetElementPtrInst &GEP) {
        // transform: GEP (bitcast [10 x i8]* X to [0 x i8]*), i32 0, ...
        // into     : GEP [10 x i8]* X, i32 0, ...
        //
+      // Likewise, transform: GEP (bitcast i8* X to [0 x i8]*), i32 0, ...
+      //           into     : GEP i8* X, ...
+      // 
        // This occurs when the program declares an array extern like "int X[];"
-      //
        const PointerType *CPTy = cast<PointerType>(PtrOp->getType());
        const PointerType *XTy = cast<PointerType>(X->getType());
-      if (const ArrayType *XATy =
-          dyn_cast<ArrayType>(XTy->getElementType()))
-        if (const ArrayType *CATy =
-            dyn_cast<ArrayType>(CPTy->getElementType()))
+      if (const ArrayType *CATy =
+          dyn_cast<ArrayType>(CPTy->getElementType())) {
+        // GEP (bitcast i8* X to [0 x i8]*), i32 0, ... ?
+        if (CATy->getElementType() == XTy->getElementType()) {
+          // -> GEP i8* X, ...
+          SmallVector<Value*, 8> Indices(GEP.idx_begin()+1, GEP.idx_end());
+          return GetElementPtrInst::Create(X, Indices.begin(), Indices.end(),
+                                           GEP.getName());
+        } else if (const ArrayType *XATy =
+                 dyn_cast<ArrayType>(XTy->getElementType())) {
+          // GEP (bitcast [10 x i8]* X to [0 x i8]*), i32 0, ... ?
            if (CATy->getElementType() == XATy->getElementType()) {
+            // -> GEP [10 x i8]* X, i32 0, ...
              // At this point, we know that the cast source type is a pointer
              // to an array of the same type as the destination pointer
              // array.  Because the array type is never stepped over (there
@@ -10750,6 +10792,8 @@ Instruction *InstCombiner::visitGetElementPtrInst(GetElementPtrInst &GEP) {
              GEP.setOperand(0, X);
              return &GEP;
            }
+        }
+      }
      } else if (GEP.getNumOperands() == 2) {
        // Transform things like:
        // %t = getelementptr i32* bitcast ([2 x i32]* %str to i32*), i32 %V
@@ -10805,7 +10849,7 @@ Instruction *InstCombiner::visitGetElementPtrInst(GetElementPtrInst &GEP) {
          // out, perform the transformation. Note, we don't know whether Scale is
          // signed or not. We'll use unsigned version of division/modulo
          // operation after making sure Scale doesn't have the sign bit set.
-        if (Scale && Scale->getSExtValue() >= 0LL &&
+        if (ArrayEltSize && Scale && Scale->getSExtValue() >= 0LL &&
              Scale->getZExtValue() % ArrayEltSize == 0) {
            Scale = ConstantInt::get(Scale->getType(),
                                     Scale->getZExtValue() / ArrayEltSize);
@@ -11001,12 +11045,12 @@ static Instruction *InstCombineLoadCast(InstCombiner &IC, LoadInst &LI,
          APInt SingleChar(numBits, 0);
          if (TD->isLittleEndian()) {
            for (signed i = len-1; i >= 0; i--) {
-            SingleChar = (uint64_t) Str[i];
+            SingleChar = (uint64_t) Str[i] & UCHAR_MAX;
              StrVal = (StrVal << 8) | SingleChar;
            }
          } else {
            for (unsigned i = 0; i < len; i++) {
-            SingleChar = (uint64_t) Str[i];
+            SingleChar = (uint64_t) Str[i] & UCHAR_MAX;
              StrVal = (StrVal << 8) | SingleChar;
            }
            // Append NULL at the end.
@@ -12330,6 +12374,7 @@ static bool TryToSinkInstruction(Instruction *I, BasicBlock *DestBlock) {
  
    BasicBlock::iterator InsertPos = DestBlock->getFirstNonPHI();
  
+  CopyPrecedingStopPoint(I, InsertPos);
    I->moveBefore(InsertPos);
    ++NumSunkInst;
    return true;
@@ -12392,6 +12437,8 @@ static void AddReachableCodeToWorklist(BasicBlock *BB,
            DBI_Prev->eraseFromParent();
          }
          DBI_Prev = DBI_Next;
+      } else {
+        DBI_Prev = 0;
        }
  
        IC.AddToWorkList(Inst);