Add in the first iteration of support for llvm/clang/lldb to allow variable per addre...

[oota-llvm.git] / lib / Transforms / InstCombine / InstCombineCasts.cpp
diff --git a/lib/Transforms/InstCombine/InstCombineCasts.cpp b/lib/Transforms/InstCombine/InstCombineCasts.cpp

index ba90bf6b5c56b2ca82efbd3f0ba2218eca7cf74d..f3f3f8f585d1a5e33b1861da5fc59758812e530c 100644 (file)
--- a/lib/Transforms/InstCombine/InstCombineCasts.cpp
+++ b/lib/Transforms/InstCombine/InstCombineCasts.cpp
@@ -13,7 +13,8 @@
  
  #include "InstCombine.h"
  #include "llvm/Analysis/ConstantFolding.h"
-#include "llvm/Target/TargetData.h"
+#include "llvm/DataLayout.h"
+#include "llvm/Target/TargetLibraryInfo.h"
  #include "llvm/Support/PatternMatch.h"
  using namespace llvm;
  using namespace PatternMatch;
@@ -33,7 +34,7 @@ static Value *DecomposeSimpleLinearExpr(Value *Val, unsigned &Scale,
    if (BinaryOperator *I = dyn_cast<BinaryOperator>(Val)) {
      // Cannot look past anything that might overflow.
      OverflowingBinaryOperator *OBI = dyn_cast<OverflowingBinaryOperator>(Val);
-    if (OBI && !OBI->hasNoUnsignedWrap()) {
+    if (OBI && !OBI->hasNoUnsignedWrap() && !OBI->hasNoSignedWrap()) {
        Scale = 1;
        Offset = 0;
        return Val;
@@ -77,7 +78,7 @@ static Value *DecomposeSimpleLinearExpr(Value *Val, unsigned &Scale,
  /// try to eliminate the cast by moving the type information into the alloc.
  Instruction *InstCombiner::PromoteCastOfAllocation(BitCastInst &CI,
                                                     AllocaInst &AI) {
-  // This requires TargetData to get the alloca alignment and size information.
+  // This requires DataLayout to get the alloca alignment and size information.
    if (!TD) return 0;
  
    PointerType *PTy = cast<PointerType>(CI.getType());
@@ -122,13 +123,13 @@ Instruction *InstCombiner::PromoteCastOfAllocation(BitCastInst &CI,
    } else {
      Amt = ConstantInt::get(AI.getArraySize()->getType(), Scale);
      // Insert before the alloca, not before the cast.
-    Amt = AllocaBuilder.CreateMul(Amt, NumElements, "tmp");
+    Amt = AllocaBuilder.CreateMul(Amt, NumElements);
    }
    
    if (uint64_t Offset = (AllocElTySize*ArrayOffset)/CastElTySize) {
      Value *Off = ConstantInt::get(AI.getArraySize()->getType(),
                                    Offset, true);
-    Amt = AllocaBuilder.CreateAdd(Amt, Off, "tmp");
+    Amt = AllocaBuilder.CreateAdd(Amt, Off);
    }
    
    AllocaInst *New = AllocaBuilder.CreateAlloca(CastElTy, Amt);
@@ -147,8 +148,6 @@ Instruction *InstCombiner::PromoteCastOfAllocation(BitCastInst &CI,
    return ReplaceInstUsesWith(CI, New);
  }
  
-
-
  /// EvaluateInDifferentType - Given an expression that 
  /// CanEvaluateTruncated or CanEvaluateSExtd returns true for, actually
  /// insert the code to evaluate the expression.
@@ -158,7 +157,7 @@ Value *InstCombiner::EvaluateInDifferentType(Value *V, Type *Ty,
      C = ConstantExpr::getIntegerCast(C, Ty, isSigned /*Sext or ZExt*/);
      // If we got a constantexpr back, try to simplify it with TD info.
      if (ConstantExpr *CE = dyn_cast<ConstantExpr>(C))
-      C = ConstantFoldConstantExpression(CE, TD);
+      C = ConstantFoldConstantExpression(CE, TD, TLI);
      return C;
    }
  
@@ -216,7 +215,6 @@ Value *InstCombiner::EvaluateInDifferentType(Value *V, Type *Ty,
    default: 
      // TODO: Can handle more cases here.
      llvm_unreachable("Unreachable!");
-    break;
    }
    
    Res->takeName(I);
@@ -231,7 +229,7 @@ isEliminableCastPair(
    const CastInst *CI, ///< The first cast instruction
    unsigned opcode,       ///< The opcode of the second cast instruction
    Type *DstTy,     ///< The target type for the second cast instruction
-  TargetData *TD         ///< The target data for pointer size
+  DataLayout *TD         ///< The target data for pointer size
  ) {
  
    Type *SrcTy = CI->getOperand(0)->getType();   // A from above
@@ -457,7 +455,7 @@ Instruction *InstCombiner::visitTrunc(TruncInst &CI) {
    // Canonicalize trunc x to i1 -> (icmp ne (and x, 1), 0), likewise for vector.
    if (DestTy->getScalarSizeInBits() == 1) {
      Constant *One = ConstantInt::get(Src->getType(), 1);
-    Src = Builder->CreateAnd(Src, One, "tmp");
+    Src = Builder->CreateAnd(Src, One);
      Value *Zero = Constant::getNullValue(Src->getType());
      return new ICmpInst(ICmpInst::ICMP_NE, Src, Zero);
    }
@@ -519,7 +517,7 @@ Instruction *InstCombiner::transformZExtICmp(ICmpInst *ICI, Instruction &CI,
                                     In->getType()->getScalarSizeInBits()-1);
        In = Builder->CreateLShr(In, Sh, In->getName()+".lobit");
        if (In->getType() != CI.getType())
-        In = Builder->CreateIntCast(In, CI.getType(), false/*ZExt*/, "tmp");
+        In = Builder->CreateIntCast(In, CI.getType(), false/*ZExt*/);
  
        if (ICI->getPredicate() == ICmpInst::ICMP_SGT) {
          Constant *One = ConstantInt::get(In->getType(), 1);
@@ -528,9 +526,7 @@ Instruction *InstCombiner::transformZExtICmp(ICmpInst *ICI, Instruction &CI,
  
        return ReplaceInstUsesWith(CI, In);
      }
-      
-      
-      
+
      // zext (X == 0) to i32 --> X^1      iff X has only the low bit set.
      // zext (X == 0) to i32 --> (X>>1)^1 iff X has only the 2nd bit set.
      // zext (X == 1) to i32 --> X        iff X has only the low bit set.
@@ -545,8 +541,7 @@ Instruction *InstCombiner::transformZExtICmp(ICmpInst *ICI, Instruction &CI,
        // If Op1C some other power of two, convert:
        uint32_t BitWidth = Op1C->getType()->getBitWidth();
        APInt KnownZero(BitWidth, 0), KnownOne(BitWidth, 0);
-      APInt TypeMask(APInt::getAllOnesValue(BitWidth));
-      ComputeMaskedBits(ICI->getOperand(0), TypeMask, KnownZero, KnownOne);
+      ComputeMaskedBits(ICI->getOperand(0), KnownZero, KnownOne);
          
        APInt KnownZeroMask(~KnownZero);
        if (KnownZeroMask.isPowerOf2()) { // Exactly 1 possible 1?
@@ -573,7 +568,7 @@ Instruction *InstCombiner::transformZExtICmp(ICmpInst *ICI, Instruction &CI,
            
          if ((Op1CV != 0) == isNE) { // Toggle the low bit.
            Constant *One = ConstantInt::get(In->getType(), 1);
-          In = Builder->CreateXor(In, One, "tmp");
+          In = Builder->CreateXor(In, One);
          }
            
          if (CI.getType() == In->getType())
@@ -594,9 +589,8 @@ Instruction *InstCombiner::transformZExtICmp(ICmpInst *ICI, Instruction &CI,
  
        APInt KnownZeroLHS(BitWidth, 0), KnownOneLHS(BitWidth, 0);
        APInt KnownZeroRHS(BitWidth, 0), KnownOneRHS(BitWidth, 0);
-      APInt TypeMask(APInt::getAllOnesValue(BitWidth));
-      ComputeMaskedBits(LHS, TypeMask, KnownZeroLHS, KnownOneLHS);
-      ComputeMaskedBits(RHS, TypeMask, KnownZeroRHS, KnownOneRHS);
+      ComputeMaskedBits(LHS, KnownZeroLHS, KnownOneLHS);
+      ComputeMaskedBits(RHS, KnownZeroRHS, KnownOneRHS);
  
        if (KnownZeroLHS == KnownZeroRHS && KnownOneLHS == KnownOneRHS) {
          APInt KnownBits = KnownZeroLHS | KnownOneLHS;
@@ -654,10 +648,8 @@ static bool CanEvaluateZExtd(Value *V, Type *Ty, unsigned &BitsToClear) {
    if (!I) return false;
    
    // If the input is a truncate from the destination type, we can trivially
-  // eliminate it, even if it has multiple uses.
-  // FIXME: This is currently disabled until codegen can handle this without
-  // pessimizing code, PR5997.
-  if (0 && isa<TruncInst>(I) && I->getOperand(0)->getType() == Ty)
+  // eliminate it.
+  if (isa<TruncInst>(I) && I->getOperand(0)->getType() == Ty)
      return true;
    
    // We can't extend or shrink something that has multiple uses: doing so would
@@ -821,7 +813,7 @@ Instruction *InstCombiner::visitZExt(ZExtInst &CI) {
                                                             AndValue));
      }
      if (SrcSize > DstSize) {
-      Value *Trunc = Builder->CreateTrunc(A, CI.getType(), "tmp");
+      Value *Trunc = Builder->CreateTrunc(A, CI.getType());
        APInt AndValue(APInt::getLowBitsSet(DstSize, MidSize));
        return BinaryOperator::CreateAnd(Trunc, 
                                         ConstantInt::get(Trunc->getType(),
@@ -868,7 +860,7 @@ Instruction *InstCombiner::visitZExt(ZExtInst &CI) {
              Value *TI0 = TI->getOperand(0);
              if (TI0->getType() == CI.getType()) {
                Constant *ZC = ConstantExpr::getZExt(C, CI.getType());
-              Value *NewAnd = Builder->CreateAnd(TI0, ZC, "tmp");
+              Value *NewAnd = Builder->CreateAnd(TI0, ZC);
                return BinaryOperator::CreateXor(NewAnd, ZC);
              }
            }
@@ -901,7 +893,7 @@ Instruction *InstCombiner::transformSExtICmp(ICmpInst *ICI, Instruction &CI) {
                                     Op0->getType()->getScalarSizeInBits()-1);
        Value *In = Builder->CreateAShr(Op0, Sh, Op0->getName()+".lobit");
        if (In->getType() != CI.getType())
-        In = Builder->CreateIntCast(In, CI.getType(), true/*SExt*/, "tmp");
+        In = Builder->CreateIntCast(In, CI.getType(), true/*SExt*/);
  
        if (Pred == ICmpInst::ICMP_SGT)
          In = Builder->CreateNot(In, In->getName()+".not");
@@ -915,8 +907,7 @@ Instruction *InstCombiner::transformSExtICmp(ICmpInst *ICI, Instruction &CI) {
          ICI->isEquality() && (Op1C->isZero() || Op1C->getValue().isPowerOf2())){
        unsigned BitWidth = Op1C->getType()->getBitWidth();
        APInt KnownZero(BitWidth, 0), KnownOne(BitWidth, 0);
-      APInt TypeMask(APInt::getAllOnesValue(BitWidth));
-      ComputeMaskedBits(Op0, TypeMask, KnownZero, KnownOne);
+      ComputeMaskedBits(Op0, KnownZero, KnownOne);
  
        APInt KnownZeroMask(~KnownZero);
        if (KnownZeroMask.isPowerOf2()) {
@@ -999,11 +990,8 @@ static bool CanEvaluateSExtd(Value *V, Type *Ty) {
    Instruction *I = dyn_cast<Instruction>(V);
    if (!I) return false;
    
-  // If this is a truncate from the dest type, we can trivially eliminate it,
-  // even if it has multiple uses.
-  // FIXME: This is currently disabled until codegen can handle this without
-  // pessimizing code, PR5997.
-  if (0 && isa<TruncInst>(I) && I->getOperand(0)->getType() == Ty)
+  // If this is a truncate from the dest type, we can trivially eliminate it.
+  if (isa<TruncInst>(I) && I->getOperand(0)->getType() == Ty)
      return true;
    
    // We can't extend or shrink something that has multiple uses: doing so would
@@ -1163,6 +1151,9 @@ static Value *LookThroughFPExtensions(Value *V) {
    if (ConstantFP *CFP = dyn_cast<ConstantFP>(V)) {
      if (CFP->getType() == Type::getPPC_FP128Ty(V->getContext()))
        return V;  // No constant folding of this.
+    // See if the value can be truncated to half and then reextended.
+    if (Value *V = FitsInFPType(CFP, APFloat::IEEEhalf))
+      return V;
      // See if the value can be truncated to float and then reextended.
      if (Value *V = FitsInFPType(CFP, APFloat::IEEEsingle))
        return V;
@@ -1213,10 +1204,9 @@ Instruction *InstCombiner::visitFPTrunc(FPTruncInst &CI) {
    }
    
    // Fold (fptrunc (sqrt (fpext x))) -> (sqrtf x)
-  // NOTE: This should be disabled by -fno-builtin-sqrt if we ever support it.
    CallInst *Call = dyn_cast<CallInst>(CI.getOperand(0));
-  if (Call && Call->getCalledFunction() &&
-      Call->getCalledFunction()->getName() == "sqrt" &&
+  if (Call && Call->getCalledFunction() && TLI->has(LibFunc::sqrtf) &&
+      Call->getCalledFunction()->getName() == TLI->getName(LibFunc::sqrt) &&
        Call->getNumArgOperands() == 1 &&
        Call->hasOneUse()) {
      CastInst *Arg = dyn_cast<CastInst>(Call->getArgOperand(0));
@@ -1303,17 +1293,18 @@ Instruction *InstCombiner::visitIntToPtr(IntToPtrInst &CI) {
    // If the source integer type is not the intptr_t type for this target, do a
    // trunc or zext to the intptr_t type, then inttoptr of it.  This allows the
    // cast to be exposed to other transforms.
+  unsigned AS = CI.getAddressSpace();
    if (TD) {
      if (CI.getOperand(0)->getType()->getScalarSizeInBits() >
-        TD->getPointerSizeInBits()) {
+        TD->getPointerSizeInBits(AS)) {
        Value *P = Builder->CreateTrunc(CI.getOperand(0),
-                                      TD->getIntPtrType(CI.getContext()), "tmp");
+                                      TD->getIntPtrType(CI.getContext()));
        return new IntToPtrInst(P, CI.getType());
      }
      if (CI.getOperand(0)->getType()->getScalarSizeInBits() <
-        TD->getPointerSizeInBits()) {
+        TD->getPointerSizeInBits(AS)) {
        Value *P = Builder->CreateZExt(CI.getOperand(0),
-                                     TD->getIntPtrType(CI.getContext()), "tmp");
+                                     TD->getIntPtrType(CI.getContext()));
        return new IntToPtrInst(P, CI.getType());
      }
    }
@@ -1346,10 +1337,9 @@ Instruction *InstCombiner::commonPointerCastTransforms(CastInst &CI) {
      // non-type-safe code.
      if (TD && GEP->hasOneUse() && isa<BitCastInst>(GEP->getOperand(0)) &&
          GEP->hasAllConstantIndices()) {
-      // We are guaranteed to get a constant from EmitGEPOffset.
-      ConstantInt *OffsetV = cast<ConstantInt>(EmitGEPOffset(GEP));
-      int64_t Offset = OffsetV->getSExtValue();
-      
+      SmallVector<Value*, 8> Ops(GEP->idx_begin(), GEP->idx_end());
+      int64_t Offset = TD->getIndexedOffset(GEP->getPointerOperandType(), Ops);
+
        // Get the base pointer input of the bitcast, and the type it points to.
        Value *OrigBase = cast<BitCastInst>(GEP->getOperand(0))->getOperand(0);
        Type *GEPIdxTy =
@@ -1379,17 +1369,16 @@ Instruction *InstCombiner::visitPtrToInt(PtrToIntInst &CI) {
    // If the destination integer type is not the intptr_t type for this target,
    // do a ptrtoint to intptr_t then do a trunc or zext.  This allows the cast
    // to be exposed to other transforms.
+  unsigned AS = CI.getPointerAddressSpace();
    if (TD) {
-    if (CI.getType()->getScalarSizeInBits() < TD->getPointerSizeInBits()) {
+    if (CI.getType()->getScalarSizeInBits() < TD->getPointerSizeInBits(AS)) {
        Value *P = Builder->CreatePtrToInt(CI.getOperand(0),
-                                         TD->getIntPtrType(CI.getContext()),
-                                         "tmp");
+                                         TD->getIntPtrType(CI.getContext()));
        return new TruncInst(P, CI.getType());
      }
-    if (CI.getType()->getScalarSizeInBits() > TD->getPointerSizeInBits()) {
+    if (CI.getType()->getScalarSizeInBits() > TD->getPointerSizeInBits(AS)) {
        Value *P = Builder->CreatePtrToInt(CI.getOperand(0),
-                                         TD->getIntPtrType(CI.getContext()),
-                                         "tmp");
+                                         TD->getIntPtrType(CI.getContext()));
        return new ZExtInst(P, CI.getType());
      }
    }
@@ -1425,16 +1414,15 @@ static Instruction *OptimizeVectorResize(Value *InVal, VectorType *DestTy,
    // Now that the element types match, get the shuffle mask and RHS of the
    // shuffle to use, which depends on whether we're increasing or decreasing the
    // size of the input.
-  SmallVector<Constant*, 16> ShuffleMask;
+  SmallVector<uint32_t, 16> ShuffleMask;
    Value *V2;
-  IntegerType *Int32Ty = Type::getInt32Ty(SrcTy->getContext());
    
    if (SrcTy->getNumElements() > DestTy->getNumElements()) {
      // If we're shrinking the number of elements, just shuffle in the low
      // elements from the input and use undef as the second shuffle input.
      V2 = UndefValue::get(SrcTy);
      for (unsigned i = 0, e = DestTy->getNumElements(); i != e; ++i)
-      ShuffleMask.push_back(ConstantInt::get(Int32Ty, i));
+      ShuffleMask.push_back(i);
      
    } else {
      // If we're increasing the number of elements, shuffle in all of the
@@ -1443,14 +1431,16 @@ static Instruction *OptimizeVectorResize(Value *InVal, VectorType *DestTy,
      V2 = Constant::getNullValue(SrcTy);
      unsigned SrcElts = SrcTy->getNumElements();
      for (unsigned i = 0, e = SrcElts; i != e; ++i)
-      ShuffleMask.push_back(ConstantInt::get(Int32Ty, i));
+      ShuffleMask.push_back(i);
  
      // The excess elements reference the first element of the zero input.
-    ShuffleMask.append(DestTy->getNumElements()-SrcElts,
-                       ConstantInt::get(Int32Ty, SrcElts));
+    for (unsigned i = 0, e = DestTy->getNumElements()-SrcElts; i != e; ++i)
+      ShuffleMask.push_back(SrcElts);
    }
    
-  return new ShuffleVectorInst(InVal, V2, ConstantVector::get(ShuffleMask));
+  return new ShuffleVectorInst(InVal, V2,
+                               ConstantDataVector::get(V2->getContext(),
+                                                       ShuffleMask));
  }
  
  static bool isMultipleOfTypeSize(unsigned Value, Type *Ty) {