Split the init.trampoline intrinsic, which currently combines GCC's

[oota-llvm.git] / lib / CodeGen / SelectionDAG / SelectionDAG.cpp
diff --git a/lib/CodeGen/SelectionDAG/SelectionDAG.cpp b/lib/CodeGen/SelectionDAG/SelectionDAG.cpp

index 019c9feb993d8d03909cdd098c35172bdade12bd..ec7bfbe495ca36fbbebc5c8cb8ab902f07b4aeba 100644 (file)
--- a/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
@@ -31,7 +31,6 @@
  #include "llvm/CodeGen/PseudoSourceValue.h"
  #include "llvm/Target/TargetRegisterInfo.h"
  #include "llvm/Target/TargetData.h"
-#include "llvm/Target/TargetFrameInfo.h"
  #include "llvm/Target/TargetLowering.h"
  #include "llvm/Target/TargetSelectionDAGInfo.h"
  #include "llvm/Target/TargetOptions.h"
@@ -433,7 +432,9 @@ static void AddNodeIDCustom(FoldingSetNodeID &ID, const SDNode *N) {
    case ISD::ATOMIC_LOAD_MIN:
    case ISD::ATOMIC_LOAD_MAX:
    case ISD::ATOMIC_LOAD_UMIN:
-  case ISD::ATOMIC_LOAD_UMAX: {
+  case ISD::ATOMIC_LOAD_UMAX:
+  case ISD::ATOMIC_LOAD:
+  case ISD::ATOMIC_STORE: {
      const AtomicSDNode *AT = cast<AtomicSDNode>(N);
      ID.AddInteger(AT->getMemoryVT().getRawBits());
      ID.AddInteger(AT->getRawSubclassData());
@@ -491,7 +492,7 @@ encodeMemSDNodeFlags(int ConvType, ISD::MemIndexedMode AM, bool isVolatile,
  
  /// doNotCSE - Return true if CSE should not be performed for this node.
  static bool doNotCSE(SDNode *N) {
-  if (N->getValueType(0) == MVT::Flag)
+  if (N->getValueType(0) == MVT::Glue)
      return true; // Never CSE anything that produces a flag.
  
    switch (N->getOpcode()) {
@@ -503,7 +504,7 @@ static bool doNotCSE(SDNode *N) {
  
    // Check that remaining values produced are not flags.
    for (unsigned i = 1, e = N->getNumValues(); i != e; ++i)
-    if (N->getValueType(i) == MVT::Flag)
+    if (N->getValueType(i) == MVT::Glue)
        return true; // Never CSE anything that produces a flag.
  
    return false;
@@ -599,7 +600,7 @@ void SelectionDAG::DeallocateNode(SDNode *N) {
    Ordering->remove(N);
  
    // If any of the SDDbgValue nodes refer to this SDNode, invalidate them.
-  SmallVector<SDDbgValue*, 2> &DbgVals = DbgInfo->getSDDbgValues(N);
+  ArrayRef<SDDbgValue*> DbgVals = DbgInfo->getSDDbgValues(N);
    for (unsigned i = 0, e = DbgVals.size(); i != e; ++i)
      DbgVals[i]->setIsInvalidated();
  }
@@ -649,7 +650,7 @@ bool SelectionDAG::RemoveNodeFromCSEMaps(SDNode *N) {
    // Verify that the node was actually in one of the CSE maps, unless it has a
    // flag result (which cannot be CSE'd) or is one of the special cases that are
    // not subject to CSE.
-  if (!Erased && N->getValueType(N->getNumValues()-1) != MVT::Flag &&
+  if (!Erased && N->getValueType(N->getNumValues()-1) != MVT::Glue &&
        !N->isMachineOpcode() && !doNotCSE(N)) {
      N->dump(this);
      dbgs() << "\n";
@@ -822,7 +823,7 @@ static void VerifyMachineNode(SDNode *N) {
  /// given type.
  ///
  unsigned SelectionDAG::getEVTAlignment(EVT VT) const {
-  const Type *Ty = VT == MVT::iPTR ?
+  Type *Ty = VT == MVT::iPTR ?
                     PointerType::get(Type::getInt8Ty(*getContext()), 0) :
                     VT.getTypeForEVT(*getContext());
  
@@ -1419,9 +1420,9 @@ SDValue SelectionDAG::getMDNode(const MDNode *MD) {
  
  /// getShiftAmountOperand - Return the specified value casted to
  /// the target's desired shift amount type.
-SDValue SelectionDAG::getShiftAmountOperand(SDValue Op) {
+SDValue SelectionDAG::getShiftAmountOperand(EVT LHSTy, SDValue Op) {
    EVT OpTy = Op.getValueType();
-  MVT ShTy = TLI.getShiftAmountTy();
+  MVT ShTy = TLI.getShiftAmountTy(LHSTy);
    if (OpTy == ShTy || OpTy.isVector()) return Op;
  
    ISD::NodeType Opcode = OpTy.bitsGT(ShTy) ?  ISD::TRUNCATE : ISD::ZERO_EXTEND;
@@ -1433,7 +1434,7 @@ SDValue SelectionDAG::getShiftAmountOperand(SDValue Op) {
  SDValue SelectionDAG::CreateStackTemporary(EVT VT, unsigned minAlign) {
    MachineFrameInfo *FrameInfo = getMachineFunction().getFrameInfo();
    unsigned ByteSize = VT.getStoreSize();
-  const Type *Ty = VT.getTypeForEVT(*getContext());
+  Type *Ty = VT.getTypeForEVT(*getContext());
    unsigned StackAlign =
    std::max((unsigned)TLI.getTargetData()->getPrefTypeAlignment(Ty), minAlign);
  
@@ -1446,8 +1447,8 @@ SDValue SelectionDAG::CreateStackTemporary(EVT VT, unsigned minAlign) {
  SDValue SelectionDAG::CreateStackTemporary(EVT VT1, EVT VT2) {
    unsigned Bytes = std::max(VT1.getStoreSizeInBits(),
                              VT2.getStoreSizeInBits())/8;
-  const Type *Ty1 = VT1.getTypeForEVT(*getContext());
-  const Type *Ty2 = VT2.getTypeForEVT(*getContext());
+  Type *Ty1 = VT1.getTypeForEVT(*getContext());
+  Type *Ty2 = VT2.getTypeForEVT(*getContext());
    const TargetData *TD = TLI.getTargetData();
    unsigned Align = std::max(TD->getPrefTypeAlignment(Ty1),
                              TD->getPrefTypeAlignment(Ty2));
@@ -2041,15 +2042,25 @@ void SelectionDAG::ComputeMaskedBits(SDValue Op, const APInt &Mask,
      KnownZero = APInt::getHighBitsSet(BitWidth, Leaders) & Mask;
      return;
    }
+  case ISD::FrameIndex:
+  case ISD::TargetFrameIndex:
+    if (unsigned Align = InferPtrAlignment(Op)) {
+      // The low bits are known zero if the pointer is aligned.
+      KnownZero = APInt::getLowBitsSet(BitWidth, Log2_32(Align));
+      return;
+    }
+    break;
+
    default:
-    // Allow the target to implement this method for its nodes.
-    if (Op.getOpcode() >= ISD::BUILTIN_OP_END) {
+    if (Op.getOpcode() < ISD::BUILTIN_OP_END)
+      break;
+    // Fallthrough
    case ISD::INTRINSIC_WO_CHAIN:
    case ISD::INTRINSIC_W_CHAIN:
    case ISD::INTRINSIC_VOID:
-      TLI.computeMaskedBitsForTargetNode(Op, Mask, KnownZero, KnownOne, *this,
-                                         Depth);
-    }
+    // Allow the target to implement this method for its nodes.
+    TLI.computeMaskedBitsForTargetNode(Op, Mask, KnownZero, KnownOne, *this,
+                                       Depth);
      return;
    }
  }
@@ -2080,12 +2091,7 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, unsigned Depth) const{
  
    case ISD::Constant: {
      const APInt &Val = cast<ConstantSDNode>(Op)->getAPIntValue();
-    // If negative, return # leading ones.
-    if (Val.isNegative())
-      return Val.countLeadingOnes();
-
-    // Return # leading zeros.
-    return Val.countLeadingZeros();
+    return Val.getNumSignBits();
    }
  
    case ISD::SIGN_EXTEND:
@@ -2280,6 +2286,25 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, unsigned Depth) const{
    return std::max(FirstAnswer, std::min(VTBits, Mask.countLeadingZeros()));
  }
  
+/// isBaseWithConstantOffset - Return true if the specified operand is an
+/// ISD::ADD with a ConstantSDNode on the right-hand side, or if it is an
+/// ISD::OR with a ConstantSDNode that is guaranteed to have the same
+/// semantics as an ADD.  This handles the equivalence:
+///     X|Cst == X+Cst iff X&Cst = 0.
+bool SelectionDAG::isBaseWithConstantOffset(SDValue Op) const {
+  if ((Op.getOpcode() != ISD::ADD && Op.getOpcode() != ISD::OR) ||
+      !isa<ConstantSDNode>(Op.getOperand(1)))
+    return false;
+
+  if (Op.getOpcode() == ISD::OR &&
+      !MaskedValueIsZero(Op.getOperand(0),
+                     cast<ConstantSDNode>(Op.getOperand(1))->getAPIntValue()))
+    return false;
+
+  return true;
+}
+
+
  bool SelectionDAG::isKnownNeverNaN(SDValue Op) const {
    // If we're told that NaNs won't happen, assume they won't.
    if (NoNaNsFPMath)
@@ -2300,6 +2325,13 @@ bool SelectionDAG::isKnownNeverZero(SDValue Op) const {
      return !C->isZero();
  
    // TODO: Recognize more cases here.
+  switch (Op.getOpcode()) {
+  default: break;
+  case ISD::OR:
+    if (const ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1)))
+      return !C->isNullValue();
+    break;
+  }
  
    return false;
  }
@@ -2317,16 +2349,6 @@ bool SelectionDAG::isEqualTo(SDValue A, SDValue B) const {
    return false;
  }
  
-bool SelectionDAG::isVerifiedDebugInfoDesc(SDValue Op) const {
-  GlobalAddressSDNode *GA = dyn_cast<GlobalAddressSDNode>(Op);
-  if (!GA) return false;
-  if (GA->getOffset() != 0) return false;
-  const GlobalVariable *GV = dyn_cast<GlobalVariable>(GA->getGlobal());
-  if (!GV) return false;
-  return MF->getMMI().hasDebugInfo();
-}
-
-
  /// getNode - Gets or creates the specified node.
  ///
  SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT) {
@@ -2417,7 +2439,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL,
                                APFloat::rmTowardZero, &ignored);
          if (s==APFloat::opInvalidOp)     // inexact is OK, in fact usual
            break;
-        APInt api(VT.getSizeInBits(), 2, x);
+        APInt api(VT.getSizeInBits(), x);
          return getConstant(api, VT);
        }
        case ISD::BITCAST:
@@ -2460,6 +2482,9 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL,
             "Vector element count mismatch!");
      if (OpOpcode == ISD::SIGN_EXTEND || OpOpcode == ISD::ZERO_EXTEND)
        return getNode(OpOpcode, DL, VT, Operand.getNode()->getOperand(0));
+    else if (OpOpcode == ISD::UNDEF)
+      // sext(undef) = 0, because the top bits will all be the same.
+      return getConstant(0, VT);
      break;
    case ISD::ZERO_EXTEND:
      assert(VT.isInteger() && Operand.getValueType().isInteger() &&
@@ -2474,6 +2499,9 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL,
      if (OpOpcode == ISD::ZERO_EXTEND)   // (zext (zext x)) -> (zext x)
        return getNode(ISD::ZERO_EXTEND, DL, VT,
                       Operand.getNode()->getOperand(0));
+    else if (OpOpcode == ISD::UNDEF)
+      // zext(undef) = 0, because the top bits will be zero.
+      return getConstant(0, VT);
      break;
    case ISD::ANY_EXTEND:
      assert(VT.isInteger() && Operand.getValueType().isInteger() &&
@@ -2490,6 +2518,8 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL,
          OpOpcode == ISD::ANY_EXTEND)
        // (ext (zext x)) -> (zext x)  and  (ext (sext x)) -> (sext x)
        return getNode(OpOpcode, DL, VT, Operand.getNode()->getOperand(0));
+    else if (OpOpcode == ISD::UNDEF)
+      return getUNDEF(VT);
  
      // (ext (trunx x)) -> x
      if (OpOpcode == ISD::TRUNCATE) {
@@ -2564,7 +2594,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL,
  
    SDNode *N;
    SDVTList VTs = getVTList(VT);
-  if (VT != MVT::Flag) { // Don't CSE flag producing nodes
+  if (VT != MVT::Glue) { // Don't CSE flag producing nodes
      FoldingSetNodeID ID;
      SDValue Ops[1] = { Operand };
      AddNodeIDNode(ID, Opcode, VTs, Ops, 1);
@@ -2721,6 +2751,13 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
             "Shift operators return type must be the same as their first arg");
      assert(VT.isInteger() && N2.getValueType().isInteger() &&
             "Shifts only work on integers");
+    // Verify that the shift amount VT is bit enough to hold valid shift
+    // amounts.  This catches things like trying to shift an i1024 value by an
+    // i8, which is easy to fall into in generic code that uses
+    // TLI.getShiftAmount().
+    assert(N2.getValueType().getSizeInBits() >=
+                   Log2_32_Ceil(N1.getValueType().getSizeInBits()) &&
+           "Invalid use of small shift amount with oversized value!");
  
      // Always fold shifts of i1 values so the code generator doesn't need to
      // handle them.  Since we know the size of the shift has to be less than the
@@ -2849,6 +2886,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
      assert(N2C && (unsigned)N2C->getZExtValue() < 2 && "Bad EXTRACT_ELEMENT!");
      assert(!N1.getValueType().isVector() && !VT.isVector() &&
             (N1.getValueType().isInteger() == VT.isInteger()) &&
+           N1.getValueType() != VT &&
             "Wrong types for EXTRACT_ELEMENT!");
  
      // EXTRACT_ELEMENT of BUILD_PAIR is often formed while legalize is expanding
@@ -2865,11 +2903,30 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
        return getConstant(ShiftedVal.trunc(ElementSize), VT);
      }
      break;
-  case ISD::EXTRACT_SUBVECTOR:
-    if (N1.getValueType() == VT) // Trivial extraction.
-      return N1;
+  case ISD::EXTRACT_SUBVECTOR: {
+    SDValue Index = N2;
+    if (VT.isSimple() && N1.getValueType().isSimple()) {
+      assert(VT.isVector() && N1.getValueType().isVector() &&
+             "Extract subvector VTs must be a vectors!");
+      assert(VT.getVectorElementType() == N1.getValueType().getVectorElementType() &&
+             "Extract subvector VTs must have the same element type!");
+      assert(VT.getSimpleVT() <= N1.getValueType().getSimpleVT() &&
+             "Extract subvector must be from larger vector to smaller vector!");
+
+      if (isa<ConstantSDNode>(Index.getNode())) {
+        assert((VT.getVectorNumElements() +
+                cast<ConstantSDNode>(Index.getNode())->getZExtValue()
+                <= N1.getValueType().getVectorNumElements())
+               && "Extract subvector overflow!");
+      }
+
+      // Trivial extraction.
+      if (VT.getSimpleVT() == N1.getValueType().getSimpleVT())
+        return N1;
+    }
      break;
    }
+  }
  
    if (N1C) {
      if (N2C) {
@@ -3006,7 +3063,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
    // Memoize this node if possible.
    SDNode *N;
    SDVTList VTs = getVTList(VT);
-  if (VT != MVT::Flag) {
+  if (VT != MVT::Glue) {
      SDValue Ops[] = { N1, N2 };
      FoldingSetNodeID ID;
      AddNodeIDNode(ID, Opcode, VTs, Ops, 2);
@@ -3064,6 +3121,30 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
    case ISD::VECTOR_SHUFFLE:
      llvm_unreachable("should use getVectorShuffle constructor!");
      break;
+  case ISD::INSERT_SUBVECTOR: {
+    SDValue Index = N3;
+    if (VT.isSimple() && N1.getValueType().isSimple()
+        && N2.getValueType().isSimple()) {
+      assert(VT.isVector() && N1.getValueType().isVector() &&
+             N2.getValueType().isVector() &&
+             "Insert subvector VTs must be a vectors");
+      assert(VT == N1.getValueType() &&
+             "Dest and insert subvector source types must match!");
+      assert(N2.getValueType().getSimpleVT() <= N1.getValueType().getSimpleVT() &&
+             "Insert subvector must be from smaller vector to larger vector!");
+      if (isa<ConstantSDNode>(Index.getNode())) {
+        assert((N2.getValueType().getVectorNumElements() +
+                cast<ConstantSDNode>(Index.getNode())->getZExtValue()
+                <= VT.getVectorNumElements())
+               && "Insert subvector overflow!");
+      }
+
+      // Trivial insertion.
+      if (VT.getSimpleVT() == N2.getValueType().getSimpleVT())
+        return N2;
+    }
+    break;
+  }
    case ISD::BITCAST:
      // Fold bit_convert nodes from a type to themselves.
      if (N1.getValueType() == VT)
@@ -3074,7 +3155,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
    // Memoize node if it doesn't produce a flag.
    SDNode *N;
    SDVTList VTs = getVTList(VT);
-  if (VT != MVT::Flag) {
+  if (VT != MVT::Glue) {
      SDValue Ops[] = { N1, N2, N3 };
      FoldingSetNodeID ID;
      AddNodeIDNode(ID, Opcode, VTs, Ops, 3);
@@ -3132,6 +3213,17 @@ SDValue SelectionDAG::getStackArgumentTokenFactor(SDValue Chain) {
                   &ArgChains[0], ArgChains.size());
  }
  
+/// SplatByte - Distribute ByteVal over NumBits bits.
+static APInt SplatByte(unsigned NumBits, uint8_t ByteVal) {
+  APInt Val = APInt(NumBits, ByteVal);
+  unsigned Shift = 8;
+  for (unsigned i = NumBits; i > 8; i >>= 1) {
+    Val = (Val << Shift) | Val;
+    Shift <<= 1;
+  }
+  return Val;
+}
+
  /// getMemsetValue - Vectorized representation of the memset value
  /// operand.
  static SDValue getMemsetValue(SDValue Value, EVT VT, SelectionDAG &DAG,
@@ -3140,27 +3232,18 @@ static SDValue getMemsetValue(SDValue Value, EVT VT, SelectionDAG &DAG,
  
    unsigned NumBits = VT.getScalarType().getSizeInBits();
    if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Value)) {
-    APInt Val = APInt(NumBits, C->getZExtValue() & 255);
-    unsigned Shift = 8;
-    for (unsigned i = NumBits; i > 8; i >>= 1) {
-      Val = (Val << Shift) | Val;
-      Shift <<= 1;
-    }
+    APInt Val = SplatByte(NumBits, C->getZExtValue() & 255);
      if (VT.isInteger())
        return DAG.getConstant(Val, VT);
      return DAG.getConstantFP(APFloat(Val), VT);
    }
  
-  const TargetLowering &TLI = DAG.getTargetLoweringInfo();
    Value = DAG.getNode(ISD::ZERO_EXTEND, dl, VT, Value);
-  unsigned Shift = 8;
-  for (unsigned i = NumBits; i > 8; i >>= 1) {
-    Value = DAG.getNode(ISD::OR, dl, VT,
-                        DAG.getNode(ISD::SHL, dl, VT, Value,
-                                    DAG.getConstant(Shift,
-                                                    TLI.getShiftAmountTy())),
-                        Value);
-    Shift <<= 1;
+  if (NumBits > 8) {
+    // Use a multiplication with 0x010101... to extend the input to the
+    // required length.
+    APInt Magic = SplatByte(NumBits, 0x01);
+    Value = DAG.getNode(ISD::MUL, dl, VT, Value, DAG.getConstant(Magic, VT));
    }
  
    return Value;
@@ -3246,13 +3329,13 @@ static bool FindOptimalMemOpLowering(std::vector<EVT> &MemOps,
                                       const TargetLowering &TLI) {
    assert((SrcAlign == 0 || SrcAlign >= DstAlign) &&
           "Expecting memcpy / memset source to meet alignment requirement!");
-  // If 'SrcAlign' is zero, that means the memory operation does not need load
-  // the value, i.e. memset or memcpy from constant string. Otherwise, it's
-  // the inferred alignment of the source. 'DstAlign', on the other hand, is the
-  // specified alignment of the memory operation. If it is zero, that means
-  // it's possible to change the alignment of the destination. 'MemcpyStrSrc'
-  // indicates whether the memcpy source is constant so it does not need to be
-  // loaded.
+  // If 'SrcAlign' is zero, that means the memory operation does not need to
+  // load the value, i.e. memset or memcpy from constant string. Otherwise,
+  // it's the inferred alignment of the source. 'DstAlign', on the other hand,
+  // is the specified alignment of the memory operation. If it is zero, that
+  // means it's possible to change the alignment of the destination.
+  // 'MemcpyStrSrc' indicates whether the memcpy source is constant so it does
+  // not need to be loaded.
    EVT VT = TLI.getOptimalMemOpType(Size, DstAlign, SrcAlign,
                                     NonScalarIntSafe, MemcpyStrSrc,
                                     DAG.getMachineFunction());
@@ -3279,15 +3362,6 @@ static bool FindOptimalMemOpLowering(std::vector<EVT> &MemOps,
        VT = LVT;
    }
  
-  // If we're optimizing for size, and there is a limit, bump the maximum number
-  // of operations inserted down to 4.  This is a wild guess that approximates
-  // the size of a call to memcpy or memset (3 arguments + call).
-  if (Limit != ~0U) {
-    const Function *F = DAG.getMachineFunction().getFunction();
-    if (F->hasFnAttr(Attribute::OptimizeForSize))
-      Limit = 4;
-  }
-
    unsigned NumMemOps = 0;
    while (Size != 0) {
      unsigned VTSize = VT.getSizeInBits() / 8;
@@ -3333,7 +3407,9 @@ static SDValue getMemcpyLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
    std::vector<EVT> MemOps;
    bool DstAlignCanChange = false;
-  MachineFrameInfo *MFI = DAG.getMachineFunction().getFrameInfo();
+  MachineFunction &MF = DAG.getMachineFunction();
+  MachineFrameInfo *MFI = MF.getFrameInfo();
+  bool OptSize = MF.getFunction()->hasFnAttr(Attribute::OptimizeForSize);
    FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
    if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
      DstAlignCanChange = true;
@@ -3343,7 +3419,7 @@ static SDValue getMemcpyLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
    std::string Str;
    bool CopyFromStr = isMemSrcFromString(Src, Str);
    bool isZeroStr = CopyFromStr && Str.empty();
-  unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemcpy();
+  unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemcpy(OptSize);
  
    if (!FindOptimalMemOpLowering(MemOps, Limit, Size,
                                  (DstAlignCanChange ? 0 : Align),
@@ -3352,7 +3428,7 @@ static SDValue getMemcpyLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
      return SDValue();
  
    if (DstAlignCanChange) {
-    const Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
+    Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
      unsigned NewAlign = (unsigned) TLI.getTargetData()->getABITypeAlignment(Ty);
      if (NewAlign > Align) {
        // Give the stack frame object a larger alignment if needed.
@@ -3390,7 +3466,7 @@ static SDValue getMemcpyLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
        // FIXME does the case above also need this?
        EVT NVT = TLI.getTypeToTransformTo(*DAG.getContext(), VT);
        assert(NVT.bitsGE(VT));
-      Value = DAG.getExtLoad(ISD::EXTLOAD, NVT, dl, Chain,
+      Value = DAG.getExtLoad(ISD::EXTLOAD, dl, NVT, Chain,
                               getMemBasePlusOffset(Src, SrcOff, DAG),
                               SrcPtrInfo.getWithOffset(SrcOff), VT, isVol, false,
                               MinAlign(SrcAlign, SrcOff));
@@ -3424,14 +3500,16 @@ static SDValue getMemmoveLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
    std::vector<EVT> MemOps;
    bool DstAlignCanChange = false;
-  MachineFrameInfo *MFI = DAG.getMachineFunction().getFrameInfo();
+  MachineFunction &MF = DAG.getMachineFunction();
+  MachineFrameInfo *MFI = MF.getFrameInfo();
+  bool OptSize = MF.getFunction()->hasFnAttr(Attribute::OptimizeForSize);
    FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
    if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
      DstAlignCanChange = true;
    unsigned SrcAlign = DAG.InferPtrAlignment(Src);
    if (Align > SrcAlign)
      SrcAlign = Align;
-  unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemmove();
+  unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemmove(OptSize);
  
    if (!FindOptimalMemOpLowering(MemOps, Limit, Size,
                                  (DstAlignCanChange ? 0 : Align),
@@ -3439,7 +3517,7 @@ static SDValue getMemmoveLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
      return SDValue();
  
    if (DstAlignCanChange) {
-    const Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
+    Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
      unsigned NewAlign = (unsigned) TLI.getTargetData()->getABITypeAlignment(Ty);
      if (NewAlign > Align) {
        // Give the stack frame object a larger alignment if needed.
@@ -3500,19 +3578,21 @@ static SDValue getMemsetStores(SelectionDAG &DAG, DebugLoc dl,
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
    std::vector<EVT> MemOps;
    bool DstAlignCanChange = false;
-  MachineFrameInfo *MFI = DAG.getMachineFunction().getFrameInfo();
+  MachineFunction &MF = DAG.getMachineFunction();
+  MachineFrameInfo *MFI = MF.getFrameInfo();
+  bool OptSize = MF.getFunction()->hasFnAttr(Attribute::OptimizeForSize);
    FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
    if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
      DstAlignCanChange = true;
    bool NonScalarIntSafe =
      isa<ConstantSDNode>(Src) && cast<ConstantSDNode>(Src)->isNullValue();
-  if (!FindOptimalMemOpLowering(MemOps, TLI.getMaxStoresPerMemset(),
+  if (!FindOptimalMemOpLowering(MemOps, TLI.getMaxStoresPerMemset(OptSize),
                                  Size, (DstAlignCanChange ? 0 : Align), 0,
                                  NonScalarIntSafe, false, DAG, TLI))
      return SDValue();
  
    if (DstAlignCanChange) {
-    const Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
+    Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
      unsigned NewAlign = (unsigned) TLI.getTargetData()->getABITypeAlignment(Ty);
      if (NewAlign > Align) {
        // Give the stack frame object a larger alignment if needed.
@@ -3525,16 +3605,34 @@ static SDValue getMemsetStores(SelectionDAG &DAG, DebugLoc dl,
    SmallVector<SDValue, 8> OutChains;
    uint64_t DstOff = 0;
    unsigned NumMemOps = MemOps.size();
+
+  // Find the largest store and generate the bit pattern for it.
+  EVT LargestVT = MemOps[0];
+  for (unsigned i = 1; i < NumMemOps; i++)
+    if (MemOps[i].bitsGT(LargestVT))
+      LargestVT = MemOps[i];
+  SDValue MemSetValue = getMemsetValue(Src, LargestVT, DAG, dl);
+
    for (unsigned i = 0; i < NumMemOps; i++) {
      EVT VT = MemOps[i];
-    unsigned VTSize = VT.getSizeInBits() / 8;
-    SDValue Value = getMemsetValue(Src, VT, DAG, dl);
+
+    // If this store is smaller than the largest store see whether we can get
+    // the smaller value for free with a truncate.
+    SDValue Value = MemSetValue;
+    if (VT.bitsLT(LargestVT)) {
+      if (!LargestVT.isVector() && !VT.isVector() &&
+          TLI.isTruncateFree(LargestVT, VT))
+        Value = DAG.getNode(ISD::TRUNCATE, dl, VT, MemSetValue);
+      else
+        Value = getMemsetValue(Src, VT, DAG, dl);
+    }
+    assert(Value.getValueType() == VT && "Value with wrong type.");
      SDValue Store = DAG.getStore(Chain, dl, Value,
                                   getMemBasePlusOffset(Dst, DstOff, DAG),
                                   DstPtrInfo.getWithOffset(DstOff),
                                   isVol, false, Align);
      OutChains.push_back(Store);
-    DstOff += VTSize;
+    DstOff += VT.getSizeInBits() / 8;
    }
  
    return DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
@@ -3687,7 +3785,7 @@ SDValue SelectionDAG::getMemset(SDValue Chain, DebugLoc dl, SDValue Dst,
      return Result;
  
    // Emit a library call.
-  const Type *IntPtrTy = TLI.getTargetData()->getIntPtrType(*getContext());
+  Type *IntPtrTy = TLI.getTargetData()->getIntPtrType(*getContext());
    TargetLowering::ArgListTy Args;
    TargetLowering::ArgListEntry Entry;
    Entry.Node = Dst; Entry.Ty = IntPtrTy;
@@ -3720,7 +3818,9 @@ SDValue SelectionDAG::getMemset(SDValue Chain, DebugLoc dl, SDValue Dst,
  SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
                                  SDValue Chain, SDValue Ptr, SDValue Cmp,
                                  SDValue Swp, MachinePointerInfo PtrInfo,
-                                unsigned Alignment) {
+                                unsigned Alignment,
+                                AtomicOrdering Ordering,
+                                SynchronizationScope SynchScope) {                                
    if (Alignment == 0)  // Ensure that codegen never sees alignment 0
      Alignment = getEVTAlignment(MemVT);
  
@@ -3733,13 +3833,16 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
    MachineMemOperand *MMO =
      MF.getMachineMemOperand(PtrInfo, Flags, MemVT.getStoreSize(), Alignment);
  
-  return getAtomic(Opcode, dl, MemVT, Chain, Ptr, Cmp, Swp, MMO);
+  return getAtomic(Opcode, dl, MemVT, Chain, Ptr, Cmp, Swp, MMO,
+                   Ordering, SynchScope);
  }
  
  SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
                                  SDValue Chain,
                                  SDValue Ptr, SDValue Cmp,
-                                SDValue Swp, MachineMemOperand *MMO) {
+                                SDValue Swp, MachineMemOperand *MMO,
+                                AtomicOrdering Ordering,
+                                SynchronizationScope SynchScope) {
    assert(Opcode == ISD::ATOMIC_CMP_SWAP && "Invalid Atomic Op");
    assert(Cmp.getValueType() == Swp.getValueType() && "Invalid Atomic Op Types");
  
@@ -3756,7 +3859,8 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
      return SDValue(E, 0);
    }
    SDNode *N = new (NodeAllocator) AtomicSDNode(Opcode, dl, VTs, MemVT, Chain,
-                                               Ptr, Cmp, Swp, MMO);
+                                               Ptr, Cmp, Swp, MMO, Ordering,
+                                               SynchScope);
    CSEMap.InsertNode(N, IP);
    AllNodes.push_back(N);
    return SDValue(N, 0);
@@ -3766,7 +3870,9 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
                                  SDValue Chain,
                                  SDValue Ptr, SDValue Val,
                                  const Value* PtrVal,
-                                unsigned Alignment) {
+                                unsigned Alignment,
+                                AtomicOrdering Ordering,
+                                SynchronizationScope SynchScope) {
    if (Alignment == 0)  // Ensure that codegen never sees alignment 0
      Alignment = getEVTAlignment(MemVT);
  
@@ -3780,13 +3886,16 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
      MF.getMachineMemOperand(MachinePointerInfo(PtrVal), Flags,
                              MemVT.getStoreSize(), Alignment);
  
-  return getAtomic(Opcode, dl, MemVT, Chain, Ptr, Val, MMO);
+  return getAtomic(Opcode, dl, MemVT, Chain, Ptr, Val, MMO,
+                   Ordering, SynchScope);
  }
  
  SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
                                  SDValue Chain,
                                  SDValue Ptr, SDValue Val,
-                                MachineMemOperand *MMO) {
+                                MachineMemOperand *MMO,
+                                AtomicOrdering Ordering,
+                                SynchronizationScope SynchScope) {
    assert((Opcode == ISD::ATOMIC_LOAD_ADD ||
            Opcode == ISD::ATOMIC_LOAD_SUB ||
            Opcode == ISD::ATOMIC_LOAD_AND ||
@@ -3797,12 +3906,14 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
            Opcode == ISD::ATOMIC_LOAD_MAX ||
            Opcode == ISD::ATOMIC_LOAD_UMIN ||
            Opcode == ISD::ATOMIC_LOAD_UMAX ||
-          Opcode == ISD::ATOMIC_SWAP) &&
+          Opcode == ISD::ATOMIC_SWAP ||
+          Opcode == ISD::ATOMIC_STORE) &&
           "Invalid Atomic Op");
  
    EVT VT = Val.getValueType();
  
-  SDVTList VTs = getVTList(VT, MVT::Other);
+  SDVTList VTs = Opcode == ISD::ATOMIC_STORE ? getVTList(MVT::Other) :
+                                               getVTList(VT, MVT::Other);
    FoldingSetNodeID ID;
    ID.AddInteger(MemVT.getRawBits());
    SDValue Ops[] = {Chain, Ptr, Val};
@@ -3813,14 +3924,63 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
      return SDValue(E, 0);
    }
    SDNode *N = new (NodeAllocator) AtomicSDNode(Opcode, dl, VTs, MemVT, Chain,
-                                               Ptr, Val, MMO);
+                                               Ptr, Val, MMO,
+                                               Ordering, SynchScope);
+  CSEMap.InsertNode(N, IP);
+  AllNodes.push_back(N);
+  return SDValue(N, 0);
+}
+
+SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
+                                EVT VT, SDValue Chain,
+                                SDValue Ptr,
+                                const Value* PtrVal,
+                                unsigned Alignment,
+                                AtomicOrdering Ordering,
+                                SynchronizationScope SynchScope) {
+  if (Alignment == 0)  // Ensure that codegen never sees alignment 0
+    Alignment = getEVTAlignment(MemVT);
+
+  MachineFunction &MF = getMachineFunction();
+  unsigned Flags = MachineMemOperand::MOLoad | MachineMemOperand::MOStore;
+
+  // For now, atomics are considered to be volatile always.
+  Flags |= MachineMemOperand::MOVolatile;
+
+  MachineMemOperand *MMO =
+    MF.getMachineMemOperand(MachinePointerInfo(PtrVal), Flags,
+                            MemVT.getStoreSize(), Alignment);
+
+  return getAtomic(Opcode, dl, MemVT, VT, Chain, Ptr, MMO,
+                   Ordering, SynchScope);
+}
+
+SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
+                                EVT VT, SDValue Chain,
+                                SDValue Ptr,
+                                MachineMemOperand *MMO,
+                                AtomicOrdering Ordering,
+                                SynchronizationScope SynchScope) {
+  assert(Opcode == ISD::ATOMIC_LOAD && "Invalid Atomic Op");
+
+  SDVTList VTs = getVTList(VT, MVT::Other);
+  FoldingSetNodeID ID;
+  ID.AddInteger(MemVT.getRawBits());
+  SDValue Ops[] = {Chain, Ptr};
+  AddNodeIDNode(ID, Opcode, VTs, Ops, 2);
+  void* IP = 0;
+  if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP)) {
+    cast<AtomicSDNode>(E)->refineAlignment(MMO);
+    return SDValue(E, 0);
+  }
+  SDNode *N = new (NodeAllocator) AtomicSDNode(Opcode, dl, VTs, MemVT, Chain,
+                                               Ptr, MMO, Ordering, SynchScope);
    CSEMap.InsertNode(N, IP);
    AllNodes.push_back(N);
    return SDValue(N, 0);
  }
  
  /// getMergeValues - Create a MERGE_VALUES node from the given operands.
-/// Allowed to return something different (and simpler) if Simplify is true.
  SDValue SelectionDAG::getMergeValues(const SDValue *Ops, unsigned NumOps,
                                       DebugLoc dl) {
    if (NumOps == 1)
@@ -3882,7 +4042,7 @@ SelectionDAG::getMemIntrinsicNode(unsigned Opcode, DebugLoc dl, SDVTList VTList,
  
    // Memoize the node unless it returns a flag.
    MemIntrinsicSDNode *N;
-  if (VTList.VTs[VTList.NumVTs-1] != MVT::Flag) {
+  if (VTList.VTs[VTList.NumVTs-1] != MVT::Glue) {
      FoldingSetNodeID ID;
      AddNodeIDNode(ID, Opcode, VTList, Ops, NumOps);
      void *IP = 0;
@@ -3943,6 +4103,8 @@ SelectionDAG::getLoad(ISD::MemIndexedMode AM, ISD::LoadExtType ExtType,
                        MachinePointerInfo PtrInfo, EVT MemVT,
                        bool isVolatile, bool isNonTemporal,
                        unsigned Alignment, const MDNode *TBAAInfo) {
+  assert(Chain.getValueType() == MVT::Other && 
+        "Invalid chain type");
    if (Alignment == 0)  // Ensure that codegen never sees alignment 0
      Alignment = getEVTAlignment(VT);
  
@@ -4020,7 +4182,7 @@ SDValue SelectionDAG::getLoad(EVT VT, DebugLoc dl,
                   PtrInfo, VT, isVolatile, isNonTemporal, Alignment, TBAAInfo);
  }
  
-SDValue SelectionDAG::getExtLoad(ISD::LoadExtType ExtType, EVT VT, DebugLoc dl,
+SDValue SelectionDAG::getExtLoad(ISD::LoadExtType ExtType, DebugLoc dl, EVT VT,
                                   SDValue Chain, SDValue Ptr,
                                   MachinePointerInfo PtrInfo, EVT MemVT,
                                   bool isVolatile, bool isNonTemporal,
@@ -4048,6 +4210,8 @@ SDValue SelectionDAG::getStore(SDValue Chain, DebugLoc dl, SDValue Val,
                                 SDValue Ptr, MachinePointerInfo PtrInfo,
                                 bool isVolatile, bool isNonTemporal,
                                 unsigned Alignment, const MDNode *TBAAInfo) {
+  assert(Chain.getValueType() == MVT::Other && 
+        "Invalid chain type");
    if (Alignment == 0)  // Ensure that codegen never sees alignment 0
      Alignment = getEVTAlignment(Val.getValueType());
  
@@ -4071,6 +4235,8 @@ SDValue SelectionDAG::getStore(SDValue Chain, DebugLoc dl, SDValue Val,
  
  SDValue SelectionDAG::getStore(SDValue Chain, DebugLoc dl, SDValue Val,
                                 SDValue Ptr, MachineMemOperand *MMO) {
+  assert(Chain.getValueType() == MVT::Other && 
+        "Invalid chain type");
    EVT VT = Val.getValueType();
    SDVTList VTs = getVTList(MVT::Other);
    SDValue Undef = getUNDEF(Ptr.getValueType());
@@ -4097,6 +4263,8 @@ SDValue SelectionDAG::getTruncStore(SDValue Chain, DebugLoc dl, SDValue Val,
                                      EVT SVT,bool isVolatile, bool isNonTemporal,
                                      unsigned Alignment,
                                      const MDNode *TBAAInfo) {
+  assert(Chain.getValueType() == MVT::Other && 
+        "Invalid chain type");
    if (Alignment == 0)  // Ensure that codegen never sees alignment 0
      Alignment = getEVTAlignment(SVT);
  
@@ -4122,6 +4290,8 @@ SDValue SelectionDAG::getTruncStore(SDValue Chain, DebugLoc dl, SDValue Val,
                                      MachineMemOperand *MMO) {
    EVT VT = Val.getValueType();
  
+  assert(Chain.getValueType() == MVT::Other && 
+        "Invalid chain type");
    if (VT == SVT)
      return getStore(Chain, dl, Val, Ptr, MMO);
  
@@ -4238,7 +4408,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
    SDNode *N;
    SDVTList VTs = getVTList(VT);
  
-  if (VT != MVT::Flag) {
+  if (VT != MVT::Glue) {
      FoldingSetNodeID ID;
      AddNodeIDNode(ID, Opcode, VTs, Ops, NumOps);
      void *IP = 0;
@@ -4304,7 +4474,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, SDVTList VTList,
  
    // Memoize the node unless it returns a flag.
    SDNode *N;
-  if (VTList.VTs[VTList.NumVTs-1] != MVT::Flag) {
+  if (VTList.VTs[VTList.NumVTs-1] != MVT::Glue) {
      FoldingSetNodeID ID;
      AddNodeIDNode(ID, Opcode, VTList, Ops, NumOps);
      void *IP = 0;
@@ -4713,7 +4883,7 @@ SDNode *SelectionDAG::MorphNodeTo(SDNode *N, unsigned Opc,
                                    unsigned NumOps) {
    // If an identical node already exists, use it.
    void *IP = 0;
-  if (VTs.VTs[VTs.NumVTs-1] != MVT::Flag) {
+  if (VTs.VTs[VTs.NumVTs-1] != MVT::Glue) {
      FoldingSetNodeID ID;
      AddNodeIDNode(ID, Opc, VTs, Ops, NumOps);
      if (SDNode *ON = CSEMap.FindNodeOrInsertPos(ID, IP))
@@ -4913,9 +5083,9 @@ SelectionDAG::getMachineNode(unsigned Opcode, DebugLoc dl,
  MachineSDNode *
  SelectionDAG::getMachineNode(unsigned Opcode, DebugLoc DL, SDVTList VTs,
                               const SDValue *Ops, unsigned NumOps) {
-  bool DoCSE = VTs.VTs[VTs.NumVTs-1] != MVT::Flag;
+  bool DoCSE = VTs.VTs[VTs.NumVTs-1] != MVT::Glue;
    MachineSDNode *N;
-  void *IP;
+  void *IP = 0;
  
    if (DoCSE) {
      FoldingSetNodeID ID;
@@ -4975,7 +5145,7 @@ SelectionDAG::getTargetInsertSubreg(int SRIdx, DebugLoc DL, EVT VT,
  /// else return NULL.
  SDNode *SelectionDAG::getNodeIfExists(unsigned Opcode, SDVTList VTList,
                                        const SDValue *Ops, unsigned NumOps) {
-  if (VTList.VTs[VTList.NumVTs-1] != MVT::Flag) {
+  if (VTList.VTs[VTList.NumVTs-1] != MVT::Glue) {
      FoldingSetNodeID ID;
      AddNodeIDNode(ID, Opcode, VTList, Ops, NumOps);
      void *IP = 0;
@@ -5408,6 +5578,29 @@ void SelectionDAG::AddDbgValue(SDDbgValue *DB, SDNode *SD, bool isParameter) {
      SD->setHasDebugValue(true);
  }
  
+/// TransferDbgValues - Transfer SDDbgValues.
+void SelectionDAG::TransferDbgValues(SDValue From, SDValue To) {
+  if (From == To || !From.getNode()->getHasDebugValue())
+    return;
+  SDNode *FromNode = From.getNode();
+  SDNode *ToNode = To.getNode();
+  ArrayRef<SDDbgValue *> DVs = GetDbgValues(FromNode);
+  SmallVector<SDDbgValue *, 2> ClonedDVs;
+  for (ArrayRef<SDDbgValue *>::iterator I = DVs.begin(), E = DVs.end();
+       I != E; ++I) {
+    SDDbgValue *Dbg = *I;
+    if (Dbg->getKind() == SDDbgValue::SDNODE) {
+      SDDbgValue *Clone = getDbgValue(Dbg->getMDPtr(), ToNode, To.getResNo(),
+                                      Dbg->getOffset(), Dbg->getDebugLoc(),
+                                      Dbg->getOrder());
+      ClonedDVs.push_back(Clone);
+    }
+  }
+  for (SmallVector<SDDbgValue *, 2>::iterator I = ClonedDVs.begin(),
+         E = ClonedDVs.end(); I != E; ++I)
+    AddDbgValue(*I, ToNode, false);
+}
+
  //===----------------------------------------------------------------------===//
  //                              SDNode Class
  //===----------------------------------------------------------------------===//
@@ -5574,24 +5767,39 @@ bool SDValue::reachesChainWithoutSideEffects(SDValue Dest,
    return false;
  }
  
-/// isPredecessorOf - Return true if this node is a predecessor of N. This node
-/// is either an operand of N or it can be reached by traversing up the operands.
-/// NOTE: this is an expensive method. Use it carefully.
-bool SDNode::isPredecessorOf(SDNode *N) const {
-  SmallPtrSet<SDNode *, 32> Visited;
-  SmallVector<SDNode *, 16> Worklist;
-  Worklist.push_back(N);
+/// hasPredecessor - Return true if N is a predecessor of this node.
+/// N is either an operand of this node, or can be reached by recursively
+/// traversing up the operands.
+/// NOTE: This is an expensive method. Use it carefully.
+bool SDNode::hasPredecessor(const SDNode *N) const {
+  SmallPtrSet<const SDNode *, 32> Visited;
+  SmallVector<const SDNode *, 16> Worklist;
+  return hasPredecessorHelper(N, Visited, Worklist);
+}
+
+bool SDNode::hasPredecessorHelper(const SDNode *N,
+                                  SmallPtrSet<const SDNode *, 32> &Visited,
+                                  SmallVector<const SDNode *, 16> &Worklist) const {
+  if (Visited.empty()) {
+    Worklist.push_back(this);
+  } else {
+    // Take a look in the visited set. If we've already encountered this node
+    // we needn't search further.
+    if (Visited.count(N))
+      return true;
+  }
  
-  do {
-    N = Worklist.pop_back_val();
-    for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
-      SDNode *Op = N->getOperand(i).getNode();
-      if (Op == this)
-        return true;
+  // Haven't visited N yet. Continue the search.
+  while (!Worklist.empty()) {
+    const SDNode *M = Worklist.pop_back_val();
+    for (unsigned i = 0, e = M->getNumOperands(); i != e; ++i) {
+      SDNode *Op = M->getOperand(i).getNode();
        if (Visited.insert(Op))
          Worklist.push_back(Op);
+      if (Op == N)
+        return true;
      }
-  } while (!Worklist.empty());
+  }
  
    return false;
  }
@@ -5627,6 +5835,7 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
  #endif
    case ISD::PREFETCH:      return "Prefetch";
    case ISD::MEMBARRIER:    return "MemBarrier";
+  case ISD::ATOMIC_FENCE:    return "AtomicFence";
    case ISD::ATOMIC_CMP_SWAP:    return "AtomicCmpSwap";
    case ISD::ATOMIC_SWAP:        return "AtomicSwap";
    case ISD::ATOMIC_LOAD_ADD:    return "AtomicLoadAdd";
@@ -5639,6 +5848,8 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::ATOMIC_LOAD_MAX:    return "AtomicLoadMax";
    case ISD::ATOMIC_LOAD_UMIN:   return "AtomicLoadUMin";
    case ISD::ATOMIC_LOAD_UMAX:   return "AtomicLoadUMax";
+  case ISD::ATOMIC_LOAD:        return "AtomicLoad";
+  case ISD::ATOMIC_STORE:       return "AtomicStore";
    case ISD::PCMARKER:      return "PCMarker";
    case ISD::READCYCLECOUNTER: return "ReadCycleCounter";
    case ISD::SRCVALUE:      return "SrcValue";
@@ -5746,6 +5957,7 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::FSUB:   return "fsub";
    case ISD::FMUL:   return "fmul";
    case ISD::FDIV:   return "fdiv";
+  case ISD::FMA:    return "fma";
    case ISD::FREM:   return "frem";
    case ISD::FCOPYSIGN: return "fcopysign";
    case ISD::FGETSIGN:  return "fgetsign";
@@ -5759,6 +5971,7 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::INSERT_VECTOR_ELT:   return "insert_vector_elt";
    case ISD::EXTRACT_VECTOR_ELT:  return "extract_vector_elt";
    case ISD::CONCAT_VECTORS:      return "concat_vectors";
+  case ISD::INSERT_SUBVECTOR:    return "insert_subvector";
    case ISD::EXTRACT_SUBVECTOR:   return "extract_subvector";
    case ISD::SCALAR_TO_VECTOR:    return "scalar_to_vector";
    case ISD::VECTOR_SHUFFLE:      return "vector_shuffle";
@@ -5792,7 +6005,7 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::UINT_TO_FP:  return "uint_to_fp";
    case ISD::FP_TO_SINT:  return "fp_to_sint";
    case ISD::FP_TO_UINT:  return "fp_to_uint";
-  case ISD::BITCAST:     return "bit_convert";
+  case ISD::BITCAST:     return "bitcast";
    case ISD::FP16_TO_FP32: return "fp16_to_fp32";
    case ISD::FP32_TO_FP16: return "fp32_to_fp16";
  
@@ -5841,7 +6054,8 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::CTLZ:    return "ctlz";
  
    // Trampolines
-  case ISD::TRAMPOLINE: return "trampoline";
+  case ISD::INIT_TRAMPOLINE: return "init_trampoline";
+  case ISD::ADJUST_TRAMPOLINE: return "adjust_trampoline";
  
    case ISD::CONDCODE:
      switch (cast<CondCodeSDNode>(this)->get()) {
@@ -6004,12 +6218,7 @@ void SDNode::print_details(raw_ostream &OS, const SelectionDAG *G) const {
        OS << LBB->getName() << " ";
      OS << (const void*)BBDN->getBasicBlock() << ">";
    } else if (const RegisterSDNode *R = dyn_cast<RegisterSDNode>(this)) {
-    if (G && R->getReg() &&
-        TargetRegisterInfo::isPhysicalRegister(R->getReg())) {
-      OS << " %" << G->getTarget().getRegisterInfo()->getName(R->getReg());
-    } else {
-      OS << " %reg" << R->getReg();
-    }
+    OS << ' ' << PrintReg(R->getReg(), G ? G->getTarget().getRegisterInfo() :0);
    } else if (const ExternalSymbolSDNode *ES =
               dyn_cast<ExternalSymbolSDNode>(this)) {
      OS << "'" << ES->getSymbol() << "'";
@@ -6119,6 +6328,9 @@ static void printrWithDepthHelper(raw_ostream &OS, const SDNode *N,
      return;
  
    for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
+    // Don't follow chain operands.
+    if (N->getOperand(i).getValueType() == MVT::Other)
+      continue;
      OS << '\n';
      printrWithDepthHelper(OS, N->getOperand(i).getNode(), G, depth-1, indent+2);
    }
@@ -6131,7 +6343,7 @@ void SDNode::printrWithDepth(raw_ostream &OS, const SelectionDAG *G,
  
  void SDNode::printrFull(raw_ostream &OS, const SelectionDAG *G) const {
    // Don't print impossibly deep things.
-  printrWithDepth(OS, G, 100);
+  printrWithDepth(OS, G, 10);
  }
  
  void SDNode::dumprWithDepth(const SelectionDAG *G, unsigned depth) const {
@@ -6140,7 +6352,7 @@ void SDNode::dumprWithDepth(const SelectionDAG *G, unsigned depth) const {
  
  void SDNode::dumprFull(const SelectionDAG *G) const {
    // Don't print impossibly deep things.
-  dumprWithDepth(G, 100);
+  dumprWithDepth(G, 10);
  }
  
  static void DumpNodes(const SDNode *N, unsigned indent, const SelectionDAG *G) {
@@ -6186,7 +6398,7 @@ SDValue SelectionDAG::UnrollVectorOp(SDNode *N, unsigned ResNE) {
          Operands[j] = getNode(ISD::EXTRACT_VECTOR_ELT, dl,
                                OperandEltVT,
                                Operand,
-                              getConstant(i, MVT::i32));
+                              getConstant(i, TLI.getPointerTy()));
        } else {
          // A scalar operand; just use it as is.
          Operands[j] = Operand;
@@ -6204,7 +6416,8 @@ SDValue SelectionDAG::UnrollVectorOp(SDNode *N, unsigned ResNE) {
      case ISD::ROTL:
      case ISD::ROTR:
        Scalars.push_back(getNode(N->getOpcode(), dl, EltVT, Operands[0],
-                                getShiftAmountOperand(Operands[1])));
+                                getShiftAmountOperand(Operands[0].getValueType(),
+                                                      Operands[1])));
        break;
      case ISD::SIGN_EXTEND_INREG:
      case ISD::FP_ROUND_INREG: {
@@ -6249,11 +6462,11 @@ bool SelectionDAG::isConsecutiveLoad(LoadSDNode *LD, LoadSDNode *Base,
      if (FS != BFS || FS != (int)Bytes) return false;
      return MFI->getObjectOffset(FI) == (MFI->getObjectOffset(BFI) + Dist*Bytes);
    }
-  if (Loc.getOpcode() == ISD::ADD && Loc.getOperand(0) == BaseLoc) {
-    ConstantSDNode *V = dyn_cast<ConstantSDNode>(Loc.getOperand(1));
-    if (V && (V->getSExtValue() == Dist*Bytes))
-      return true;
-  }
+
+  // Handle X+C
+  if (isBaseWithConstantOffset(Loc) && Loc.getOperand(0) == BaseLoc &&
+      cast<ConstantSDNode>(Loc.getOperand(1))->getSExtValue() == Dist*Bytes)
+    return true;
  
    const GlobalValue *GV1 = NULL;
    const GlobalValue *GV2 = NULL;
@@ -6294,15 +6507,14 @@ unsigned SelectionDAG::InferPtrAlignment(SDValue Ptr) const {
    int64_t FrameOffset = 0;
    if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Ptr)) {
      FrameIdx = FI->getIndex();
-  } else if (Ptr.getOpcode() == ISD::ADD &&
-             isa<ConstantSDNode>(Ptr.getOperand(1)) &&
+  } else if (isBaseWithConstantOffset(Ptr) &&
               isa<FrameIndexSDNode>(Ptr.getOperand(0))) {
+    // Handle FI+Cst
      FrameIdx = cast<FrameIndexSDNode>(Ptr.getOperand(0))->getIndex();
      FrameOffset = Ptr.getConstantOperandVal(1);
    }
  
    if (FrameIdx != (1 << 31)) {
-    // FIXME: Handle FI+CST.
      const MachineFrameInfo &MFI = *getMachineFunction().getFrameInfo();
      unsigned FIInfoAlign = MinAlign(MFI.getObjectAlignment(FrameIdx),
                                      FrameOffset);
@@ -6386,7 +6598,7 @@ unsigned GlobalAddressSDNode::getAddressSpace() const {
  }
  
  
-const Type *ConstantPoolSDNode::getType() const {
+Type *ConstantPoolSDNode::getType() const {
    if (isMachineConstantPoolEntry())
      return Val.MachineCPVal->getType();
    return Val.ConstVal->getType();