Add sub/mul overflow intrinsics. This currently doesn't have a

[oota-llvm.git] / lib / CodeGen / SelectionDAG / SelectionDAGBuild.cpp
diff --git a/lib/CodeGen/SelectionDAG/SelectionDAGBuild.cpp b/lib/CodeGen/SelectionDAG/SelectionDAGBuild.cpp

index 57b6768528fe553919a20da41038aa94d6697db4..5d81d224c88506d898e8ed901e9b9f9daf5faa4f 100644 (file)
--- a/lib/CodeGen/SelectionDAG/SelectionDAGBuild.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAGBuild.cpp
@@ -25,7 +25,7 @@
  #include "llvm/Instructions.h"
  #include "llvm/Intrinsics.h"
  #include "llvm/IntrinsicInst.h"
-#include "llvm/ParameterAttributes.h"
+#include "llvm/Module.h"
  #include "llvm/CodeGen/FastISel.h"
  #include "llvm/CodeGen/GCStrategy.h"
  #include "llvm/CodeGen/GCMetadata.h"
@@ -35,6 +35,7 @@
  #include "llvm/CodeGen/MachineJumpTableInfo.h"
  #include "llvm/CodeGen/MachineModuleInfo.h"
  #include "llvm/CodeGen/MachineRegisterInfo.h"
+#include "llvm/CodeGen/PseudoSourceValue.h"
  #include "llvm/CodeGen/SelectionDAG.h"
  #include "llvm/Target/TargetRegisterInfo.h"
  #include "llvm/Target/TargetData.h"
@@ -247,7 +248,9 @@ static bool isUsedOutsideOfDefiningBlock(Instruction *I) {
  static bool isOnlyUsedInEntryBlock(Argument *A, bool EnableFastISel) {
    // With FastISel active, we may be splitting blocks, so force creation
    // of virtual registers for all non-dead arguments.
-  if (EnableFastISel)
+  // Don't force virtual registers for byval arguments though, because
+  // fast-isel can't handle those in all cases.
+  if (EnableFastISel && !A->hasByValAttr())
      return A->use_empty();
  
    BasicBlock *Entry = A->getParent()->begin();
@@ -389,14 +392,17 @@ static SDValue getCopyFromParts(SelectionDAG &DAG,
          ValueVT : MVT::getIntegerVT(RoundBits);
        SDValue Lo, Hi;
  
+      MVT HalfVT = ValueVT.isInteger() ?
+        MVT::getIntegerVT(RoundBits/2) :
+        MVT::getFloatingPointVT(RoundBits/2);
+
        if (RoundParts > 2) {
-        MVT HalfVT = MVT::getIntegerVT(RoundBits/2);
          Lo = getCopyFromParts(DAG, Parts, RoundParts/2, PartVT, HalfVT);
          Hi = getCopyFromParts(DAG, Parts+RoundParts/2, RoundParts/2,
                                PartVT, HalfVT);
        } else {
-        Lo = Parts[0];
-        Hi = Parts[1];
+        Lo = DAG.getNode(ISD::BIT_CONVERT, HalfVT, Parts[0]);
+        Hi = DAG.getNode(ISD::BIT_CONVERT, HalfVT, Parts[1]);
        }
        if (TLI.isBigEndian())
          std::swap(Lo, Hi);
@@ -511,11 +517,8 @@ static SDValue getCopyFromParts(SelectionDAG &DAG,
  /// getCopyToParts - Create a series of nodes that contain the specified value
  /// split into legal parts.  If the parts contain more bits than Val, then, for
  /// integers, ExtendKind can be used to specify how to generate the extra bits.
-static void getCopyToParts(SelectionDAG &DAG,
-                           SDValue Val,
-                           SDValue *Parts,
-                           unsigned NumParts,
-                           MVT PartVT,
+static void getCopyToParts(SelectionDAG &DAG, SDValue Val,
+                           SDValue *Parts, unsigned NumParts, MVT PartVT,
                             ISD::NodeType ExtendKind = ISD::ANY_EXTEND) {
    TargetLowering &TLI = DAG.getTargetLoweringInfo();
    MVT PtrVT = TLI.getPointerTy();
@@ -794,7 +797,7 @@ SDValue SelectionDAGLowering::getValue(const Value *V) {
      MVT VT = TLI.getValueType(V->getType(), true);
      
      if (ConstantInt *CI = dyn_cast<ConstantInt>(C))
-      return N = DAG.getConstant(CI->getValue(), VT);
+      return N = DAG.getConstant(*CI, VT);
  
      if (GlobalValue *GV = dyn_cast<GlobalValue>(C))
        return N = DAG.getGlobalAddress(GV, VT);
@@ -803,7 +806,7 @@ SDValue SelectionDAGLowering::getValue(const Value *V) {
        return N = DAG.getConstant(0, TLI.getPointerTy());
      
      if (ConstantFP *CFP = dyn_cast<ConstantFP>(C))
-      return N = DAG.getConstantFP(CFP->getValueAPF(), VT);
+      return N = DAG.getConstantFP(*CFP, VT);
      
      if (isa<UndefValue>(C) && !isa<VectorType>(V->getType()) &&
          !V->getType()->isAggregateType())
@@ -904,15 +907,18 @@ void SelectionDAGLowering::visitRet(ReturnInst &I) {
    SmallVector<SDValue, 8> NewValues;
    NewValues.push_back(getControlRoot());
    for (unsigned i = 0, e = I.getNumOperands(); i != e; ++i) {  
-    SDValue RetOp = getValue(I.getOperand(i));
-
      SmallVector<MVT, 4> ValueVTs;
      ComputeValueVTs(TLI, I.getOperand(i)->getType(), ValueVTs);
-    for (unsigned j = 0, f = ValueVTs.size(); j != f; ++j) {
+    unsigned NumValues = ValueVTs.size();
+    if (NumValues == 0) continue;
+
+    SDValue RetOp = getValue(I.getOperand(i));
+    for (unsigned j = 0, f = NumValues; j != f; ++j) {
        MVT VT = ValueVTs[j];
  
        // FIXME: C calling convention requires the return type to be promoted to
-      // at least 32-bit. But this is not necessary for non-C calling conventions.
+      // at least 32-bit. But this is not necessary for non-C calling
+      // conventions.
        if (VT.isInteger()) {
          MVT MinVT = TLI.getRegisterType(MVT::i32);
          if (VT.bitsLT(MinVT))
@@ -925,17 +931,21 @@ void SelectionDAGLowering::visitRet(ReturnInst &I) {
        ISD::NodeType ExtendKind = ISD::ANY_EXTEND;
    
        const Function *F = I.getParent()->getParent();
-      if (F->paramHasAttr(0, ParamAttr::SExt))
+      if (F->paramHasAttr(0, Attribute::SExt))
          ExtendKind = ISD::SIGN_EXTEND;
-      else if (F->paramHasAttr(0, ParamAttr::ZExt))
+      else if (F->paramHasAttr(0, Attribute::ZExt))
          ExtendKind = ISD::ZERO_EXTEND;
  
        getCopyToParts(DAG, SDValue(RetOp.getNode(), RetOp.getResNo() + j),
                       &Parts[0], NumParts, PartVT, ExtendKind);
  
+      // 'inreg' on function refers to return value
+      ISD::ArgFlagsTy Flags = ISD::ArgFlagsTy();
+      if (F->paramHasAttr(0, Attribute::InReg))
+        Flags.setInReg();
        for (unsigned i = 0; i < NumParts; ++i) {
          NewValues.push_back(Parts[i]);
-        NewValues.push_back(DAG.getArgFlags(ISD::ArgFlagsTy()));
+        NewValues.push_back(DAG.getArgFlags(Flags));
        }
      }
    }
@@ -990,6 +1000,104 @@ static bool InBlock(const Value *V, const BasicBlock *BB) {
    return true;
  }
  
+/// getFCmpCondCode - Return the ISD condition code corresponding to
+/// the given LLVM IR floating-point condition code.  This includes
+/// consideration of global floating-point math flags.
+///
+static ISD::CondCode getFCmpCondCode(FCmpInst::Predicate Pred) {
+  ISD::CondCode FPC, FOC;
+  switch (Pred) {
+  case FCmpInst::FCMP_FALSE: FOC = FPC = ISD::SETFALSE; break;
+  case FCmpInst::FCMP_OEQ:   FOC = ISD::SETEQ; FPC = ISD::SETOEQ; break;
+  case FCmpInst::FCMP_OGT:   FOC = ISD::SETGT; FPC = ISD::SETOGT; break;
+  case FCmpInst::FCMP_OGE:   FOC = ISD::SETGE; FPC = ISD::SETOGE; break;
+  case FCmpInst::FCMP_OLT:   FOC = ISD::SETLT; FPC = ISD::SETOLT; break;
+  case FCmpInst::FCMP_OLE:   FOC = ISD::SETLE; FPC = ISD::SETOLE; break;
+  case FCmpInst::FCMP_ONE:   FOC = ISD::SETNE; FPC = ISD::SETONE; break;
+  case FCmpInst::FCMP_ORD:   FOC = FPC = ISD::SETO;   break;
+  case FCmpInst::FCMP_UNO:   FOC = FPC = ISD::SETUO;  break;
+  case FCmpInst::FCMP_UEQ:   FOC = ISD::SETEQ; FPC = ISD::SETUEQ; break;
+  case FCmpInst::FCMP_UGT:   FOC = ISD::SETGT; FPC = ISD::SETUGT; break;
+  case FCmpInst::FCMP_UGE:   FOC = ISD::SETGE; FPC = ISD::SETUGE; break;
+  case FCmpInst::FCMP_ULT:   FOC = ISD::SETLT; FPC = ISD::SETULT; break;
+  case FCmpInst::FCMP_ULE:   FOC = ISD::SETLE; FPC = ISD::SETULE; break;
+  case FCmpInst::FCMP_UNE:   FOC = ISD::SETNE; FPC = ISD::SETUNE; break;
+  case FCmpInst::FCMP_TRUE:  FOC = FPC = ISD::SETTRUE; break;
+  default:
+    assert(0 && "Invalid FCmp predicate opcode!");
+    FOC = FPC = ISD::SETFALSE;
+    break;
+  }
+  if (FiniteOnlyFPMath())
+    return FOC;
+  else 
+    return FPC;
+}
+
+/// getICmpCondCode - Return the ISD condition code corresponding to
+/// the given LLVM IR integer condition code.
+///
+static ISD::CondCode getICmpCondCode(ICmpInst::Predicate Pred) {
+  switch (Pred) {
+  case ICmpInst::ICMP_EQ:  return ISD::SETEQ;
+  case ICmpInst::ICMP_NE:  return ISD::SETNE;
+  case ICmpInst::ICMP_SLE: return ISD::SETLE;
+  case ICmpInst::ICMP_ULE: return ISD::SETULE;
+  case ICmpInst::ICMP_SGE: return ISD::SETGE;
+  case ICmpInst::ICMP_UGE: return ISD::SETUGE;
+  case ICmpInst::ICMP_SLT: return ISD::SETLT;
+  case ICmpInst::ICMP_ULT: return ISD::SETULT;
+  case ICmpInst::ICMP_SGT: return ISD::SETGT;
+  case ICmpInst::ICMP_UGT: return ISD::SETUGT;
+  default:
+    assert(0 && "Invalid ICmp predicate opcode!");
+    return ISD::SETNE;
+  }
+}
+
+/// EmitBranchForMergedCondition - Helper method for FindMergedConditions.
+/// This function emits a branch and is used at the leaves of an OR or an
+/// AND operator tree.
+///
+void
+SelectionDAGLowering::EmitBranchForMergedCondition(Value *Cond,
+                                                   MachineBasicBlock *TBB,
+                                                   MachineBasicBlock *FBB,
+                                                   MachineBasicBlock *CurBB) {
+  const BasicBlock *BB = CurBB->getBasicBlock();
+
+  // If the leaf of the tree is a comparison, merge the condition into
+  // the caseblock.
+  if (CmpInst *BOp = dyn_cast<CmpInst>(Cond)) {
+    // The operands of the cmp have to be in this block.  We don't know
+    // how to export them from some other block.  If this is the first block
+    // of the sequence, no exporting is needed.
+    if (CurBB == CurMBB ||
+        (isExportableFromCurrentBlock(BOp->getOperand(0), BB) &&
+         isExportableFromCurrentBlock(BOp->getOperand(1), BB))) {
+      ISD::CondCode Condition;
+      if (ICmpInst *IC = dyn_cast<ICmpInst>(Cond)) {
+        Condition = getICmpCondCode(IC->getPredicate());
+      } else if (FCmpInst *FC = dyn_cast<FCmpInst>(Cond)) {
+        Condition = getFCmpCondCode(FC->getPredicate());
+      } else {
+        Condition = ISD::SETEQ; // silence warning.
+        assert(0 && "Unknown compare instruction");
+      }
+
+      CaseBlock CB(Condition, BOp->getOperand(0),
+                   BOp->getOperand(1), NULL, TBB, FBB, CurBB);
+      SwitchCases.push_back(CB);
+      return;
+    }
+  }
+
+  // Create a CaseBlock record representing this branch.
+  CaseBlock CB(ISD::SETEQ, Cond, ConstantInt::getTrue(),
+               NULL, TBB, FBB, CurBB);
+  SwitchCases.push_back(CB);
+}
+
  /// FindMergedConditions - If Cond is an expression like 
  void SelectionDAGLowering::FindMergedConditions(Value *Cond,
                                                  MachineBasicBlock *TBB,
@@ -998,83 +1106,15 @@ void SelectionDAGLowering::FindMergedConditions(Value *Cond,
                                                  unsigned Opc) {
    // If this node is not part of the or/and tree, emit it as a branch.
    Instruction *BOp = dyn_cast<Instruction>(Cond);
-
    if (!BOp || !(isa<BinaryOperator>(BOp) || isa<CmpInst>(BOp)) || 
        (unsigned)BOp->getOpcode() != Opc || !BOp->hasOneUse() ||
        BOp->getParent() != CurBB->getBasicBlock() ||
        !InBlock(BOp->getOperand(0), CurBB->getBasicBlock()) ||
        !InBlock(BOp->getOperand(1), CurBB->getBasicBlock())) {
-    const BasicBlock *BB = CurBB->getBasicBlock();
-    
-    // If the leaf of the tree is a comparison, merge the condition into 
-    // the caseblock.
-    if ((isa<ICmpInst>(Cond) || isa<FCmpInst>(Cond)) &&
-        // The operands of the cmp have to be in this block.  We don't know
-        // how to export them from some other block.  If this is the first block
-        // of the sequence, no exporting is needed.
-        (CurBB == CurMBB ||
-         (isExportableFromCurrentBlock(BOp->getOperand(0), BB) &&
-          isExportableFromCurrentBlock(BOp->getOperand(1), BB)))) {
-      BOp = cast<Instruction>(Cond);
-      ISD::CondCode Condition;
-      if (ICmpInst *IC = dyn_cast<ICmpInst>(Cond)) {
-        switch (IC->getPredicate()) {
-        default: assert(0 && "Unknown icmp predicate opcode!");
-        case ICmpInst::ICMP_EQ:  Condition = ISD::SETEQ;  break;
-        case ICmpInst::ICMP_NE:  Condition = ISD::SETNE;  break;
-        case ICmpInst::ICMP_SLE: Condition = ISD::SETLE;  break;
-        case ICmpInst::ICMP_ULE: Condition = ISD::SETULE; break;
-        case ICmpInst::ICMP_SGE: Condition = ISD::SETGE;  break;
-        case ICmpInst::ICMP_UGE: Condition = ISD::SETUGE; break;
-        case ICmpInst::ICMP_SLT: Condition = ISD::SETLT;  break;
-        case ICmpInst::ICMP_ULT: Condition = ISD::SETULT; break;
-        case ICmpInst::ICMP_SGT: Condition = ISD::SETGT;  break;
-        case ICmpInst::ICMP_UGT: Condition = ISD::SETUGT; break;
-        }
-      } else if (FCmpInst *FC = dyn_cast<FCmpInst>(Cond)) {
-        ISD::CondCode FPC, FOC;
-        switch (FC->getPredicate()) {
-        default: assert(0 && "Unknown fcmp predicate opcode!");
-        case FCmpInst::FCMP_FALSE: FOC = FPC = ISD::SETFALSE; break;
-        case FCmpInst::FCMP_OEQ:   FOC = ISD::SETEQ; FPC = ISD::SETOEQ; break;
-        case FCmpInst::FCMP_OGT:   FOC = ISD::SETGT; FPC = ISD::SETOGT; break;
-        case FCmpInst::FCMP_OGE:   FOC = ISD::SETGE; FPC = ISD::SETOGE; break;
-        case FCmpInst::FCMP_OLT:   FOC = ISD::SETLT; FPC = ISD::SETOLT; break;
-        case FCmpInst::FCMP_OLE:   FOC = ISD::SETLE; FPC = ISD::SETOLE; break;
-        case FCmpInst::FCMP_ONE:   FOC = ISD::SETNE; FPC = ISD::SETONE; break;
-        case FCmpInst::FCMP_ORD:   FOC = FPC = ISD::SETO;   break;
-        case FCmpInst::FCMP_UNO:   FOC = FPC = ISD::SETUO;  break;
-        case FCmpInst::FCMP_UEQ:   FOC = ISD::SETEQ; FPC = ISD::SETUEQ; break;
-        case FCmpInst::FCMP_UGT:   FOC = ISD::SETGT; FPC = ISD::SETUGT; break;
-        case FCmpInst::FCMP_UGE:   FOC = ISD::SETGE; FPC = ISD::SETUGE; break;
-        case FCmpInst::FCMP_ULT:   FOC = ISD::SETLT; FPC = ISD::SETULT; break;
-        case FCmpInst::FCMP_ULE:   FOC = ISD::SETLE; FPC = ISD::SETULE; break;
-        case FCmpInst::FCMP_UNE:   FOC = ISD::SETNE; FPC = ISD::SETUNE; break;
-        case FCmpInst::FCMP_TRUE:  FOC = FPC = ISD::SETTRUE; break;
-        }
-        if (FiniteOnlyFPMath())
-          Condition = FOC;
-        else 
-          Condition = FPC;
-      } else {
-        Condition = ISD::SETEQ; // silence warning.
-        assert(0 && "Unknown compare instruction");
-      }
-      
-      CaseBlock CB(Condition, BOp->getOperand(0), 
-                   BOp->getOperand(1), NULL, TBB, FBB, CurBB);
-      SwitchCases.push_back(CB);
-      return;
-    }
-    
-    // Create a CaseBlock record representing this branch.
-    CaseBlock CB(ISD::SETEQ, Cond, ConstantInt::getTrue(),
-                 NULL, TBB, FBB, CurBB);
-    SwitchCases.push_back(CB);
+    EmitBranchForMergedCondition(Cond, TBB, FBB, CurBB);
      return;
    }
    
-  
    //  Create TmpBB after CurBB.
    MachineFunction::iterator BBI = CurBB;
    MachineFunction &MF = DAG.getMachineFunction();
@@ -2061,23 +2101,7 @@ void SelectionDAGLowering::visitICmp(User &I) {
      predicate = ICmpInst::Predicate(IC->getPredicate());
    SDValue Op1 = getValue(I.getOperand(0));
    SDValue Op2 = getValue(I.getOperand(1));
-  ISD::CondCode Opcode;
-  switch (predicate) {
-    case ICmpInst::ICMP_EQ  : Opcode = ISD::SETEQ; break;
-    case ICmpInst::ICMP_NE  : Opcode = ISD::SETNE; break;
-    case ICmpInst::ICMP_UGT : Opcode = ISD::SETUGT; break;
-    case ICmpInst::ICMP_UGE : Opcode = ISD::SETUGE; break;
-    case ICmpInst::ICMP_ULT : Opcode = ISD::SETULT; break;
-    case ICmpInst::ICMP_ULE : Opcode = ISD::SETULE; break;
-    case ICmpInst::ICMP_SGT : Opcode = ISD::SETGT; break;
-    case ICmpInst::ICMP_SGE : Opcode = ISD::SETGE; break;
-    case ICmpInst::ICMP_SLT : Opcode = ISD::SETLT; break;
-    case ICmpInst::ICMP_SLE : Opcode = ISD::SETLE; break;
-    default:
-      assert(!"Invalid ICmp predicate value");
-      Opcode = ISD::SETEQ;
-      break;
-  }
+  ISD::CondCode Opcode = getICmpCondCode(predicate);
    setValue(&I, DAG.getSetCC(MVT::i1, Op1, Op2, Opcode));
  }
  
@@ -2089,33 +2113,7 @@ void SelectionDAGLowering::visitFCmp(User &I) {
      predicate = FCmpInst::Predicate(FC->getPredicate());
    SDValue Op1 = getValue(I.getOperand(0));
    SDValue Op2 = getValue(I.getOperand(1));
-  ISD::CondCode Condition, FOC, FPC;
-  switch (predicate) {
-    case FCmpInst::FCMP_FALSE: FOC = FPC = ISD::SETFALSE; break;
-    case FCmpInst::FCMP_OEQ:   FOC = ISD::SETEQ; FPC = ISD::SETOEQ; break;
-    case FCmpInst::FCMP_OGT:   FOC = ISD::SETGT; FPC = ISD::SETOGT; break;
-    case FCmpInst::FCMP_OGE:   FOC = ISD::SETGE; FPC = ISD::SETOGE; break;
-    case FCmpInst::FCMP_OLT:   FOC = ISD::SETLT; FPC = ISD::SETOLT; break;
-    case FCmpInst::FCMP_OLE:   FOC = ISD::SETLE; FPC = ISD::SETOLE; break;
-    case FCmpInst::FCMP_ONE:   FOC = ISD::SETNE; FPC = ISD::SETONE; break;
-    case FCmpInst::FCMP_ORD:   FOC = FPC = ISD::SETO;   break;
-    case FCmpInst::FCMP_UNO:   FOC = FPC = ISD::SETUO;  break;
-    case FCmpInst::FCMP_UEQ:   FOC = ISD::SETEQ; FPC = ISD::SETUEQ; break;
-    case FCmpInst::FCMP_UGT:   FOC = ISD::SETGT; FPC = ISD::SETUGT; break;
-    case FCmpInst::FCMP_UGE:   FOC = ISD::SETGE; FPC = ISD::SETUGE; break;
-    case FCmpInst::FCMP_ULT:   FOC = ISD::SETLT; FPC = ISD::SETULT; break;
-    case FCmpInst::FCMP_ULE:   FOC = ISD::SETLE; FPC = ISD::SETULE; break;
-    case FCmpInst::FCMP_UNE:   FOC = ISD::SETNE; FPC = ISD::SETUNE; break;
-    case FCmpInst::FCMP_TRUE:  FOC = FPC = ISD::SETTRUE; break;
-    default:
-      assert(!"Invalid FCmp predicate value");
-      FOC = FPC = ISD::SETFALSE;
-      break;
-  }
-  if (FiniteOnlyFPMath())
-    Condition = FOC;
-  else 
-    Condition = FPC;
+  ISD::CondCode Condition = getFCmpCondCode(predicate);
    setValue(&I, DAG.getSetCC(MVT::i1, Op1, Op2, Condition));
  }
  
@@ -2127,23 +2125,7 @@ void SelectionDAGLowering::visitVICmp(User &I) {
      predicate = ICmpInst::Predicate(IC->getPredicate());
    SDValue Op1 = getValue(I.getOperand(0));
    SDValue Op2 = getValue(I.getOperand(1));
-  ISD::CondCode Opcode;
-  switch (predicate) {
-    case ICmpInst::ICMP_EQ  : Opcode = ISD::SETEQ; break;
-    case ICmpInst::ICMP_NE  : Opcode = ISD::SETNE; break;
-    case ICmpInst::ICMP_UGT : Opcode = ISD::SETUGT; break;
-    case ICmpInst::ICMP_UGE : Opcode = ISD::SETUGE; break;
-    case ICmpInst::ICMP_ULT : Opcode = ISD::SETULT; break;
-    case ICmpInst::ICMP_ULE : Opcode = ISD::SETULE; break;
-    case ICmpInst::ICMP_SGT : Opcode = ISD::SETGT; break;
-    case ICmpInst::ICMP_SGE : Opcode = ISD::SETGE; break;
-    case ICmpInst::ICMP_SLT : Opcode = ISD::SETLT; break;
-    case ICmpInst::ICMP_SLE : Opcode = ISD::SETLE; break;
-    default:
-      assert(!"Invalid ICmp predicate value");
-      Opcode = ISD::SETEQ;
-      break;
-  }
+  ISD::CondCode Opcode = getICmpCondCode(predicate);
    setValue(&I, DAG.getVSetCC(Op1.getValueType(), Op1, Op2, Opcode));
  }
  
@@ -2155,45 +2137,31 @@ void SelectionDAGLowering::visitVFCmp(User &I) {
      predicate = FCmpInst::Predicate(FC->getPredicate());
    SDValue Op1 = getValue(I.getOperand(0));
    SDValue Op2 = getValue(I.getOperand(1));
-  ISD::CondCode Condition, FOC, FPC;
-  switch (predicate) {
-    case FCmpInst::FCMP_FALSE: FOC = FPC = ISD::SETFALSE; break;
-    case FCmpInst::FCMP_OEQ:   FOC = ISD::SETEQ; FPC = ISD::SETOEQ; break;
-    case FCmpInst::FCMP_OGT:   FOC = ISD::SETGT; FPC = ISD::SETOGT; break;
-    case FCmpInst::FCMP_OGE:   FOC = ISD::SETGE; FPC = ISD::SETOGE; break;
-    case FCmpInst::FCMP_OLT:   FOC = ISD::SETLT; FPC = ISD::SETOLT; break;
-    case FCmpInst::FCMP_OLE:   FOC = ISD::SETLE; FPC = ISD::SETOLE; break;
-    case FCmpInst::FCMP_ONE:   FOC = ISD::SETNE; FPC = ISD::SETONE; break;
-    case FCmpInst::FCMP_ORD:   FOC = FPC = ISD::SETO;   break;
-    case FCmpInst::FCMP_UNO:   FOC = FPC = ISD::SETUO;  break;
-    case FCmpInst::FCMP_UEQ:   FOC = ISD::SETEQ; FPC = ISD::SETUEQ; break;
-    case FCmpInst::FCMP_UGT:   FOC = ISD::SETGT; FPC = ISD::SETUGT; break;
-    case FCmpInst::FCMP_UGE:   FOC = ISD::SETGE; FPC = ISD::SETUGE; break;
-    case FCmpInst::FCMP_ULT:   FOC = ISD::SETLT; FPC = ISD::SETULT; break;
-    case FCmpInst::FCMP_ULE:   FOC = ISD::SETLE; FPC = ISD::SETULE; break;
-    case FCmpInst::FCMP_UNE:   FOC = ISD::SETNE; FPC = ISD::SETUNE; break;
-    case FCmpInst::FCMP_TRUE:  FOC = FPC = ISD::SETTRUE; break;
-    default:
-      assert(!"Invalid VFCmp predicate value");
-      FOC = FPC = ISD::SETFALSE;
-      break;
-  }
-  if (FiniteOnlyFPMath())
-    Condition = FOC;
-  else 
-    Condition = FPC;
-    
+  ISD::CondCode Condition = getFCmpCondCode(predicate);
    MVT DestVT = TLI.getValueType(I.getType());
      
    setValue(&I, DAG.getVSetCC(DestVT, Op1, Op2, Condition));
  }
  
  void SelectionDAGLowering::visitSelect(User &I) {
-  SDValue Cond     = getValue(I.getOperand(0));
-  SDValue TrueVal  = getValue(I.getOperand(1));
-  SDValue FalseVal = getValue(I.getOperand(2));
-  setValue(&I, DAG.getNode(ISD::SELECT, TrueVal.getValueType(), Cond,
-                           TrueVal, FalseVal));
+  SmallVector<MVT, 4> ValueVTs;
+  ComputeValueVTs(TLI, I.getType(), ValueVTs);
+  unsigned NumValues = ValueVTs.size();
+  if (NumValues != 0) {
+    SmallVector<SDValue, 4> Values(NumValues);
+    SDValue Cond     = getValue(I.getOperand(0));
+    SDValue TrueVal  = getValue(I.getOperand(1));
+    SDValue FalseVal = getValue(I.getOperand(2));
+
+    for (unsigned i = 0; i != NumValues; ++i)
+      Values[i] = DAG.getNode(ISD::SELECT, TrueVal.getValueType(), Cond,
+                              SDValue(TrueVal.getNode(), TrueVal.getResNo() + i),
+                              SDValue(FalseVal.getNode(), FalseVal.getResNo() + i));
+
+    setValue(&I, DAG.getNode(ISD::MERGE_VALUES,
+                             DAG.getVTList(&ValueVTs[0], NumValues),
+                             &Values[0], NumValues));
+  }
  }
  
  
@@ -2256,7 +2224,7 @@ void SelectionDAGLowering::visitUIToFP(User &I) {
  }
  
  void SelectionDAGLowering::visitSIToFP(User &I){ 
-  // UIToFP is never a no-op cast, no need to check
+  // SIToFP is never a no-op cast, no need to check
    SDValue N = getValue(I.getOperand(0));
    MVT DestVT = TLI.getValueType(I.getType());
    setValue(&I, DAG.getNode(ISD::SINT_TO_FP, DestVT, N));
@@ -2321,14 +2289,208 @@ void SelectionDAGLowering::visitExtractElement(User &I) {
                             TLI.getValueType(I.getType()), InVec, InIdx));
  }
  
+
+// Utility for visitShuffleVector - Returns true if the mask is mask starting
+// from SIndx and increasing to the element length (undefs are allowed).
+static bool SequentialMask(SDValue Mask, unsigned SIndx) {
+  unsigned MaskNumElts = Mask.getNumOperands();
+  for (unsigned i = 0; i != MaskNumElts; ++i) {
+    if (Mask.getOperand(i).getOpcode() != ISD::UNDEF) {
+      unsigned Idx = cast<ConstantSDNode>(Mask.getOperand(i))->getZExtValue();
+      if (Idx != i + SIndx)
+        return false;
+    }
+  }
+  return true;
+}
+
  void SelectionDAGLowering::visitShuffleVector(User &I) {
-  SDValue V1   = getValue(I.getOperand(0));
-  SDValue V2   = getValue(I.getOperand(1));
+  SDValue Src1 = getValue(I.getOperand(0));
+  SDValue Src2 = getValue(I.getOperand(1));
    SDValue Mask = getValue(I.getOperand(2));
  
-  setValue(&I, DAG.getNode(ISD::VECTOR_SHUFFLE,
-                           TLI.getValueType(I.getType()),
-                           V1, V2, Mask));
+  MVT VT = TLI.getValueType(I.getType());
+  MVT SrcVT = Src1.getValueType();
+  int MaskNumElts = Mask.getNumOperands();
+  int SrcNumElts = SrcVT.getVectorNumElements();
+
+  if (SrcNumElts == MaskNumElts) {
+    setValue(&I, DAG.getNode(ISD::VECTOR_SHUFFLE, VT, Src1, Src2, Mask));
+    return;
+  }
+
+  // Normalize the shuffle vector since mask and vector length don't match.
+  MVT MaskEltVT = Mask.getValueType().getVectorElementType();
+
+  if (SrcNumElts < MaskNumElts && MaskNumElts % SrcNumElts == 0) {
+    // Mask is longer than the source vectors and is a multiple of the source
+    // vectors.  We can use concatenate vector to make the mask and vectors
+    // lengths match.
+    if (SrcNumElts*2 == MaskNumElts && SequentialMask(Mask, 0)) {
+      // The shuffle is concatenating two vectors together.
+      setValue(&I, DAG.getNode(ISD::CONCAT_VECTORS, VT, Src1, Src2));
+      return;
+    }
+
+    // Pad both vectors with undefs to make them the same length as the mask.
+    unsigned NumConcat = MaskNumElts / SrcNumElts;
+    SDValue UndefVal = DAG.getNode(ISD::UNDEF, SrcVT);
+
+    SDValue* MOps1 = new SDValue[NumConcat];
+    SDValue* MOps2 = new SDValue[NumConcat];
+    MOps1[0] = Src1;
+    MOps2[0] = Src2;
+    for (unsigned i = 1; i != NumConcat; ++i) {
+      MOps1[i] = UndefVal;
+      MOps2[i] = UndefVal;
+    }
+    Src1 = DAG.getNode(ISD::CONCAT_VECTORS, VT, MOps1, NumConcat);
+    Src2 = DAG.getNode(ISD::CONCAT_VECTORS, VT, MOps2, NumConcat);
+
+    delete [] MOps1;
+    delete [] MOps2;
+
+    // Readjust mask for new input vector length.
+    SmallVector<SDValue, 8> MappedOps;
+    for (int i = 0; i != MaskNumElts; ++i) {
+      if (Mask.getOperand(i).getOpcode() == ISD::UNDEF) {
+        MappedOps.push_back(Mask.getOperand(i));
+      } else {
+        int Idx = cast<ConstantSDNode>(Mask.getOperand(i))->getZExtValue();
+        if (Idx < SrcNumElts)
+          MappedOps.push_back(DAG.getConstant(Idx, MaskEltVT));
+        else
+          MappedOps.push_back(DAG.getConstant(Idx + MaskNumElts - SrcNumElts,
+                                              MaskEltVT));
+      }
+    }
+    Mask = DAG.getNode(ISD::BUILD_VECTOR, Mask.getValueType(),
+                       &MappedOps[0], MappedOps.size());
+
+    setValue(&I, DAG.getNode(ISD::VECTOR_SHUFFLE, VT, Src1, Src2, Mask));
+    return;
+  }
+
+  if (SrcNumElts > MaskNumElts) {
+    // Resulting vector is shorter than the incoming vector.
+    if (SrcNumElts == MaskNumElts && SequentialMask(Mask,0)) {
+      // Shuffle extracts 1st vector.
+      setValue(&I, Src1);
+      return;
+    }
+
+    if (SrcNumElts == MaskNumElts && SequentialMask(Mask,MaskNumElts)) {
+      // Shuffle extracts 2nd vector.
+      setValue(&I, Src2);
+      return;
+    }
+
+    // Analyze the access pattern of the vector to see if we can extract
+    // two subvectors and do the shuffle. The analysis is done by calculating
+    // the range of elements the mask access on both vectors.
+    int MinRange[2] = { SrcNumElts+1, SrcNumElts+1};
+    int MaxRange[2] = {-1, -1};
+
+    for (int i = 0; i != MaskNumElts; ++i) {
+      SDValue Arg = Mask.getOperand(i);
+      if (Arg.getOpcode() != ISD::UNDEF) {
+        assert(isa<ConstantSDNode>(Arg) && "Invalid VECTOR_SHUFFLE mask!");
+        int Idx = cast<ConstantSDNode>(Arg)->getZExtValue();
+        int Input = 0;
+        if (Idx >= SrcNumElts) {
+          Input = 1;
+          Idx -= SrcNumElts;
+        }
+        if (Idx > MaxRange[Input])
+          MaxRange[Input] = Idx;
+        if (Idx < MinRange[Input])
+          MinRange[Input] = Idx;
+      }
+    }
+
+    // Check if the access is smaller than the vector size and can we find
+    // a reasonable extract index.
+    int RangeUse[2] = { 2, 2 };  // 0 = Unused, 1 = Extract, 2 = Can not Extract.
+    int StartIdx[2];  // StartIdx to extract from
+    for (int Input=0; Input < 2; ++Input) {
+      if (MinRange[Input] == SrcNumElts+1 && MaxRange[Input] == -1) {
+        RangeUse[Input] = 0; // Unused
+        StartIdx[Input] = 0;
+      } else if (MaxRange[Input] - MinRange[Input] < MaskNumElts) {
+        // Fits within range but we should see if we can find a good
+        // start index that is a multiple of the mask length.
+        if (MaxRange[Input] < MaskNumElts) {
+          RangeUse[Input] = 1; // Extract from beginning of the vector
+          StartIdx[Input] = 0;
+        } else {
+          StartIdx[Input] = (MinRange[Input]/MaskNumElts)*MaskNumElts;
+          if (MaxRange[Input] - StartIdx[Input] < MaskNumElts &&
+              StartIdx[Input] + MaskNumElts < SrcNumElts) 
+            RangeUse[Input] = 1; // Extract from a multiple of the mask length.
+        }
+      }
+    }
+
+    if (RangeUse[0] == 0 && RangeUse[0] == 0) {
+      setValue(&I, DAG.getNode(ISD::UNDEF, VT));  // Vectors are not used.
+      return;
+    }
+    else if (RangeUse[0] < 2 && RangeUse[1] < 2) {
+      // Extract appropriate subvector and generate a vector shuffle
+      for (int Input=0; Input < 2; ++Input) {
+        SDValue& Src = Input == 0 ? Src1 : Src2;
+        if (RangeUse[Input] == 0) {
+          Src = DAG.getNode(ISD::UNDEF, VT);
+        } else {
+          Src = DAG.getNode(ISD::EXTRACT_SUBVECTOR, VT, Src,
+                            DAG.getIntPtrConstant(StartIdx[Input]));
+        }
+      }
+      // Calculate new mask.
+      SmallVector<SDValue, 8> MappedOps;
+      for (int i = 0; i != MaskNumElts; ++i) {
+        SDValue Arg = Mask.getOperand(i);
+        if (Arg.getOpcode() == ISD::UNDEF) {
+          MappedOps.push_back(Arg);
+        } else {
+          int Idx = cast<ConstantSDNode>(Arg)->getZExtValue();
+          if (Idx < SrcNumElts)
+            MappedOps.push_back(DAG.getConstant(Idx - StartIdx[0], MaskEltVT));
+          else {
+            Idx = Idx - SrcNumElts - StartIdx[1] + MaskNumElts;
+            MappedOps.push_back(DAG.getConstant(Idx, MaskEltVT));
+          } 
+        }
+      }
+      Mask = DAG.getNode(ISD::BUILD_VECTOR, Mask.getValueType(),
+                         &MappedOps[0], MappedOps.size());
+      setValue(&I, DAG.getNode(ISD::VECTOR_SHUFFLE, VT, Src1, Src2, Mask));
+      return;
+    }
+  }
+
+  // We can't use either concat vectors or extract subvectors so fall back to
+  // replacing the shuffle with extract and build vector.
+  // to insert and build vector.
+  MVT EltVT = VT.getVectorElementType();
+  MVT PtrVT = TLI.getPointerTy();
+  SmallVector<SDValue,8> Ops;
+  for (int i = 0; i != MaskNumElts; ++i) {
+    SDValue Arg = Mask.getOperand(i);
+    if (Arg.getOpcode() == ISD::UNDEF) {
+      Ops.push_back(DAG.getNode(ISD::UNDEF, EltVT));
+    } else {
+      assert(isa<ConstantSDNode>(Arg) && "Invalid VECTOR_SHUFFLE mask!");
+      int Idx = cast<ConstantSDNode>(Arg)->getZExtValue();
+      if (Idx < SrcNumElts)
+        Ops.push_back(DAG.getNode(ISD::EXTRACT_VECTOR_ELT, EltVT, Src1,
+                                  DAG.getConstant(Idx, PtrVT)));
+      else
+        Ops.push_back(DAG.getNode(ISD::EXTRACT_VECTOR_ELT, EltVT, Src2,
+                                  DAG.getConstant(Idx - SrcNumElts, PtrVT)));
+    }
+  }
+  setValue(&I, DAG.getNode(ISD::BUILD_VECTOR, VT, &Ops[0], Ops.size()));
  }
  
  void SelectionDAGLowering::visitInsertValue(InsertValueInst &I) {
@@ -2367,8 +2529,9 @@ void SelectionDAGLowering::visitInsertValue(InsertValueInst &I) {
      Values[i] = IntoUndef ? DAG.getNode(ISD::UNDEF, AggValueVTs[i]) :
                  SDValue(Agg.getNode(), Agg.getResNo() + i);
  
-  setValue(&I, DAG.getMergeValues(DAG.getVTList(&AggValueVTs[0], NumAggValues),
-                                  &Values[0], NumAggValues));
+  setValue(&I, DAG.getNode(ISD::MERGE_VALUES,
+                           DAG.getVTList(&AggValueVTs[0], NumAggValues),
+                           &Values[0], NumAggValues));
  }
  
  void SelectionDAGLowering::visitExtractValue(ExtractValueInst &I) {
@@ -2390,11 +2553,14 @@ void SelectionDAGLowering::visitExtractValue(ExtractValueInst &I) {
    // Copy out the selected value(s).
    for (unsigned i = LinearIndex; i != LinearIndex + NumValValues; ++i)
      Values[i - LinearIndex] =
-      OutOfUndef ? DAG.getNode(ISD::UNDEF, Agg.getNode()->getValueType(Agg.getResNo() + i)) :
-                   SDValue(Agg.getNode(), Agg.getResNo() + i);
-
-  setValue(&I, DAG.getMergeValues(DAG.getVTList(&ValValueVTs[0], NumValValues),
-                                  &Values[0], NumValValues));
+      OutOfUndef ?
+        DAG.getNode(ISD::UNDEF,
+                    Agg.getNode()->getValueType(Agg.getResNo() + i)) :
+        SDValue(Agg.getNode(), Agg.getResNo() + i);
+
+  setValue(&I, DAG.getNode(ISD::MERGE_VALUES,
+                           DAG.getVTList(&ValValueVTs[0], NumValValues),
+                           &Values[0], NumValValues));
  }
  
  
@@ -2558,8 +2724,9 @@ void SelectionDAGLowering::visitLoad(LoadInst &I) {
        PendingLoads.push_back(Chain);
    }
  
-  setValue(&I, DAG.getMergeValues(DAG.getVTList(&ValueVTs[0], NumValues),
-                                  &Values[0], NumValues));
+  setValue(&I, DAG.getNode(ISD::MERGE_VALUES,
+                           DAG.getVTList(&ValueVTs[0], NumValues),
+                           &Values[0], NumValues));
  }
  
  
@@ -2612,9 +2779,14 @@ void SelectionDAGLowering::visitTargetIntrinsic(CallInst &I,
        Ops.push_back(getRoot());
      }
    }
-  
-  // Add the intrinsic ID as an integer operand.
-  Ops.push_back(DAG.getConstant(Intrinsic, TLI.getPointerTy()));
+
+  // Info is set by getTgtMemInstrinsic
+  TargetLowering::IntrinsicInfo Info;
+  bool IsTgtIntrinsic = TLI.getTgtMemIntrinsic(Info, I, Intrinsic);
+
+  // Add the intrinsic ID as an integer operand if it's not a target intrinsic.  
+  if (!IsTgtIntrinsic)
+    Ops.push_back(DAG.getConstant(Intrinsic, TLI.getPointerTy()));
  
    // Add all operands of the call to the operand list.
    for (unsigned i = 1, e = I.getNumOperands(); i != e; ++i) {
@@ -2645,7 +2817,15 @@ void SelectionDAGLowering::visitTargetIntrinsic(CallInst &I,
  
    // Create the node.
    SDValue Result;
-  if (!HasChain)
+  if (IsTgtIntrinsic) {
+    // This is target intrinsic that touches memory
+    Result = DAG.getMemIntrinsicNode(Info.opc, VTList, VTs.size(),
+                                     &Ops[0], Ops.size(),
+                                     Info.memVT, Info.ptrVal, Info.offset,
+                                     Info.align, Info.vol,
+                                     Info.readMem, Info.writeMem);
+  }
+  else if (!HasChain)
      Result = DAG.getNode(ISD::INTRINSIC_WO_CHAIN, VTList, VTs.size(),
                           &Ops[0], Ops.size());
    else if (I.getType() != Type::VoidTy)
@@ -2738,12 +2918,12 @@ void AddCatchInfo(CallInst &I, MachineModuleInfo *MMI,
  
  }
  
-// GetSignificand - Get the significand and build it into a floating-point
-// number with exponent of 1:
-//
-//   Op = (Op & 0x007fffff) | 0x3f800000;
-//
-// where Op is the hexidecimal representation of floating point value.
+/// GetSignificand - Get the significand and build it into a floating-point
+/// number with exponent of 1:
+///
+///   Op = (Op & 0x007fffff) | 0x3f800000;
+///
+/// where Op is the hexidecimal representation of floating point value.
  static SDValue
  GetSignificand(SelectionDAG &DAG, SDValue Op) {
      SDValue t1 = DAG.getNode(ISD::AND, MVT::i32, Op,
@@ -2753,11 +2933,11 @@ GetSignificand(SelectionDAG &DAG, SDValue Op) {
      return DAG.getNode(ISD::BIT_CONVERT, MVT::f32, t2);
  }
  
-// GetExponent - Get the exponent:
-//
-//   (float)((Op1 >> 23) - 127);
-//
-// where Op is the hexidecimal representation of floating point value.
+/// GetExponent - Get the exponent:
+///
+///   (float)((Op1 >> 23) - 127);
+///
+/// where Op is the hexidecimal representation of floating point value.
  static SDValue
  GetExponent(SelectionDAG &DAG, SDValue Op) {
      SDValue t1 = DAG.getNode(ISD::SRL, MVT::i32, Op,
@@ -2767,6 +2947,12 @@ GetExponent(SelectionDAG &DAG, SDValue Op) {
      return DAG.getNode(ISD::UINT_TO_FP, MVT::f32, t2);
  }
  
+/// getF32Constant - Get 32-bit floating point constant.
+static SDValue
+getF32Constant(SelectionDAG &DAG, unsigned Flt) {
+  return DAG.getConstantFP(APFloat(APInt(32, Flt)), MVT::f32);
+}
+
  /// Inlined utility function to implement binary input atomic intrinsics for 
  /// visitIntrinsicCall: I is a call instruction
  ///                     Op is the associated NodeType for I
@@ -2782,6 +2968,23 @@ SelectionDAGLowering::implVisitBinaryAtomic(CallInst& I, ISD::NodeType Op) {
    return 0;
  }
  
+// implVisitAluOverflow - Lower an overflow instrinsics
+const char *
+SelectionDAGLowering::implVisitAluOverflow(CallInst &I, ISD::NodeType Op) {
+    SDValue Op1 = getValue(I.getOperand(1));
+    SDValue Op2 = getValue(I.getOperand(2));
+
+    MVT ValueVTs[] = { Op1.getValueType(), MVT::i1 };
+    SDValue Ops[] = { Op1, Op2 };
+
+    SDValue Result =
+      DAG.getNode(Op,
+                  DAG.getVTList(&ValueVTs[0], 2), &Ops[0], 2);
+
+    setValue(&I, Result);
+    return 0;
+  }
+
  /// visitExp - Lower an exp intrinsic. Handles the special sequences for
  /// limited-precision mode.
  void
@@ -2798,8 +3001,7 @@ SelectionDAGLowering::visitExp(CallInst &I) {
      //   #define LOG2OFe 1.4426950f
      //   IntegerPartOfX = ((int32_t)(X * LOG2OFe));
      SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, Op,
-                             DAG.getConstantFP(APFloat(
-                               APInt(32, 0x3fb8aa3b)), MVT::f32));
+                             getF32Constant(DAG, 0x3fb8aa3b));
      SDValue IntegerPartOfX = DAG.getNode(ISD::FP_TO_SINT, MVT::i32, t0);
  
      //   FractionalPartOfX = (X * LOG2OFe) - (float)IntegerPartOfX;
@@ -2819,15 +3021,12 @@ SelectionDAGLowering::visitExp(CallInst &I) {
        //
        // error 0.0144103317, which is 6 bits
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e814304)), MVT::f32));
+                               getF32Constant(DAG, 0x3e814304));
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f3c50c8)), MVT::f32));
+                               getF32Constant(DAG, 0x3f3c50c8));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f7f5e7e)), MVT::f32));
+                               getF32Constant(DAG, 0x3f7f5e7e));
        SDValue TwoToFracPartOfX = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t5);
  
        // Add the exponent into the result in integer domain.
@@ -2845,19 +3044,15 @@ SelectionDAGLowering::visitExp(CallInst &I) {
        //
        // 0.000107046256 error, which is 13 to 14 bits
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3da235e3)), MVT::f32));
+                               getF32Constant(DAG, 0x3da235e3));
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e65b8f3)), MVT::f32));
+                               getF32Constant(DAG, 0x3e65b8f3));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f324b07)), MVT::f32));
+                               getF32Constant(DAG, 0x3f324b07));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f7ff8fd)), MVT::f32));
+                               getF32Constant(DAG, 0x3f7ff8fd));
        SDValue TwoToFracPartOfX = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t7);
  
        // Add the exponent into the result in integer domain.
@@ -2878,31 +3073,24 @@ SelectionDAGLowering::visitExp(CallInst &I) {
        //
        // error 2.47208000*10^(-7), which is better than 18 bits
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3924b03e)), MVT::f32));
+                               getF32Constant(DAG, 0x3924b03e));
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3ab24b87)), MVT::f32));
+                               getF32Constant(DAG, 0x3ab24b87));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3c1d8c17)), MVT::f32));
+                               getF32Constant(DAG, 0x3c1d8c17));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3d634a1d)), MVT::f32));
+                               getF32Constant(DAG, 0x3d634a1d));
        SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
        SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e75fe14)), MVT::f32));
+                               getF32Constant(DAG, 0x3e75fe14));
        SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
        SDValue t11 = DAG.getNode(ISD::FADD, MVT::f32, t10,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f317234)), MVT::f32));
+                                getF32Constant(DAG, 0x3f317234));
        SDValue t12 = DAG.getNode(ISD::FMUL, MVT::f32, t11, X);
        SDValue t13 = DAG.getNode(ISD::FADD, MVT::f32, t12,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f800000)), MVT::f32));
+                                getF32Constant(DAG, 0x3f800000));
        SDValue TwoToFracPartOfX = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t13);
  
        // Add the exponent into the result in integer domain.
@@ -2935,8 +3123,7 @@ SelectionDAGLowering::visitLog(CallInst &I) {
      // Scale the exponent by log(2) [0.69314718f].
      SDValue Exp = GetExponent(DAG, Op1);
      SDValue LogOfExponent = DAG.getNode(ISD::FMUL, MVT::f32, Exp,
-                              DAG.getConstantFP(APFloat(
-                                APInt(32, 0x3f317218)), MVT::f32));
+                                        getF32Constant(DAG, 0x3f317218));
  
      // Get the significand and build it into a floating-point number with
      // exponent of 1.
@@ -2951,15 +3138,12 @@ SelectionDAGLowering::visitLog(CallInst &I) {
        // 
        // error 0.0034276066, which is better than 8 bits
        SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0xbe74c456)), MVT::f32));
+                               getF32Constant(DAG, 0xbe74c456));
        SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3fb3a2b1)), MVT::f32));
+                               getF32Constant(DAG, 0x3fb3a2b1));
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
        SDValue LogOfMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t2,
-                                  DAG.getConstantFP(APFloat(
-                                    APInt(32, 0x3f949a29)), MVT::f32));
+                                          getF32Constant(DAG, 0x3f949a29));
  
        result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, LogOfMantissa);
      } else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
@@ -2973,23 +3157,18 @@ SelectionDAGLowering::visitLog(CallInst &I) {
        //
        // error 0.000061011436, which is 14 bits
        SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0xbd67b6d6)), MVT::f32));
+                               getF32Constant(DAG, 0xbd67b6d6));
        SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3ee4f4b8)), MVT::f32));
+                               getF32Constant(DAG, 0x3ee4f4b8));
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
        SDValue t3 = DAG.getNode(ISD::FSUB, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3fbc278b)), MVT::f32));
+                               getF32Constant(DAG, 0x3fbc278b));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x40348e95)), MVT::f32));
+                               getF32Constant(DAG, 0x40348e95));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue LogOfMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t6,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x3fdef31a)), MVT::f32));
+                                          getF32Constant(DAG, 0x3fdef31a));
  
        result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, LogOfMantissa);
      } else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
@@ -3005,31 +3184,24 @@ SelectionDAGLowering::visitLog(CallInst &I) {
        //
        // error 0.0000023660568, which is better than 18 bits
        SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0xbc91e5ac)), MVT::f32));
+                               getF32Constant(DAG, 0xbc91e5ac));
        SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e4350aa)), MVT::f32));
+                               getF32Constant(DAG, 0x3e4350aa));
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
        SDValue t3 = DAG.getNode(ISD::FSUB, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f60d3e3)), MVT::f32));
+                               getF32Constant(DAG, 0x3f60d3e3));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x4011cdf0)), MVT::f32));
+                               getF32Constant(DAG, 0x4011cdf0));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue t7 = DAG.getNode(ISD::FSUB, MVT::f32, t6,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x406cfd1c)), MVT::f32));
+                               getF32Constant(DAG, 0x406cfd1c));
        SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
        SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x408797cb)), MVT::f32));
+                               getF32Constant(DAG, 0x408797cb));
        SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
        SDValue LogOfMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t10,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x4006dcab)), MVT::f32));
+                                          getF32Constant(DAG, 0x4006dcab));
  
        result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, LogOfMantissa);
      }
@@ -3070,15 +3242,12 @@ SelectionDAGLowering::visitLog2(CallInst &I) {
        //
        // error 0.0049451742, which is more than 7 bits
        SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0xbeb08fe0)), MVT::f32));
+                               getF32Constant(DAG, 0xbeb08fe0));
        SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x40019463)), MVT::f32));
+                               getF32Constant(DAG, 0x40019463));
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
        SDValue Log2ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t2,
-                                  DAG.getConstantFP(APFloat(
-                                    APInt(32, 0x3fd6633d)), MVT::f32));
+                                           getF32Constant(DAG, 0x3fd6633d));
  
        result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log2ofMantissa);
      } else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
@@ -3092,23 +3261,18 @@ SelectionDAGLowering::visitLog2(CallInst &I) {
        //   
        // error 0.0000876136000, which is better than 13 bits
        SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0xbda7262e)), MVT::f32));
+                               getF32Constant(DAG, 0xbda7262e));
        SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f25280b)), MVT::f32));
+                               getF32Constant(DAG, 0x3f25280b));
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
        SDValue t3 = DAG.getNode(ISD::FSUB, MVT::f32, t2,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x4007b923)), MVT::f32));
+                               getF32Constant(DAG, 0x4007b923));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x40823e2f)), MVT::f32));
+                               getF32Constant(DAG, 0x40823e2f));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue Log2ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t6,
-                                 DAG.getConstantFP(APFloat(
-                                   APInt(32, 0x4020d29c)), MVT::f32));
+                                           getF32Constant(DAG, 0x4020d29c));
  
        result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log2ofMantissa);
      } else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
@@ -3125,31 +3289,24 @@ SelectionDAGLowering::visitLog2(CallInst &I) {
        //
        // error 0.0000018516, which is better than 18 bits
        SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0xbcd2769e)), MVT::f32));
+                               getF32Constant(DAG, 0xbcd2769e));
        SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e8ce0b9)), MVT::f32));
+                               getF32Constant(DAG, 0x3e8ce0b9));
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
        SDValue t3 = DAG.getNode(ISD::FSUB, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3fa22ae7)), MVT::f32));
+                               getF32Constant(DAG, 0x3fa22ae7));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x40525723)), MVT::f32));
+                               getF32Constant(DAG, 0x40525723));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue t7 = DAG.getNode(ISD::FSUB, MVT::f32, t6,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x40aaf200)), MVT::f32));
+                               getF32Constant(DAG, 0x40aaf200));
        SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
        SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x40c39dad)), MVT::f32));
+                               getF32Constant(DAG, 0x40c39dad));
        SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
        SDValue Log2ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t10,
-                                 DAG.getConstantFP(APFloat(
-                                   APInt(32, 0x4042902c)), MVT::f32));
+                                           getF32Constant(DAG, 0x4042902c));
  
        result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log2ofMantissa);
      }
@@ -3168,6 +3325,7 @@ SelectionDAGLowering::visitLog2(CallInst &I) {
  void
  SelectionDAGLowering::visitLog10(CallInst &I) {
    SDValue result;
+
    if (getValue(I.getOperand(1)).getValueType() == MVT::f32 &&
        LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
      SDValue Op = getValue(I.getOperand(1));
@@ -3176,8 +3334,7 @@ SelectionDAGLowering::visitLog10(CallInst &I) {
      // Scale the exponent by log10(2) [0.30102999f].
      SDValue Exp = GetExponent(DAG, Op1);
      SDValue LogOfExponent = DAG.getNode(ISD::FMUL, MVT::f32, Exp,
-                             DAG.getConstantFP(APFloat(
-                               APInt(32, 0x3e9a209a)), MVT::f32));
+                                        getF32Constant(DAG, 0x3e9a209a));
  
      // Get the significand and build it into a floating-point number with
      // exponent of 1.
@@ -3192,15 +3349,12 @@ SelectionDAGLowering::visitLog10(CallInst &I) {
        //
        // error 0.0014886165, which is 6 bits
        SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0xbdd49a13)), MVT::f32));
+                               getF32Constant(DAG, 0xbdd49a13));
        SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x3f1c0789)), MVT::f32));
+                               getF32Constant(DAG, 0x3f1c0789));
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
        SDValue Log10ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t2,
-                                  DAG.getConstantFP(APFloat(
-                                    APInt(32, 0x3f011300)), MVT::f32));
+                                            getF32Constant(DAG, 0x3f011300));
  
        result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log10ofMantissa);
      } else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
@@ -3213,19 +3367,15 @@ SelectionDAGLowering::visitLog10(CallInst &I) {
        //
        // error 0.00019228036, which is better than 12 bits
        SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3d431f31)), MVT::f32));
+                               getF32Constant(DAG, 0x3d431f31));
        SDValue t1 = DAG.getNode(ISD::FSUB, MVT::f32, t0,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3ea21fb2)), MVT::f32));
+                               getF32Constant(DAG, 0x3ea21fb2));
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f6ae232)), MVT::f32));
+                               getF32Constant(DAG, 0x3f6ae232));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue Log10ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t4,
-                                  DAG.getConstantFP(APFloat(
-                                    APInt(32, 0x3f25f7c3)), MVT::f32));
+                                            getF32Constant(DAG, 0x3f25f7c3));
  
        result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log10ofMantissa);
      } else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
@@ -3240,27 +3390,21 @@ SelectionDAGLowering::visitLog10(CallInst &I) {
        //
        // error 0.0000037995730, which is better than 18 bits
        SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3c5d51ce)), MVT::f32));
+                               getF32Constant(DAG, 0x3c5d51ce));
        SDValue t1 = DAG.getNode(ISD::FSUB, MVT::f32, t0,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x3e00685a)), MVT::f32));
+                               getF32Constant(DAG, 0x3e00685a));
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3efb6798)), MVT::f32));
+                               getF32Constant(DAG, 0x3efb6798));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FSUB, MVT::f32, t4,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f88d192)), MVT::f32));
+                               getF32Constant(DAG, 0x3f88d192));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3fc4316c)), MVT::f32));
+                               getF32Constant(DAG, 0x3fc4316c));
        SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
        SDValue Log10ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t8,
-                                  DAG.getConstantFP(APFloat(
-                                    APInt(32, 0x3f57ce70)), MVT::f32));
+                                            getF32Constant(DAG, 0x3f57ce70));
  
        result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log10ofMantissa);
      }
@@ -3303,15 +3447,12 @@ SelectionDAGLowering::visitExp2(CallInst &I) {
        //
        // error 0.0144103317, which is 6 bits
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e814304)), MVT::f32));
+                               getF32Constant(DAG, 0x3e814304));
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f3c50c8)), MVT::f32));
+                               getF32Constant(DAG, 0x3f3c50c8));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4, 
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f7f5e7e)), MVT::f32));
+                               getF32Constant(DAG, 0x3f7f5e7e));
        SDValue t6 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t5);
        SDValue TwoToFractionalPartOfX =
          DAG.getNode(ISD::ADD, MVT::i32, t6, IntegerPartOfX);
@@ -3327,19 +3468,15 @@ SelectionDAGLowering::visitExp2(CallInst &I) {
        //
        // error 0.000107046256, which is 13 to 14 bits
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3da235e3)), MVT::f32));
+                               getF32Constant(DAG, 0x3da235e3));
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e65b8f3)), MVT::f32));
+                               getF32Constant(DAG, 0x3e65b8f3));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4, 
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f324b07)), MVT::f32));
+                               getF32Constant(DAG, 0x3f324b07));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f7ff8fd)), MVT::f32));
+                               getF32Constant(DAG, 0x3f7ff8fd));
        SDValue t8 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t7);
        SDValue TwoToFractionalPartOfX =
          DAG.getNode(ISD::ADD, MVT::i32, t8, IntegerPartOfX);
@@ -3357,31 +3494,24 @@ SelectionDAGLowering::visitExp2(CallInst &I) {
        //               (0.136028312e-2f + 0.157059148e-3f *x)*x)*x)*x)*x)*x;
        // error 2.47208000*10^(-7), which is better than 18 bits
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3924b03e)), MVT::f32));
+                               getF32Constant(DAG, 0x3924b03e));
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3ab24b87)), MVT::f32));
+                               getF32Constant(DAG, 0x3ab24b87));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4, 
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3c1d8c17)), MVT::f32));
+                               getF32Constant(DAG, 0x3c1d8c17));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3d634a1d)), MVT::f32));
+                               getF32Constant(DAG, 0x3d634a1d));
        SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
        SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e75fe14)), MVT::f32));
+                               getF32Constant(DAG, 0x3e75fe14));
        SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
        SDValue t11 = DAG.getNode(ISD::FADD, MVT::f32, t10,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x3f317234)), MVT::f32));
+                                getF32Constant(DAG, 0x3f317234));
        SDValue t12 = DAG.getNode(ISD::FMUL, MVT::f32, t11, X);
        SDValue t13 = DAG.getNode(ISD::FADD, MVT::f32, t12,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x3f800000)), MVT::f32));
+                                getF32Constant(DAG, 0x3f800000));
        SDValue t14 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t13);
        SDValue TwoToFractionalPartOfX =
          DAG.getNode(ISD::ADD, MVT::i32, t14, IntegerPartOfX);
@@ -3426,8 +3556,7 @@ SelectionDAGLowering::visitPow(CallInst &I) {
      //   #define LOG2OF10 3.3219281f
      //   IntegerPartOfX = (int32_t)(x * LOG2OF10);
      SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, Op,
-                             DAG.getConstantFP(APFloat(
-                               APInt(32, 0x40549a78)), MVT::f32));
+                             getF32Constant(DAG, 0x40549a78));
      SDValue IntegerPartOfX = DAG.getNode(ISD::FP_TO_SINT, MVT::i32, t0);
  
      //   FractionalPartOfX = x - (float)IntegerPartOfX;
@@ -3447,15 +3576,12 @@ SelectionDAGLowering::visitPow(CallInst &I) {
        // 
        // error 0.0144103317, which is 6 bits
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e814304)), MVT::f32));
+                               getF32Constant(DAG, 0x3e814304));
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f3c50c8)), MVT::f32));
+                               getF32Constant(DAG, 0x3f3c50c8));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4, 
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f7f5e7e)), MVT::f32));
+                               getF32Constant(DAG, 0x3f7f5e7e));
        SDValue t6 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t5);
        SDValue TwoToFractionalPartOfX =
          DAG.getNode(ISD::ADD, MVT::i32, t6, IntegerPartOfX);
@@ -3471,19 +3597,15 @@ SelectionDAGLowering::visitPow(CallInst &I) {
        //
        // error 0.000107046256, which is 13 to 14 bits
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3da235e3)), MVT::f32));
+                               getF32Constant(DAG, 0x3da235e3));
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e65b8f3)), MVT::f32));
+                               getF32Constant(DAG, 0x3e65b8f3));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4, 
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f324b07)), MVT::f32));
+                               getF32Constant(DAG, 0x3f324b07));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3f7ff8fd)), MVT::f32));
+                               getF32Constant(DAG, 0x3f7ff8fd));
        SDValue t8 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t7);
        SDValue TwoToFractionalPartOfX =
          DAG.getNode(ISD::ADD, MVT::i32, t8, IntegerPartOfX);
@@ -3501,31 +3623,24 @@ SelectionDAGLowering::visitPow(CallInst &I) {
        //               (0.136028312e-2f + 0.157059148e-3f *x)*x)*x)*x)*x)*x;
        // error 2.47208000*10^(-7), which is better than 18 bits
        SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3924b03e)), MVT::f32));
+                               getF32Constant(DAG, 0x3924b03e));
        SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3ab24b87)), MVT::f32));
+                               getF32Constant(DAG, 0x3ab24b87));
        SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
        SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4, 
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3c1d8c17)), MVT::f32));
+                               getF32Constant(DAG, 0x3c1d8c17));
        SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
        SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3d634a1d)), MVT::f32));
+                               getF32Constant(DAG, 0x3d634a1d));
        SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
        SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
-                               DAG.getConstantFP(APFloat(
-                                 APInt(32, 0x3e75fe14)), MVT::f32));
+                               getF32Constant(DAG, 0x3e75fe14));
        SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
        SDValue t11 = DAG.getNode(ISD::FADD, MVT::f32, t10,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x3f317234)), MVT::f32));
+                                getF32Constant(DAG, 0x3f317234));
        SDValue t12 = DAG.getNode(ISD::FMUL, MVT::f32, t11, X);
        SDValue t13 = DAG.getNode(ISD::FADD, MVT::f32, t12,
-                                DAG.getConstantFP(APFloat(
-                                  APInt(32, 0x3f800000)), MVT::f32));
+                                getF32Constant(DAG, 0x3f800000));
        SDValue t14 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t13);
        SDValue TwoToFractionalPartOfX =
          DAG.getNode(ISD::ADD, MVT::i32, t14, IntegerPartOfX);
@@ -3570,8 +3685,7 @@ SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
    case Intrinsic::longjmp:
      return "_longjmp"+!TLI.usesUnderscoreLongJmp();
      break;
-  case Intrinsic::memcpy_i32:
-  case Intrinsic::memcpy_i64: {
+  case Intrinsic::memcpy: {
      SDValue Op1 = getValue(I.getOperand(1));
      SDValue Op2 = getValue(I.getOperand(2));
      SDValue Op3 = getValue(I.getOperand(3));
@@ -3580,8 +3694,7 @@ SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
                                I.getOperand(1), 0, I.getOperand(2), 0));
      return 0;
    }
-  case Intrinsic::memset_i32:
-  case Intrinsic::memset_i64: {
+  case Intrinsic::memset: {
      SDValue Op1 = getValue(I.getOperand(1));
      SDValue Op2 = getValue(I.getOperand(2));
      SDValue Op3 = getValue(I.getOperand(3));
@@ -3590,8 +3703,7 @@ SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
                                I.getOperand(1), 0));
      return 0;
    }
-  case Intrinsic::memmove_i32:
-  case Intrinsic::memmove_i64: {
+  case Intrinsic::memmove: {
      SDValue Op1 = getValue(I.getOperand(1));
      SDValue Op2 = getValue(I.getOperand(2));
      SDValue Op3 = getValue(I.getOperand(3));
@@ -3601,7 +3713,7 @@ SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
      // lower memmove as memcpy.
      uint64_t Size = -1ULL;
      if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op3))
-      Size = C->getValue();
+      Size = C->getZExtValue();
      if (AA->alias(I.getOperand(1), Size, I.getOperand(2), Size) ==
          AliasAnalysis::NoAlias) {
        DAG.setRoot(DAG.getMemcpy(getRoot(), Op1, Op2, Op3, Align, false,
@@ -3660,9 +3772,12 @@ SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
        SubprogramDesc *Subprogram = cast<SubprogramDesc>(DD);
        const CompileUnitDesc *CompileUnit = Subprogram->getFile();
        unsigned SrcFile = MMI->RecordSource(CompileUnit);
-      // Record the source line but does create a label. It will be emitted
-      // at asm emission time.
-      MMI->RecordSourceLine(Subprogram->getLine(), 0, SrcFile);
+      // Record the source line but does not create a label for the normal
+      // function start. It will be emitted at asm emission time. However,
+      // create a label if this is a beginning of inlined function.
+      unsigned LabelID = MMI->RecordSourceLine(Subprogram->getLine(), 0, SrcFile);
+      if (MMI->getSourceLines().size() != 1)
+        DAG.setRoot(DAG.getLabel(ISD::DBG_LABEL, getRoot(), LabelID));
      }
  
      return 0;
@@ -3792,6 +3907,38 @@ SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
      return 0;
    }
  
+  case Intrinsic::convertff:
+  case Intrinsic::convertfsi:
+  case Intrinsic::convertfui:
+  case Intrinsic::convertsif:
+  case Intrinsic::convertuif:
+  case Intrinsic::convertss:
+  case Intrinsic::convertsu:
+  case Intrinsic::convertus:
+  case Intrinsic::convertuu: {
+    ISD::CvtCode Code = ISD::CVT_INVALID;
+    switch (Intrinsic) {
+    case Intrinsic::convertff:  Code = ISD::CVT_FF; break;
+    case Intrinsic::convertfsi: Code = ISD::CVT_FS; break;
+    case Intrinsic::convertfui: Code = ISD::CVT_FU; break;
+    case Intrinsic::convertsif: Code = ISD::CVT_SF; break;
+    case Intrinsic::convertuif: Code = ISD::CVT_UF; break;
+    case Intrinsic::convertss:  Code = ISD::CVT_SS; break;
+    case Intrinsic::convertsu:  Code = ISD::CVT_SU; break;
+    case Intrinsic::convertus:  Code = ISD::CVT_US; break;
+    case Intrinsic::convertuu:  Code = ISD::CVT_UU; break;
+    }
+    MVT DestVT = TLI.getValueType(I.getType());
+    Value* Op1 = I.getOperand(1);
+    setValue(&I, DAG.getConvertRndSat(DestVT, getValue(Op1),
+                                DAG.getValueType(DestVT),
+                                DAG.getValueType(getValue(Op1).getValueType()),
+                                getValue(I.getOperand(2)),
+                                getValue(I.getOperand(3)),
+                                Code));
+    return 0;
+  }
+
    case Intrinsic::sqrt:
      setValue(&I, DAG.getNode(ISD::FSQRT,
                               getValue(I.getOperand(1)).getValueType(),
@@ -3894,6 +4041,28 @@ SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
      DAG.setRoot(DAG.getNode(ISD::STACKRESTORE, MVT::Other, getRoot(), Tmp));
      return 0;
    }
+  case Intrinsic::stackprotector: {
+    // Emit code into the DAG to store the stack guard onto the stack.
+    MachineFunction &MF = DAG.getMachineFunction();
+    MachineFrameInfo *MFI = MF.getFrameInfo();
+    MVT PtrTy = TLI.getPointerTy();
+
+    SDValue Src = getValue(I.getOperand(1));   // The guard's value.
+    AllocaInst *Slot = cast<AllocaInst>(I.getOperand(2));
+
+    int FI = FuncInfo.StaticAllocaMap[Slot];
+    MFI->setStackProtectorIndex(FI);
+
+    SDValue FIN = DAG.getFrameIndex(FI, PtrTy);
+
+    // Store the stack protector onto the stack.
+    SDValue Result = DAG.getStore(getRoot(), Src, FIN,
+                                  PseudoSourceValue::getFixedStack(FI),
+                                  0, true);
+    setValue(&I, Result);
+    DAG.setRoot(Result);
+    return 0;
+  }
    case Intrinsic::var_annotation:
      // Discard annotate attributes
      return 0;
@@ -3943,6 +4112,20 @@ SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
      DAG.setRoot(DAG.getNode(ISD::TRAP, MVT::Other, getRoot()));
      return 0;
    }
+
+  case Intrinsic::uadd_with_overflow:
+    return implVisitAluOverflow(I, ISD::UADDO);
+  case Intrinsic::sadd_with_overflow:
+    return implVisitAluOverflow(I, ISD::SADDO);
+  case Intrinsic::usub_with_overflow:
+    return implVisitAluOverflow(I, ISD::USUBO);
+  case Intrinsic::ssub_with_overflow:
+    return implVisitAluOverflow(I, ISD::SSUBO);
+  case Intrinsic::umul_with_overflow:
+    return implVisitAluOverflow(I, ISD::UMULO);
+  case Intrinsic::smul_with_overflow:
+    return implVisitAluOverflow(I, ISD::SMULO);
+
    case Intrinsic::prefetch: {
      SDValue Ops[4];
      Ops[0] = getRoot();
@@ -4177,12 +4360,12 @@ void SelectionDAGLowering::LowerCallTo(CallSite CS, SDValue Callee,
      Entry.Node = ArgNode; Entry.Ty = (*i)->getType();
  
      unsigned attrInd = i - CS.arg_begin() + 1;
-    Entry.isSExt  = CS.paramHasAttr(attrInd, ParamAttr::SExt);
-    Entry.isZExt  = CS.paramHasAttr(attrInd, ParamAttr::ZExt);
-    Entry.isInReg = CS.paramHasAttr(attrInd, ParamAttr::InReg);
-    Entry.isSRet  = CS.paramHasAttr(attrInd, ParamAttr::StructRet);
-    Entry.isNest  = CS.paramHasAttr(attrInd, ParamAttr::Nest);
-    Entry.isByVal = CS.paramHasAttr(attrInd, ParamAttr::ByVal);
+    Entry.isSExt  = CS.paramHasAttr(attrInd, Attribute::SExt);
+    Entry.isZExt  = CS.paramHasAttr(attrInd, Attribute::ZExt);
+    Entry.isInReg = CS.paramHasAttr(attrInd, Attribute::InReg);
+    Entry.isSRet  = CS.paramHasAttr(attrInd, Attribute::StructRet);
+    Entry.isNest  = CS.paramHasAttr(attrInd, Attribute::Nest);
+    Entry.isByVal = CS.paramHasAttr(attrInd, Attribute::ByVal);
      Entry.Alignment = CS.getParamAlignment(attrInd);
      Args.push_back(Entry);
    }
@@ -4199,9 +4382,11 @@ void SelectionDAGLowering::LowerCallTo(CallSite CS, SDValue Callee,
  
    std::pair<SDValue,SDValue> Result =
      TLI.LowerCallTo(getRoot(), CS.getType(),
-                    CS.paramHasAttr(0, ParamAttr::SExt),
-                    CS.paramHasAttr(0, ParamAttr::ZExt),
-                    FTy->isVarArg(), CS.getCallingConv(), IsTailCall,
+                    CS.paramHasAttr(0, Attribute::SExt),
+                    CS.paramHasAttr(0, Attribute::ZExt), FTy->isVarArg(),
+                    CS.paramHasAttr(0, Attribute::InReg),
+                    CS.getCallingConv(),
+                    IsTailCall && PerformTailCallOpt,
                      Callee, Args, DAG);
    if (CS.getType() != Type::VoidTy)
      setValue(CS.getInstruction(), Result.first);
@@ -4351,13 +4536,13 @@ SDValue RegsForValue::getCopyFromRegs(SelectionDAG &DAG,
            else if (NumZeroBits >= RegSize-9)
              isSExt = false, FromVT = MVT::i8;  // ASSERT ZEXT 8
            else if (NumSignBits > RegSize-16)
-            isSExt = true, FromVT = MVT::i16;   // ASSERT SEXT 16
+            isSExt = true, FromVT = MVT::i16;  // ASSERT SEXT 16
            else if (NumZeroBits >= RegSize-17)
-            isSExt = false, FromVT = MVT::i16;  // ASSERT ZEXT 16
+            isSExt = false, FromVT = MVT::i16; // ASSERT ZEXT 16
            else if (NumSignBits > RegSize-32)
-            isSExt = true, FromVT = MVT::i32;   // ASSERT SEXT 32
+            isSExt = true, FromVT = MVT::i32;  // ASSERT SEXT 32
            else if (NumZeroBits >= RegSize-33)
-            isSExt = false, FromVT = MVT::i32;  // ASSERT ZEXT 32
+            isSExt = false, FromVT = MVT::i32; // ASSERT ZEXT 32
            
            if (FromVT != MVT::Other) {
              P = DAG.getNode(isSExt ? ISD::AssertSext : ISD::AssertZext,
@@ -4376,8 +4561,9 @@ SDValue RegsForValue::getCopyFromRegs(SelectionDAG &DAG,
      Parts.clear();
    }
  
-  return DAG.getMergeValues(DAG.getVTList(&ValueVTs[0], ValueVTs.size()),
-                            &Values[0], ValueVTs.size());
+  return DAG.getNode(ISD::MERGE_VALUES,
+                     DAG.getVTList(&ValueVTs[0], ValueVTs.size()),
+                     &Values[0], ValueVTs.size());
  }
  
  /// getCopyToRegs - Emit a series of CopyToReg nodes that copies the
@@ -4438,8 +4624,10 @@ void RegsForValue::AddInlineAsmOperands(unsigned Code, SelectionDAG &DAG,
    for (unsigned Value = 0, Reg = 0, e = ValueVTs.size(); Value != e; ++Value) {
      unsigned NumRegs = TLI->getNumRegisters(ValueVTs[Value]);
      MVT RegisterVT = RegVTs[Value];
-    for (unsigned i = 0; i != NumRegs; ++i)
+    for (unsigned i = 0; i != NumRegs; ++i) {
+      assert(Reg < Regs.size() && "Mismatch in # registers expected");
        Ops.push_back(DAG.getRegister(Regs[Reg++], RegisterVT));
+    }
    }
  }
  
@@ -4525,6 +4713,43 @@ struct VISIBILITY_HIDDEN SDISelAsmOperandInfo :
          MarkRegAndAliases(AssignedRegs.Regs[i], InputRegs, TRI);
      }
    }
+      
+  /// getCallOperandValMVT - Return the MVT of the Value* that this operand
+  /// corresponds to.  If there is no Value* for this operand, it returns
+  /// MVT::Other.
+  MVT getCallOperandValMVT(const TargetLowering &TLI,
+                           const TargetData *TD) const {
+    if (CallOperandVal == 0) return MVT::Other;
+    
+    if (isa<BasicBlock>(CallOperandVal))
+      return TLI.getPointerTy();
+    
+    const llvm::Type *OpTy = CallOperandVal->getType();
+    
+    // If this is an indirect operand, the operand is a pointer to the
+    // accessed type.
+    if (isIndirect)
+      OpTy = cast<PointerType>(OpTy)->getElementType();
+    
+    // If OpTy is not a single value, it may be a struct/union that we
+    // can tile with integers.
+    if (!OpTy->isSingleValueType() && OpTy->isSized()) {
+      unsigned BitSize = TD->getTypeSizeInBits(OpTy);
+      switch (BitSize) {
+      default: break;
+      case 1:
+      case 8:
+      case 16:
+      case 32:
+      case 64:
+      case 128:
+        OpTy = IntegerType::get(BitSize);
+        break;
+      }
+    }
+    
+    return TLI.getValueType(OpTy, true);
+  }
    
  private:
    /// MarkRegAndAliases - Mark the specified register and all aliases in the
@@ -4548,12 +4773,10 @@ private:
  /// allocation.  This produces generally horrible, but correct, code.
  ///
  ///   OpInfo describes the operand.
-///   HasEarlyClobber is true if there are any early clobber constraints (=&r)
-///     or any explicitly clobbered registers.
  ///   Input and OutputRegs are the set of already allocated physical registers.
  ///
  void SelectionDAGLowering::
-GetRegistersForValue(SDISelAsmOperandInfo &OpInfo, bool HasEarlyClobber,
+GetRegistersForValue(SDISelAsmOperandInfo &OpInfo,
                       std::set<unsigned> &OutputRegs, 
                       std::set<unsigned> &InputRegs) {
    // Compute whether this value requires an input register, an output register,
@@ -4564,10 +4787,9 @@ GetRegistersForValue(SDISelAsmOperandInfo &OpInfo, bool HasEarlyClobber,
    case InlineAsm::isOutput:
      isOutReg = true;
      
-    // If this is an early-clobber output, or if there is an input
-    // constraint that matches this, we need to reserve the input register
-    // so no other inputs allocate to it.
-    isInReg = OpInfo.isEarlyClobber || OpInfo.hasMatchingInput;
+    // If there is an input constraint that matches this, we need to reserve 
+    // the input register so no other inputs allocate to it.
+    isInReg = OpInfo.hasMatchingInput();
      break;
    case InlineAsm::isInput:
      isInReg = true;
@@ -4590,11 +4812,37 @@ GetRegistersForValue(SDISelAsmOperandInfo &OpInfo, bool HasEarlyClobber,
                                       OpInfo.ConstraintVT);
  
    unsigned NumRegs = 1;
-  if (OpInfo.ConstraintVT != MVT::Other)
+  if (OpInfo.ConstraintVT != MVT::Other) {
+    // If this is a FP input in an integer register (or visa versa) insert a bit
+    // cast of the input value.  More generally, handle any case where the input
+    // value disagrees with the register class we plan to stick this in.
+    if (OpInfo.Type == InlineAsm::isInput &&
+        PhysReg.second && !PhysReg.second->hasType(OpInfo.ConstraintVT)) {
+      // Try to convert to the first MVT that the reg class contains.  If the
+      // types are identical size, use a bitcast to convert (e.g. two differing
+      // vector types).
+      MVT RegVT = *PhysReg.second->vt_begin();
+      if (RegVT.getSizeInBits() == OpInfo.ConstraintVT.getSizeInBits()) {
+        OpInfo.CallOperand = DAG.getNode(ISD::BIT_CONVERT, RegVT,
+                                         OpInfo.CallOperand);
+        OpInfo.ConstraintVT = RegVT;
+      } else if (RegVT.isInteger() && OpInfo.ConstraintVT.isFloatingPoint()) {
+        // If the input is a FP value and we want it in FP registers, do a
+        // bitcast to the corresponding integer type.  This turns an f64 value
+        // into i64, which can be passed with two i32 values on a 32-bit
+        // machine.
+        RegVT = MVT::getIntegerVT(OpInfo.ConstraintVT.getSizeInBits());
+        OpInfo.CallOperand = DAG.getNode(ISD::BIT_CONVERT, RegVT,
+                                         OpInfo.CallOperand);
+        OpInfo.ConstraintVT = RegVT;
+      }
+    }
+    
      NumRegs = TLI.getNumRegisters(OpInfo.ConstraintVT);
+  }
+  
    MVT RegVT;
    MVT ValueVT = OpInfo.ConstraintVT;
-  
  
    // If this is a constraint for a specific physical register, like {r17},
    // assign it now.
@@ -4634,16 +4882,12 @@ GetRegistersForValue(SDISelAsmOperandInfo &OpInfo, bool HasEarlyClobber,
    std::vector<unsigned> RegClassRegs;
    const TargetRegisterClass *RC = PhysReg.second;
    if (RC) {
-    // If this is an early clobber or tied register, our regalloc doesn't know
-    // how to maintain the constraint.  If it isn't, go ahead and create vreg
-    // and let the regalloc do the right thing.
-    if (!OpInfo.hasMatchingInput && !OpInfo.isEarlyClobber &&
-        // If there is some other early clobber and this is an input register,
-        // then we are forced to pre-allocate the input reg so it doesn't
-        // conflict with the earlyclobber.
-        !(OpInfo.Type == InlineAsm::isInput && HasEarlyClobber)) {
+    // If this is a tied register, our regalloc doesn't know how to maintain 
+    // the constraint, so we have to pick a register to pin the input/output to.
+    // If it isn't a matched constraint, go ahead and create vreg and let the
+    // regalloc do its thing.
+    if (!OpInfo.hasMatchingInput()) {
        RegVT = *PhysReg.second->vt_begin();
-      
        if (OpInfo.ConstraintVT == MVT::Other)
          ValueVT = RegVT;
  
@@ -4712,6 +4956,22 @@ GetRegistersForValue(SDISelAsmOperandInfo &OpInfo, bool HasEarlyClobber,
    // Otherwise, we couldn't allocate enough registers for this.
  }
  
+/// hasInlineAsmMemConstraint - Return true if the inline asm instruction being
+/// processed uses a memory 'm' constraint.
+static bool
+hasInlineAsmMemConstraint(std::vector<InlineAsm::ConstraintInfo> &CInfos,
+                          TargetLowering &TLI) {
+  for (unsigned i = 0, e = CInfos.size(); i != e; ++i) {
+    InlineAsm::ConstraintInfo &CI = CInfos[i];
+    for (unsigned j = 0, ee = CI.Codes.size(); j != ee; ++j) {
+      TargetLowering::ConstraintType CType = TLI.getConstraintType(CI.Codes[j]);
+      if (CType == TargetLowering::C_Memory)
+        return true;
+    }
+  }
+
+  return false;
+}
  
  /// visitInlineAsm - Handle a call to an InlineAsm object.
  ///
@@ -4731,10 +4991,7 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
    std::vector<InlineAsm::ConstraintInfo>
      ConstraintInfos = IA->ParseConstraints();
  
-  // SawEarlyClobber - Keep track of whether we saw an earlyclobber output
-  // constraint.  If so, we can't let the register allocator allocate any input
-  // registers, because it will not know to avoid the earlyclobbered output reg.
-  bool SawEarlyClobber = false;
+  bool hasMemory = hasInlineAsmMemConstraint(ConstraintInfos, TLI);
    
    unsigned ArgNo = 0;   // ArgNo - The argument of the CallInst.
    unsigned ResNo = 0;   // ResNo - The result number of the next output.
@@ -4752,6 +5009,7 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
          OpInfo.CallOperandVal = CS.getArgument(ArgNo++);
          break;
        }
+        
        // The return value of the call is this value.  As such, there is no
        // corresponding argument.
        assert(CS.getType() != Type::VoidTy && "Bad inline asm!");
@@ -4774,59 +5032,44 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
      // If this is an input or an indirect output, process the call argument.
      // BasicBlocks are labels, currently appearing only in asm's.
      if (OpInfo.CallOperandVal) {
-      if (BasicBlock *BB = dyn_cast<BasicBlock>(OpInfo.CallOperandVal))
+      if (BasicBlock *BB = dyn_cast<BasicBlock>(OpInfo.CallOperandVal)) {
          OpInfo.CallOperand = DAG.getBasicBlock(FuncInfo.MBBMap[BB]);
-      else {
+      } else {
          OpInfo.CallOperand = getValue(OpInfo.CallOperandVal);
-        const Type *OpTy = OpInfo.CallOperandVal->getType();
-        // If this is an indirect operand, the operand is a pointer to the
-        // accessed type.
-        if (OpInfo.isIndirect)
-          OpTy = cast<PointerType>(OpTy)->getElementType();
-
-        // If OpTy is not a single value, it may be a struct/union that we
-        // can tile with integers.
-        if (!OpTy->isSingleValueType() && OpTy->isSized()) {
-          unsigned BitSize = TD->getTypeSizeInBits(OpTy);
-          switch (BitSize) {
-          default: break;
-          case 1:
-          case 8:
-          case 16:
-          case 32:
-          case 64:
-            OpTy = IntegerType::get(BitSize);
-            break;
-          }
-        }
-
-        OpVT = TLI.getValueType(OpTy, true);
        }
+      
+      OpVT = OpInfo.getCallOperandValMVT(TLI, TD);
      }
      
      OpInfo.ConstraintVT = OpVT;
+  }
+  
+  // Second pass over the constraints: compute which constraint option to use
+  // and assign registers to constraints that want a specific physreg.
+  for (unsigned i = 0, e = ConstraintInfos.size(); i != e; ++i) {
+    SDISelAsmOperandInfo &OpInfo = ConstraintOperands[i];
      
-    // Compute the constraint code and ConstraintType to use.
-    TLI.ComputeConstraintToUse(OpInfo, OpInfo.CallOperand, &DAG);
-
-    // Keep track of whether we see an earlyclobber.
-    SawEarlyClobber |= OpInfo.isEarlyClobber;
-    
-    // If we see a clobber of a register, it is an early clobber.
-    if (!SawEarlyClobber &&
-        OpInfo.Type == InlineAsm::isClobber &&
-        OpInfo.ConstraintType == TargetLowering::C_Register) {
-      // Note that we want to ignore things that we don't track here, like
-      // dirflag, fpsr, flags, etc.
-      std::pair<unsigned, const TargetRegisterClass*> PhysReg = 
-        TLI.getRegForInlineAsmConstraint(OpInfo.ConstraintCode,
-                                         OpInfo.ConstraintVT);
-      if (PhysReg.first || PhysReg.second) {
-        // This is a register we know of.
-        SawEarlyClobber = true;
+    // If this is an output operand with a matching input operand, look up the
+    // matching input.  It might have a different type (e.g. the output might be
+    // i32 and the input i64) and we need to pick the larger width to ensure we
+    // reserve the right number of registers.  
+    if (OpInfo.hasMatchingInput()) {
+      SDISelAsmOperandInfo &Input = ConstraintOperands[OpInfo.MatchingInput];
+      if (OpInfo.ConstraintVT != Input.ConstraintVT) {
+        assert(OpInfo.ConstraintVT.isInteger() &&
+               Input.ConstraintVT.isInteger() &&
+               "Asm constraints must be the same or different sized integers");
+        if (OpInfo.ConstraintVT.getSizeInBits() < 
+            Input.ConstraintVT.getSizeInBits())
+          OpInfo.ConstraintVT = Input.ConstraintVT;
+        else
+          Input.ConstraintVT = OpInfo.ConstraintVT;
        }
      }
      
+    // Compute the constraint code and ConstraintType to use.
+    TLI.ComputeConstraintToUse(OpInfo, OpInfo.CallOperand, hasMemory, &DAG);
+
      // If this is a memory input, and if the operand is not indirect, do what we
      // need to to provide an address for the memory input.
      if (OpInfo.ConstraintType == TargetLowering::C_Memory &&
@@ -4867,20 +5110,20 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
      // If this constraint is for a specific register, allocate it before
      // anything else.
      if (OpInfo.ConstraintType == TargetLowering::C_Register)
-      GetRegistersForValue(OpInfo, SawEarlyClobber, OutputRegs, InputRegs);
+      GetRegistersForValue(OpInfo, OutputRegs, InputRegs);
    }
    ConstraintInfos.clear();
    
    
    // Second pass - Loop over all of the operands, assigning virtual or physregs
-  // to registerclass operands.
+  // to register class operands.
    for (unsigned i = 0, e = ConstraintOperands.size(); i != e; ++i) {
      SDISelAsmOperandInfo &OpInfo = ConstraintOperands[i];
      
      // C_Register operands have already been allocated, Other/Memory don't need
      // to be.
      if (OpInfo.ConstraintType == TargetLowering::C_RegisterClass)
-      GetRegistersForValue(OpInfo, SawEarlyClobber, OutputRegs, InputRegs);
+      GetRegistersForValue(OpInfo, OutputRegs, InputRegs);
    }    
    
    // AsmNodeOperands - The operands for the ISD::INLINEASM node.
@@ -4908,8 +5151,8 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
          assert(OpInfo.isIndirect && "Memory output must be indirect operand");
  
          // Add information to the INLINEASM node to know about this output.
-        unsigned ResOpType = 4/*MEM*/ | (1 << 3);
-        AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType, 
+        unsigned ResOpType = 4/*MEM*/ | (1<<3);
+        AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
                                                          TLI.getPointerTy()));
          AsmNodeOperands.push_back(OpInfo.CallOperand);
          break;
@@ -4939,17 +5182,19 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
        
        // Add information to the INLINEASM node to know that this register is
        // set.
-      OpInfo.AssignedRegs.AddInlineAsmOperands(2 /*REGDEF*/, DAG,
-                                               AsmNodeOperands);
+      OpInfo.AssignedRegs.AddInlineAsmOperands(OpInfo.isEarlyClobber ?
+                                               6 /* EARLYCLOBBER REGDEF */ :
+                                               2 /* REGDEF */ ,
+                                               DAG, AsmNodeOperands);
        break;
      }
      case InlineAsm::isInput: {
        SDValue InOperandVal = OpInfo.CallOperand;
        
-      if (isdigit(OpInfo.ConstraintCode[0])) {    // Matching constraint?
+      if (OpInfo.isMatchingInputConstraint()) {   // Matching constraint?
          // If this is required to match an output register we have already set,
          // just use its register.
-        unsigned OperandNo = atoi(OpInfo.ConstraintCode.c_str());
+        unsigned OperandNo = OpInfo.getMatchedOperand();
          
          // Scan until we find the definition we already emitted of this operand.
          // When we find it, create a RegsForValue operand.
@@ -4957,16 +5202,18 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
          for (; OperandNo; --OperandNo) {
            // Advance to the next operand.
            unsigned NumOps = 
-            cast<ConstantSDNode>(AsmNodeOperands[CurOp])->getValue();
+            cast<ConstantSDNode>(AsmNodeOperands[CurOp])->getZExtValue();
            assert(((NumOps & 7) == 2 /*REGDEF*/ ||
+                  (NumOps & 7) == 6 /*EARLYCLOBBER REGDEF*/ ||
                    (NumOps & 7) == 4 /*MEM*/) &&
                   "Skipped past definitions?");
            CurOp += (NumOps>>3)+1;
          }
  
          unsigned NumOps = 
-          cast<ConstantSDNode>(AsmNodeOperands[CurOp])->getValue();
-        if ((NumOps & 7) == 2 /*REGDEF*/) {
+          cast<ConstantSDNode>(AsmNodeOperands[CurOp])->getZExtValue();
+        if ((NumOps & 7) == 2 /*REGDEF*/ 
+            || (NumOps & 7) == 6 /* EARLYCLOBBER REGDEF */) {
            // Add NumOps>>3 registers to MatchedRegs.
            RegsForValue MatchedRegs;
            MatchedRegs.TLI = &TLI;
@@ -4983,11 +5230,10 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
            MatchedRegs.AddInlineAsmOperands(1 /*REGUSE*/, DAG, AsmNodeOperands);
            break;
          } else {
-          assert((NumOps & 7) == 4/*MEM*/ && "Unknown matching constraint!");
+          assert(((NumOps & 7) == 4) && "Unknown matching constraint!");
            assert((NumOps >> 3) == 1 && "Unexpected number of operands"); 
            // Add information to the INLINEASM node to know about this input.
-          unsigned ResOpType = 4/*MEM*/ | (1 << 3);
-          AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
+          AsmNodeOperands.push_back(DAG.getTargetConstant(NumOps,
                                                            TLI.getPointerTy()));
            AsmNodeOperands.push_back(AsmNodeOperands[CurOp+1]);
            break;
@@ -5000,7 +5246,7 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
          
          std::vector<SDValue> Ops;
          TLI.LowerAsmOperandForConstraint(InOperandVal, OpInfo.ConstraintCode[0],
-                                         Ops, DAG);
+                                         hasMemory, Ops, DAG);
          if (Ops.empty()) {
            cerr << "Invalid operand for inline asm constraint '"
                 << OpInfo.ConstraintCode << "'!\n";
@@ -5019,7 +5265,7 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
                 "Memory operands expect pointer values");
                 
          // Add information to the INLINEASM node to know about this input.
-        unsigned ResOpType = 4/*MEM*/ | (1 << 3);
+        unsigned ResOpType = 4/*MEM*/ | (1<<3);
          AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
                                                          TLI.getPointerTy()));
          AsmNodeOperands.push_back(InOperandVal);
@@ -5033,21 +5279,24 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
               "Don't know how to handle indirect register inputs yet!");
  
        // Copy the input into the appropriate registers.
-      assert(!OpInfo.AssignedRegs.Regs.empty() &&
-             "Couldn't allocate input reg!");
+      if (OpInfo.AssignedRegs.Regs.empty()) {
+        cerr << "Couldn't allocate output reg for constraint '"
+             << OpInfo.ConstraintCode << "'!\n";
+        exit(1);
+      }
  
        OpInfo.AssignedRegs.getCopyToRegs(InOperandVal, DAG, Chain, &Flag);
        
-      OpInfo.AssignedRegs.AddInlineAsmOperands(1/*REGUSE*/, DAG,
-                                               AsmNodeOperands);
+      OpInfo.AssignedRegs.AddInlineAsmOperands(1/*REGUSE*/,
+                                               DAG, AsmNodeOperands);
        break;
      }
      case InlineAsm::isClobber: {
        // Add the clobbered value to the operand list, so that the register
        // allocator is aware that the physreg got clobbered.
        if (!OpInfo.AssignedRegs.Regs.empty())
-        OpInfo.AssignedRegs.AddInlineAsmOperands(2/*REGDEF*/, DAG,
-                                                 AsmNodeOperands);
+        OpInfo.AssignedRegs.AddInlineAsmOperands(6 /* EARLYCLOBBER REGDEF */,
+                                                 DAG, AsmNodeOperands);
        break;
      }
      }
@@ -5066,22 +5315,28 @@ void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
    // and set it as the value of the call.
    if (!RetValRegs.Regs.empty()) {
      SDValue Val = RetValRegs.getCopyFromRegs(DAG, Chain, &Flag);
-
-    // If any of the results of the inline asm is a vector, it may have the
-    // wrong width/num elts.  This can happen for register classes that can
-    // contain multiple different value types.  The preg or vreg allocated may
-    // not have the same VT as was expected.  Convert it to the right type with
-    // bit_convert.
-    if (const StructType *ResSTy = dyn_cast<StructType>(CS.getType())) {
-      for (unsigned i = 0, e = ResSTy->getNumElements(); i != e; ++i) {
-        if (Val.getNode()->getValueType(i).isVector())
-          Val = DAG.getNode(ISD::BIT_CONVERT,
-                            TLI.getValueType(ResSTy->getElementType(i)), Val);
+    
+    // FIXME: Why don't we do this for inline asms with MRVs?
+    if (CS.getType()->isSingleValueType() && CS.getType()->isSized()) {
+      MVT ResultType = TLI.getValueType(CS.getType());
+    
+      // If any of the results of the inline asm is a vector, it may have the
+      // wrong width/num elts.  This can happen for register classes that can
+      // contain multiple different value types.  The preg or vreg allocated may
+      // not have the same VT as was expected.  Convert it to the right type
+      // with bit_convert.
+      if (ResultType != Val.getValueType() && Val.getValueType().isVector()) {
+        Val = DAG.getNode(ISD::BIT_CONVERT, ResultType, Val);
+
+      } else if (ResultType != Val.getValueType() && 
+                 ResultType.isInteger() && Val.getValueType().isInteger()) {
+        // If a result value was tied to an input value, the computed result may
+        // have a wider width than the expected result.  Extract the relevant
+        // portion.
+        Val = DAG.getNode(ISD::TRUNCATE, ResultType, Val);
        }
-    } else {
-      if (Val.getValueType().isVector())
-        Val = DAG.getNode(ISD::BIT_CONVERT, TLI.getValueType(CS.getType()),
-                          Val);
+    
+      assert(ResultType == Val.getValueType() && "Asm result value mismatch!");
      }
  
      setValue(CS.getInstruction(), Val);
@@ -5133,8 +5388,10 @@ void SelectionDAGLowering::visitMalloc(MallocInst &I) {
    Args.push_back(Entry);
  
    std::pair<SDValue,SDValue> Result =
-    TLI.LowerCallTo(getRoot(), I.getType(), false, false, false, CallingConv::C,
-                    true, DAG.getExternalSymbol("malloc", IntPtr), Args, DAG);
+    TLI.LowerCallTo(getRoot(), I.getType(), false, false, false, false,
+                    CallingConv::C, PerformTailCallOpt, 
+                    DAG.getExternalSymbol("malloc", IntPtr),
+                    Args, DAG);
    setValue(&I, Result.first);  // Pointers always fit in registers
    DAG.setRoot(Result.second);
  }
@@ -5147,8 +5404,8 @@ void SelectionDAGLowering::visitFree(FreeInst &I) {
    Args.push_back(Entry);
    MVT IntPtr = TLI.getPointerTy();
    std::pair<SDValue,SDValue> Result =
-    TLI.LowerCallTo(getRoot(), Type::VoidTy, false, false, false,
-                    CallingConv::C, true,
+    TLI.LowerCallTo(getRoot(), Type::VoidTy, false, false, false, false,
+                    CallingConv::C, PerformTailCallOpt,
                      DAG.getExternalSymbol("free", IntPtr), Args, DAG);
    DAG.setRoot(Result.second);
  }
@@ -5208,15 +5465,15 @@ void TargetLowering::LowerArguments(Function &F, SelectionDAG &DAG,
        unsigned OriginalAlignment =
          getTargetData()->getABITypeAlignment(ArgTy);
  
-      if (F.paramHasAttr(j, ParamAttr::ZExt))
+      if (F.paramHasAttr(j, Attribute::ZExt))
          Flags.setZExt();
-      if (F.paramHasAttr(j, ParamAttr::SExt))
+      if (F.paramHasAttr(j, Attribute::SExt))
          Flags.setSExt();
-      if (F.paramHasAttr(j, ParamAttr::InReg))
+      if (F.paramHasAttr(j, Attribute::InReg))
          Flags.setInReg();
-      if (F.paramHasAttr(j, ParamAttr::StructRet))
+      if (F.paramHasAttr(j, Attribute::StructRet))
          Flags.setSRet();
-      if (F.paramHasAttr(j, ParamAttr::ByVal)) {
+      if (F.paramHasAttr(j, Attribute::ByVal)) {
          Flags.setByVal();
          const PointerType *Ty = cast<PointerType>(I->getType());
          const Type *ElementTy = Ty->getElementType();
@@ -5229,7 +5486,7 @@ void TargetLowering::LowerArguments(Function &F, SelectionDAG &DAG,
          Flags.setByValAlign(FrameAlign);
          Flags.setByValSize(FrameSize);
        }
-      if (F.paramHasAttr(j, ParamAttr::Nest))
+      if (F.paramHasAttr(j, Attribute::Nest))
          Flags.setNest();
        Flags.setOrigAlign(OriginalAlignment);
  
@@ -5296,9 +5553,9 @@ void TargetLowering::LowerArguments(Function &F, SelectionDAG &DAG,
          Parts[j] = SDValue(Result, i++);
  
        ISD::NodeType AssertOp = ISD::DELETED_NODE;
-      if (F.paramHasAttr(Idx, ParamAttr::SExt))
+      if (F.paramHasAttr(Idx, Attribute::SExt))
          AssertOp = ISD::AssertSext;
-      else if (F.paramHasAttr(Idx, ParamAttr::ZExt))
+      else if (F.paramHasAttr(Idx, Attribute::ZExt))
          AssertOp = ISD::AssertZext;
  
        ArgValues.push_back(getCopyFromParts(DAG, &Parts[0], NumParts, PartVT, VT,
@@ -5316,14 +5573,15 @@ void TargetLowering::LowerArguments(Function &F, SelectionDAG &DAG,
  std::pair<SDValue, SDValue>
  TargetLowering::LowerCallTo(SDValue Chain, const Type *RetTy,
                              bool RetSExt, bool RetZExt, bool isVarArg,
+                            bool isInreg,
                              unsigned CallingConv, bool isTailCall,
                              SDValue Callee,
                              ArgListTy &Args, SelectionDAG &DAG) {
+  assert((!isTailCall || PerformTailCallOpt) &&
+         "isTailCall set when tail-call optimizations are disabled!");
+
    SmallVector<SDValue, 32> Ops;
    Ops.push_back(Chain);   // Op#0 - Chain
-  Ops.push_back(DAG.getConstant(CallingConv, getPointerTy())); // Op#1 - CC
-  Ops.push_back(DAG.getConstant(isVarArg, getPointerTy()));    // Op#2 - VarArg
-  Ops.push_back(DAG.getConstant(isTailCall, getPointerTy()));  // Op#3 - Tail
    Ops.push_back(Callee);
    
    // Handle all of the outgoing arguments.
@@ -5334,7 +5592,8 @@ TargetLowering::LowerCallTo(SDValue Chain, const Type *RetTy,
           Value != NumValues; ++Value) {
        MVT VT = ValueVTs[Value];
        const Type *ArgTy = VT.getTypeForMVT();
-      SDValue Op = SDValue(Args[i].Node.getNode(), Args[i].Node.getResNo() + Value);
+      SDValue Op = SDValue(Args[i].Node.getNode(),
+                           Args[i].Node.getResNo() + Value);
        ISD::ArgFlagsTy Flags;
        unsigned OriginalAlignment =
          getTargetData()->getABITypeAlignment(ArgTy);
@@ -5408,14 +5667,15 @@ TargetLowering::LowerCallTo(SDValue Chain, const Type *RetTy,
    LoweredRetTys.push_back(MVT::Other);  // Always has a chain.
    
    // Create the CALL node.
-  SDValue Res = DAG.getNode(ISD::CALL,
-                              DAG.getVTList(&LoweredRetTys[0],
-                                            LoweredRetTys.size()),
-                              &Ops[0], Ops.size());
+  SDValue Res = DAG.getCall(CallingConv, isVarArg, isTailCall, isInreg,
+                            DAG.getVTList(&LoweredRetTys[0],
+                                          LoweredRetTys.size()),
+                            &Ops[0], Ops.size()
+                            );
    Chain = Res.getValue(LoweredRetTys.size() - 1);
  
    // Gather up the call result into a single value.
-  if (RetTy != Type::VoidTy) {
+  if (RetTy != Type::VoidTy && !RetTys.empty()) {
      ISD::NodeType AssertOp = ISD::DELETED_NODE;
  
      if (RetSExt)
@@ -5438,8 +5698,9 @@ TargetLowering::LowerCallTo(SDValue Chain, const Type *RetTy,
                           AssertOp);
        ReturnValues.push_back(ReturnValue);
      }
-    Res = DAG.getMergeValues(DAG.getVTList(&RetTys[0], RetTys.size()),
-                             &ReturnValues[0], ReturnValues.size());
+    Res = DAG.getNode(ISD::MERGE_VALUES,
+                      DAG.getVTList(&RetTys[0], RetTys.size()),
+                      &ReturnValues[0], ReturnValues.size());
    }
  
    return std::make_pair(Res, Chain);
@@ -5612,8 +5873,13 @@ SelectionDAGISel::HandlePHINodesInSuccessorBlocksFast(BasicBlock *LLVMBB,
        // exactly one register for each non-void instruction.
        MVT VT = TLI.getValueType(PN->getType(), /*AllowUnknown=*/true);
        if (VT == MVT::Other || !TLI.isTypeLegal(VT)) {
-        SDL->PHINodesToUpdate.resize(OrigNumPHINodesToUpdate);
-        return false;
+        // Promote MVT::i1.
+        if (VT == MVT::i1)
+          VT = TLI.getTypeToTransformTo(VT);
+        else {
+          SDL->PHINodesToUpdate.resize(OrigNumPHINodesToUpdate);
+          return false;
+        }
        }
  
        Value *PHIOp = PN->getIncomingValueForBlock(LLVMBB);