Replace Count{Leading,Trailing}Zeros_{32,64} with count{Leading,Trailing}Zeros.

[oota-llvm.git] / lib / CodeGen / SelectionDAG / SelectionDAGBuilder.cpp
diff --git a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

index 9c5148f0cd6446c5007157e3ff505d4ce0817815..9799568e03d01e3cbdc9feb38d90030dae83cc53 100644 (file)
--- a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
@@ -12,51 +12,51 @@
  //===----------------------------------------------------------------------===//
  
  #define DEBUG_TYPE "isel"
-#include "SDNodeDbgValue.h"
  #include "SelectionDAGBuilder.h"
+#include "SDNodeDbgValue.h"
  #include "llvm/ADT/BitVector.h"
-#include "llvm/ADT/PostOrderIterator.h"
  #include "llvm/ADT/SmallSet.h"
  #include "llvm/Analysis/AliasAnalysis.h"
+#include "llvm/Analysis/BranchProbabilityInfo.h"
  #include "llvm/Analysis/ConstantFolding.h"
  #include "llvm/Analysis/ValueTracking.h"
-#include "llvm/Constants.h"
-#include "llvm/CallingConv.h"
-#include "llvm/DebugInfo.h"
-#include "llvm/DerivedTypes.h"
-#include "llvm/Function.h"
-#include "llvm/GlobalVariable.h"
-#include "llvm/InlineAsm.h"
-#include "llvm/Instructions.h"
-#include "llvm/Intrinsics.h"
-#include "llvm/IntrinsicInst.h"
-#include "llvm/LLVMContext.h"
-#include "llvm/Module.h"
  #include "llvm/CodeGen/Analysis.h"
  #include "llvm/CodeGen/FastISel.h"
  #include "llvm/CodeGen/FunctionLoweringInfo.h"
-#include "llvm/CodeGen/GCStrategy.h"
  #include "llvm/CodeGen/GCMetadata.h"
-#include "llvm/CodeGen/MachineFunction.h"
+#include "llvm/CodeGen/GCStrategy.h"
  #include "llvm/CodeGen/MachineFrameInfo.h"
+#include "llvm/CodeGen/MachineFunction.h"
  #include "llvm/CodeGen/MachineInstrBuilder.h"
  #include "llvm/CodeGen/MachineJumpTableInfo.h"
  #include "llvm/CodeGen/MachineModuleInfo.h"
  #include "llvm/CodeGen/MachineRegisterInfo.h"
  #include "llvm/CodeGen/SelectionDAG.h"
-#include "llvm/DataLayout.h"
+#include "llvm/DebugInfo.h"
+#include "llvm/IR/CallingConv.h"
+#include "llvm/IR/Constants.h"
+#include "llvm/IR/DataLayout.h"
+#include "llvm/IR/DerivedTypes.h"
+#include "llvm/IR/Function.h"
+#include "llvm/IR/GlobalVariable.h"
+#include "llvm/IR/InlineAsm.h"
+#include "llvm/IR/Instructions.h"
+#include "llvm/IR/IntrinsicInst.h"
+#include "llvm/IR/Intrinsics.h"
+#include "llvm/IR/LLVMContext.h"
+#include "llvm/IR/Module.h"
+#include "llvm/Support/CommandLine.h"
+#include "llvm/Support/Debug.h"
+#include "llvm/Support/ErrorHandling.h"
+#include "llvm/Support/IntegersSubsetMapping.h"
+#include "llvm/Support/MathExtras.h"
+#include "llvm/Support/raw_ostream.h"
  #include "llvm/Target/TargetFrameLowering.h"
  #include "llvm/Target/TargetInstrInfo.h"
  #include "llvm/Target/TargetIntrinsicInfo.h"
  #include "llvm/Target/TargetLibraryInfo.h"
  #include "llvm/Target/TargetLowering.h"
  #include "llvm/Target/TargetOptions.h"
-#include "llvm/Support/CommandLine.h"
-#include "llvm/Support/IntegersSubsetMapping.h"
-#include "llvm/Support/Debug.h"
-#include "llvm/Support/ErrorHandling.h"
-#include "llvm/Support/MathExtras.h"
-#include "llvm/Support/raw_ostream.h"
  #include <algorithm>
  using namespace llvm;
  
@@ -89,7 +89,7 @@ static const unsigned MaxParallelChains = 64;
  
  static SDValue getCopyFromPartsVector(SelectionDAG &DAG, DebugLoc DL,
                                        const SDValue *Parts, unsigned NumParts,
-                                      EVT PartVT, EVT ValueVT, const Value *V);
+                                      MVT PartVT, EVT ValueVT, const Value *V);
  
  /// getCopyFromParts - Create a value that contains the specified legal parts
  /// combined into the value they represent.  If the parts combine to a type
@@ -98,7 +98,7 @@ static SDValue getCopyFromPartsVector(SelectionDAG &DAG, DebugLoc DL,
  /// (ISD::AssertSext).
  static SDValue getCopyFromParts(SelectionDAG &DAG, DebugLoc DL,
                                  const SDValue *Parts,
-                                unsigned NumParts, EVT PartVT, EVT ValueVT,
+                                unsigned NumParts, MVT PartVT, EVT ValueVT,
                                  const Value *V,
                                  ISD::NodeType AssertOp = ISD::DELETED_NODE) {
    if (ValueVT.isVector())
@@ -161,7 +161,7 @@ static SDValue getCopyFromParts(SelectionDAG &DAG, DebugLoc DL,
        }
      } else if (PartVT.isFloatingPoint()) {
        // FP split into multiple FP parts (for ppcf128)
-      assert(ValueVT == EVT(MVT::ppcf128) && PartVT == EVT(MVT::f64) &&
+      assert(ValueVT == EVT(MVT::ppcf128) && PartVT == MVT::f64 &&
               "Unexpected split");
        SDValue Lo, Hi;
        Lo = DAG.getNode(ISD::BITCAST, DL, EVT(MVT::f64), Parts[0]);
@@ -179,25 +179,25 @@ static SDValue getCopyFromParts(SelectionDAG &DAG, DebugLoc DL,
    }
  
    // There is now one part, held in Val.  Correct it to match ValueVT.
-  PartVT = Val.getValueType();
+  EVT PartEVT = Val.getValueType();
  
-  if (PartVT == ValueVT)
+  if (PartEVT == ValueVT)
      return Val;
  
-  if (PartVT.isInteger() && ValueVT.isInteger()) {
-    if (ValueVT.bitsLT(PartVT)) {
+  if (PartEVT.isInteger() && ValueVT.isInteger()) {
+    if (ValueVT.bitsLT(PartEVT)) {
        // For a truncate, see if we have any information to
        // indicate whether the truncated bits will always be
        // zero or sign-extension.
        if (AssertOp != ISD::DELETED_NODE)
-        Val = DAG.getNode(AssertOp, DL, PartVT, Val,
+        Val = DAG.getNode(AssertOp, DL, PartEVT, Val,
                            DAG.getValueType(ValueVT));
        return DAG.getNode(ISD::TRUNCATE, DL, ValueVT, Val);
      }
      return DAG.getNode(ISD::ANY_EXTEND, DL, ValueVT, Val);
    }
  
-  if (PartVT.isFloatingPoint() && ValueVT.isFloatingPoint()) {
+  if (PartEVT.isFloatingPoint() && ValueVT.isFloatingPoint()) {
      // FP_ROUND's are always exact here.
      if (ValueVT.bitsLT(Val.getValueType()))
        return DAG.getNode(ISD::FP_ROUND, DL, ValueVT, Val,
@@ -206,7 +206,7 @@ static SDValue getCopyFromParts(SelectionDAG &DAG, DebugLoc DL,
      return DAG.getNode(ISD::FP_EXTEND, DL, ValueVT, Val);
    }
  
-  if (PartVT.getSizeInBits() == ValueVT.getSizeInBits())
+  if (PartEVT.getSizeInBits() == ValueVT.getSizeInBits())
      return DAG.getNode(ISD::BITCAST, DL, ValueVT, Val);
  
    llvm_unreachable("Unknown mismatch!");
@@ -219,7 +219,7 @@ static SDValue getCopyFromParts(SelectionDAG &DAG, DebugLoc DL,
  /// ValueVT (ISD::AssertSext).
  static SDValue getCopyFromPartsVector(SelectionDAG &DAG, DebugLoc DL,
                                        const SDValue *Parts, unsigned NumParts,
-                                      EVT PartVT, EVT ValueVT, const Value *V) {
+                                      MVT PartVT, EVT ValueVT, const Value *V) {
    assert(ValueVT.isVector() && "Not a vector value");
    assert(NumParts > 0 && "No parts to assemble!");
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
@@ -227,7 +227,8 @@ static SDValue getCopyFromPartsVector(SelectionDAG &DAG, DebugLoc DL,
  
    // Handle a multi-element vector.
    if (NumParts > 1) {
-    EVT IntermediateVT, RegisterVT;
+    EVT IntermediateVT;
+    MVT RegisterVT;
      unsigned NumIntermediates;
      unsigned NumRegs =
      TLI.getVectorTypeBreakdown(*DAG.getContext(), ValueVT, IntermediateVT,
@@ -235,7 +236,7 @@ static SDValue getCopyFromPartsVector(SelectionDAG &DAG, DebugLoc DL,
      assert(NumRegs == NumParts && "Part count doesn't match vector breakdown!");
      NumParts = NumRegs; // Silence a compiler warning.
      assert(RegisterVT == PartVT && "Part type doesn't match vector breakdown!");
-    assert(RegisterVT == Parts[0].getValueType() &&
+    assert(RegisterVT == Parts[0].getSimpleValueType() &&
             "Part type doesn't match part!");
  
      // Assemble the parts into intermediate operands.
@@ -265,31 +266,31 @@ static SDValue getCopyFromPartsVector(SelectionDAG &DAG, DebugLoc DL,
    }
  
    // There is now one part, held in Val.  Correct it to match ValueVT.
-  PartVT = Val.getValueType();
+  EVT PartEVT = Val.getValueType();
  
-  if (PartVT == ValueVT)
+  if (PartEVT == ValueVT)
      return Val;
  
-  if (PartVT.isVector()) {
+  if (PartEVT.isVector()) {
      // If the element type of the source/dest vectors are the same, but the
      // parts vector has more elements than the value vector, then we have a
      // vector widening case (e.g. <2 x float> -> <4 x float>).  Extract the
      // elements we want.
-    if (PartVT.getVectorElementType() == ValueVT.getVectorElementType()) {
-      assert(PartVT.getVectorNumElements() > ValueVT.getVectorNumElements() &&
+    if (PartEVT.getVectorElementType() == ValueVT.getVectorElementType()) {
+      assert(PartEVT.getVectorNumElements() > ValueVT.getVectorNumElements() &&
               "Cannot narrow, it would be a lossy transformation");
        return DAG.getNode(ISD::EXTRACT_SUBVECTOR, DL, ValueVT, Val,
                           DAG.getIntPtrConstant(0));
      }
  
      // Vector/Vector bitcast.
-    if (ValueVT.getSizeInBits() == PartVT.getSizeInBits())
+    if (ValueVT.getSizeInBits() == PartEVT.getSizeInBits())
        return DAG.getNode(ISD::BITCAST, DL, ValueVT, Val);
  
-    assert(PartVT.getVectorNumElements() == ValueVT.getVectorNumElements() &&
+    assert(PartEVT.getVectorNumElements() == ValueVT.getVectorNumElements() &&
        "Cannot handle this kind of promotion");
      // Promoted vector extract
-    bool Smaller = ValueVT.bitsLE(PartVT);
+    bool Smaller = ValueVT.bitsLE(PartEVT);
      return DAG.getNode((Smaller ? ISD::TRUNCATE : ISD::ANY_EXTEND),
                         DL, ValueVT, Val);
  
@@ -297,7 +298,7 @@ static SDValue getCopyFromPartsVector(SelectionDAG &DAG, DebugLoc DL,
  
    // Trivial bitcast if the types are the same size and the destination
    // vector type is legal.
-  if (PartVT.getSizeInBits() == ValueVT.getSizeInBits() &&
+  if (PartEVT.getSizeInBits() == ValueVT.getSizeInBits() &&
        TLI.isTypeLegal(ValueVT))
      return DAG.getNode(ISD::BITCAST, DL, ValueVT, Val);
  
@@ -313,12 +314,12 @@ static SDValue getCopyFromPartsVector(SelectionDAG &DAG, DebugLoc DL,
      } else {
        Ctx.emitError(ErrMsg);
      }
-    report_fatal_error("Cannot handle scalar-to-vector conversion!");
+    return DAG.getUNDEF(ValueVT);
    }
  
    if (ValueVT.getVectorNumElements() == 1 &&
-      ValueVT.getVectorElementType() != PartVT) {
-    bool Smaller = ValueVT.bitsLE(PartVT);
+      ValueVT.getVectorElementType() != PartEVT) {
+    bool Smaller = ValueVT.bitsLE(PartEVT);
      Val = DAG.getNode((Smaller ? ISD::TRUNCATE : ISD::ANY_EXTEND),
                         DL, ValueVT.getScalarType(), Val);
    }
@@ -328,14 +329,14 @@ static SDValue getCopyFromPartsVector(SelectionDAG &DAG, DebugLoc DL,
  
  static void getCopyToPartsVector(SelectionDAG &DAG, DebugLoc dl,
                                   SDValue Val, SDValue *Parts, unsigned NumParts,
-                                 EVT PartVT, const Value *V);
+                                 MVT PartVT, const Value *V);
  
  /// getCopyToParts - Create a series of nodes that contain the specified value
  /// split into legal parts.  If the parts contain more bits than Val, then, for
  /// integers, ExtendKind can be used to specify how to generate the extra bits.
  static void getCopyToParts(SelectionDAG &DAG, DebugLoc DL,
                             SDValue Val, SDValue *Parts, unsigned NumParts,
-                           EVT PartVT, const Value *V,
+                           MVT PartVT, const Value *V,
                             ISD::NodeType ExtendKind = ISD::ANY_EXTEND) {
    EVT ValueVT = Val.getValueType();
  
@@ -352,7 +353,8 @@ static void getCopyToParts(SelectionDAG &DAG, DebugLoc DL,
      return;
  
    assert(!ValueVT.isVector() && "Vector case handled elsewhere");
-  if (PartVT == ValueVT) {
+  EVT PartEVT = PartVT;
+  if (PartEVT == ValueVT) {
      assert(NumParts == 1 && "No-op copy with multiple parts!");
      Parts[0] = Val;
      return;
@@ -374,7 +376,7 @@ static void getCopyToParts(SelectionDAG &DAG, DebugLoc DL,
      }
    } else if (PartBits == ValueVT.getSizeInBits()) {
      // Different types of the same size.
-    assert(NumParts == 1 && PartVT != ValueVT);
+    assert(NumParts == 1 && PartEVT != ValueVT);
      Val = DAG.getNode(ISD::BITCAST, DL, PartVT, Val);
    } else if (NumParts * PartBits < ValueVT.getSizeInBits()) {
      // If the parts cover less bits than value has, truncate the value.
@@ -393,7 +395,7 @@ static void getCopyToParts(SelectionDAG &DAG, DebugLoc DL,
           "Failed to tile the value with PartVT!");
  
    if (NumParts == 1) {
-    if (PartVT != ValueVT) {
+    if (PartEVT != ValueVT) {
        LLVMContext &Ctx = *DAG.getContext();
        Twine ErrMsg("scalar-to-vector conversion failed");
        if (const Instruction *I = dyn_cast_or_null<Instruction>(V)) {
@@ -466,20 +468,21 @@ static void getCopyToParts(SelectionDAG &DAG, DebugLoc DL,
  /// value split into legal parts.
  static void getCopyToPartsVector(SelectionDAG &DAG, DebugLoc DL,
                                   SDValue Val, SDValue *Parts, unsigned NumParts,
-                                 EVT PartVT, const Value *V) {
+                                 MVT PartVT, const Value *V) {
    EVT ValueVT = Val.getValueType();
    assert(ValueVT.isVector() && "Not a vector");
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
  
    if (NumParts == 1) {
-    if (PartVT == ValueVT) {
+    EVT PartEVT = PartVT;
+    if (PartEVT == ValueVT) {
        // Nothing to do.
      } else if (PartVT.getSizeInBits() == ValueVT.getSizeInBits()) {
        // Bitconvert vector->vector case.
        Val = DAG.getNode(ISD::BITCAST, DL, PartVT, Val);
      } else if (PartVT.isVector() &&
-               PartVT.getVectorElementType() == ValueVT.getVectorElementType() &&
-               PartVT.getVectorNumElements() > ValueVT.getVectorNumElements()) {
+               PartEVT.getVectorElementType() == ValueVT.getVectorElementType() &&
+               PartEVT.getVectorNumElements() > ValueVT.getVectorNumElements()) {
        EVT ElementVT = PartVT.getVectorElementType();
        // Vector widening case, e.g. <2 x float> -> <4 x float>.  Shuffle in
        // undef elements.
@@ -499,12 +502,12 @@ static void getCopyToPartsVector(SelectionDAG &DAG, DebugLoc DL,
        //SDValue UndefElts = DAG.getUNDEF(VectorTy);
        //Val = DAG.getNode(ISD::CONCAT_VECTORS, DL, PartVT, Val, UndefElts);
      } else if (PartVT.isVector() &&
-               PartVT.getVectorElementType().bitsGE(
+               PartEVT.getVectorElementType().bitsGE(
                   ValueVT.getVectorElementType()) &&
-               PartVT.getVectorNumElements() == ValueVT.getVectorNumElements()) {
+               PartEVT.getVectorNumElements() == ValueVT.getVectorNumElements()) {
  
        // Promoted vector extract
-      bool Smaller = PartVT.bitsLE(ValueVT);
+      bool Smaller = PartEVT.bitsLE(ValueVT);
        Val = DAG.getNode((Smaller ? ISD::TRUNCATE : ISD::ANY_EXTEND),
                          DL, PartVT, Val);
      } else{
@@ -524,7 +527,8 @@ static void getCopyToPartsVector(SelectionDAG &DAG, DebugLoc DL,
    }
  
    // Handle a multi-element vector.
-  EVT IntermediateVT, RegisterVT;
+  EVT IntermediateVT;
+  MVT RegisterVT;
    unsigned NumIntermediates;
    unsigned NumRegs = TLI.getVectorTypeBreakdown(*DAG.getContext(), ValueVT,
                                                  IntermediateVT,
@@ -589,7 +593,7 @@ namespace {
      /// getRegisterType member function, however when with physical registers
      /// it is necessary to have a separate record of the types.
      ///
-    SmallVector<EVT, 4> RegVTs;
+    SmallVector<MVT, 4> RegVTs;
  
      /// Regs - This list holds the registers assigned to the values.
      /// Each legal or promoted value requires one register, and each
@@ -600,7 +604,7 @@ namespace {
      RegsForValue() {}
  
      RegsForValue(const SmallVector<unsigned, 4> &regs,
-                 EVT regvt, EVT valuevt)
+                 MVT regvt, EVT valuevt)
        : ValueVTs(1, valuevt), RegVTs(1, regvt), Regs(regs) {}
  
      RegsForValue(LLVMContext &Context, const TargetLowering &tli,
@@ -610,7 +614,7 @@ namespace {
        for (unsigned Value = 0, e = ValueVTs.size(); Value != e; ++Value) {
          EVT ValueVT = ValueVTs[Value];
          unsigned NumRegs = tli.getNumRegisters(Context, ValueVT);
-        EVT RegisterVT = tli.getRegisterType(Context, ValueVT);
+        MVT RegisterVT = tli.getRegisterType(Context, ValueVT);
          for (unsigned i = 0; i != NumRegs; ++i)
            Regs.push_back(Reg + i);
          RegVTs.push_back(RegisterVT);
@@ -621,7 +625,7 @@ namespace {
      /// areValueTypesLegal - Return true if types of all the values are legal.
      bool areValueTypesLegal(const TargetLowering &TLI) {
        for (unsigned Value = 0, e = ValueVTs.size(); Value != e; ++Value) {
-        EVT RegisterVT = RegVTs[Value];
+        MVT RegisterVT = RegVTs[Value];
          if (!TLI.isTypeLegal(RegisterVT))
            return false;
        }
@@ -683,7 +687,7 @@ SDValue RegsForValue::getCopyFromRegs(SelectionDAG &DAG,
      // Copy the legal parts from the registers.
      EVT ValueVT = ValueVTs[Value];
      unsigned NumRegs = TLI.getNumRegisters(*DAG.getContext(), ValueVT);
-    EVT RegisterVT = RegVTs[Value];
+    MVT RegisterVT = RegVTs[Value];
  
      Parts.resize(NumRegs);
      for (unsigned i = 0; i != NumRegs; ++i) {
@@ -768,10 +772,12 @@ void RegsForValue::getCopyToRegs(SDValue Val, SelectionDAG &DAG, DebugLoc dl,
    for (unsigned Value = 0, Part = 0, e = ValueVTs.size(); Value != e; ++Value) {
      EVT ValueVT = ValueVTs[Value];
      unsigned NumParts = TLI.getNumRegisters(*DAG.getContext(), ValueVT);
-    EVT RegisterVT = RegVTs[Value];
+    MVT RegisterVT = RegVTs[Value];
+    ISD::NodeType ExtendKind =
+      TLI.isZExtFree(Val, RegisterVT)? ISD::ZERO_EXTEND: ISD::ANY_EXTEND;
  
      getCopyToParts(DAG, dl, Val.getValue(Val.getResNo() + Value),
-                   &Parts[Part], NumParts, RegisterVT, V);
+                   &Parts[Part], NumParts, RegisterVT, V, ExtendKind);
      Part += NumParts;
    }
  
@@ -834,7 +840,7 @@ void RegsForValue::AddInlineAsmOperands(unsigned Code, bool HasMatching,
  
    for (unsigned Value = 0, Reg = 0, e = ValueVTs.size(); Value != e; ++Value) {
      unsigned NumRegs = TLI.getNumRegisters(*DAG.getContext(), ValueVTs[Value]);
-    EVT RegisterVT = RegVTs[Value];
+    MVT RegisterVT = RegVTs[Value];
      for (unsigned i = 0; i != NumRegs; ++i) {
        assert(Reg < Regs.size() && "Mismatch in # registers expected");
        Ops.push_back(DAG.getRegister(Regs[Reg++], RegisterVT));
@@ -967,7 +973,7 @@ void SelectionDAGBuilder::visit(unsigned Opcode, const User &I) {
      // Build the switch statement using the Instruction.def file.
  #define HANDLE_INST(NUM, OPCODE, CLASS) \
      case Instruction::OPCODE: visit##OPCODE((const CLASS&)I); break;
-#include "llvm/Instruction.def"
+#include "llvm/IR/Instruction.def"
    }
  
    // Assign the ordering to the freshly created DAG nodes.
@@ -996,7 +1002,7 @@ void SelectionDAGBuilder::resolveDanglingDebugInfo(const Value *V,
          DAG.AddDbgValue(SDV, Val.getNode(), false);
        }
      } else
-      DEBUG(dbgs() << "Dropping debug info for " << DI << "\n");
+      DEBUG(dbgs() << "Dropping debug info for " << *DI << "\n");
      DanglingDebugInfoMap[V] = DanglingDebugInfo();
    }
  }
@@ -1227,16 +1233,18 @@ void SelectionDAGBuilder::visitRet(const ReturnInst &I) {
          ISD::NodeType ExtendKind = ISD::ANY_EXTEND;
  
          const Function *F = I.getParent()->getParent();
-        if (F->getRetAttributes().hasSExtAttr())
+        if (F->getAttributes().hasAttribute(AttributeSet::ReturnIndex,
+                                            Attribute::SExt))
            ExtendKind = ISD::SIGN_EXTEND;
-        else if (F->getRetAttributes().hasZExtAttr())
+        else if (F->getAttributes().hasAttribute(AttributeSet::ReturnIndex,
+                                                 Attribute::ZExt))
            ExtendKind = ISD::ZERO_EXTEND;
  
          if (ExtendKind != ISD::ANY_EXTEND && VT.isInteger())
-          VT = TLI.getTypeForExtArgOrReturn(*DAG.getContext(), VT, ExtendKind);
+          VT = TLI.getTypeForExtArgOrReturn(VT.getSimpleVT(), ExtendKind);
  
          unsigned NumParts = TLI.getNumRegisters(*DAG.getContext(), VT);
-        EVT PartVT = TLI.getRegisterType(*DAG.getContext(), VT);
+        MVT PartVT = TLI.getRegisterType(*DAG.getContext(), VT);
          SmallVector<SDValue, 4> Parts(NumParts);
          getCopyToParts(DAG, getCurDebugLoc(),
                         SDValue(RetOp.getNode(), RetOp.getResNo() + j),
@@ -1244,7 +1252,8 @@ void SelectionDAGBuilder::visitRet(const ReturnInst &I) {
  
          // 'inreg' on function refers to return value
          ISD::ArgFlagsTy Flags = ISD::ArgFlagsTy();
-        if (F->getRetAttributes().hasInRegAttr())
+        if (F->getAttributes().hasAttribute(AttributeSet::ReturnIndex,
+                                            Attribute::InReg))
            Flags.setInReg();
  
          // Propagate extension type if any
@@ -1255,7 +1264,7 @@ void SelectionDAGBuilder::visitRet(const ReturnInst &I) {
  
          for (unsigned i = 0; i < NumParts; ++i) {
            Outs.push_back(ISD::OutputArg(Flags, Parts[i].getValueType(),
-                                        /*isfixed=*/true));
+                                        /*isfixed=*/true, 0, 0));
            OutVals.push_back(Parts[i]);
          }
        }
@@ -1701,8 +1710,10 @@ void SelectionDAGBuilder::visitJumpTableHeader(JumpTable &JT,
    // for the switch statement if the value being switched on exceeds the largest
    // case in the switch.
    SDValue CMP = DAG.getSetCC(getCurDebugLoc(),
-                             TLI.getSetCCResultType(Sub.getValueType()), Sub,
-                             DAG.getConstant(JTH.Last-JTH.First,VT),
+                             TLI.getSetCCResultType(*DAG.getContext(),
+                                                    Sub.getValueType()),
+                             Sub,
+                             DAG.getConstant(JTH.Last - JTH.First,VT),
                               ISD::SETUGT);
  
    // Set NextBlock to be the MBB immediately after the current one, if any.
@@ -1736,7 +1747,8 @@ void SelectionDAGBuilder::visitBitTestHeader(BitTestBlock &B,
  
    // Check range
    SDValue RangeCmp = DAG.getSetCC(getCurDebugLoc(),
-                                  TLI.getSetCCResultType(Sub.getValueType()),
+                                  TLI.getSetCCResultType(*DAG.getContext(),
+                                                         Sub.getValueType()),
                                    Sub, DAG.getConstant(B.Range, VT),
                                    ISD::SETUGT);
  
@@ -1758,8 +1770,8 @@ void SelectionDAGBuilder::visitBitTestHeader(BitTestBlock &B,
      Sub = DAG.getZExtOrTrunc(Sub, getCurDebugLoc(), VT);
    }
  
-  B.RegVT = VT;
-  B.Reg = FuncInfo.CreateReg(VT);
+  B.RegVT = VT.getSimpleVT();
+  B.Reg = FuncInfo.CreateReg(B.RegVT);
    SDValue CopyTo = DAG.getCopyToReg(getControlRoot(), getCurDebugLoc(),
                                      B.Reg, Sub);
  
@@ -1793,7 +1805,7 @@ void SelectionDAGBuilder::visitBitTestCase(BitTestBlock &BB,
                                             unsigned Reg,
                                             BitTestCase &B,
                                             MachineBasicBlock *SwitchBB) {
-  EVT VT = BB.RegVT;
+  MVT VT = BB.RegVT;
    SDValue ShiftOp = DAG.getCopyFromReg(getControlRoot(), getCurDebugLoc(),
                                         Reg, VT);
    SDValue Cmp;
@@ -1802,14 +1814,14 @@ void SelectionDAGBuilder::visitBitTestCase(BitTestBlock &BB,
      // Testing for a single bit; just compare the shift count with what it
      // would need to be to shift a 1 bit in that position.
      Cmp = DAG.getSetCC(getCurDebugLoc(),
-                       TLI.getSetCCResultType(VT),
+                       TLI.getSetCCResultType(*DAG.getContext(), VT),
                         ShiftOp,
-                       DAG.getConstant(CountTrailingZeros_64(B.Mask), VT),
+                       DAG.getConstant(countTrailingZeros(B.Mask), VT),
                         ISD::SETEQ);
    } else if (PopCount == BB.Range) {
      // There is only one zero bit in the range, test for it directly.
      Cmp = DAG.getSetCC(getCurDebugLoc(),
-                       TLI.getSetCCResultType(VT),
+                       TLI.getSetCCResultType(*DAG.getContext(), VT),
                         ShiftOp,
                         DAG.getConstant(CountTrailingOnes_64(B.Mask), VT),
                         ISD::SETNE);
@@ -1822,7 +1834,7 @@ void SelectionDAGBuilder::visitBitTestCase(BitTestBlock &BB,
      SDValue AndOp = DAG.getNode(ISD::AND, getCurDebugLoc(),
                                  VT, SwitchVal, DAG.getConstant(B.Mask, VT));
      Cmp = DAG.getSetCC(getCurDebugLoc(),
-                       TLI.getSetCCResultType(VT),
+                       TLI.getSetCCResultType(*DAG.getContext(), VT),
                         AndOp, DAG.getConstant(0, VT),
                         ISD::SETNE);
    }
@@ -2604,14 +2616,14 @@ void SelectionDAGBuilder::visitIndirectBr(const IndirectBrInst &I) {
    MachineBasicBlock *IndirectBrMBB = FuncInfo.MBB;
  
    // Update machine-CFG edges with unique successors.
-  SmallVector<BasicBlock*, 32> succs;
-  succs.reserve(I.getNumSuccessors());
-  for (unsigned i = 0, e = I.getNumSuccessors(); i != e; ++i)
-    succs.push_back(I.getSuccessor(i));
-  array_pod_sort(succs.begin(), succs.end());
-  succs.erase(std::unique(succs.begin(), succs.end()), succs.end());
-  for (unsigned i = 0, e = succs.size(); i != e; ++i) {
-    MachineBasicBlock *Succ = FuncInfo.MBBMap[succs[i]];
+  SmallSet<BasicBlock*, 32> Done;
+  for (unsigned i = 0, e = I.getNumSuccessors(); i != e; ++i) {
+    BasicBlock *BB = I.getSuccessor(i);
+    bool Inserted = Done.insert(BB);
+    if (!Inserted)
+        continue;
+
+    MachineBasicBlock *Succ = FuncInfo.MBBMap[BB];
      addSuccessorWithWeight(IndirectBrMBB, Succ);
    }
  
@@ -2645,7 +2657,7 @@ void SelectionDAGBuilder::visitShift(const User &I, unsigned Opcode) {
    SDValue Op1 = getValue(I.getOperand(0));
    SDValue Op2 = getValue(I.getOperand(1));
  
-  MVT ShiftTy = TLI.getShiftAmountTy(Op2.getValueType());
+  EVT ShiftTy = TLI.getShiftAmountTy(Op2.getValueType());
  
    // Coerce the shift amount to the right type if we can.
    if (!I.getType()->isVectorTy() && Op2.getValueType() != ShiftTy) {
@@ -3137,12 +3149,12 @@ void SelectionDAGBuilder::visitGetElementPtr(const User &I) {
         OI != E; ++OI) {
      const Value *Idx = *OI;
      if (StructType *StTy = dyn_cast<StructType>(Ty)) {
-      unsigned Field = cast<ConstantInt>(Idx)->getZExtValue();
+      unsigned Field = cast<Constant>(Idx)->getUniqueInteger().getZExtValue();
        if (Field) {
          // N = N + Offset
          uint64_t Offset = TD->getStructLayout(StTy)->getElementOffset(Field);
          N = DAG.getNode(ISD::ADD, getCurDebugLoc(), N.getValueType(), N,
-                        DAG.getIntPtrConstant(Offset));
+                        DAG.getConstant(Offset, N.getValueType()));
        }
  
        Ty = StTy->getElementType(Field);
@@ -3187,7 +3199,7 @@ void SelectionDAGBuilder::visitGetElementPtr(const User &I) {
                               N.getValueType(), IdxN,
                               DAG.getConstant(Amt, IdxN.getValueType()));
          } else {
-          SDValue Scale = DAG.getConstant(ElementSize, TLI.getPointerTy());
+          SDValue Scale = DAG.getConstant(ElementSize, IdxN.getValueType());
            IdxN = DAG.getNode(ISD::MUL, getCurDebugLoc(),
                               N.getValueType(), IdxN, Scale);
          }
@@ -3510,7 +3522,7 @@ void SelectionDAGBuilder::visitAtomicLoad(const LoadInst &I) {
  
    EVT VT = TLI.getValueType(I.getType());
  
-  if (I.getAlignment() * 8 < VT.getSizeInBits())
+  if (I.getAlignment() < VT.getSizeInBits() / 8)
      report_fatal_error("Cannot generate unaligned atomic load");
  
    SDValue L =
@@ -3540,7 +3552,7 @@ void SelectionDAGBuilder::visitAtomicStore(const StoreInst &I) {
  
    EVT VT = TLI.getValueType(I.getValueOperand()->getType());
  
-  if (I.getAlignment() * 8 < VT.getSizeInBits())
+  if (I.getAlignment() < VT.getSizeInBits() / 8)
      report_fatal_error("Cannot generate unaligned atomic store");
  
    if (TLI.getInsertFencesForAtomic())
@@ -3654,7 +3666,7 @@ void SelectionDAGBuilder::visitTargetIntrinsic(const CallInst &I,
  ///
  ///   Op = (Op & 0x007fffff) | 0x3f800000;
  ///
-/// where Op is the hexidecimal representation of floating point value.
+/// where Op is the hexadecimal representation of floating point value.
  static SDValue
  GetSignificand(SelectionDAG &DAG, SDValue Op, DebugLoc dl) {
    SDValue t1 = DAG.getNode(ISD::AND, dl, MVT::i32, Op,
@@ -3668,7 +3680,7 @@ GetSignificand(SelectionDAG &DAG, SDValue Op, DebugLoc dl) {
  ///
  ///   (float)(int)(((Op & 0x7f800000) >> 23) - 127);
  ///
-/// where Op is the hexidecimal representation of floating point value.
+/// where Op is the hexadecimal representation of floating point value.
  static SDValue
  GetExponent(SelectionDAG &DAG, SDValue Op, const TargetLowering &TLI,
              DebugLoc dl) {
@@ -3684,19 +3696,16 @@ GetExponent(SelectionDAG &DAG, SDValue Op, const TargetLowering &TLI,
  /// getF32Constant - Get 32-bit floating point constant.
  static SDValue
  getF32Constant(SelectionDAG &DAG, unsigned Flt) {
-  return DAG.getConstantFP(APFloat(APInt(32, Flt)), MVT::f32);
+  return DAG.getConstantFP(APFloat(APFloat::IEEEsingle, APInt(32, Flt)),
+                           MVT::f32);
  }
  
-/// visitExp - Lower an exp intrinsic. Handles the special sequences for
+/// expandExp - Lower an exp intrinsic. Handles the special sequences for
  /// limited-precision mode.
-void
-SelectionDAGBuilder::visitExp(const CallInst &I) {
-  SDValue result;
-  DebugLoc dl = getCurDebugLoc();
-
-  if (getValue(I.getArgOperand(0)).getValueType() == MVT::f32 &&
+static SDValue expandExp(DebugLoc dl, SDValue Op, SelectionDAG &DAG,
+                         const TargetLowering &TLI) {
+  if (Op.getValueType() == MVT::f32 &&
        LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
-    SDValue Op = getValue(I.getArgOperand(0));
  
      // Put the exponent in the right bit position for later addition to the
      // final result:
@@ -3715,6 +3724,7 @@ SelectionDAGBuilder::visitExp(const CallInst &I) {
      IntegerPartOfX = DAG.getNode(ISD::SHL, dl, MVT::i32, IntegerPartOfX,
                                   DAG.getConstant(23, TLI.getPointerTy()));
  
+    SDValue TwoToFracPartOfX;
      if (LimitFloatPrecision <= 6) {
        // For floating-point precision of 6:
        //
@@ -3728,16 +3738,9 @@ SelectionDAGBuilder::visitExp(const CallInst &I) {
        SDValue t3 = DAG.getNode(ISD::FADD, dl, MVT::f32, t2,
                                 getF32Constant(DAG, 0x3f3c50c8));
        SDValue t4 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t3, X);
-      SDValue t5 = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
-                               getF32Constant(DAG, 0x3f7f5e7e));
-      SDValue TwoToFracPartOfX = DAG.getNode(ISD::BITCAST, dl,MVT::i32, t5);
-
-      // Add the exponent into the result in integer domain.
-      SDValue t6 = DAG.getNode(ISD::ADD, dl, MVT::i32,
-                               TwoToFracPartOfX, IntegerPartOfX);
-
-      result = DAG.getNode(ISD::BITCAST, dl, MVT::f32, t6);
-    } else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
+      TwoToFracPartOfX = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
+                                     getF32Constant(DAG, 0x3f7f5e7e));
+    } else if (LimitFloatPrecision <= 12) {
        // For floating-point precision of 12:
        //
        //   TwoToFractionalPartOfX =
@@ -3754,16 +3757,9 @@ SelectionDAGBuilder::visitExp(const CallInst &I) {
        SDValue t5 = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
                                 getF32Constant(DAG, 0x3f324b07));
        SDValue t6 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t5, X);
-      SDValue t7 = DAG.getNode(ISD::FADD, dl, MVT::f32, t6,
-                               getF32Constant(DAG, 0x3f7ff8fd));
-      SDValue TwoToFracPartOfX = DAG.getNode(ISD::BITCAST, dl,MVT::i32, t7);
-
-      // Add the exponent into the result in integer domain.
-      SDValue t8 = DAG.getNode(ISD::ADD, dl, MVT::i32,
-                               TwoToFracPartOfX, IntegerPartOfX);
-
-      result = DAG.getNode(ISD::BITCAST, dl, MVT::f32, t8);
-    } else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
+      TwoToFracPartOfX = DAG.getNode(ISD::FADD, dl, MVT::f32, t6,
+                                     getF32Constant(DAG, 0x3f7ff8fd));
+    } else { // LimitFloatPrecision <= 18
        // For floating-point precision of 18:
        //
        //   TwoToFractionalPartOfX =
@@ -3792,37 +3788,27 @@ SelectionDAGBuilder::visitExp(const CallInst &I) {
        SDValue t11 = DAG.getNode(ISD::FADD, dl, MVT::f32, t10,
                                  getF32Constant(DAG, 0x3f317234));
        SDValue t12 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t11, X);
-      SDValue t13 = DAG.getNode(ISD::FADD, dl, MVT::f32, t12,
-                                getF32Constant(DAG, 0x3f800000));
-      SDValue TwoToFracPartOfX = DAG.getNode(ISD::BITCAST, dl,
-                                             MVT::i32, t13);
-
-      // Add the exponent into the result in integer domain.
-      SDValue t14 = DAG.getNode(ISD::ADD, dl, MVT::i32,
-                                TwoToFracPartOfX, IntegerPartOfX);
-
-      result = DAG.getNode(ISD::BITCAST, dl, MVT::f32, t14);
+      TwoToFracPartOfX = DAG.getNode(ISD::FADD, dl, MVT::f32, t12,
+                                     getF32Constant(DAG, 0x3f800000));
      }
-  } else {
-    // No special expansion.
-    result = DAG.getNode(ISD::FEXP, dl,
-                         getValue(I.getArgOperand(0)).getValueType(),
-                         getValue(I.getArgOperand(0)));
+
+    // Add the exponent into the result in integer domain.
+    SDValue t13 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, TwoToFracPartOfX);
+    return DAG.getNode(ISD::BITCAST, dl, MVT::f32,
+                       DAG.getNode(ISD::ADD, dl, MVT::i32,
+                                   t13, IntegerPartOfX));
    }
  
-  setValue(&I, result);
+  // No special expansion.
+  return DAG.getNode(ISD::FEXP, dl, Op.getValueType(), Op);
  }
  
-/// visitLog - Lower a log intrinsic. Handles the special sequences for
+/// expandLog - Lower a log intrinsic. Handles the special sequences for
  /// limited-precision mode.
-void
-SelectionDAGBuilder::visitLog(const CallInst &I) {
-  SDValue result;
-  DebugLoc dl = getCurDebugLoc();
-
-  if (getValue(I.getArgOperand(0)).getValueType() == MVT::f32 &&
+static SDValue expandLog(DebugLoc dl, SDValue Op, SelectionDAG &DAG,
+                         const TargetLowering &TLI) {
+  if (Op.getValueType() == MVT::f32 &&
        LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
-    SDValue Op = getValue(I.getArgOperand(0));
      SDValue Op1 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, Op);
  
      // Scale the exponent by log(2) [0.69314718f].
@@ -3834,6 +3820,7 @@ SelectionDAGBuilder::visitLog(const CallInst &I) {
      // exponent of 1.
      SDValue X = GetSignificand(DAG, Op1, dl);
  
+    SDValue LogOfMantissa;
      if (LimitFloatPrecision <= 6) {
        // For floating-point precision of 6:
        //
@@ -3847,12 +3834,9 @@ SelectionDAGBuilder::visitLog(const CallInst &I) {
        SDValue t1 = DAG.getNode(ISD::FADD, dl, MVT::f32, t0,
                                 getF32Constant(DAG, 0x3fb3a2b1));
        SDValue t2 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t1, X);
-      SDValue LogOfMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t2,
-                                          getF32Constant(DAG, 0x3f949a29));
-
-      result = DAG.getNode(ISD::FADD, dl,
-                           MVT::f32, LogOfExponent, LogOfMantissa);
-    } else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
+      LogOfMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t2,
+                                  getF32Constant(DAG, 0x3f949a29));
+    } else if (LimitFloatPrecision <= 12) {
        // For floating-point precision of 12:
        //
        //   LogOfMantissa =
@@ -3873,12 +3857,9 @@ SelectionDAGBuilder::visitLog(const CallInst &I) {
        SDValue t5 = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
                                 getF32Constant(DAG, 0x40348e95));
        SDValue t6 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t5, X);
-      SDValue LogOfMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t6,
-                                          getF32Constant(DAG, 0x3fdef31a));
-
-      result = DAG.getNode(ISD::FADD, dl,
-                           MVT::f32, LogOfExponent, LogOfMantissa);
-    } else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
+      LogOfMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t6,
+                                  getF32Constant(DAG, 0x3fdef31a));
+    } else { // LimitFloatPrecision <= 18
        // For floating-point precision of 18:
        //
        //   LogOfMantissa =
@@ -3907,32 +3888,23 @@ SelectionDAGBuilder::visitLog(const CallInst &I) {
        SDValue t9 = DAG.getNode(ISD::FADD, dl, MVT::f32, t8,
                                 getF32Constant(DAG, 0x408797cb));
        SDValue t10 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t9, X);
-      SDValue LogOfMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t10,
-                                          getF32Constant(DAG, 0x4006dcab));
-
-      result = DAG.getNode(ISD::FADD, dl,
-                           MVT::f32, LogOfExponent, LogOfMantissa);
+      LogOfMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t10,
+                                  getF32Constant(DAG, 0x4006dcab));
      }
-  } else {
-    // No special expansion.
-    result = DAG.getNode(ISD::FLOG, dl,
-                         getValue(I.getArgOperand(0)).getValueType(),
-                         getValue(I.getArgOperand(0)));
+
+    return DAG.getNode(ISD::FADD, dl, MVT::f32, LogOfExponent, LogOfMantissa);
    }
  
-  setValue(&I, result);
+  // No special expansion.
+  return DAG.getNode(ISD::FLOG, dl, Op.getValueType(), Op);
  }
  
-/// visitLog2 - Lower a log2 intrinsic. Handles the special sequences for
+/// expandLog2 - Lower a log2 intrinsic. Handles the special sequences for
  /// limited-precision mode.
-void
-SelectionDAGBuilder::visitLog2(const CallInst &I) {
-  SDValue result;
-  DebugLoc dl = getCurDebugLoc();
-
-  if (getValue(I.getArgOperand(0)).getValueType() == MVT::f32 &&
+static SDValue expandLog2(DebugLoc dl, SDValue Op, SelectionDAG &DAG,
+                          const TargetLowering &TLI) {
+  if (Op.getValueType() == MVT::f32 &&
        LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
-    SDValue Op = getValue(I.getArgOperand(0));
      SDValue Op1 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, Op);
  
      // Get the exponent.
@@ -3944,6 +3916,7 @@ SelectionDAGBuilder::visitLog2(const CallInst &I) {
  
      // Different possible minimax approximations of significand in
      // floating-point for various degrees of accuracy over [1,2].
+    SDValue Log2ofMantissa;
      if (LimitFloatPrecision <= 6) {
        // For floating-point precision of 6:
        //
@@ -3955,12 +3928,9 @@ SelectionDAGBuilder::visitLog2(const CallInst &I) {
        SDValue t1 = DAG.getNode(ISD::FADD, dl, MVT::f32, t0,
                                 getF32Constant(DAG, 0x40019463));
        SDValue t2 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t1, X);
-      SDValue Log2ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t2,
-                                           getF32Constant(DAG, 0x3fd6633d));
-
-      result = DAG.getNode(ISD::FADD, dl,
-                           MVT::f32, LogOfExponent, Log2ofMantissa);
-    } else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
+      Log2ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t2,
+                                   getF32Constant(DAG, 0x3fd6633d));
+    } else if (LimitFloatPrecision <= 12) {
        // For floating-point precision of 12:
        //
        //   Log2ofMantissa =
@@ -3981,12 +3951,9 @@ SelectionDAGBuilder::visitLog2(const CallInst &I) {
        SDValue t5 = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
                                 getF32Constant(DAG, 0x40823e2f));
        SDValue t6 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t5, X);
-      SDValue Log2ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t6,
-                                           getF32Constant(DAG, 0x4020d29c));
-
-      result = DAG.getNode(ISD::FADD, dl,
-                           MVT::f32, LogOfExponent, Log2ofMantissa);
-    } else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
+      Log2ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t6,
+                                   getF32Constant(DAG, 0x4020d29c));
+    } else { // LimitFloatPrecision <= 18
        // For floating-point precision of 18:
        //
        //   Log2ofMantissa =
@@ -4016,32 +3983,23 @@ SelectionDAGBuilder::visitLog2(const CallInst &I) {
        SDValue t9 = DAG.getNode(ISD::FADD, dl, MVT::f32, t8,
                                 getF32Constant(DAG, 0x40c39dad));
        SDValue t10 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t9, X);
-      SDValue Log2ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t10,
-                                           getF32Constant(DAG, 0x4042902c));
-
-      result = DAG.getNode(ISD::FADD, dl,
-                           MVT::f32, LogOfExponent, Log2ofMantissa);
+      Log2ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t10,
+                                   getF32Constant(DAG, 0x4042902c));
      }
-  } else {
-    // No special expansion.
-    result = DAG.getNode(ISD::FLOG2, dl,
-                         getValue(I.getArgOperand(0)).getValueType(),
-                         getValue(I.getArgOperand(0)));
+
+    return DAG.getNode(ISD::FADD, dl, MVT::f32, LogOfExponent, Log2ofMantissa);
    }
  
-  setValue(&I, result);
+  // No special expansion.
+  return DAG.getNode(ISD::FLOG2, dl, Op.getValueType(), Op);
  }
  
-/// visitLog10 - Lower a log10 intrinsic. Handles the special sequences for
+/// expandLog10 - Lower a log10 intrinsic. Handles the special sequences for
  /// limited-precision mode.
-void
-SelectionDAGBuilder::visitLog10(const CallInst &I) {
-  SDValue result;
-  DebugLoc dl = getCurDebugLoc();
-
-  if (getValue(I.getArgOperand(0)).getValueType() == MVT::f32 &&
+static SDValue expandLog10(DebugLoc dl, SDValue Op, SelectionDAG &DAG,
+                           const TargetLowering &TLI) {
+  if (Op.getValueType() == MVT::f32 &&
        LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
-    SDValue Op = getValue(I.getArgOperand(0));
      SDValue Op1 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, Op);
  
      // Scale the exponent by log10(2) [0.30102999f].
@@ -4053,6 +4011,7 @@ SelectionDAGBuilder::visitLog10(const CallInst &I) {
      // exponent of 1.
      SDValue X = GetSignificand(DAG, Op1, dl);
  
+    SDValue Log10ofMantissa;
      if (LimitFloatPrecision <= 6) {
        // For floating-point precision of 6:
        //
@@ -4066,12 +4025,9 @@ SelectionDAGBuilder::visitLog10(const CallInst &I) {
        SDValue t1 = DAG.getNode(ISD::FADD, dl, MVT::f32, t0,
                                 getF32Constant(DAG, 0x3f1c0789));
        SDValue t2 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t1, X);
-      SDValue Log10ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t2,
-                                            getF32Constant(DAG, 0x3f011300));
-
-      result = DAG.getNode(ISD::FADD, dl,
-                           MVT::f32, LogOfExponent, Log10ofMantissa);
-    } else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
+      Log10ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t2,
+                                    getF32Constant(DAG, 0x3f011300));
+    } else if (LimitFloatPrecision <= 12) {
        // For floating-point precision of 12:
        //
        //   Log10ofMantissa =
@@ -4088,12 +4044,9 @@ SelectionDAGBuilder::visitLog10(const CallInst &I) {
        SDValue t3 = DAG.getNode(ISD::FADD, dl, MVT::f32, t2,
                                 getF32Constant(DAG, 0x3f6ae232));
        SDValue t4 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t3, X);
-      SDValue Log10ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t4,
-                                            getF32Constant(DAG, 0x3f25f7c3));
-
-      result = DAG.getNode(ISD::FADD, dl,
-                           MVT::f32, LogOfExponent, Log10ofMantissa);
-    } else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
+      Log10ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t4,
+                                    getF32Constant(DAG, 0x3f25f7c3));
+    } else { // LimitFloatPrecision <= 18
        // For floating-point precision of 18:
        //
        //   Log10ofMantissa =
@@ -4118,33 +4071,23 @@ SelectionDAGBuilder::visitLog10(const CallInst &I) {
        SDValue t7 = DAG.getNode(ISD::FADD, dl, MVT::f32, t6,
                                 getF32Constant(DAG, 0x3fc4316c));
        SDValue t8 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t7, X);
-      SDValue Log10ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t8,
-                                            getF32Constant(DAG, 0x3f57ce70));
-
-      result = DAG.getNode(ISD::FADD, dl,
-                           MVT::f32, LogOfExponent, Log10ofMantissa);
+      Log10ofMantissa = DAG.getNode(ISD::FSUB, dl, MVT::f32, t8,
+                                    getF32Constant(DAG, 0x3f57ce70));
      }
-  } else {
-    // No special expansion.
-    result = DAG.getNode(ISD::FLOG10, dl,
-                         getValue(I.getArgOperand(0)).getValueType(),
-                         getValue(I.getArgOperand(0)));
+
+    return DAG.getNode(ISD::FADD, dl, MVT::f32, LogOfExponent, Log10ofMantissa);
    }
  
-  setValue(&I, result);
+  // No special expansion.
+  return DAG.getNode(ISD::FLOG10, dl, Op.getValueType(), Op);
  }
  
-/// visitExp2 - Lower an exp2 intrinsic. Handles the special sequences for
+/// expandExp2 - Lower an exp2 intrinsic. Handles the special sequences for
  /// limited-precision mode.
-void
-SelectionDAGBuilder::visitExp2(const CallInst &I) {
-  SDValue result;
-  DebugLoc dl = getCurDebugLoc();
-
-  if (getValue(I.getArgOperand(0)).getValueType() == MVT::f32 &&
+static SDValue expandExp2(DebugLoc dl, SDValue Op, SelectionDAG &DAG,
+                          const TargetLowering &TLI) {
+  if (Op.getValueType() == MVT::f32 &&
        LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
-    SDValue Op = getValue(I.getArgOperand(0));
-
      SDValue IntegerPartOfX = DAG.getNode(ISD::FP_TO_SINT, dl, MVT::i32, Op);
  
      //   FractionalPartOfX = x - (float)IntegerPartOfX;
@@ -4155,6 +4098,7 @@ SelectionDAGBuilder::visitExp2(const CallInst &I) {
      IntegerPartOfX = DAG.getNode(ISD::SHL, dl, MVT::i32, IntegerPartOfX,
                                   DAG.getConstant(23, TLI.getPointerTy()));
  
+    SDValue TwoToFractionalPartOfX;
      if (LimitFloatPrecision <= 6) {
        // For floating-point precision of 6:
        //
@@ -4168,15 +4112,9 @@ SelectionDAGBuilder::visitExp2(const CallInst &I) {
        SDValue t3 = DAG.getNode(ISD::FADD, dl, MVT::f32, t2,
                                 getF32Constant(DAG, 0x3f3c50c8));
        SDValue t4 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t3, X);
-      SDValue t5 = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
-                               getF32Constant(DAG, 0x3f7f5e7e));
-      SDValue t6 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, t5);
-      SDValue TwoToFractionalPartOfX =
-        DAG.getNode(ISD::ADD, dl, MVT::i32, t6, IntegerPartOfX);
-
-      result = DAG.getNode(ISD::BITCAST, dl,
-                           MVT::f32, TwoToFractionalPartOfX);
-    } else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
+      TwoToFractionalPartOfX = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
+                                           getF32Constant(DAG, 0x3f7f5e7e));
+    } else if (LimitFloatPrecision <= 12) {
        // For floating-point precision of 12:
        //
        //   TwoToFractionalPartOfX =
@@ -4193,15 +4131,9 @@ SelectionDAGBuilder::visitExp2(const CallInst &I) {
        SDValue t5 = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
                                 getF32Constant(DAG, 0x3f324b07));
        SDValue t6 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t5, X);
-      SDValue t7 = DAG.getNode(ISD::FADD, dl, MVT::f32, t6,
-                               getF32Constant(DAG, 0x3f7ff8fd));
-      SDValue t8 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, t7);
-      SDValue TwoToFractionalPartOfX =
-        DAG.getNode(ISD::ADD, dl, MVT::i32, t8, IntegerPartOfX);
-
-      result = DAG.getNode(ISD::BITCAST, dl,
-                           MVT::f32, TwoToFractionalPartOfX);
-    } else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
+      TwoToFractionalPartOfX = DAG.getNode(ISD::FADD, dl, MVT::f32, t6,
+                                           getF32Constant(DAG, 0x3f7ff8fd));
+    } else { // LimitFloatPrecision <= 18
        // For floating-point precision of 18:
        //
        //   TwoToFractionalPartOfX =
@@ -4229,54 +4161,42 @@ SelectionDAGBuilder::visitExp2(const CallInst &I) {
        SDValue t11 = DAG.getNode(ISD::FADD, dl, MVT::f32, t10,
                                  getF32Constant(DAG, 0x3f317234));
        SDValue t12 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t11, X);
-      SDValue t13 = DAG.getNode(ISD::FADD, dl, MVT::f32, t12,
-                                getF32Constant(DAG, 0x3f800000));
-      SDValue t14 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, t13);
-      SDValue TwoToFractionalPartOfX =
-        DAG.getNode(ISD::ADD, dl, MVT::i32, t14, IntegerPartOfX);
-
-      result = DAG.getNode(ISD::BITCAST, dl,
-                           MVT::f32, TwoToFractionalPartOfX);
+      TwoToFractionalPartOfX = DAG.getNode(ISD::FADD, dl, MVT::f32, t12,
+                                           getF32Constant(DAG, 0x3f800000));
      }
-  } else {
-    // No special expansion.
-    result = DAG.getNode(ISD::FEXP2, dl,
-                         getValue(I.getArgOperand(0)).getValueType(),
-                         getValue(I.getArgOperand(0)));
+
+    // Add the exponent into the result in integer domain.
+    SDValue t13 = DAG.getNode(ISD::BITCAST, dl, MVT::i32,
+                              TwoToFractionalPartOfX);
+    return DAG.getNode(ISD::BITCAST, dl, MVT::f32,
+                       DAG.getNode(ISD::ADD, dl, MVT::i32,
+                                   t13, IntegerPartOfX));
    }
  
-  setValue(&I, result);
+  // No special expansion.
+  return DAG.getNode(ISD::FEXP2, dl, Op.getValueType(), Op);
  }
  
  /// visitPow - Lower a pow intrinsic. Handles the special sequences for
  /// limited-precision mode with x == 10.0f.
-void
-SelectionDAGBuilder::visitPow(const CallInst &I) {
-  SDValue result;
-  const Value *Val = I.getArgOperand(0);
-  DebugLoc dl = getCurDebugLoc();
+static SDValue expandPow(DebugLoc dl, SDValue LHS, SDValue RHS,
+                         SelectionDAG &DAG, const TargetLowering &TLI) {
    bool IsExp10 = false;
-
-  if (getValue(Val).getValueType() == MVT::f32 &&
-      getValue(I.getArgOperand(1)).getValueType() == MVT::f32 &&
+  if (LHS.getValueType() == MVT::f32 && LHS.getValueType() == MVT::f32 &&
        LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
-    if (Constant *C = const_cast<Constant*>(dyn_cast<Constant>(Val))) {
-      if (ConstantFP *CFP = dyn_cast<ConstantFP>(C)) {
-        APFloat Ten(10.0f);
-        IsExp10 = CFP->getValueAPF().bitwiseIsEqual(Ten);
-      }
+    if (ConstantFPSDNode *LHSC = dyn_cast<ConstantFPSDNode>(LHS)) {
+      APFloat Ten(10.0f);
+      IsExp10 = LHSC->isExactlyValue(Ten);
      }
    }
  
-  if (IsExp10 && LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
-    SDValue Op = getValue(I.getArgOperand(1));
-
+  if (IsExp10) {
      // Put the exponent in the right bit position for later addition to the
      // final result:
      //
      //   #define LOG2OF10 3.3219281f
      //   IntegerPartOfX = (int32_t)(x * LOG2OF10);
-    SDValue t0 = DAG.getNode(ISD::FMUL, dl, MVT::f32, Op,
+    SDValue t0 = DAG.getNode(ISD::FMUL, dl, MVT::f32, RHS,
                               getF32Constant(DAG, 0x40549a78));
      SDValue IntegerPartOfX = DAG.getNode(ISD::FP_TO_SINT, dl, MVT::i32, t0);
  
@@ -4288,6 +4208,7 @@ SelectionDAGBuilder::visitPow(const CallInst &I) {
      IntegerPartOfX = DAG.getNode(ISD::SHL, dl, MVT::i32, IntegerPartOfX,
                                   DAG.getConstant(23, TLI.getPointerTy()));
  
+    SDValue TwoToFractionalPartOfX;
      if (LimitFloatPrecision <= 6) {
        // For floating-point precision of 6:
        //
@@ -4301,15 +4222,9 @@ SelectionDAGBuilder::visitPow(const CallInst &I) {
        SDValue t3 = DAG.getNode(ISD::FADD, dl, MVT::f32, t2,
                                 getF32Constant(DAG, 0x3f3c50c8));
        SDValue t4 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t3, X);
-      SDValue t5 = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
-                               getF32Constant(DAG, 0x3f7f5e7e));
-      SDValue t6 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, t5);
-      SDValue TwoToFractionalPartOfX =
-        DAG.getNode(ISD::ADD, dl, MVT::i32, t6, IntegerPartOfX);
-
-      result = DAG.getNode(ISD::BITCAST, dl,
-                           MVT::f32, TwoToFractionalPartOfX);
-    } else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
+      TwoToFractionalPartOfX = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
+                                           getF32Constant(DAG, 0x3f7f5e7e));
+    } else if (LimitFloatPrecision <= 12) {
        // For floating-point precision of 12:
        //
        //   TwoToFractionalPartOfX =
@@ -4326,15 +4241,9 @@ SelectionDAGBuilder::visitPow(const CallInst &I) {
        SDValue t5 = DAG.getNode(ISD::FADD, dl, MVT::f32, t4,
                                 getF32Constant(DAG, 0x3f324b07));
        SDValue t6 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t5, X);
-      SDValue t7 = DAG.getNode(ISD::FADD, dl, MVT::f32, t6,
-                               getF32Constant(DAG, 0x3f7ff8fd));
-      SDValue t8 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, t7);
-      SDValue TwoToFractionalPartOfX =
-        DAG.getNode(ISD::ADD, dl, MVT::i32, t8, IntegerPartOfX);
-
-      result = DAG.getNode(ISD::BITCAST, dl,
-                           MVT::f32, TwoToFractionalPartOfX);
-    } else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
+      TwoToFractionalPartOfX = DAG.getNode(ISD::FADD, dl, MVT::f32, t6,
+                                           getF32Constant(DAG, 0x3f7ff8fd));
+    } else { // LimitFloatPrecision <= 18
        // For floating-point precision of 18:
        //
        //   TwoToFractionalPartOfX =
@@ -4362,24 +4271,18 @@ SelectionDAGBuilder::visitPow(const CallInst &I) {
        SDValue t11 = DAG.getNode(ISD::FADD, dl, MVT::f32, t10,
                                  getF32Constant(DAG, 0x3f317234));
        SDValue t12 = DAG.getNode(ISD::FMUL, dl, MVT::f32, t11, X);
-      SDValue t13 = DAG.getNode(ISD::FADD, dl, MVT::f32, t12,
-                                getF32Constant(DAG, 0x3f800000));
-      SDValue t14 = DAG.getNode(ISD::BITCAST, dl, MVT::i32, t13);
-      SDValue TwoToFractionalPartOfX =
-        DAG.getNode(ISD::ADD, dl, MVT::i32, t14, IntegerPartOfX);
-
-      result = DAG.getNode(ISD::BITCAST, dl,
-                           MVT::f32, TwoToFractionalPartOfX);
+      TwoToFractionalPartOfX = DAG.getNode(ISD::FADD, dl, MVT::f32, t12,
+                                           getF32Constant(DAG, 0x3f800000));
      }
-  } else {
-    // No special expansion.
-    result = DAG.getNode(ISD::FPOW, dl,
-                         getValue(I.getArgOperand(0)).getValueType(),
-                         getValue(I.getArgOperand(0)),
-                         getValue(I.getArgOperand(1)));
+
+    SDValue t13 = DAG.getNode(ISD::BITCAST, dl,MVT::i32,TwoToFractionalPartOfX);
+    return DAG.getNode(ISD::BITCAST, dl, MVT::f32,
+                       DAG.getNode(ISD::ADD, dl, MVT::i32,
+                                   t13, IntegerPartOfX));
    }
  
-  setValue(&I, result);
+  // No special expansion.
+  return DAG.getNode(ISD::FPOW, dl, LHS.getValueType(), LHS, RHS);
  }
  
  
@@ -4400,7 +4303,8 @@ static SDValue ExpandPowI(DebugLoc DL, SDValue LHS, SDValue RHS,
        return DAG.getConstantFP(1.0, LHS.getValueType());
  
      const Function *F = DAG.getMachineFunction().getFunction();
-    if (!F->getFnAttributes().hasOptimizeForSizeAttr() ||
+    if (!F->getAttributes().hasAttribute(AttributeSet::FunctionIndex,
+                                         Attribute::OptimizeForSize) ||
          // If optimizing for size, don't insert too many multiplies.  This
          // inserts up to 5 multiplies.
          CountPopulation_32(Val)+Log2_32(Val) < 7) {
@@ -4566,6 +4470,8 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      SDValue Op2 = getValue(I.getArgOperand(1));
      SDValue Op3 = getValue(I.getArgOperand(2));
      unsigned Align = cast<ConstantInt>(I.getArgOperand(3))->getZExtValue();
+    if (!Align)
+      Align = 1; // @llvm.memcpy defines 0 and 1 to both mean no alignment.
      bool isVol = cast<ConstantInt>(I.getArgOperand(4))->getZExtValue();
      DAG.setRoot(DAG.getMemcpy(getRoot(), dl, Op1, Op2, Op3, Align, isVol, false,
                                MachinePointerInfo(I.getArgOperand(0)),
@@ -4582,6 +4488,8 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      SDValue Op2 = getValue(I.getArgOperand(1));
      SDValue Op3 = getValue(I.getArgOperand(2));
      unsigned Align = cast<ConstantInt>(I.getArgOperand(3))->getZExtValue();
+    if (!Align)
+      Align = 1; // @llvm.memset defines 0 and 1 to both mean no alignment.
      bool isVol = cast<ConstantInt>(I.getArgOperand(4))->getZExtValue();
      DAG.setRoot(DAG.getMemset(getRoot(), dl, Op1, Op2, Op3, Align, isVol,
                                MachinePointerInfo(I.getArgOperand(0))));
@@ -4599,6 +4507,8 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      SDValue Op2 = getValue(I.getArgOperand(1));
      SDValue Op3 = getValue(I.getArgOperand(2));
      unsigned Align = cast<ConstantInt>(I.getArgOperand(3))->getZExtValue();
+    if (!Align)
+      Align = 1; // @llvm.memmove defines 0 and 1 to both mean no alignment.
      bool isVol = cast<ConstantInt>(I.getArgOperand(4))->getZExtValue();
      DAG.setRoot(DAG.getMemmove(getRoot(), dl, Op1, Op2, Op3, Align, isVol,
                                 MachinePointerInfo(I.getArgOperand(0)),
@@ -4873,7 +4783,6 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      // the sse2/mmx shift instructions reads 64 bits. Set the upper 32 bits
      // to be zero.
      // We must do this early because v2i32 is not a legal type.
-    DebugLoc dl = getCurDebugLoc();
      SDValue ShOps[2];
      ShOps[0] = ShAmt;
      ShOps[1] = DAG.getConstant(0, MVT::i32);
@@ -4890,7 +4799,6 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
    case Intrinsic::x86_avx_vinsertf128_ps_256:
    case Intrinsic::x86_avx_vinsertf128_si_256:
    case Intrinsic::x86_avx2_vinserti128: {
-    DebugLoc dl = getCurDebugLoc();
      EVT DestVT = TLI.getValueType(I.getType());
      EVT ElVT = TLI.getValueType(I.getArgOperand(1)->getType());
      uint64_t Idx = (cast<ConstantInt>(I.getArgOperand(2))->getZExtValue() & 1) *
@@ -4906,7 +4814,6 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
    case Intrinsic::x86_avx_vextractf128_ps_256:
    case Intrinsic::x86_avx_vextractf128_si_256:
    case Intrinsic::x86_avx2_vextracti128: {
-    DebugLoc dl = getCurDebugLoc();
      EVT DestVT = TLI.getValueType(I.getType());
      uint64_t Idx = (cast<ConstantInt>(I.getArgOperand(1))->getZExtValue() & 1) *
                     DestVT.getVectorNumElements();
@@ -4940,7 +4847,7 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      }
      EVT DestVT = TLI.getValueType(I.getType());
      const Value *Op1 = I.getArgOperand(0);
-    Res = DAG.getConvertRndSat(DestVT, getCurDebugLoc(), getValue(Op1),
+    Res = DAG.getConvertRndSat(DestVT, dl, getValue(Op1),
                                 DAG.getValueType(DestVT),
                                 DAG.getValueType(getValue(Op1).getValueType()),
                                 getValue(I.getArgOperand(1)),
@@ -4949,53 +4856,57 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      setValue(&I, Res);
      return 0;
    }
-  case Intrinsic::sqrt:
-    setValue(&I, DAG.getNode(ISD::FSQRT, dl,
-                             getValue(I.getArgOperand(0)).getValueType(),
-                             getValue(I.getArgOperand(0))));
-    return 0;
    case Intrinsic::powi:
      setValue(&I, ExpandPowI(dl, getValue(I.getArgOperand(0)),
                              getValue(I.getArgOperand(1)), DAG));
      return 0;
-  case Intrinsic::sin:
-    setValue(&I, DAG.getNode(ISD::FSIN, dl,
-                             getValue(I.getArgOperand(0)).getValueType(),
-                             getValue(I.getArgOperand(0))));
-    return 0;
-  case Intrinsic::cos:
-    setValue(&I, DAG.getNode(ISD::FCOS, dl,
-                             getValue(I.getArgOperand(0)).getValueType(),
-                             getValue(I.getArgOperand(0))));
-    return 0;
    case Intrinsic::log:
-    visitLog(I);
+    setValue(&I, expandLog(dl, getValue(I.getArgOperand(0)), DAG, TLI));
      return 0;
    case Intrinsic::log2:
-    visitLog2(I);
+    setValue(&I, expandLog2(dl, getValue(I.getArgOperand(0)), DAG, TLI));
      return 0;
    case Intrinsic::log10:
-    visitLog10(I);
+    setValue(&I, expandLog10(dl, getValue(I.getArgOperand(0)), DAG, TLI));
      return 0;
    case Intrinsic::exp:
-    visitExp(I);
+    setValue(&I, expandExp(dl, getValue(I.getArgOperand(0)), DAG, TLI));
      return 0;
    case Intrinsic::exp2:
-    visitExp2(I);
+    setValue(&I, expandExp2(dl, getValue(I.getArgOperand(0)), DAG, TLI));
      return 0;
    case Intrinsic::pow:
-    visitPow(I);
+    setValue(&I, expandPow(dl, getValue(I.getArgOperand(0)),
+                           getValue(I.getArgOperand(1)), DAG, TLI));
      return 0;
+  case Intrinsic::sqrt:
    case Intrinsic::fabs:
-    setValue(&I, DAG.getNode(ISD::FABS, dl,
-                             getValue(I.getArgOperand(0)).getValueType(),
-                             getValue(I.getArgOperand(0))));
-    return 0;
+  case Intrinsic::sin:
+  case Intrinsic::cos:
    case Intrinsic::floor:
-    setValue(&I, DAG.getNode(ISD::FFLOOR, dl,
+  case Intrinsic::ceil:
+  case Intrinsic::trunc:
+  case Intrinsic::rint:
+  case Intrinsic::nearbyint: {
+    unsigned Opcode;
+    switch (Intrinsic) {
+    default: llvm_unreachable("Impossible intrinsic");  // Can't reach here.
+    case Intrinsic::sqrt:      Opcode = ISD::FSQRT;      break;
+    case Intrinsic::fabs:      Opcode = ISD::FABS;       break;
+    case Intrinsic::sin:       Opcode = ISD::FSIN;       break;
+    case Intrinsic::cos:       Opcode = ISD::FCOS;       break;
+    case Intrinsic::floor:     Opcode = ISD::FFLOOR;     break;
+    case Intrinsic::ceil:      Opcode = ISD::FCEIL;      break;
+    case Intrinsic::trunc:     Opcode = ISD::FTRUNC;     break;
+    case Intrinsic::rint:      Opcode = ISD::FRINT;      break;
+    case Intrinsic::nearbyint: Opcode = ISD::FNEARBYINT; break;
+    }
+
+    setValue(&I, DAG.getNode(Opcode, dl,
                               getValue(I.getArgOperand(0)).getValueType(),
                               getValue(I.getArgOperand(0))));
      return 0;
+  }
    case Intrinsic::fma:
      setValue(&I, DAG.getNode(ISD::FMA, dl,
                               getValue(I.getArgOperand(0)).getValueType(),
@@ -5006,7 +4917,6 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
    case Intrinsic::fmuladd: {
      EVT VT = TLI.getValueType(I.getType());
      if (TM.Options.AllowFPOpFusion != FPOpFusion::Strict &&
-        TLI.isOperationLegal(ISD::FMA, VT) &&
          TLI.isFMAFasterThanMulAndAdd(VT)){
        setValue(&I, DAG.getNode(ISD::FMA, dl,
                                 getValue(I.getArgOperand(0)).getValueType(),
@@ -5103,7 +5013,7 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      SDValue FIN = DAG.getFrameIndex(FI, PtrTy);
  
      // Store the stack protector onto the stack.
-    Res = DAG.getStore(getRoot(), getCurDebugLoc(), Src, FIN,
+    Res = DAG.getStore(getRoot(), dl, Src, FIN,
                         MachinePointerInfo::getFixedStack(FI),
                         true, false, 0);
      setValue(&I, Res);
@@ -5127,6 +5037,11 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      setValue(&I, Res);
      return 0;
    }
+  case Intrinsic::annotation:
+  case Intrinsic::ptr_annotation:
+    // Drop the intrinsic, but forward the value
+    setValue(&I, getValue(I.getOperand(0)));
+    return 0;
    case Intrinsic::var_annotation:
      // Discard annotate attributes
      return 0;
@@ -5175,10 +5090,13 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      return 0;
    }
  
+  case Intrinsic::debugtrap:
    case Intrinsic::trap: {
      StringRef TrapFuncName = TM.Options.getTrapFunctionName();
      if (TrapFuncName.empty()) {
-      DAG.setRoot(DAG.getNode(ISD::TRAP, dl,MVT::Other, getRoot()));
+      ISD::NodeType Op = (Intrinsic == Intrinsic::trap) ? 
+        ISD::TRAP : ISD::DEBUGTRAP;
+      DAG.setRoot(DAG.getNode(Op, dl,MVT::Other, getRoot()));
        return 0;
      }
      TargetLowering::ArgListTy Args;
@@ -5188,15 +5106,12 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
                   /*isTailCall=*/false,
                   /*doesNotRet=*/false, /*isReturnValueUsed=*/true,
                   DAG.getExternalSymbol(TrapFuncName.data(), TLI.getPointerTy()),
-                 Args, DAG, getCurDebugLoc());
+                 Args, DAG, dl);
      std::pair<SDValue, SDValue> Result = TLI.LowerCallTo(CLI);
      DAG.setRoot(Result.second);
      return 0;
    }
-  case Intrinsic::debugtrap: {
-    DAG.setRoot(DAG.getNode(ISD::DEBUGTRAP, dl,MVT::Other, getRoot()));
-    return 0;
-  }
+
    case Intrinsic::uadd_with_overflow:
    case Intrinsic::sadd_with_overflow:
    case Intrinsic::usub_with_overflow:
@@ -5217,7 +5132,7 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      SDValue Op2 = getValue(I.getArgOperand(1));
  
      SDVTList VTs = DAG.getVTList(Op1.getValueType(), MVT::i1);
-    setValue(&I, DAG.getNode(Op, getCurDebugLoc(), VTs, Op1, Op2));
+    setValue(&I, DAG.getNode(Op, dl, VTs, Op1, Op2));
      return 0;
    }
    case Intrinsic::prefetch: {
@@ -5267,6 +5182,7 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
        Res = DAG.getNode(Opcode, dl, MVT::Other, Ops, 2);
        DAG.setRoot(Res);
      }
+    return 0;
    }
    case Intrinsic::invariant_start:
      // Discard region information.
@@ -5296,8 +5212,7 @@ void SelectionDAGBuilder::LowerCallTo(ImmutableCallSite CS, SDValue Callee,
  
    // Check whether the function can return without sret-demotion.
    SmallVector<ISD::OutputArg, 4> Outs;
-  GetReturnInfo(RetTy, CS.getAttributes().getRetAttributes(),
-                Outs, TLI);
+  GetReturnInfo(RetTy, CS.getAttributes(), Outs, TLI);
  
    bool CanLowerReturn = TLI.CanLowerReturn(CS.getCallingConv(),
                                             DAG.getMachineFunction(),
@@ -5325,6 +5240,7 @@ void SelectionDAGBuilder::LowerCallTo(ImmutableCallSite CS, SDValue Callee,
      Entry.isSRet = true;
      Entry.isNest = false;
      Entry.isByVal = false;
+    Entry.isReturned = false;
      Entry.Alignment = Align;
      Args.push_back(Entry);
      RetTy = Type::getVoidTy(FTy->getContext());
@@ -5342,13 +5258,14 @@ void SelectionDAGBuilder::LowerCallTo(ImmutableCallSite CS, SDValue Callee,
      Entry.Node = ArgNode; Entry.Ty = V->getType();
  
      unsigned attrInd = i - CS.arg_begin() + 1;
-    Entry.isSExt  = CS.paramHasSExtAttr(attrInd);
-    Entry.isZExt  = CS.paramHasZExtAttr(attrInd);
-    Entry.isInReg = CS.paramHasInRegAttr(attrInd);
-    Entry.isSRet  = CS.paramHasStructRetAttr(attrInd);
-    Entry.isNest  = CS.paramHasNestAttr(attrInd);
-    Entry.isByVal = CS.paramHasByValAttr(attrInd);
-    Entry.Alignment = CS.getParamAlignment(attrInd);
+    Entry.isSExt     = CS.paramHasAttr(attrInd, Attribute::SExt);
+    Entry.isZExt     = CS.paramHasAttr(attrInd, Attribute::ZExt);
+    Entry.isInReg    = CS.paramHasAttr(attrInd, Attribute::InReg);
+    Entry.isSRet     = CS.paramHasAttr(attrInd, Attribute::StructRet);
+    Entry.isNest     = CS.paramHasAttr(attrInd, Attribute::Nest);
+    Entry.isByVal    = CS.paramHasAttr(attrInd, Attribute::ByVal);
+    Entry.isReturned = CS.paramHasAttr(attrInd, Attribute::Returned);
+    Entry.Alignment  = CS.getParamAlignment(attrInd);
      Args.push_back(Entry);
    }
  
@@ -5376,13 +5293,7 @@ void SelectionDAGBuilder::LowerCallTo(ImmutableCallSite CS, SDValue Callee,
  
    // Check if target-independent constraints permit a tail call here.
    // Target-dependent constraints are checked within TLI.LowerCallTo.
-  if (isTailCall &&
-      !isInTailCallPosition(CS, CS.getAttributes().getRetAttributes(), TLI))
-    isTailCall = false;
-
-  // If there's a possibility that fast-isel has already selected some amount
-  // of the current basic block, don't emit a tail call.
-  if (isTailCall && TM.Options.EnableFastISel)
+  if (isTailCall && !isInTailCallPosition(CS, TLI))
      isTailCall = false;
  
    TargetLowering::
@@ -5856,7 +5767,7 @@ static void GetRegistersForValue(SelectionDAG &DAG,
        // Try to convert to the first EVT that the reg class contains.  If the
        // types are identical size, use a bitcast to convert (e.g. two differing
        // vector types).
-      EVT RegVT = *PhysReg.second->vt_begin();
+      MVT RegVT = *PhysReg.second->vt_begin();
        if (RegVT.getSizeInBits() == OpInfo.ConstraintVT.getSizeInBits()) {
          OpInfo.CallOperand = DAG.getNode(ISD::BITCAST, DL,
                                           RegVT, OpInfo.CallOperand);
@@ -5866,8 +5777,7 @@ static void GetRegistersForValue(SelectionDAG &DAG,
          // bitcast to the corresponding integer type.  This turns an f64 value
          // into i64, which can be passed with two i32 values on a 32-bit
          // machine.
-        RegVT = EVT::getIntegerVT(Context,
-                                  OpInfo.ConstraintVT.getSizeInBits());
+        RegVT = MVT::getIntegerVT(OpInfo.ConstraintVT.getSizeInBits());
          OpInfo.CallOperand = DAG.getNode(ISD::BITCAST, DL,
                                           RegVT, OpInfo.CallOperand);
          OpInfo.ConstraintVT = RegVT;
@@ -5877,7 +5787,7 @@ static void GetRegistersForValue(SelectionDAG &DAG,
      NumRegs = TLI.getNumRegisters(Context, OpInfo.ConstraintVT);
    }
  
-  EVT RegVT;
+  MVT RegVT;
    EVT ValueVT = OpInfo.ConstraintVT;
  
    // If this is a constraint for a specific physical register, like {r17},
@@ -5951,7 +5861,7 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
      ConstraintOperands.push_back(SDISelAsmOperandInfo(TargetConstraints[i]));
      SDISelAsmOperandInfo &OpInfo = ConstraintOperands.back();
  
-    EVT OpVT = MVT::Other;
+    MVT OpVT = MVT::Other;
  
      // Compute the value type for each operand.
      switch (OpInfo.Type) {
@@ -5966,10 +5876,10 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
        // corresponding argument.
        assert(!CS.getType()->isVoidTy() && "Bad inline asm!");
        if (StructType *STy = dyn_cast<StructType>(CS.getType())) {
-        OpVT = TLI.getValueType(STy->getElementType(ResNo));
+        OpVT = TLI.getSimpleValueType(STy->getElementType(ResNo));
        } else {
          assert(ResNo == 0 && "Asm only has one result!");
-        OpVT = TLI.getValueType(CS.getType());
+        OpVT = TLI.getSimpleValueType(CS.getType());
        }
        ++ResNo;
        break;
@@ -5990,7 +5900,8 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
          OpInfo.CallOperand = getValue(OpInfo.CallOperandVal);
        }
  
-      OpVT = OpInfo.getCallOperandValEVT(*DAG.getContext(), TLI, TD);
+      OpVT = OpInfo.getCallOperandValEVT(*DAG.getContext(), TLI, TD).
+        getSimpleVT();
      }
  
      OpInfo.ConstraintVT = OpVT;
@@ -6052,6 +5963,10 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
      // Compute the constraint code and ConstraintType to use.
      TLI.ComputeConstraintToUse(OpInfo, OpInfo.CallOperand, &DAG);
  
+    if (OpInfo.ConstraintType == TargetLowering::C_Memory &&
+        OpInfo.Type == InlineAsm::isClobber)
+      continue;
+
      // If this is a memory input, and if the operand is not indirect, do what we
      // need to to provide an address for the memory input.
      if (OpInfo.ConstraintType == TargetLowering::C_Memory &&
@@ -6128,7 +6043,8 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
    const MDNode *SrcLoc = CS.getInstruction()->getMetadata("srcloc");
    AsmNodeOperands.push_back(DAG.getMDNode(SrcLoc));
  
-  // Remember the HasSideEffect, AlignStack and AsmDialect bits as operand 3.
+  // Remember the HasSideEffect, AlignStack, AsmDialect, MayLoad and MayStore
+  // bits as operand 3.
    unsigned ExtraInfo = 0;
    if (IA->hasSideEffects())
      ExtraInfo |= InlineAsm::Extra_HasSideEffects;
@@ -6136,6 +6052,29 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
      ExtraInfo |= InlineAsm::Extra_IsAlignStack;
    // Set the asm dialect.
    ExtraInfo |= IA->getDialect() * InlineAsm::Extra_AsmDialect;
+
+  // Determine if this InlineAsm MayLoad or MayStore based on the constraints.
+  for (unsigned i = 0, e = TargetConstraints.size(); i != e; ++i) {
+    TargetLowering::AsmOperandInfo &OpInfo = TargetConstraints[i];
+
+    // Compute the constraint code and ConstraintType to use.
+    TLI.ComputeConstraintToUse(OpInfo, SDValue());
+
+    // Ideally, we would only check against memory constraints.  However, the
+    // meaning of an other constraint can be target-specific and we can't easily
+    // reason about it.  Therefore, be conservative and set MayLoad/MayStore
+    // for other constriants as well.
+    if (OpInfo.ConstraintType == TargetLowering::C_Memory ||
+        OpInfo.ConstraintType == TargetLowering::C_Other) {
+      if (OpInfo.Type == InlineAsm::isInput)
+        ExtraInfo |= InlineAsm::Extra_MayLoad;
+      else if (OpInfo.Type == InlineAsm::isOutput)
+        ExtraInfo |= InlineAsm::Extra_MayStore;
+      else if (OpInfo.Type == InlineAsm::isClobber)
+        ExtraInfo |= (InlineAsm::Extra_MayLoad | InlineAsm::Extra_MayStore);
+    }
+  }
+
    AsmNodeOperands.push_back(DAG.getTargetConstant(ExtraInfo,
                                                    TLI.getPointerTy()));
  
@@ -6231,18 +6170,26 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
              Ctx.emitError(CS.getInstruction(),  "inline asm not supported yet:"
                            " don't know how to handle tied "
                            "indirect register inputs");
+            report_fatal_error("Cannot handle indirect register inputs!");
            }
  
            RegsForValue MatchedRegs;
            MatchedRegs.ValueVTs.push_back(InOperandVal.getValueType());
-          EVT RegVT = AsmNodeOperands[CurOp+1].getValueType();
+          MVT RegVT = AsmNodeOperands[CurOp+1].getSimpleValueType();
            MatchedRegs.RegVTs.push_back(RegVT);
            MachineRegisterInfo &RegInfo = DAG.getMachineFunction().getRegInfo();
            for (unsigned i = 0, e = InlineAsm::getNumOperandRegisters(OpFlag);
-               i != e; ++i)
-            MatchedRegs.Regs.push_back
-              (RegInfo.createVirtualRegister(TLI.getRegClassFor(RegVT)));
-
+               i != e; ++i) {
+            if (const TargetRegisterClass *RC = TLI.getRegClassFor(RegVT))
+              MatchedRegs.Regs.push_back(RegInfo.createVirtualRegister(RC));
+            else {
+              LLVMContext &Ctx = *DAG.getContext();
+              Ctx.emitError(CS.getInstruction(), "inline asm error: This value"
+                            " type register class is not natively supported!");
+              report_fatal_error("inline asm error: This value type register "
+                                 "class is not natively supported!");
+            }
+          }
            // Use the produced MatchedRegs object to
            MatchedRegs.getCopyToRegs(InOperandVal, DAG, getCurDebugLoc(),
                                      Chain, &Flag, CS.getInstruction());
@@ -6459,6 +6406,28 @@ void SelectionDAGBuilder::visitVACopy(const CallInst &I) {
  /// migrated to using LowerCall, this hook should be integrated into SDISel.
  std::pair<SDValue, SDValue>
  TargetLowering::LowerCallTo(TargetLowering::CallLoweringInfo &CLI) const {
+  // Handle the incoming return values from the call.
+  CLI.Ins.clear();
+  SmallVector<EVT, 4> RetTys;
+  ComputeValueVTs(*this, CLI.RetTy, RetTys);
+  for (unsigned I = 0, E = RetTys.size(); I != E; ++I) {
+    EVT VT = RetTys[I];
+    MVT RegisterVT = getRegisterType(CLI.RetTy->getContext(), VT);
+    unsigned NumRegs = getNumRegisters(CLI.RetTy->getContext(), VT);
+    for (unsigned i = 0; i != NumRegs; ++i) {
+      ISD::InputArg MyFlags;
+      MyFlags.VT = RegisterVT;
+      MyFlags.Used = CLI.IsReturnValueUsed;
+      if (CLI.RetSExt)
+        MyFlags.Flags.setSExt();
+      if (CLI.RetZExt)
+        MyFlags.Flags.setZExt();
+      if (CLI.IsInReg)
+        MyFlags.Flags.setInReg();
+      CLI.Ins.push_back(MyFlags);
+    }
+  }
+
    // Handle all of the outgoing arguments.
    CLI.Outs.clear();
    CLI.OutVals.clear();
@@ -6502,7 +6471,7 @@ TargetLowering::LowerCallTo(TargetLowering::CallLoweringInfo &CLI) const {
          Flags.setNest();
        Flags.setOrigAlign(OriginalAlignment);
  
-      EVT PartVT = getRegisterType(CLI.RetTy->getContext(), VT);
+      MVT PartVT = getRegisterType(CLI.RetTy->getContext(), VT);
        unsigned NumParts = getNumRegisters(CLI.RetTy->getContext(), VT);
        SmallVector<SDValue, 4> Parts(NumParts);
        ISD::NodeType ExtendKind = ISD::ANY_EXTEND;
@@ -6512,13 +6481,34 @@ TargetLowering::LowerCallTo(TargetLowering::CallLoweringInfo &CLI) const {
        else if (Args[i].isZExt)
          ExtendKind = ISD::ZERO_EXTEND;
  
+      // Conservatively only handle 'returned' on non-vectors for now
+      if (Args[i].isReturned && !Op.getValueType().isVector()) {
+        assert(CLI.RetTy == Args[i].Ty && RetTys.size() == NumValues &&
+               "unexpected use of 'returned'");
+        // Before passing 'returned' to the target lowering code, ensure that
+        // either the register MVT and the actual EVT are the same size or that
+        // the return value and argument are extended in the same way; in these
+        // cases it's safe to pass the argument register value unchanged as the
+        // return register value (although it's at the target's option whether
+        // to do so)
+        // TODO: allow code generation to take advantage of partially preserved
+        // registers rather than clobbering the entire register when the
+        // parameter extension method is not compatible with the return
+        // extension method
+        if ((NumParts * PartVT.getSizeInBits() == VT.getSizeInBits()) ||
+            (ExtendKind != ISD::ANY_EXTEND &&
+             CLI.RetSExt == Args[i].isSExt && CLI.RetZExt == Args[i].isZExt))
+        Flags.setReturned();
+      }
+
        getCopyToParts(CLI.DAG, CLI.DL, Op, &Parts[0], NumParts,
                       PartVT, CLI.CS ? CLI.CS->getInstruction() : 0, ExtendKind);
  
        for (unsigned j = 0; j != NumParts; ++j) {
          // if it isn't first piece, alignment must be 1
          ISD::OutputArg MyFlags(Flags, Parts[j].getValueType(),
-                               i < CLI.NumFixedArgs);
+                               i < CLI.NumFixedArgs,
+                               i, j*Parts[j].getValueType().getStoreSize());
          if (NumParts > 1 && j == 0)
            MyFlags.Flags.setSplit();
          else if (j != 0)
@@ -6530,28 +6520,6 @@ TargetLowering::LowerCallTo(TargetLowering::CallLoweringInfo &CLI) const {
      }
    }
  
-  // Handle the incoming return values from the call.
-  CLI.Ins.clear();
-  SmallVector<EVT, 4> RetTys;
-  ComputeValueVTs(*this, CLI.RetTy, RetTys);
-  for (unsigned I = 0, E = RetTys.size(); I != E; ++I) {
-    EVT VT = RetTys[I];
-    EVT RegisterVT = getRegisterType(CLI.RetTy->getContext(), VT);
-    unsigned NumRegs = getNumRegisters(CLI.RetTy->getContext(), VT);
-    for (unsigned i = 0; i != NumRegs; ++i) {
-      ISD::InputArg MyFlags;
-      MyFlags.VT = RegisterVT.getSimpleVT();
-      MyFlags.Used = CLI.IsReturnValueUsed;
-      if (CLI.RetSExt)
-        MyFlags.Flags.setSExt();
-      if (CLI.RetZExt)
-        MyFlags.Flags.setZExt();
-      if (CLI.IsInReg)
-        MyFlags.Flags.setInReg();
-      CLI.Ins.push_back(MyFlags);
-    }
-  }
-
    SmallVector<SDValue, 4> InVals;
    CLI.Chain = LowerCall(CLI, InVals);
  
@@ -6590,7 +6558,7 @@ TargetLowering::LowerCallTo(TargetLowering::CallLoweringInfo &CLI) const {
    unsigned CurReg = 0;
    for (unsigned I = 0, E = RetTys.size(); I != E; ++I) {
      EVT VT = RetTys[I];
-    EVT RegisterVT = getRegisterType(CLI.RetTy->getContext(), VT);
+    MVT RegisterVT = getRegisterType(CLI.RetTy->getContext(), VT);
      unsigned NumRegs = getNumRegisters(CLI.RetTy->getContext(), VT);
  
      ReturnValues.push_back(getCopyFromParts(CLI.DAG, CLI.DL, &InVals[CurReg],
@@ -6658,19 +6626,12 @@ static bool isOnlyUsedInEntryBlock(const Argument *A, bool FastISel) {
    return true;
  }
  
-void SelectionDAGISel::LowerArguments(const BasicBlock *LLVMBB) {
-  // If this is the entry block, emit arguments.
-  const Function &F = *LLVMBB->getParent();
+void SelectionDAGISel::LowerArguments(const Function &F) {
    SelectionDAG &DAG = SDB->DAG;
    DebugLoc dl = SDB->getCurDebugLoc();
    const DataLayout *TD = TLI.getDataLayout();
    SmallVector<ISD::InputArg, 16> Ins;
  
-  // Check whether the function can return without sret-demotion.
-  SmallVector<ISD::OutputArg, 4> Outs;
-  GetReturnInfo(F.getReturnType(), F.getAttributes().getRetAttributes(),
-                Outs, TLI);
-
    if (!FuncInfo->CanLowerReturn) {
      // Put in an sret pointer parameter before all the other parameters.
      SmallVector<EVT, 1> ValueVTs;
@@ -6680,8 +6641,8 @@ void SelectionDAGISel::LowerArguments(const BasicBlock *LLVMBB) {
      // or one register.
      ISD::ArgFlagsTy Flags;
      Flags.setSRet();
-    EVT RegisterVT = TLI.getRegisterType(*DAG.getContext(), ValueVTs[0]);
-    ISD::InputArg RetArg(Flags, RegisterVT, true);
+    MVT RegisterVT = TLI.getRegisterType(*DAG.getContext(), ValueVTs[0]);
+    ISD::InputArg RetArg(Flags, RegisterVT, true, 0, 0);
      Ins.push_back(RetArg);
    }
  
@@ -6700,15 +6661,15 @@ void SelectionDAGISel::LowerArguments(const BasicBlock *LLVMBB) {
        unsigned OriginalAlignment =
          TD->getABITypeAlignment(ArgTy);
  
-      if (F.getParamAttributes(Idx).hasZExtAttr())
+      if (F.getAttributes().hasAttribute(Idx, Attribute::ZExt))
          Flags.setZExt();
-      if (F.getParamAttributes(Idx).hasSExtAttr())
+      if (F.getAttributes().hasAttribute(Idx, Attribute::SExt))
          Flags.setSExt();
-      if (F.getParamAttributes(Idx).hasInRegAttr())
+      if (F.getAttributes().hasAttribute(Idx, Attribute::InReg))
          Flags.setInReg();
-      if (F.getParamAttributes(Idx).hasStructRetAttr())
+      if (F.getAttributes().hasAttribute(Idx, Attribute::StructRet))
          Flags.setSRet();
-      if (F.getParamAttributes(Idx).hasByValAttr()) {
+      if (F.getAttributes().hasAttribute(Idx, Attribute::ByVal)) {
          Flags.setByVal();
          PointerType *Ty = cast<PointerType>(I->getType());
          Type *ElementTy = Ty->getElementType();
@@ -6722,14 +6683,15 @@ void SelectionDAGISel::LowerArguments(const BasicBlock *LLVMBB) {
            FrameAlign = TLI.getByValTypeAlignment(ElementTy);
          Flags.setByValAlign(FrameAlign);
        }
-      if (F.getParamAttributes(Idx).hasNestAttr())
+      if (F.getAttributes().hasAttribute(Idx, Attribute::Nest))
          Flags.setNest();
        Flags.setOrigAlign(OriginalAlignment);
  
-      EVT RegisterVT = TLI.getRegisterType(*CurDAG->getContext(), VT);
+      MVT RegisterVT = TLI.getRegisterType(*CurDAG->getContext(), VT);
        unsigned NumRegs = TLI.getNumRegisters(*CurDAG->getContext(), VT);
        for (unsigned i = 0; i != NumRegs; ++i) {
-        ISD::InputArg MyFlags(Flags, RegisterVT, isArgValueUsed);
+        ISD::InputArg MyFlags(Flags, RegisterVT, isArgValueUsed,
+                              Idx-1, i*RegisterVT.getStoreSize());
          if (NumRegs > 1 && i == 0)
            MyFlags.Flags.setSplit();
          // if it isn't first piece, alignment must be 1
@@ -6771,8 +6733,8 @@ void SelectionDAGISel::LowerArguments(const BasicBlock *LLVMBB) {
      // from the sret argument into it.
      SmallVector<EVT, 1> ValueVTs;
      ComputeValueVTs(TLI, PointerType::getUnqual(F.getReturnType()), ValueVTs);
-    EVT VT = ValueVTs[0];
-    EVT RegVT = TLI.getRegisterType(*CurDAG->getContext(), VT);
+    MVT VT = ValueVTs[0].getSimpleVT();
+    MVT RegVT = TLI.getRegisterType(*CurDAG->getContext(), VT);
      ISD::NodeType AssertOp = ISD::DELETED_NODE;
      SDValue ArgValue = getCopyFromParts(DAG, dl, &InVals[0], 1,
                                          RegVT, VT, NULL, AssertOp);
@@ -6799,19 +6761,25 @@ void SelectionDAGISel::LowerArguments(const BasicBlock *LLVMBB) {
  
      // If this argument is unused then remember its value. It is used to generate
      // debugging information.
-    if (I->use_empty() && NumValues)
+    if (I->use_empty() && NumValues) {
        SDB->setUnusedArgValue(I, InVals[i]);
  
+      // Also remember any frame index for use in FastISel.
+      if (FrameIndexSDNode *FI =
+          dyn_cast<FrameIndexSDNode>(InVals[i].getNode()))
+        FuncInfo->setArgumentFrameIndex(I, FI->getIndex());
+    }
+
      for (unsigned Val = 0; Val != NumValues; ++Val) {
        EVT VT = ValueVTs[Val];
-      EVT PartVT = TLI.getRegisterType(*CurDAG->getContext(), VT);
+      MVT PartVT = TLI.getRegisterType(*CurDAG->getContext(), VT);
        unsigned NumParts = TLI.getNumRegisters(*CurDAG->getContext(), VT);
  
        if (!I->use_empty()) {
          ISD::NodeType AssertOp = ISD::DELETED_NODE;
-        if (F.getParamAttributes(Idx).hasSExtAttr())
+        if (F.getAttributes().hasAttribute(Idx, Attribute::SExt))
            AssertOp = ISD::AssertSext;
-        else if (F.getParamAttributes(Idx).hasZExtAttr())
+        else if (F.getAttributes().hasAttribute(Idx, Attribute::ZExt))
            AssertOp = ISD::AssertZext;
  
          ArgValues.push_back(getCopyFromParts(DAG, dl, &InVals[i],