Make isLegalAddressingMode() taking DataLayout as an argument

[oota-llvm.git] / lib / Target / PowerPC / PPCISelLowering.cpp
diff --git a/lib/Target/PowerPC/PPCISelLowering.cpp b/lib/Target/PowerPC/PPCISelLowering.cpp

index bb0eb3995299e7ad643bfbdfc4a3bb5aab920153..0fe88258cab5be161d2b1addd07fc0db7e85e875 100644 (file)
--- a/lib/Target/PowerPC/PPCISelLowering.cpp
+++ b/lib/Target/PowerPC/PPCISelLowering.cpp
@@ -39,6 +39,7 @@
  #include "llvm/Support/MathExtras.h"
  #include "llvm/Support/raw_ostream.h"
  #include "llvm/Target/TargetOptions.h"
+
  using namespace llvm;
  
  // FIXME: Remove this once soft-float is supported.
@@ -404,9 +405,9 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
        // add/sub are legal for all supported vector VT's.
        setOperationAction(ISD::ADD , VT, Legal);
        setOperationAction(ISD::SUB , VT, Legal);
-
+      
        // Vector instructions introduced in P8
-      if (Subtarget.hasP8Altivec()) {
+      if (Subtarget.hasP8Altivec() && (VT.SimpleTy != MVT::v1i128)) {
          setOperationAction(ISD::CTPOP, VT, Legal);
          setOperationAction(ISD::CTLZ, VT, Legal);
        }
@@ -516,7 +517,12 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
        setOperationAction(ISD::FSQRT, MVT::v4f32, Legal);
      }
  
-    setOperationAction(ISD::MUL, MVT::v4i32, Custom);
+    
+    if (Subtarget.hasP8Altivec()) 
+      setOperationAction(ISD::MUL, MVT::v4i32, Legal);
+    else
+      setOperationAction(ISD::MUL, MVT::v4i32, Custom);
+      
      setOperationAction(ISD::MUL, MVT::v8i16, Custom);
      setOperationAction(ISD::MUL, MVT::v16i8, Custom);
  
@@ -569,20 +575,32 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
  
        setOperationAction(ISD::VECTOR_SHUFFLE, MVT::v2f64, Legal);
  
+      if (Subtarget.hasP8Vector())
+        addRegisterClass(MVT::f32, &PPC::VSSRCRegClass);
+
        addRegisterClass(MVT::f64, &PPC::VSFRCRegClass);
  
        addRegisterClass(MVT::v4f32, &PPC::VSRCRegClass);
        addRegisterClass(MVT::v2f64, &PPC::VSRCRegClass);
  
-      // VSX v2i64 only supports non-arithmetic operations.
-      setOperationAction(ISD::ADD, MVT::v2i64, Expand);
-      setOperationAction(ISD::SUB, MVT::v2i64, Expand);
+      if (Subtarget.hasP8Altivec()) {
+        setOperationAction(ISD::SHL, MVT::v2i64, Legal);
+        setOperationAction(ISD::SRA, MVT::v2i64, Legal);
+        setOperationAction(ISD::SRL, MVT::v2i64, Legal);
  
-      setOperationAction(ISD::SHL, MVT::v2i64, Expand);
-      setOperationAction(ISD::SRA, MVT::v2i64, Expand);
-      setOperationAction(ISD::SRL, MVT::v2i64, Expand);
+        setOperationAction(ISD::SETCC, MVT::v2i64, Legal);
+      }
+      else {
+        setOperationAction(ISD::SHL, MVT::v2i64, Expand);
+        setOperationAction(ISD::SRA, MVT::v2i64, Expand);
+        setOperationAction(ISD::SRL, MVT::v2i64, Expand);
+
+        setOperationAction(ISD::SETCC, MVT::v2i64, Custom);
  
-      setOperationAction(ISD::SETCC, MVT::v2i64, Custom);
+        // VSX v2i64 only supports non-arithmetic operations.
+        setOperationAction(ISD::ADD, MVT::v2i64, Expand);
+        setOperationAction(ISD::SUB, MVT::v2i64, Expand);
+      }
  
        setOperationAction(ISD::LOAD, MVT::v2i64, Promote);
        AddPromotedToType (ISD::LOAD, MVT::v2i64, MVT::v2f64);
@@ -606,8 +624,10 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
        addRegisterClass(MVT::v2i64, &PPC::VSRCRegClass);
      }
  
-    if (Subtarget.hasP8Altivec()) 
+    if (Subtarget.hasP8Altivec()) {
        addRegisterClass(MVT::v2i64, &PPC::VRRCRegClass);
+      addRegisterClass(MVT::v1i128, &PPC::VRRCRegClass);
+    }
    }
  
    if (Subtarget.hasQPX()) {
@@ -880,7 +900,7 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
    else
      setSchedulingPreference(Sched::Hybrid);
  
-  computeRegisterProperties();
+  computeRegisterProperties(STI.getRegisterInfo());
  
    // The Freescale cores do better with aggressive inlining of memcpy and
    // friends. GCC uses same threshold of 128 bytes (= 32 word stores).
@@ -892,6 +912,13 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
      MaxStoresPerMemcpyOptSize = 8;
      MaxStoresPerMemmove = 32;
      MaxStoresPerMemmoveOptSize = 8;
+  } else if (Subtarget.getDarwinDirective() == PPC::DIR_A2) {
+    // The A2 also benefits from (very) aggressive inlining of memcpy and
+    // friends. The overhead of a the function call, even when warm, can be
+    // over one hundred cycles.
+    MaxStoresPerMemset = 128;
+    MaxStoresPerMemcpy = 128;
+    MaxStoresPerMemmove = 128;
    }
  }
  
@@ -925,7 +952,8 @@ static void getMaxByValAlign(Type *Ty, unsigned &MaxAlign,
  
  /// getByValTypeAlignment - Return the desired alignment for ByVal aggregate
  /// function arguments in the caller parameter area.
-unsigned PPCTargetLowering::getByValTypeAlignment(Type *Ty) const {
+unsigned PPCTargetLowering::getByValTypeAlignment(Type *Ty,
+                                                  const DataLayout &DL) const {
    // Darwin passes everything on 4 byte boundary.
    if (Subtarget.isDarwin())
      return 4;
@@ -939,8 +967,8 @@ unsigned PPCTargetLowering::getByValTypeAlignment(Type *Ty) const {
  }
  
  const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {
-  switch (Opcode) {
-  default: return nullptr;
+  switch ((PPCISD::NodeType)Opcode) {
+  case PPCISD::FIRST_NUMBER:    break;
    case PPCISD::FSEL:            return "PPCISD::FSEL";
    case PPCISD::FCFID:           return "PPCISD::FCFID";
    case PPCISD::FCFIDU:          return "PPCISD::FCFIDU";
@@ -965,6 +993,7 @@ const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {
    case PPCISD::SRL:             return "PPCISD::SRL";
    case PPCISD::SRA:             return "PPCISD::SRA";
    case PPCISD::SHL:             return "PPCISD::SHL";
+  case PPCISD::SRA_ADDZE:       return "PPCISD::SRA_ADDZE";
    case PPCISD::CALL:            return "PPCISD::CALL";
    case PPCISD::CALL_NOP:        return "PPCISD::CALL_NOP";
    case PPCISD::MTCTR:           return "PPCISD::MTCTR";
@@ -975,14 +1004,19 @@ const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {
    case PPCISD::EH_SJLJ_SETJMP:  return "PPCISD::EH_SJLJ_SETJMP";
    case PPCISD::EH_SJLJ_LONGJMP: return "PPCISD::EH_SJLJ_LONGJMP";
    case PPCISD::MFOCRF:          return "PPCISD::MFOCRF";
+  case PPCISD::MFVSR:           return "PPCISD::MFVSR";
+  case PPCISD::MTVSRA:          return "PPCISD::MTVSRA";
+  case PPCISD::MTVSRZ:          return "PPCISD::MTVSRZ";
+  case PPCISD::ANDIo_1_EQ_BIT:  return "PPCISD::ANDIo_1_EQ_BIT";
+  case PPCISD::ANDIo_1_GT_BIT:  return "PPCISD::ANDIo_1_GT_BIT";
    case PPCISD::VCMP:            return "PPCISD::VCMP";
    case PPCISD::VCMPo:           return "PPCISD::VCMPo";
    case PPCISD::LBRX:            return "PPCISD::LBRX";
    case PPCISD::STBRX:           return "PPCISD::STBRX";
    case PPCISD::LFIWAX:          return "PPCISD::LFIWAX";
    case PPCISD::LFIWZX:          return "PPCISD::LFIWZX";
-  case PPCISD::LARX:            return "PPCISD::LARX";
-  case PPCISD::STCX:            return "PPCISD::STCX";
+  case PPCISD::LXVD2X:          return "PPCISD::LXVD2X";
+  case PPCISD::STXVD2X:         return "PPCISD::STXVD2X";
    case PPCISD::COND_BRANCH:     return "PPCISD::COND_BRANCH";
    case PPCISD::BDNZ:            return "PPCISD::BDNZ";
    case PPCISD::BDZ:             return "PPCISD::BDZ";
@@ -991,10 +1025,8 @@ const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {
    case PPCISD::TC_RETURN:       return "PPCISD::TC_RETURN";
    case PPCISD::CR6SET:          return "PPCISD::CR6SET";
    case PPCISD::CR6UNSET:        return "PPCISD::CR6UNSET";
-  case PPCISD::ADDIS_TOC_HA:    return "PPCISD::ADDIS_TOC_HA";
-  case PPCISD::LD_TOC_L:        return "PPCISD::LD_TOC_L";
-  case PPCISD::ADDI_TOC_L:      return "PPCISD::ADDI_TOC_L";
    case PPCISD::PPC32_GOT:       return "PPCISD::PPC32_GOT";
+  case PPCISD::PPC32_PICGOT:    return "PPCISD::PPC32_PICGOT";
    case PPCISD::ADDIS_GOT_TPREL_HA: return "PPCISD::ADDIS_GOT_TPREL_HA";
    case PPCISD::LD_GOT_TPREL_L:  return "PPCISD::LD_GOT_TPREL_L";
    case PPCISD::ADD_TLS:         return "PPCISD::ADD_TLS";
@@ -1010,6 +1042,10 @@ const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {
    case PPCISD::ADDI_DTPREL_L:   return "PPCISD::ADDI_DTPREL_L";
    case PPCISD::VADD_SPLAT:      return "PPCISD::VADD_SPLAT";
    case PPCISD::SC:              return "PPCISD::SC";
+  case PPCISD::CLRBHRB:         return "PPCISD::CLRBHRB";
+  case PPCISD::MFBHRBE:         return "PPCISD::MFBHRBE";
+  case PPCISD::RFEBB:           return "PPCISD::RFEBB";
+  case PPCISD::XXSWAPD:         return "PPCISD::XXSWAPD";
    case PPCISD::QVFPERM:         return "PPCISD::QVFPERM";
    case PPCISD::QVGPCI:          return "PPCISD::QVGPCI";
    case PPCISD::QVALIGNI:        return "PPCISD::QVALIGNI";
@@ -1017,9 +1053,11 @@ const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {
    case PPCISD::QBFLT:           return "PPCISD::QBFLT";
    case PPCISD::QVLFSb:          return "PPCISD::QVLFSb";
    }
+  return nullptr;
  }
  
-EVT PPCTargetLowering::getSetCCResultType(LLVMContext &C, EVT VT) const {
+EVT PPCTargetLowering::getSetCCResultType(const DataLayout &DL, LLVMContext &C,
+                                          EVT VT) const {
    if (!VT.isVector())
      return Subtarget.useCRBits() ? MVT::i1 : MVT::i32;
  
@@ -1061,7 +1099,7 @@ static bool isConstantOrUndef(int Op, int Val) {
  /// VPKUHUM instruction.
  /// The ShuffleKind distinguishes between big-endian operations with
  /// two different inputs (0), either-endian operations with two identical
-/// inputs (1), and little-endian operantion with two different inputs (2).
+/// inputs (1), and little-endian operations with two different inputs (2).
  /// For the latter, the input operands are swapped (see PPCInstrAltivec.td).
  bool PPC::isVPKUHUMShuffleMask(ShuffleVectorSDNode *N, unsigned ShuffleKind,
                                 SelectionDAG &DAG) {
@@ -1092,7 +1130,7 @@ bool PPC::isVPKUHUMShuffleMask(ShuffleVectorSDNode *N, unsigned ShuffleKind,
  /// VPKUWUM instruction.
  /// The ShuffleKind distinguishes between big-endian operations with
  /// two different inputs (0), either-endian operations with two identical
-/// inputs (1), and little-endian operantion with two different inputs (2).
+/// inputs (1), and little-endian operations with two different inputs (2).
  /// For the latter, the input operands are swapped (see PPCInstrAltivec.td).
  bool PPC::isVPKUWUMShuffleMask(ShuffleVectorSDNode *N, unsigned ShuffleKind,
                                 SelectionDAG &DAG) {
@@ -1123,6 +1161,56 @@ bool PPC::isVPKUWUMShuffleMask(ShuffleVectorSDNode *N, unsigned ShuffleKind,
    return true;
  }
  
+/// isVPKUDUMShuffleMask - Return true if this is the shuffle mask for a
+/// VPKUDUM instruction, AND the VPKUDUM instruction exists for the
+/// current subtarget.
+///
+/// The ShuffleKind distinguishes between big-endian operations with
+/// two different inputs (0), either-endian operations with two identical
+/// inputs (1), and little-endian operations with two different inputs (2).
+/// For the latter, the input operands are swapped (see PPCInstrAltivec.td).
+bool PPC::isVPKUDUMShuffleMask(ShuffleVectorSDNode *N, unsigned ShuffleKind,
+                               SelectionDAG &DAG) {
+  const PPCSubtarget& Subtarget =
+    static_cast<const PPCSubtarget&>(DAG.getSubtarget());
+  if (!Subtarget.hasP8Vector())
+    return false;
+
+  bool IsLE = DAG.getTarget().getDataLayout()->isLittleEndian();
+  if (ShuffleKind == 0) {
+    if (IsLE)
+      return false;
+    for (unsigned i = 0; i != 16; i += 4)
+      if (!isConstantOrUndef(N->getMaskElt(i  ),  i*2+4) ||
+          !isConstantOrUndef(N->getMaskElt(i+1),  i*2+5) ||
+          !isConstantOrUndef(N->getMaskElt(i+2),  i*2+6) ||
+          !isConstantOrUndef(N->getMaskElt(i+3),  i*2+7))
+        return false;
+  } else if (ShuffleKind == 2) {
+    if (!IsLE)
+      return false;
+    for (unsigned i = 0; i != 16; i += 4)
+      if (!isConstantOrUndef(N->getMaskElt(i  ),  i*2) ||
+          !isConstantOrUndef(N->getMaskElt(i+1),  i*2+1) ||
+          !isConstantOrUndef(N->getMaskElt(i+2),  i*2+2) ||
+          !isConstantOrUndef(N->getMaskElt(i+3),  i*2+3))
+        return false;
+  } else if (ShuffleKind == 1) {
+    unsigned j = IsLE ? 0 : 4;
+    for (unsigned i = 0; i != 8; i += 4)
+      if (!isConstantOrUndef(N->getMaskElt(i  ),  i*2+j)   ||
+          !isConstantOrUndef(N->getMaskElt(i+1),  i*2+j+1) ||
+          !isConstantOrUndef(N->getMaskElt(i+2),  i*2+j+2) ||
+          !isConstantOrUndef(N->getMaskElt(i+3),  i*2+j+3) ||
+          !isConstantOrUndef(N->getMaskElt(i+8),  i*2+j)   ||
+          !isConstantOrUndef(N->getMaskElt(i+9),  i*2+j+1) ||
+          !isConstantOrUndef(N->getMaskElt(i+10), i*2+j+2) ||
+          !isConstantOrUndef(N->getMaskElt(i+11), i*2+j+3))
+        return false;
+  }
+  return true;
+}
+
  /// isVMerge - Common function, used to match vmrg* shuffles.
  ///
  static bool isVMerge(ShuffleVectorSDNode *N, unsigned UnitSize,
@@ -1193,6 +1281,99 @@ bool PPC::isVMRGHShuffleMask(ShuffleVectorSDNode *N, unsigned UnitSize,
    }
  }
  
+/**
+ * \brief Common function used to match vmrgew and vmrgow shuffles
+ *
+ * The indexOffset determines whether to look for even or odd words in
+ * the shuffle mask. This is based on the of the endianness of the target
+ * machine.
+ *   - Little Endian:
+ *     - Use offset of 0 to check for odd elements
+ *     - Use offset of 4 to check for even elements
+ *   - Big Endian:
+ *     - Use offset of 0 to check for even elements
+ *     - Use offset of 4 to check for odd elements
+ * A detailed description of the vector element ordering for little endian and
+ * big endian can be found at
+ * http://www.ibm.com/developerworks/library/l-ibm-xl-c-cpp-compiler/index.html
+ * Targeting your applications - what little endian and big endian IBM XL C/C++
+ * compiler differences mean to you
+ *
+ * The mask to the shuffle vector instruction specifies the indices of the
+ * elements from the two input vectors to place in the result. The elements are
+ * numbered in array-access order, starting with the first vector. These vectors
+ * are always of type v16i8, thus each vector will contain 16 elements of size
+ * 8. More info on the shuffle vector can be found in the
+ * http://llvm.org/docs/LangRef.html#shufflevector-instruction
+ * Language Reference.
+ *
+ * The RHSStartValue indicates whether the same input vectors are used (unary)
+ * or two different input vectors are used, based on the following:
+ *   - If the instruction uses the same vector for both inputs, the range of the
+ *     indices will be 0 to 15. In this case, the RHSStart value passed should
+ *     be 0.
+ *   - If the instruction has two different vectors then the range of the
+ *     indices will be 0 to 31. In this case, the RHSStart value passed should
+ *     be 16 (indices 0-15 specify elements in the first vector while indices 16
+ *     to 31 specify elements in the second vector).
+ *
+ * \param[in] N The shuffle vector SD Node to analyze
+ * \param[in] IndexOffset Specifies whether to look for even or odd elements
+ * \param[in] RHSStartValue Specifies the starting index for the righthand input
+ * vector to the shuffle_vector instruction
+ * \return true iff this shuffle vector represents an even or odd word merge
+ */
+static bool isVMerge(ShuffleVectorSDNode *N, unsigned IndexOffset,
+                     unsigned RHSStartValue) {
+  if (N->getValueType(0) != MVT::v16i8)
+    return false;
+
+  for (unsigned i = 0; i < 2; ++i)
+    for (unsigned j = 0; j < 4; ++j)
+      if (!isConstantOrUndef(N->getMaskElt(i*4+j),
+                             i*RHSStartValue+j+IndexOffset) ||
+          !isConstantOrUndef(N->getMaskElt(i*4+j+8),
+                             i*RHSStartValue+j+IndexOffset+8))
+        return false;
+  return true;
+}
+
+/**
+ * \brief Determine if the specified shuffle mask is suitable for the vmrgew or
+ * vmrgow instructions.
+ *
+ * \param[in] N The shuffle vector SD Node to analyze
+ * \param[in] CheckEven Check for an even merge (true) or an odd merge (false)
+ * \param[in] ShuffleKind Identify the type of merge:
+ *   - 0 = big-endian merge with two different inputs;
+ *   - 1 = either-endian merge with two identical inputs;
+ *   - 2 = little-endian merge with two different inputs (inputs are swapped for
+ *     little-endian merges).
+ * \param[in] DAG The current SelectionDAG
+ * \return true iff this shuffle mask 
+ */
+bool PPC::isVMRGEOShuffleMask(ShuffleVectorSDNode *N, bool CheckEven,
+                              unsigned ShuffleKind, SelectionDAG &DAG) {
+  if (DAG.getTarget().getDataLayout()->isLittleEndian()) {
+    unsigned indexOffset = CheckEven ? 4 : 0;
+    if (ShuffleKind == 1) // Unary
+      return isVMerge(N, indexOffset, 0);
+    else if (ShuffleKind == 2) // swapped
+      return isVMerge(N, indexOffset, 16);
+    else
+      return false;
+  }
+  else {
+    unsigned indexOffset = CheckEven ? 0 : 4;
+    if (ShuffleKind == 1) // Unary
+      return isVMerge(N, indexOffset, 0);
+    else if (ShuffleKind == 0) // Normal
+      return isVMerge(N, indexOffset, 16);
+    else
+      return false;
+  }
+  return false;
+}
  
  /// isVSLDOIShuffleMask - If this is a vsldoi shuffle mask, return the shift
  /// amount, otherwise return -1.
@@ -1271,22 +1452,6 @@ bool PPC::isSplatShuffleMask(ShuffleVectorSDNode *N, unsigned EltSize) {
    return true;
  }
  
-/// isAllNegativeZeroVector - Returns true if all elements of build_vector
-/// are -0.0.
-bool PPC::isAllNegativeZeroVector(SDNode *N) {
-  BuildVectorSDNode *BV = cast<BuildVectorSDNode>(N);
-
-  APInt APVal, APUndef;
-  unsigned BitSize;
-  bool HasAnyUndefs;
-
-  if (BV->isConstantSplat(APVal, APUndef, BitSize, HasAnyUndefs, 32, true))
-    if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(N->getOperand(0)))
-      return CFP->getValueAPF().isNegZero();
-
-  return false;
-}
-
  /// getVSPLTImmediate - Return the appropriate VSPLT* immediate to splat the
  /// specified isSplatShuffleMask VECTOR_SHUFFLE mask.
  unsigned PPC::getVSPLTImmediate(SDNode *N, unsigned EltSize,
@@ -1346,17 +1511,17 @@ SDValue PPC::get_VSPLTI_elt(SDNode *N, unsigned ByteSize, SelectionDAG &DAG) {
      // Finally, check the least significant entry.
      if (LeadingZero) {
        if (!UniquedVals[Multiple-1].getNode())
-        return DAG.getTargetConstant(0, MVT::i32);  // 0,0,0,undef
+        return DAG.getTargetConstant(0, SDLoc(N), MVT::i32);  // 0,0,0,undef
        int Val = cast<ConstantSDNode>(UniquedVals[Multiple-1])->getZExtValue();
-      if (Val < 16)
-        return DAG.getTargetConstant(Val, MVT::i32);  // 0,0,0,4 -> vspltisw(4)
+      if (Val < 16)                                   // 0,0,0,4 -> vspltisw(4)
+        return DAG.getTargetConstant(Val, SDLoc(N), MVT::i32);
      }
      if (LeadingOnes) {
        if (!UniquedVals[Multiple-1].getNode())
-        return DAG.getTargetConstant(~0U, MVT::i32);  // -1,-1,-1,undef
+        return DAG.getTargetConstant(~0U, SDLoc(N), MVT::i32); // -1,-1,-1,undef
        int Val =cast<ConstantSDNode>(UniquedVals[Multiple-1])->getSExtValue();
        if (Val >= -16)                            // -1,-1,-1,-2 -> vspltisw(-2)
-        return DAG.getTargetConstant(Val, MVT::i32);
+        return DAG.getTargetConstant(Val, SDLoc(N), MVT::i32);
      }
  
      return SDValue();
@@ -1387,17 +1552,10 @@ SDValue PPC::get_VSPLTI_elt(SDNode *N, unsigned ByteSize, SelectionDAG &DAG) {
    // immediate field for would be zero, and we prefer to use vxor for it.
    if (ValSizeInBytes < ByteSize) return SDValue();
  
-  // If the element value is larger than the splat value, cut it in half and
-  // check to see if the two halves are equal.  Continue doing this until we
-  // get to ByteSize.  This allows us to handle 0x01010101 as 0x01.
-  while (ValSizeInBytes > ByteSize) {
-    ValSizeInBytes >>= 1;
-
-    // If the top half equals the bottom half, we're still ok.
-    if (((Value >> (ValSizeInBytes*8)) & ((1 << (8*ValSizeInBytes))-1)) !=
-         (Value                        & ((1 << (8*ValSizeInBytes))-1)))
-      return SDValue();
-  }
+  // If the element value is larger than the splat value, check if it consists
+  // of a repeated bit pattern of size ByteSize.
+  if (!APInt(ValSizeInBytes * 8, Value).isSplat(ByteSize * 8))
+    return SDValue();
  
    // Properly sign extend the value.
    int MaskVal = SignExtend32(Value, ByteSize * 8);
@@ -1407,7 +1565,7 @@ SDValue PPC::get_VSPLTI_elt(SDNode *N, unsigned ByteSize, SelectionDAG &DAG) {
  
    // Finally, if this value fits in a 5 bit sext field, return it
    if (SignExtend32<5>(MaskVal) == MaskVal)
-    return DAG.getTargetConstant(MaskVal, MVT::i32);
+    return DAG.getTargetConstant(MaskVal, SDLoc(N), MVT::i32);
    return SDValue();
  }
  
@@ -1566,7 +1724,7 @@ bool PPCTargetLowering::SelectAddressRegImm(SDValue N, SDValue &Disp,
      short imm = 0;
      if (isIntS16Immediate(N.getOperand(1), imm) &&
          (!Aligned || (imm & 3) == 0)) {
-      Disp = DAG.getTargetConstant(imm, N.getValueType());
+      Disp = DAG.getTargetConstant(imm, dl, N.getValueType());
        if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N.getOperand(0))) {
          Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());
          fixupFuncForFI(DAG, FI->getIndex(), N.getValueType());
@@ -1606,7 +1764,7 @@ bool PPCTargetLowering::SelectAddressRegImm(SDValue N, SDValue &Disp,
          } else {
            Base = N.getOperand(0);
          }
-        Disp = DAG.getTargetConstant(imm, N.getValueType());
+        Disp = DAG.getTargetConstant(imm, dl, N.getValueType());
          return true;
        }
      }
@@ -1617,7 +1775,7 @@ bool PPCTargetLowering::SelectAddressRegImm(SDValue N, SDValue &Disp,
      // this as "d, 0"
      short Imm;
      if (isIntS16Immediate(CN, Imm) && (!Aligned || (Imm & 3) == 0)) {
-      Disp = DAG.getTargetConstant(Imm, CN->getValueType(0));
+      Disp = DAG.getTargetConstant(Imm, dl, CN->getValueType(0));
        Base = DAG.getRegister(Subtarget.isPPC64() ? PPC::ZERO8 : PPC::ZERO,
                               CN->getValueType(0));
        return true;
@@ -1630,16 +1788,17 @@ bool PPCTargetLowering::SelectAddressRegImm(SDValue N, SDValue &Disp,
        int Addr = (int)CN->getZExtValue();
  
        // Otherwise, break this down into an LIS + disp.
-      Disp = DAG.getTargetConstant((short)Addr, MVT::i32);
+      Disp = DAG.getTargetConstant((short)Addr, dl, MVT::i32);
  
-      Base = DAG.getTargetConstant((Addr - (signed short)Addr) >> 16, MVT::i32);
+      Base = DAG.getTargetConstant((Addr - (signed short)Addr) >> 16, dl,
+                                   MVT::i32);
        unsigned Opc = CN->getValueType(0) == MVT::i32 ? PPC::LIS : PPC::LIS8;
        Base = SDValue(DAG.getMachineNode(Opc, dl, CN->getValueType(0), Base), 0);
        return true;
      }
    }
  
-  Disp = DAG.getTargetConstant(0, getPointerTy());
+  Disp = DAG.getTargetConstant(0, dl, getPointerTy(DAG.getDataLayout()));
    if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N)) {
      Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());
      fixupFuncForFI(DAG, FI->getIndex(), N.getValueType());
@@ -1798,9 +1957,9 @@ static bool GetLabelAccessInfo(const TargetMachine &TM,
  
  static SDValue LowerLabelRef(SDValue HiPart, SDValue LoPart, bool isPIC,
                               SelectionDAG &DAG) {
-  EVT PtrVT = HiPart.getValueType();
-  SDValue Zero = DAG.getConstant(0, PtrVT);
    SDLoc DL(HiPart);
+  EVT PtrVT = HiPart.getValueType();
+  SDValue Zero = DAG.getConstant(0, DL, PtrVT);
  
    SDValue Hi = DAG.getNode(PPCISD::Hi, DL, PtrVT, HiPart, Zero);
    SDValue Lo = DAG.getNode(PPCISD::Lo, DL, PtrVT, LoPart, Zero);
@@ -1824,6 +1983,19 @@ static void setUsesTOCBasePtr(SelectionDAG &DAG) {
    setUsesTOCBasePtr(DAG.getMachineFunction());
  }
  
+static SDValue getTOCEntry(SelectionDAG &DAG, SDLoc dl, bool Is64Bit,
+                           SDValue GA) {
+  EVT VT = Is64Bit ? MVT::i64 : MVT::i32;
+  SDValue Reg = Is64Bit ? DAG.getRegister(PPC::X2, VT) :
+                DAG.getNode(PPCISD::GlobalBaseReg, dl, VT);
+
+  SDValue Ops[] = { GA, Reg };
+  return DAG.getMemIntrinsicNode(PPCISD::TOC_ENTRY, dl,
+                                 DAG.getVTList(VT, MVT::Other), Ops, VT,
+                                 MachinePointerInfo::getGOT(), 0, false, true,
+                                 false, 0);
+}
+
  SDValue PPCTargetLowering::LowerConstantPool(SDValue Op,
                                               SelectionDAG &DAG) const {
    EVT PtrVT = Op.getValueType();
@@ -1835,8 +2007,7 @@ SDValue PPCTargetLowering::LowerConstantPool(SDValue Op,
    if (Subtarget.isSVR4ABI() && Subtarget.isPPC64()) {
      setUsesTOCBasePtr(DAG);
      SDValue GA = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment(), 0);
-    return DAG.getNode(PPCISD::TOC_ENTRY, SDLoc(CP), MVT::i64, GA,
-                       DAG.getRegister(PPC::X2, MVT::i64));
+    return getTOCEntry(DAG, SDLoc(CP), true, GA);
    }
  
    unsigned MOHiFlag, MOLoFlag;
@@ -1846,9 +2017,7 @@ SDValue PPCTargetLowering::LowerConstantPool(SDValue Op,
    if (isPIC && Subtarget.isSVR4ABI()) {
      SDValue GA = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment(),
                                             PPCII::MO_PIC_FLAG);
-    SDLoc DL(CP);
-    return DAG.getNode(PPCISD::TOC_ENTRY, DL, MVT::i32, GA,
-                       DAG.getNode(PPCISD::GlobalBaseReg, DL, PtrVT));
+    return getTOCEntry(DAG, SDLoc(CP), false, GA);
    }
  
    SDValue CPIHi =
@@ -1867,8 +2036,7 @@ SDValue PPCTargetLowering::LowerJumpTable(SDValue Op, SelectionDAG &DAG) const {
    if (Subtarget.isSVR4ABI() && Subtarget.isPPC64()) {
      setUsesTOCBasePtr(DAG);
      SDValue GA = DAG.getTargetJumpTable(JT->getIndex(), PtrVT);
-    return DAG.getNode(PPCISD::TOC_ENTRY, SDLoc(JT), MVT::i64, GA,
-                       DAG.getRegister(PPC::X2, MVT::i64));
+    return getTOCEntry(DAG, SDLoc(JT), true, GA);
    }
  
    unsigned MOHiFlag, MOLoFlag;
@@ -1878,9 +2046,7 @@ SDValue PPCTargetLowering::LowerJumpTable(SDValue Op, SelectionDAG &DAG) const {
    if (isPIC && Subtarget.isSVR4ABI()) {
      SDValue GA = DAG.getTargetJumpTable(JT->getIndex(), PtrVT,
                                          PPCII::MO_PIC_FLAG);
-    SDLoc DL(GA);
-    return DAG.getNode(PPCISD::TOC_ENTRY, SDLoc(JT), PtrVT, GA,
-                       DAG.getNode(PPCISD::GlobalBaseReg, DL, PtrVT));
+    return getTOCEntry(DAG, SDLoc(GA), false, GA);
    }
  
    SDValue JTIHi = DAG.getTargetJumpTable(JT->getIndex(), PtrVT, MOHiFlag);
@@ -1899,8 +2065,7 @@ SDValue PPCTargetLowering::LowerBlockAddress(SDValue Op,
    if (Subtarget.isSVR4ABI() && Subtarget.isPPC64()) {
      setUsesTOCBasePtr(DAG);
      SDValue GA = DAG.getTargetBlockAddress(BA, PtrVT, BASDN->getOffset());
-    return DAG.getNode(PPCISD::TOC_ENTRY, SDLoc(BASDN), MVT::i64, GA,
-                       DAG.getRegister(PPC::X2, MVT::i64));
+    return getTOCEntry(DAG, SDLoc(BASDN), true, GA);
    }
  
    unsigned MOHiFlag, MOLoFlag;
@@ -1921,7 +2086,7 @@ SDValue PPCTargetLowering::LowerGlobalTLSAddress(SDValue Op,
    GlobalAddressSDNode *GA = cast<GlobalAddressSDNode>(Op);
    SDLoc dl(GA);
    const GlobalValue *GV = GA->getGlobal();
-  EVT PtrVT = getPointerTy();
+  EVT PtrVT = getPointerTy(DAG.getDataLayout());
    bool is64bit = Subtarget.isPPC64();
    const Module *M = DAG.getMachineFunction().getFunction()->getParent();
    PICLevel::Level picLevel = M->getPICLevel();
@@ -2010,8 +2175,7 @@ SDValue PPCTargetLowering::LowerGlobalAddress(SDValue Op,
    if (Subtarget.isSVR4ABI() && Subtarget.isPPC64()) {
      setUsesTOCBasePtr(DAG);
      SDValue GA = DAG.getTargetGlobalAddress(GV, DL, PtrVT, GSDN->getOffset());
-    return DAG.getNode(PPCISD::TOC_ENTRY, DL, MVT::i64, GA,
-                       DAG.getRegister(PPC::X2, MVT::i64));
+    return getTOCEntry(DAG, DL, true, GA);
    }
  
    unsigned MOHiFlag, MOLoFlag;
@@ -2022,8 +2186,7 @@ SDValue PPCTargetLowering::LowerGlobalAddress(SDValue Op,
      SDValue GA = DAG.getTargetGlobalAddress(GV, DL, PtrVT,
                                              GSDN->getOffset(),
                                              PPCII::MO_PIC_FLAG);
-    return DAG.getNode(PPCISD::TOC_ENTRY, DL, MVT::i32, GA,
-                       DAG.getNode(PPCISD::GlobalBaseReg, DL, MVT::i32));
+    return getTOCEntry(DAG, DL, false, GA);
    }
  
    SDValue GAHi =
@@ -2080,7 +2243,7 @@ SDValue PPCTargetLowering::LowerSETCC(SDValue Op, SelectionDAG &DAG) const {
        unsigned Log2b = Log2_32(VT.getSizeInBits());
        SDValue Clz = DAG.getNode(ISD::CTLZ, dl, VT, Zext);
        SDValue Scc = DAG.getNode(ISD::SRL, dl, VT, Clz,
-                                DAG.getConstant(Log2b, MVT::i32));
+                                DAG.getConstant(Log2b, dl, MVT::i32));
        return DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, Scc);
      }
      // Leave comparisons against 0 and -1 alone for now, since they're usually
@@ -2100,7 +2263,7 @@ SDValue PPCTargetLowering::LowerSETCC(SDValue Op, SelectionDAG &DAG) const {
      EVT VT = Op.getValueType();
      SDValue Sub = DAG.getNode(ISD::XOR, dl, LHSVT, Op.getOperand(0),
                                  Op.getOperand(1));
-    return DAG.getSetCC(dl, VT, Sub, DAG.getConstant(0, LHSVT), CC);
+    return DAG.getSetCC(dl, VT, Sub, DAG.getConstant(0, dl, LHSVT), CC);
    }
    return SDValue();
  }
@@ -2109,7 +2272,7 @@ SDValue PPCTargetLowering::LowerVAARG(SDValue Op, SelectionDAG &DAG,
                                        const PPCSubtarget &Subtarget) const {
    SDNode *Node = Op.getNode();
    EVT VT = Node->getValueType(0);
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
    SDValue InChain = Node->getOperand(0);
    SDValue VAListPtr = Node->getOperand(1);
    const Value *SV = cast<SrcValueSDNode>(Node->getOperand(2))->getValue();
@@ -2126,11 +2289,11 @@ SDValue PPCTargetLowering::LowerVAARG(SDValue Op, SelectionDAG &DAG,
    if (VT == MVT::i64) {
      // Check if GprIndex is even
      SDValue GprAnd = DAG.getNode(ISD::AND, dl, MVT::i32, GprIndex,
-                                 DAG.getConstant(1, MVT::i32));
+                                 DAG.getConstant(1, dl, MVT::i32));
      SDValue CC64 = DAG.getSetCC(dl, MVT::i32, GprAnd,
-                                DAG.getConstant(0, MVT::i32), ISD::SETNE);
+                                DAG.getConstant(0, dl, MVT::i32), ISD::SETNE);
      SDValue GprIndexPlusOne = DAG.getNode(ISD::ADD, dl, MVT::i32, GprIndex,
-                                          DAG.getConstant(1, MVT::i32));
+                                          DAG.getConstant(1, dl, MVT::i32));
      // Align GprIndex to be even if it isn't
      GprIndex = DAG.getNode(ISD::SELECT, dl, MVT::i32, CC64, GprIndexPlusOne,
                             GprIndex);
@@ -2138,7 +2301,7 @@ SDValue PPCTargetLowering::LowerVAARG(SDValue Op, SelectionDAG &DAG,
  
    // fpr index is 1 byte after gpr
    SDValue FprPtr = DAG.getNode(ISD::ADD, dl, PtrVT, VAListPtr,
-                               DAG.getConstant(1, MVT::i32));
+                               DAG.getConstant(1, dl, MVT::i32));
  
    // fpr
    SDValue FprIndex = DAG.getExtLoad(ISD::ZEXTLOAD, dl, MVT::i32, InChain,
@@ -2147,10 +2310,10 @@ SDValue PPCTargetLowering::LowerVAARG(SDValue Op, SelectionDAG &DAG,
    InChain = FprIndex.getValue(1);
  
    SDValue RegSaveAreaPtr = DAG.getNode(ISD::ADD, dl, PtrVT, VAListPtr,
-                                       DAG.getConstant(8, MVT::i32));
+                                       DAG.getConstant(8, dl, MVT::i32));
  
    SDValue OverflowAreaPtr = DAG.getNode(ISD::ADD, dl, PtrVT, VAListPtr,
-                                        DAG.getConstant(4, MVT::i32));
+                                        DAG.getConstant(4, dl, MVT::i32));
  
    // areas
    SDValue OverflowArea = DAG.getLoad(MVT::i32, dl, InChain, OverflowAreaPtr,
@@ -2165,12 +2328,12 @@ SDValue PPCTargetLowering::LowerVAARG(SDValue Op, SelectionDAG &DAG,
  
    // select overflow_area if index > 8
    SDValue CC = DAG.getSetCC(dl, MVT::i32, VT.isInteger() ? GprIndex : FprIndex,
-                            DAG.getConstant(8, MVT::i32), ISD::SETLT);
+                            DAG.getConstant(8, dl, MVT::i32), ISD::SETLT);
  
    // adjustment constant gpr_index * 4/8
    SDValue RegConstant = DAG.getNode(ISD::MUL, dl, MVT::i32,
                                      VT.isInteger() ? GprIndex : FprIndex,
-                                    DAG.getConstant(VT.isInteger() ? 4 : 8,
+                                    DAG.getConstant(VT.isInteger() ? 4 : 8, dl,
                                                      MVT::i32));
  
    // OurReg = RegSaveArea + RegConstant
@@ -2180,12 +2343,12 @@ SDValue PPCTargetLowering::LowerVAARG(SDValue Op, SelectionDAG &DAG,
    // Floating types are 32 bytes into RegSaveArea
    if (VT.isFloatingPoint())
      OurReg = DAG.getNode(ISD::ADD, dl, PtrVT, OurReg,
-                         DAG.getConstant(32, MVT::i32));
+                         DAG.getConstant(32, dl, MVT::i32));
  
    // increase {f,g}pr_index by 1 (or 2 if VT is i64)
    SDValue IndexPlus1 = DAG.getNode(ISD::ADD, dl, MVT::i32,
                                     VT.isInteger() ? GprIndex : FprIndex,
-                                   DAG.getConstant(VT == MVT::i64 ? 2 : 1,
+                                   DAG.getConstant(VT == MVT::i64 ? 2 : 1, dl,
                                                     MVT::i32));
  
    InChain = DAG.getTruncStore(InChain, dl, IndexPlus1,
@@ -2199,7 +2362,7 @@ SDValue PPCTargetLowering::LowerVAARG(SDValue Op, SelectionDAG &DAG,
    // increase overflow_area by 4/8 if gpr/fpr > 8
    SDValue OverflowAreaPlusN = DAG.getNode(ISD::ADD, dl, PtrVT, OverflowArea,
                                            DAG.getConstant(VT.isInteger() ? 4 : 8,
-                                          MVT::i32));
+                                          dl, MVT::i32));
  
    OverflowArea = DAG.getNode(ISD::SELECT, dl, MVT::i32, CC, OverflowArea,
                               OverflowAreaPlusN);
@@ -2221,8 +2384,8 @@ SDValue PPCTargetLowering::LowerVACOPY(SDValue Op, SelectionDAG &DAG,
    // 2*sizeof(char) + 2 Byte alignment + 2*sizeof(char*) = 12 Byte
    return DAG.getMemcpy(Op.getOperand(0), Op,
                         Op.getOperand(1), Op.getOperand(2),
-                       DAG.getConstant(12, MVT::i32), 8, false, true,
-                       MachinePointerInfo(), MachinePointerInfo());
+                       DAG.getConstant(12, SDLoc(Op), MVT::i32), 8, false, true,
+                       false, MachinePointerInfo(), MachinePointerInfo());
  }
  
  SDValue PPCTargetLowering::LowerADJUST_TRAMPOLINE(SDValue Op,
@@ -2238,7 +2401,7 @@ SDValue PPCTargetLowering::LowerINIT_TRAMPOLINE(SDValue Op,
    SDValue Nest = Op.getOperand(3); // 'nest' parameter value
    SDLoc dl(Op);
  
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
    bool isPPC64 = (PtrVT == MVT::i64);
    Type *IntPtrTy =
      DAG.getTargetLoweringInfo().getDataLayout()->getIntPtrType(
@@ -2251,7 +2414,7 @@ SDValue PPCTargetLowering::LowerINIT_TRAMPOLINE(SDValue Op,
    Entry.Node = Trmp; Args.push_back(Entry);
  
    // TrampSize == (isPPC64 ? 48 : 40);
-  Entry.Node = DAG.getConstant(isPPC64 ? 48 : 40,
+  Entry.Node = DAG.getConstant(isPPC64 ? 48 : 40, dl,
                                 isPPC64 ? MVT::i64 : MVT::i32);
    Args.push_back(Entry);
  
@@ -2279,7 +2442,7 @@ SDValue PPCTargetLowering::LowerVASTART(SDValue Op, SelectionDAG &DAG,
    if (Subtarget.isDarwinABI() || Subtarget.isPPC64()) {
      // vastart just stores the address of the VarArgsFrameIndex slot into the
      // memory location argument.
-    EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+    EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
      SDValue FR = DAG.getFrameIndex(FuncInfo->getVarArgsFrameIndex(), PtrVT);
      const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();
      return DAG.getStore(Op.getOperand(0), dl, FR, Op.getOperand(1),
@@ -2312,11 +2475,10 @@ SDValue PPCTargetLowering::LowerVASTART(SDValue Op, SelectionDAG &DAG,
    // } va_list[1];
  
  
-  SDValue ArgGPR = DAG.getConstant(FuncInfo->getVarArgsNumGPR(), MVT::i32);
-  SDValue ArgFPR = DAG.getConstant(FuncInfo->getVarArgsNumFPR(), MVT::i32);
+  SDValue ArgGPR = DAG.getConstant(FuncInfo->getVarArgsNumGPR(), dl, MVT::i32);
+  SDValue ArgFPR = DAG.getConstant(FuncInfo->getVarArgsNumFPR(), dl, MVT::i32);
  
-
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
  
    SDValue StackOffsetFI = DAG.getFrameIndex(FuncInfo->getVarArgsStackOffset(),
                                              PtrVT);
@@ -2324,13 +2486,13 @@ SDValue PPCTargetLowering::LowerVASTART(SDValue Op, SelectionDAG &DAG,
                                   PtrVT);
  
    uint64_t FrameOffset = PtrVT.getSizeInBits()/8;
-  SDValue ConstFrameOffset = DAG.getConstant(FrameOffset, PtrVT);
+  SDValue ConstFrameOffset = DAG.getConstant(FrameOffset, dl, PtrVT);
  
    uint64_t StackOffset = PtrVT.getSizeInBits()/8 - 1;
-  SDValue ConstStackOffset = DAG.getConstant(StackOffset, PtrVT);
+  SDValue ConstStackOffset = DAG.getConstant(StackOffset, dl, PtrVT);
  
    uint64_t FPROffset = 1;
-  SDValue ConstFPROffset = DAG.getConstant(FPROffset, PtrVT);
+  SDValue ConstFPROffset = DAG.getConstant(FPROffset, dl, PtrVT);
  
    const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();
  
@@ -2435,27 +2597,16 @@ bool llvm::CC_PPC32_SVR4_Custom_AlignFPArgRegs(unsigned &ValNo, MVT &ValVT,
    return false;
  }
  
-/// GetFPR - Get the set of FP registers that should be allocated for arguments,
+/// FPR - The set of FP registers that should be allocated for arguments,
  /// on Darwin.
-static const MCPhysReg *GetFPR() {
-  static const MCPhysReg FPR[] = {
-    PPC::F1, PPC::F2, PPC::F3, PPC::F4, PPC::F5, PPC::F6, PPC::F7,
-    PPC::F8, PPC::F9, PPC::F10, PPC::F11, PPC::F12, PPC::F13
-  };
-
-  return FPR;
-}
-
-/// GetQFPR - Get the set of QPX registers that should be allocated for
-/// arguments.
-static const MCPhysReg *GetQFPR() {
-  static const MCPhysReg QFPR[] = {
-    PPC::QF1, PPC::QF2, PPC::QF3, PPC::QF4, PPC::QF5, PPC::QF6, PPC::QF7,
-    PPC::QF8, PPC::QF9, PPC::QF10, PPC::QF11, PPC::QF12, PPC::QF13
-  };
+static const MCPhysReg FPR[] = {PPC::F1,  PPC::F2,  PPC::F3, PPC::F4, PPC::F5,
+                                PPC::F6,  PPC::F7,  PPC::F8, PPC::F9, PPC::F10,
+                                PPC::F11, PPC::F12, PPC::F13};
  
-  return QFPR;
-}
+/// QFPR - The set of QPX registers that should be allocated for arguments.
+static const MCPhysReg QFPR[] = {
+    PPC::QF1, PPC::QF2, PPC::QF3,  PPC::QF4,  PPC::QF5,  PPC::QF6, PPC::QF7,
+    PPC::QF8, PPC::QF9, PPC::QF10, PPC::QF11, PPC::QF12, PPC::QF13};
  
  /// CalculateStackSlotSize - Calculates the size reserved for this argument on
  /// the stack.
@@ -2483,7 +2634,8 @@ static unsigned CalculateStackSlotAlignment(EVT ArgVT, EVT OrigVT,
    // Altivec parameters are padded to a 16 byte boundary.
    if (ArgVT == MVT::v4f32 || ArgVT == MVT::v4i32 ||
        ArgVT == MVT::v8i16 || ArgVT == MVT::v16i8 ||
-      ArgVT == MVT::v2f64 || ArgVT == MVT::v2i64)
+      ArgVT == MVT::v2f64 || ArgVT == MVT::v2i64 ||
+      ArgVT == MVT::v1i128)
      Align = 16;
    // QPX vector types stored in double-precision are padded to a 32 byte
    // boundary.
@@ -2562,7 +2714,8 @@ static bool CalculateStackSlotUsed(EVT ArgVT, EVT OrigVT,
        }
      if (ArgVT == MVT::v4f32 || ArgVT == MVT::v4i32 ||
          ArgVT == MVT::v8i16 || ArgVT == MVT::v16i8 ||
-        ArgVT == MVT::v2f64 || ArgVT == MVT::v2i64)
+        ArgVT == MVT::v2f64 || ArgVT == MVT::v2i64 ||
+        ArgVT == MVT::v1i128)
        if (AvailableVRs > 0) {
          --AvailableVRs;
          return false;
@@ -2645,7 +2798,7 @@ PPCTargetLowering::LowerFormalArguments_32SVR4(
    MachineFrameInfo *MFI = MF.getFrameInfo();
    PPCFunctionInfo *FuncInfo = MF.getInfo<PPCFunctionInfo>();
  
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
    // Potential tail calls could cause overwriting of argument stack slots.
    bool isImmutable = !(getTargetMachine().Options.GuaranteedTailCallOpt &&
                         (CallConv == CallingConv::Fast));
@@ -2678,7 +2831,10 @@ PPCTargetLowering::LowerFormalArguments_32SVR4(
            RC = &PPC::GPRCRegClass;
            break;
          case MVT::f32:
-          RC = &PPC::F4RCRegClass;
+          if (Subtarget.hasP8Vector())
+            RC = &PPC::VSSRCRegClass;
+          else
+            RC = &PPC::F4RCRegClass;
            break;
          case MVT::f64:
            if (Subtarget.hasVSX())
@@ -2802,7 +2958,7 @@ PPCTargetLowering::LowerFormalArguments_32SVR4(
                                     MachinePointerInfo(), false, false, 0);
        MemOps.push_back(Store);
        // Increment the address by four for the next argument to store
-      SDValue PtrOff = DAG.getConstant(PtrVT.getSizeInBits()/8, PtrVT);
+      SDValue PtrOff = DAG.getConstant(PtrVT.getSizeInBits()/8, dl, PtrVT);
        FIN = DAG.getNode(ISD::ADD, dl, PtrOff.getValueType(), FIN, PtrOff);
      }
  
@@ -2821,7 +2977,7 @@ PPCTargetLowering::LowerFormalArguments_32SVR4(
                                     MachinePointerInfo(), false, false, 0);
        MemOps.push_back(Store);
        // Increment the address by eight for the next argument to store
-      SDValue PtrOff = DAG.getConstant(MVT(MVT::f64).getSizeInBits()/8,
+      SDValue PtrOff = DAG.getConstant(MVT(MVT::f64).getSizeInBits()/8, dl,
                                           PtrVT);
        FIN = DAG.getNode(ISD::ADD, dl, PtrOff.getValueType(), FIN, PtrOff);
      }
@@ -2868,7 +3024,7 @@ PPCTargetLowering::LowerFormalArguments_64SVR4(
    assert(!(CallConv == CallingConv::Fast && isVarArg) &&
           "fastcc not supported on varargs functions");
  
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
    // Potential tail calls could cause overwriting of argument stack slots.
    bool isImmutable = !(getTargetMachine().Options.GuaranteedTailCallOpt &&
                         (CallConv == CallingConv::Fast));
@@ -2879,9 +3035,6 @@ PPCTargetLowering::LowerFormalArguments_64SVR4(
      PPC::X3, PPC::X4, PPC::X5, PPC::X6,
      PPC::X7, PPC::X8, PPC::X9, PPC::X10,
    };
-
-  static const MCPhysReg *FPR = GetFPR();
-
    static const MCPhysReg VR[] = {
      PPC::V2, PPC::V3, PPC::V4, PPC::V5, PPC::V6, PPC::V7, PPC::V8,
      PPC::V9, PPC::V10, PPC::V11, PPC::V12, PPC::V13
@@ -2891,8 +3044,6 @@ PPCTargetLowering::LowerFormalArguments_64SVR4(
      PPC::VSH9, PPC::VSH10, PPC::VSH11, PPC::VSH12, PPC::VSH13
    };
  
-  static const MCPhysReg *QFPR = GetQFPR();
-
    const unsigned Num_GPR_Regs = array_lengthof(GPR);
    const unsigned Num_FPR_Regs = 13;
    const unsigned Num_VR_Regs  = array_lengthof(VR);
@@ -3002,7 +3153,7 @@ PPCTargetLowering::LowerFormalArguments_64SVR4(
          // address of the enclosing doubleword on big-endian systems.
          SDValue Arg = FIN;
          if (!isLittleEndian) {
-          SDValue ArgOff = DAG.getConstant(PtrByteSize - ObjSize, PtrVT);
+          SDValue ArgOff = DAG.getConstant(PtrByteSize - ObjSize, dl, PtrVT);
            Arg = DAG.getNode(ISD::ADD, dl, ArgOff.getValueType(), Arg, ArgOff);
          }
          InVals.push_back(Arg);
@@ -3048,7 +3199,7 @@ PPCTargetLowering::LowerFormalArguments_64SVR4(
          SDValue Val = DAG.getCopyFromReg(Chain, dl, VReg, PtrVT);
          SDValue Addr = FIN;
          if (j) {
-          SDValue Off = DAG.getConstant(j, PtrVT);
+          SDValue Off = DAG.getConstant(j, dl, PtrVT);
            Addr = DAG.getNode(ISD::ADD, dl, Off.getValueType(), Addr, Off);
          }
          SDValue Store = DAG.getStore(Val.getValue(1), dl, Val, Addr,
@@ -3097,7 +3248,10 @@ PPCTargetLowering::LowerFormalArguments_64SVR4(
          unsigned VReg;
  
          if (ObjectVT == MVT::f32)
-          VReg = MF.addLiveIn(FPR[FPR_idx], &PPC::F4RCRegClass);
+          VReg = MF.addLiveIn(FPR[FPR_idx],
+                              Subtarget.hasP8Vector()
+                                  ? &PPC::VSSRCRegClass
+                                  : &PPC::F4RCRegClass);
          else
            VReg = MF.addLiveIn(FPR[FPR_idx], Subtarget.hasVSX()
                                                  ? &PPC::VSFRCRegClass
@@ -3118,7 +3272,7 @@ PPCTargetLowering::LowerFormalArguments_64SVR4(
          if (ObjectVT == MVT::f32) {
            if ((ArgOffset % PtrByteSize) == (isLittleEndian ? 4 : 0))
              ArgVal = DAG.getNode(ISD::SRL, dl, MVT::i64, ArgVal,
-                                 DAG.getConstant(32, MVT::i32));
+                                 DAG.getConstant(32, dl, MVT::i32));
            ArgVal = DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, ArgVal);
          }
  
@@ -3146,6 +3300,7 @@ PPCTargetLowering::LowerFormalArguments_64SVR4(
      case MVT::v16i8:
      case MVT::v2f64:
      case MVT::v2i64:
+    case MVT::v1i128:
        if (!Subtarget.hasQPX()) {
        // These can be scalar arguments or elements of a vector array type
        // passed directly.  The latter are used to implement ELFv2 homogenous
@@ -3246,7 +3401,7 @@ PPCTargetLowering::LowerFormalArguments_64SVR4(
                                     MachinePointerInfo(), false, false, 0);
        MemOps.push_back(Store);
        // Increment the address by four for the next argument to store
-      SDValue PtrOff = DAG.getConstant(PtrByteSize, PtrVT);
+      SDValue PtrOff = DAG.getConstant(PtrByteSize, dl, PtrVT);
        FIN = DAG.getNode(ISD::ADD, dl, PtrOff.getValueType(), FIN, PtrOff);
      }
    }
@@ -3271,7 +3426,7 @@ PPCTargetLowering::LowerFormalArguments_Darwin(
    MachineFrameInfo *MFI = MF.getFrameInfo();
    PPCFunctionInfo *FuncInfo = MF.getInfo<PPCFunctionInfo>();
  
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
    bool isPPC64 = PtrVT == MVT::i64;
    // Potential tail calls could cause overwriting of argument stack slots.
    bool isImmutable = !(getTargetMachine().Options.GuaranteedTailCallOpt &&
@@ -3290,9 +3445,6 @@ PPCTargetLowering::LowerFormalArguments_Darwin(
      PPC::X3, PPC::X4, PPC::X5, PPC::X6,
      PPC::X7, PPC::X8, PPC::X9, PPC::X10,
    };
-
-  static const MCPhysReg *FPR = GetFPR();
-
    static const MCPhysReg VR[] = {
      PPC::V2, PPC::V3, PPC::V4, PPC::V5, PPC::V6, PPC::V7, PPC::V8,
      PPC::V9, PPC::V10, PPC::V11, PPC::V12, PPC::V13
@@ -3615,7 +3767,7 @@ PPCTargetLowering::LowerFormalArguments_Darwin(
                                     MachinePointerInfo(), false, false, 0);
        MemOps.push_back(Store);
        // Increment the address by four for the next argument to store
-      SDValue PtrOff = DAG.getConstant(PtrVT.getSizeInBits()/8, PtrVT);
+      SDValue PtrOff = DAG.getConstant(PtrVT.getSizeInBits()/8, dl, PtrVT);
        FIN = DAG.getNode(ISD::ADD, dl, PtrOff.getValueType(), FIN, PtrOff);
      }
    }
@@ -3693,8 +3845,9 @@ static SDNode *isBLACompatibleAddress(SDValue Op, SelectionDAG &DAG) {
        SignExtend32<26>(Addr) != Addr)
      return nullptr;  // Top 6 bits have to be sext of immediate.
  
-  return DAG.getConstant((int)C->getZExtValue() >> 2,
-                         DAG.getTargetLoweringInfo().getPointerTy()).getNode();
+  return DAG.getConstant((int)C->getZExtValue() >> 2, SDLoc(Op),
+                         DAG.getTargetLoweringInfo().getPointerTy(
+                             DAG.getDataLayout())).getNode();
  }
  
  namespace {
@@ -3825,9 +3978,9 @@ static SDValue
  CreateCopyOfByValArgument(SDValue Src, SDValue Dst, SDValue Chain,
                            ISD::ArgFlagsTy Flags, SelectionDAG &DAG,
                            SDLoc dl) {
-  SDValue SizeNode = DAG.getConstant(Flags.getByValSize(), MVT::i32);
+  SDValue SizeNode = DAG.getConstant(Flags.getByValSize(), dl, MVT::i32);
    return DAG.getMemcpy(Chain, dl, Dst, Src, SizeNode, Flags.getByValAlign(),
-                       false, false, MachinePointerInfo(),
+                       false, false, false, MachinePointerInfo(),
                         MachinePointerInfo());
  }
  
@@ -3840,7 +3993,7 @@ LowerMemOpCallTo(SelectionDAG &DAG, MachineFunction &MF, SDValue Chain,
                   bool isVector, SmallVectorImpl<SDValue> &MemOpChains,
                   SmallVectorImpl<TailCallArgumentInfo> &TailCallArguments,
                   SDLoc dl) {
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
    if (!isTailCall) {
      if (isVector) {
        SDValue StackPtr;
@@ -3849,7 +4002,7 @@ LowerMemOpCallTo(SelectionDAG &DAG, MachineFunction &MF, SDValue Chain,
        else
          StackPtr = DAG.getRegister(PPC::R1, MVT::i32);
        PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr,
-                           DAG.getConstant(ArgOffset, PtrVT));
+                           DAG.getConstant(ArgOffset, dl, PtrVT));
      }
      MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff,
                                         MachinePointerInfo(), false, false, 0));
@@ -3880,8 +4033,8 @@ void PrepareTailCall(SelectionDAG &DAG, SDValue &InFlag, SDValue &Chain,
                                          isPPC64, isDarwinABI, dl);
  
    // Emit callseq_end just before tailcall node.
-  Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumBytes, true),
-                             DAG.getIntPtrConstant(0, true), InFlag, dl);
+  Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumBytes, dl, true),
+                             DAG.getIntPtrConstant(0, dl, true), InFlag, dl);
    InFlag = Chain.getValue(1);
  }
  
@@ -3911,7 +4064,7 @@ unsigned PrepareCall(SelectionDAG &DAG, SDValue &Callee, SDValue &InFlag,
    bool isSVR4ABI = Subtarget.isSVR4ABI();
    bool isELFv2ABI = Subtarget.isELFv2ABI();
  
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
    NodeTys.push_back(MVT::Other);   // Returns a chain
    NodeTys.push_back(MVT::Glue);    // Returns a flag for retval copy to use.
  
@@ -3933,8 +4086,7 @@ unsigned PrepareCall(SelectionDAG &DAG, SDValue &Callee, SDValue &InFlag,
      if ((DAG.getTarget().getRelocationModel() != Reloc::Static &&
           (Subtarget.getTargetTriple().isMacOSX() &&
            Subtarget.getTargetTriple().isMacOSXVersionLT(10, 5)) &&
-         (G->getGlobal()->isDeclaration() ||
-          G->getGlobal()->isWeakForLinker())) ||
+         !G->getGlobal()->isStrongDefinitionForLinker()) ||
          (Subtarget.isTargetELF() && !isPPC64 &&
           !G->getGlobal()->hasLocalLinkage() &&
           DAG.getTarget().getRelocationModel() == Reloc::PIC_)) {
@@ -4027,13 +4179,13 @@ unsigned PrepareCall(SelectionDAG &DAG, SDValue &Callee, SDValue &InFlag,
                                          false, false, LoadsInv, 8);
  
        // Load environment pointer into r11.
-      SDValue PtrOff = DAG.getIntPtrConstant(16);
+      SDValue PtrOff = DAG.getIntPtrConstant(16, dl);
        SDValue AddPtr = DAG.getNode(ISD::ADD, dl, MVT::i64, Callee, PtrOff);
        SDValue LoadEnvPtr = DAG.getLoad(MVT::i64, dl, LDChain, AddPtr,
                                         MPI.getWithOffset(16), false, false,
                                         LoadsInv, 8);
  
-      SDValue TOCOff = DAG.getIntPtrConstant(8);
+      SDValue TOCOff = DAG.getIntPtrConstant(8, dl);
        SDValue AddTOC = DAG.getNode(ISD::ADD, dl, MVT::i64, Callee, TOCOff);
        SDValue TOCPtr = DAG.getLoad(MVT::i64, dl, LDChain, AddTOC,
                                     MPI.getWithOffset(8), false, false,
@@ -4081,7 +4233,7 @@ unsigned PrepareCall(SelectionDAG &DAG, SDValue &Callee, SDValue &InFlag,
    }
    // If this is a tail call add stack pointer delta.
    if (isTailCall)
-    Ops.push_back(DAG.getConstant(SPDiff, MVT::i32));
+    Ops.push_back(DAG.getConstant(SPDiff, dl, MVT::i32));
  
    // Add argument registers to the end of the list so that they are known live
    // into the call.
@@ -4103,8 +4255,7 @@ static
  bool isLocalCall(const SDValue &Callee)
  {
    if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee))
-    return !G->getGlobal()->isDeclaration() &&
-           !G->getGlobal()->isWeakForLinker();
+    return G->getGlobal()->isStrongDefinitionForLinker();
    return false;
  }
  
@@ -4186,7 +4337,8 @@ PPCTargetLowering::FinishCall(CallingConv::ID CallConv, SDLoc dl,
  
    // Add a register mask operand representing the call-preserved registers.
    const TargetRegisterInfo *TRI = Subtarget.getRegisterInfo();
-  const uint32_t *Mask = TRI->getCallPreservedMask(CallConv);
+  const uint32_t *Mask =
+      TRI->getCallPreservedMask(DAG.getMachineFunction(), CallConv);
    assert(Mask && "Missing call preserved mask for calling convention");
    Ops.push_back(DAG.getRegisterMask(Mask));
  
@@ -4202,6 +4354,7 @@ PPCTargetLowering::FinishCall(CallingConv::ID CallConv, SDLoc dl,
              isa<ConstantSDNode>(Callee)) &&
      "Expecting an global address, external symbol, absolute value or register");
  
+    DAG.getMachineFunction().getFrameInfo()->setHasTailCall();
      return DAG.getNode(PPCISD::TC_RETURN, dl, MVT::Other, Ops);
    }
  
@@ -4228,10 +4381,10 @@ PPCTargetLowering::FinishCall(CallingConv::ID CallConv, SDLoc dl,
        // allocated and an unnecessary move instruction being generated.
        CallOpc = PPCISD::BCTRL_LOAD_TOC;
  
-      EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+      EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
        SDValue StackPtr = DAG.getRegister(PPC::X1, PtrVT);
        unsigned TOCSaveOffset = Subtarget.getFrameLowering()->getTOCSaveOffset();
-      SDValue TOCOff = DAG.getIntPtrConstant(TOCSaveOffset);
+      SDValue TOCOff = DAG.getIntPtrConstant(TOCSaveOffset, dl);
        SDValue AddTOC = DAG.getNode(ISD::ADD, dl, MVT::i64, StackPtr, TOCOff);
  
        // The address needs to go after the chain input but before the flag (or
@@ -4247,8 +4400,8 @@ PPCTargetLowering::FinishCall(CallingConv::ID CallConv, SDLoc dl,
    Chain = DAG.getNode(CallOpc, dl, NodeTys, Ops);
    InFlag = Chain.getValue(1);
  
-  Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumBytes, true),
-                             DAG.getIntPtrConstant(BytesCalleePops, true),
+  Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumBytes, dl, true),
+                             DAG.getIntPtrConstant(BytesCalleePops, dl, true),
                               InFlag, dl);
    if (!Ins.empty())
      InFlag = Chain.getValue(1);
@@ -4392,7 +4545,7 @@ PPCTargetLowering::LowerCall_32SVR4(SDValue Chain, SDValue Callee,
  
    // Adjust the stack pointer for the new arguments...
    // These operations are automatically eliminated by the prolog/epilog pass
-  Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumBytes, true),
+  Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumBytes, dl, true),
                                 dl);
    SDValue CallSeqStart = Chain;
  
@@ -4432,8 +4585,9 @@ PPCTargetLowering::LowerCall_32SVR4(SDValue Chain, SDValue Callee,
        // Memory reserved in the local variable space of the callers stack frame.
        unsigned LocMemOffset = ByValVA.getLocMemOffset();
  
-      SDValue PtrOff = DAG.getIntPtrConstant(LocMemOffset);
-      PtrOff = DAG.getNode(ISD::ADD, dl, getPointerTy(), StackPtr, PtrOff);
+      SDValue PtrOff = DAG.getIntPtrConstant(LocMemOffset, dl);
+      PtrOff = DAG.getNode(ISD::ADD, dl, getPointerTy(MF.getDataLayout()),
+                           StackPtr, PtrOff);
  
        // Create a copy of the argument in the local area of the current
        // stack frame.
@@ -4469,8 +4623,9 @@ PPCTargetLowering::LowerCall_32SVR4(SDValue Chain, SDValue Callee,
        unsigned LocMemOffset = VA.getLocMemOffset();
  
        if (!isTailCall) {
-        SDValue PtrOff = DAG.getIntPtrConstant(LocMemOffset);
-        PtrOff = DAG.getNode(ISD::ADD, dl, getPointerTy(), StackPtr, PtrOff);
+        SDValue PtrOff = DAG.getIntPtrConstant(LocMemOffset, dl);
+        PtrOff = DAG.getNode(ISD::ADD, dl, getPointerTy(MF.getDataLayout()),
+                             StackPtr, PtrOff);
  
          MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff,
                                             MachinePointerInfo(),
@@ -4551,7 +4706,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
    bool isLittleEndian = Subtarget.isLittleEndian();
    unsigned NumOps = Outs.size();
  
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
    unsigned PtrByteSize = 8;
  
    MachineFunction &MF = DAG.getMachineFunction();
@@ -4581,8 +4736,6 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
      PPC::X3, PPC::X4, PPC::X5, PPC::X6,
      PPC::X7, PPC::X8, PPC::X9, PPC::X10,
    };
-  static const MCPhysReg *FPR = GetFPR();
-
    static const MCPhysReg VR[] = {
      PPC::V2, PPC::V3, PPC::V4, PPC::V5, PPC::V6, PPC::V7, PPC::V8,
      PPC::V9, PPC::V10, PPC::V11, PPC::V12, PPC::V13
@@ -4592,8 +4745,6 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
      PPC::VSH9, PPC::VSH10, PPC::VSH11, PPC::VSH12, PPC::VSH13
    };
  
-  static const MCPhysReg *QFPR = GetQFPR();
-
    const unsigned NumGPRs = array_lengthof(GPR);
    const unsigned NumFPRs = 13;
    const unsigned NumVRs  = array_lengthof(VR);
@@ -4626,6 +4777,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
          case MVT::v16i8:
          case MVT::v2f64:
          case MVT::v2i64:
+        case MVT::v1i128:
            if (++NumVRsUsed <= NumVRs)
              continue;
            break;
@@ -4686,7 +4838,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
  
    // Adjust the stack pointer for the new arguments...
    // These operations are automatically eliminated by the prolog/epilog pass
-  Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumBytes, true),
+  Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumBytes, dl, true),
                                 dl);
    SDValue CallSeqStart = Chain;
  
@@ -4730,7 +4882,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
          CalculateStackSlotAlignment(ArgVT, OrigVT, Flags, PtrByteSize);
        ArgOffset = ((ArgOffset + Align - 1) / Align) * Align;
  
-      PtrOff = DAG.getConstant(ArgOffset, StackPtr.getValueType());
+      PtrOff = DAG.getConstant(ArgOffset, dl, StackPtr.getValueType());
  
        PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr, PtrOff);
      };
@@ -4787,7 +4939,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
        if (GPR_idx == NumGPRs && Size < 8) {
          SDValue AddPtr = PtrOff;
          if (!isLittleEndian) {
-          SDValue Const = DAG.getConstant(PtrByteSize - Size,
+          SDValue Const = DAG.getConstant(PtrByteSize - Size, dl,
                                            PtrOff.getValueType());
            AddPtr = DAG.getNode(ISD::ADD, dl, PtrVT, PtrOff, Const);
          }
@@ -4827,7 +4979,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
          // parameter save area instead of a new local variable.
          SDValue AddPtr = PtrOff;
          if (!isLittleEndian) {
-          SDValue Const = DAG.getConstant(8 - Size, PtrOff.getValueType());
+          SDValue Const = DAG.getConstant(8 - Size, dl, PtrOff.getValueType());
            AddPtr = DAG.getNode(ISD::ADD, dl, PtrVT, PtrOff, Const);
          }
          Chain = CallSeqStart = createMemcpyOutsideCallSeq(Arg, AddPtr,
@@ -4849,7 +5001,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
        // For aggregates larger than PtrByteSize, copy the pieces of the
        // object that fit into registers from the parameter save area.
        for (unsigned j=0; j<Size; j+=PtrByteSize) {
-        SDValue Const = DAG.getConstant(j, PtrOff.getValueType());
+        SDValue Const = DAG.getConstant(j, dl, PtrOff.getValueType());
          SDValue AddArg = DAG.getNode(ISD::ADD, dl, PtrVT, Arg, Const);
          if (GPR_idx != NumGPRs) {
            SDValue Load = DAG.getLoad(PtrVT, dl, Chain, AddArg,
@@ -4944,7 +5096,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
            ArgVal = DAG.getNode(ISD::ANY_EXTEND, dl, MVT::i64, ArgVal);
            if (!isLittleEndian)
              ArgVal = DAG.getNode(ISD::SHL, dl, MVT::i64, ArgVal,
-                                 DAG.getConstant(32, MVT::i32));
+                                 DAG.getConstant(32, dl, MVT::i32));
  
          // Non-final even elements are skipped; they will be handled
          // together the with subsequent argument on the next go-around.
@@ -4961,7 +5113,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
          // second (rightmost) word of the stack doubleword.
          if (Arg.getValueType() == MVT::f32 &&
              !isLittleEndian && !Flags.isInConsecutiveRegs()) {
-          SDValue ConstFour = DAG.getConstant(4, PtrOff.getValueType());
+          SDValue ConstFour = DAG.getConstant(4, dl, PtrOff.getValueType());
            PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, PtrOff, ConstFour);
          }
  
@@ -4988,6 +5140,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
      case MVT::v16i8:
      case MVT::v2f64:
      case MVT::v2i64:
+    case MVT::v1i128:
        if (!Subtarget.hasQPX()) {
        // These can be scalar arguments or elements of a vector array type
        // passed directly.  The latter are used to implement ELFv2 homogenous
@@ -5021,7 +5174,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
            if (GPR_idx == NumGPRs)
              break;
            SDValue Ix = DAG.getNode(ISD::ADD, dl, PtrVT, PtrOff,
-                                  DAG.getConstant(i, PtrVT));
+                                   DAG.getConstant(i, dl, PtrVT));
            SDValue Load = DAG.getLoad(PtrVT, dl, Store, Ix, MachinePointerInfo(),
                                       false, false, false, 0);
            MemOpChains.push_back(Load.getValue(1));
@@ -5075,11 +5228,11 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
            RegsToPass.push_back(std::make_pair(QFPR[QFPR_idx++], Load));
          }
          ArgOffset += (IsF32 ? 16 : 32);
-        for (unsigned i=0; i<(IsF32 ? 16 : 32); i+=PtrByteSize) {
+        for (unsigned i = 0; i < (IsF32 ? 16U : 32U); i += PtrByteSize) {
            if (GPR_idx == NumGPRs)
              break;
            SDValue Ix = DAG.getNode(ISD::ADD, dl, PtrVT, PtrOff,
-                                  DAG.getConstant(i, PtrVT));
+                                   DAG.getConstant(i, dl, PtrVT));
            SDValue Load = DAG.getLoad(PtrVT, dl, Store, Ix, MachinePointerInfo(),
                                       false, false, false, 0);
            MemOpChains.push_back(Load.getValue(1));
@@ -5126,7 +5279,7 @@ PPCTargetLowering::LowerCall_64SVR4(SDValue Chain, SDValue Callee,
      SDValue Val = DAG.getCopyFromReg(Chain, dl, PPC::X2, MVT::i64);
      // TOC save area offset.
      unsigned TOCSaveOffset = Subtarget.getFrameLowering()->getTOCSaveOffset();
-    SDValue PtrOff = DAG.getIntPtrConstant(TOCSaveOffset);
+    SDValue PtrOff = DAG.getIntPtrConstant(TOCSaveOffset, dl);
      SDValue AddPtr = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr, PtrOff);
      Chain = DAG.getStore(Val.getValue(1), dl, Val, AddPtr,
                           MachinePointerInfo::getStack(TOCSaveOffset),
@@ -5169,7 +5322,7 @@ PPCTargetLowering::LowerCall_Darwin(SDValue Chain, SDValue Callee,
  
    unsigned NumOps = Outs.size();
  
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
    bool isPPC64 = PtrVT == MVT::i64;
    unsigned PtrByteSize = isPPC64 ? 8 : 4;
  
@@ -5245,7 +5398,7 @@ PPCTargetLowering::LowerCall_Darwin(SDValue Chain, SDValue Callee,
  
    // Adjust the stack pointer for the new arguments...
    // These operations are automatically eliminated by the prolog/epilog pass
-  Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumBytes, true),
+  Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumBytes, dl, true),
                                 dl);
    SDValue CallSeqStart = Chain;
  
@@ -5279,8 +5432,6 @@ PPCTargetLowering::LowerCall_Darwin(SDValue Chain, SDValue Callee,
      PPC::X3, PPC::X4, PPC::X5, PPC::X6,
      PPC::X7, PPC::X8, PPC::X9, PPC::X10,
    };
-  static const MCPhysReg *FPR = GetFPR();
-
    static const MCPhysReg VR[] = {
      PPC::V2, PPC::V3, PPC::V4, PPC::V5, PPC::V6, PPC::V7, PPC::V8,
      PPC::V9, PPC::V10, PPC::V11, PPC::V12, PPC::V13
@@ -5303,7 +5454,7 @@ PPCTargetLowering::LowerCall_Darwin(SDValue Chain, SDValue Callee,
      // register cannot be found for it.
      SDValue PtrOff;
  
-    PtrOff = DAG.getConstant(ArgOffset, StackPtr.getValueType());
+    PtrOff = DAG.getConstant(ArgOffset, dl, StackPtr.getValueType());
  
      PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr, PtrOff);
  
@@ -5332,7 +5483,7 @@ PPCTargetLowering::LowerCall_Darwin(SDValue Chain, SDValue Callee,
  
            ArgOffset += PtrByteSize;
          } else {
-          SDValue Const = DAG.getConstant(PtrByteSize - Size,
+          SDValue Const = DAG.getConstant(PtrByteSize - Size, dl,
                                            PtrOff.getValueType());
            SDValue AddPtr = DAG.getNode(ISD::ADD, dl, PtrVT, PtrOff, Const);
            Chain = CallSeqStart = createMemcpyOutsideCallSeq(Arg, AddPtr,
@@ -5353,7 +5504,7 @@ PPCTargetLowering::LowerCall_Darwin(SDValue Chain, SDValue Callee,
        // copy the pieces of the object that fit into registers from the
        // parameter save area.
        for (unsigned j=0; j<Size; j+=PtrByteSize) {
-        SDValue Const = DAG.getConstant(j, PtrOff.getValueType());
+        SDValue Const = DAG.getConstant(j, dl, PtrOff.getValueType());
          SDValue AddArg = DAG.getNode(ISD::ADD, dl, PtrVT, Arg, Const);
          if (GPR_idx != NumGPRs) {
            SDValue Load = DAG.getLoad(PtrVT, dl, Chain, AddArg,
@@ -5406,7 +5557,7 @@ PPCTargetLowering::LowerCall_Darwin(SDValue Chain, SDValue Callee,
              RegsToPass.push_back(std::make_pair(GPR[GPR_idx++], Load));
            }
            if (GPR_idx != NumGPRs && Arg.getValueType() == MVT::f64 && !isPPC64){
-            SDValue ConstFour = DAG.getConstant(4, PtrOff.getValueType());
+            SDValue ConstFour = DAG.getConstant(4, dl, PtrOff.getValueType());
              PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, PtrOff, ConstFour);
              SDValue Load = DAG.getLoad(PtrVT, dl, Store, PtrOff,
                                         MachinePointerInfo(),
@@ -5451,7 +5602,7 @@ PPCTargetLowering::LowerCall_Darwin(SDValue Chain, SDValue Callee,
          // We could elide this store in the case where the object fits
          // entirely in R registers.  Maybe later.
          PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr,
-                            DAG.getConstant(ArgOffset, PtrVT));
+                             DAG.getConstant(ArgOffset, dl, PtrVT));
          SDValue Store = DAG.getStore(Chain, dl, Arg, PtrOff,
                                       MachinePointerInfo(), false, false, 0);
          MemOpChains.push_back(Store);
@@ -5467,7 +5618,7 @@ PPCTargetLowering::LowerCall_Darwin(SDValue Chain, SDValue Callee,
            if (GPR_idx == NumGPRs)
              break;
            SDValue Ix = DAG.getNode(ISD::ADD, dl, PtrVT, PtrOff,
-                                  DAG.getConstant(i, PtrVT));
+                                   DAG.getConstant(i, dl, PtrVT));
            SDValue Load = DAG.getLoad(PtrVT, dl, Store, Ix, MachinePointerInfo(),
                                       false, false, false, 0);
            MemOpChains.push_back(Load.getValue(1));
@@ -5615,7 +5766,7 @@ SDValue PPCTargetLowering::LowerSTACKRESTORE(SDValue Op, SelectionDAG &DAG,
    SDLoc dl(Op);
  
    // Get the corect type for pointers.
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
  
    // Construct the stack pointer operand.
    bool isPPC64 = Subtarget.isPPC64();
@@ -5645,7 +5796,7 @@ SDValue
  PPCTargetLowering::getReturnAddrFrameIndex(SelectionDAG & DAG) const {
    MachineFunction &MF = DAG.getMachineFunction();
    bool isPPC64 = Subtarget.isPPC64();
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
  
    // Get current frame pointer save index.  The users of this index will be
    // primarily DYNALLOC instructions.
@@ -5668,7 +5819,7 @@ SDValue
  PPCTargetLowering::getFramePointerFrameIndex(SelectionDAG & DAG) const {
    MachineFunction &MF = DAG.getMachineFunction();
    bool isPPC64 = Subtarget.isPPC64();
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
  
    // Get current frame pointer save index.  The users of this index will be
    // primarily DYNALLOC instructions.
@@ -5696,10 +5847,10 @@ SDValue PPCTargetLowering::LowerDYNAMIC_STACKALLOC(SDValue Op,
    SDLoc dl(Op);
  
    // Get the corect type for pointers.
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
    // Negate the size.
    SDValue NegSize = DAG.getNode(ISD::SUB, dl, PtrVT,
-                                  DAG.getConstant(0, PtrVT), Size);
+                                DAG.getConstant(0, dl, PtrVT), Size);
    // Construct a node for the frame pointer save index.
    SDValue FPSIdx = getFramePointerFrameIndex(DAG);
    // Build a DYNALLOC node.
@@ -5739,8 +5890,9 @@ SDValue PPCTargetLowering::LowerLOAD(SDValue Op, SelectionDAG &DAG) const {
    SDValue BasePtr = LD->getBasePtr();
    MachineMemOperand *MMO = LD->getMemOperand();
  
-  SDValue NewLD = DAG.getExtLoad(ISD::EXTLOAD, dl, getPointerTy(), Chain,
-                                 BasePtr, MVT::i8, MMO);
+  SDValue NewLD =
+      DAG.getExtLoad(ISD::EXTLOAD, dl, getPointerTy(DAG.getDataLayout()), Chain,
+                     BasePtr, MVT::i8, MMO);
    SDValue Result = DAG.getNode(ISD::TRUNCATE, dl, MVT::i1, NewLD);
  
    SDValue Ops[] = { Result, SDValue(NewLD.getNode(), 1) };
@@ -5764,7 +5916,8 @@ SDValue PPCTargetLowering::LowerSTORE(SDValue Op, SelectionDAG &DAG) const {
    SDValue Value = ST->getValue();
    MachineMemOperand *MMO = ST->getMemOperand();
  
-  Value = DAG.getNode(ISD::ZERO_EXTEND, dl, getPointerTy(), Value);
+  Value = DAG.getNode(ISD::ZERO_EXTEND, dl, getPointerTy(DAG.getDataLayout()),
+                      Value);
    return DAG.getTruncStore(Chain, dl, Value, BasePtr, MVT::i8, MMO);
  }
  
@@ -5929,7 +6082,7 @@ void PPCTargetLowering::LowerFP_TO_INTForReuse(SDValue Op, ReuseLoadInfo &RLI,
    // add in a bias.
    if (Op.getValueType() == MVT::i32 && !i32Stack) {
      FIPtr = DAG.getNode(ISD::ADD, dl, FIPtr.getValueType(), FIPtr,
-                        DAG.getConstant(4, FIPtr.getValueType()));
+                        DAG.getConstant(4, dl, FIPtr.getValueType()));
      MPI = MPI.getWithOffset(4);
    }
  
@@ -5938,8 +6091,46 @@ void PPCTargetLowering::LowerFP_TO_INTForReuse(SDValue Op, ReuseLoadInfo &RLI,
    RLI.MPI = MPI;
  }
  
+/// \brief Custom lowers floating point to integer conversions to use
+/// the direct move instructions available in ISA 2.07 to avoid the
+/// need for load/store combinations.
+SDValue PPCTargetLowering::LowerFP_TO_INTDirectMove(SDValue Op,
+                                                    SelectionDAG &DAG,
+                                                    SDLoc dl) const {
+  assert(Op.getOperand(0).getValueType().isFloatingPoint());
+  SDValue Src = Op.getOperand(0);
+
+  if (Src.getValueType() == MVT::f32)
+    Src = DAG.getNode(ISD::FP_EXTEND, dl, MVT::f64, Src);
+
+  SDValue Tmp;
+  switch (Op.getSimpleValueType().SimpleTy) {
+  default: llvm_unreachable("Unhandled FP_TO_INT type in custom expander!");
+  case MVT::i32:
+    Tmp = DAG.getNode(
+        Op.getOpcode() == ISD::FP_TO_SINT
+            ? PPCISD::FCTIWZ
+            : (Subtarget.hasFPCVT() ? PPCISD::FCTIWUZ : PPCISD::FCTIDZ),
+        dl, MVT::f64, Src);
+    Tmp = DAG.getNode(PPCISD::MFVSR, dl, MVT::i32, Tmp);
+    break;
+  case MVT::i64:
+    assert((Op.getOpcode() == ISD::FP_TO_SINT || Subtarget.hasFPCVT()) &&
+           "i64 FP_TO_UINT is supported only with FPCVT");
+    Tmp = DAG.getNode(Op.getOpcode()==ISD::FP_TO_SINT ? PPCISD::FCTIDZ :
+                                                        PPCISD::FCTIDUZ,
+                      dl, MVT::f64, Src);
+    Tmp = DAG.getNode(PPCISD::MFVSR, dl, MVT::i64, Tmp);
+    break;
+  }
+  return Tmp;
+}
+
  SDValue PPCTargetLowering::LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG,
                                            SDLoc dl) const {
+  if (Subtarget.hasDirectMove() && Subtarget.isPPC64())
+    return LowerFP_TO_INTDirectMove(Op, DAG, dl);
+
    ReuseLoadInfo RLI;
    LowerFP_TO_INTForReuse(Op, RLI, DAG, dl);
  
@@ -6017,6 +6208,38 @@ void PPCTargetLowering::spliceIntoChain(SDValue ResChain,
    DAG.UpdateNodeOperands(TF.getNode(), ResChain, NewResChain);
  }
  
+/// \brief Custom lowers integer to floating point conversions to use
+/// the direct move instructions available in ISA 2.07 to avoid the
+/// need for load/store combinations.
+SDValue PPCTargetLowering::LowerINT_TO_FPDirectMove(SDValue Op,
+                                                    SelectionDAG &DAG,
+                                                    SDLoc dl) const {
+  assert((Op.getValueType() == MVT::f32 ||
+          Op.getValueType() == MVT::f64) &&
+         "Invalid floating point type as target of conversion");
+  assert(Subtarget.hasFPCVT() &&
+         "Int to FP conversions with direct moves require FPCVT");
+  SDValue FP;
+  SDValue Src = Op.getOperand(0);
+  bool SinglePrec = Op.getValueType() == MVT::f32;
+  bool WordInt = Src.getSimpleValueType().SimpleTy == MVT::i32;
+  bool Signed = Op.getOpcode() == ISD::SINT_TO_FP;
+  unsigned ConvOp = Signed ? (SinglePrec ? PPCISD::FCFIDS : PPCISD::FCFID) :
+                             (SinglePrec ? PPCISD::FCFIDUS : PPCISD::FCFIDU);
+
+  if (WordInt) {
+    FP = DAG.getNode(Signed ? PPCISD::MTVSRA : PPCISD::MTVSRZ,
+                     dl, MVT::f64, Src);
+    FP = DAG.getNode(ConvOp, dl, SinglePrec ? MVT::f32 : MVT::f64, FP);
+  }
+  else {
+    FP = DAG.getNode(PPCISD::MTVSRA, dl, MVT::f64, Src);
+    FP = DAG.getNode(ConvOp, dl, SinglePrec ? MVT::f32 : MVT::f64, FP);
+  }
+
+  return FP;
+}
+
  SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
                                            SelectionDAG &DAG) const {
    SDLoc dl(Op);
@@ -6031,7 +6254,7 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
      // This can be done with an fma and the 0.5 constant: (V+1.0)*0.5 = 0.5*V+0.5
      Value = DAG.getNode(PPCISD::QBFLT, dl, MVT::v4f64, Value);
    
-    SDValue FPHalfs = DAG.getConstantFP(0.5, MVT::f64);
+    SDValue FPHalfs = DAG.getConstantFP(0.5, dl, MVT::f64);
      FPHalfs = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4f64,
                            FPHalfs, FPHalfs, FPHalfs, FPHalfs);
    
@@ -6039,7 +6262,8 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
  
      if (Op.getValueType() != MVT::v4f64)
        Value = DAG.getNode(ISD::FP_ROUND, dl,
-                          Op.getValueType(), Value, DAG.getIntPtrConstant(1));
+                          Op.getValueType(), Value,
+                          DAG.getIntPtrConstant(1, dl));
      return Value;
    }
  
@@ -6049,8 +6273,13 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
  
    if (Op.getOperand(0).getValueType() == MVT::i1)
      return DAG.getNode(ISD::SELECT, dl, Op.getValueType(), Op.getOperand(0),
-                       DAG.getConstantFP(1.0, Op.getValueType()),
-                       DAG.getConstantFP(0.0, Op.getValueType()));
+                       DAG.getConstantFP(1.0, dl, Op.getValueType()),
+                       DAG.getConstantFP(0.0, dl, Op.getValueType()));
+
+  // If we have direct moves, we can do all the conversion, skip the store/load
+  // however, without FPCVT we can't do most conversions.
+  if (Subtarget.hasDirectMove() && Subtarget.isPPC64() && Subtarget.hasFPCVT())
+    return LowerINT_TO_FPDirectMove(Op, DAG, dl);
  
    assert((Op.getOpcode() == ISD::SINT_TO_FP || Subtarget.hasFPCVT()) &&
           "UINT_TO_FP is supported only with FPCVT");
@@ -6089,12 +6318,12 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
        // bit 12 (value 2048) is set instead, so that the final rounding
        // to single-precision gets the correct result.
        SDValue Round = DAG.getNode(ISD::AND, dl, MVT::i64,
-                                  SINT, DAG.getConstant(2047, MVT::i64));
+                                  SINT, DAG.getConstant(2047, dl, MVT::i64));
        Round = DAG.getNode(ISD::ADD, dl, MVT::i64,
-                          Round, DAG.getConstant(2047, MVT::i64));
+                          Round, DAG.getConstant(2047, dl, MVT::i64));
        Round = DAG.getNode(ISD::OR, dl, MVT::i64, Round, SINT);
        Round = DAG.getNode(ISD::AND, dl, MVT::i64,
-                          Round, DAG.getConstant(-2048, MVT::i64));
+                          Round, DAG.getConstant(-2048, dl, MVT::i64));
  
        // However, we cannot use that value unconditionally: if the magnitude
        // of the input value is small, the bit-twiddling we did above might
@@ -6105,11 +6334,11 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
        // bits are all sign-bit copies, and use the rounded value computed
        // above otherwise.
        SDValue Cond = DAG.getNode(ISD::SRA, dl, MVT::i64,
-                                 SINT, DAG.getConstant(53, MVT::i32));
+                                 SINT, DAG.getConstant(53, dl, MVT::i32));
        Cond = DAG.getNode(ISD::ADD, dl, MVT::i64,
-                         Cond, DAG.getConstant(1, MVT::i64));
+                         Cond, DAG.getConstant(1, dl, MVT::i64));
        Cond = DAG.getSetCC(dl, MVT::i32,
-                          Cond, DAG.getConstant(1, MVT::i64), ISD::SETUGT);
+                          Cond, DAG.getConstant(1, dl, MVT::i64), ISD::SETUGT);
  
        SINT = DAG.getNode(ISD::SELECT, dl, MVT::i64, Cond, Round, SINT);
      }
@@ -6149,7 +6378,7 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
                   SINT.getOpcode() == ISD::ZERO_EXTEND)) &&
                 SINT.getOperand(0).getValueType() == MVT::i32) {
        MachineFrameInfo *FrameInfo = MF.getFrameInfo();
-      EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+      EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(DAG.getDataLayout());
  
        int FrameIdx = FrameInfo->CreateStackObject(4, 4, false);
        SDValue FIdx = DAG.getFrameIndex(FrameIdx, PtrVT);
@@ -6182,7 +6411,7 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
  
      if (Op.getValueType() == MVT::f32 && !Subtarget.hasFPCVT())
        FP = DAG.getNode(ISD::FP_ROUND, dl,
-                       MVT::f32, FP, DAG.getIntPtrConstant(0));
+                       MVT::f32, FP, DAG.getIntPtrConstant(0, dl));
      return FP;
    }
  
@@ -6194,7 +6423,7 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
    // then lfd it and fcfid it.
    MachineFunction &MF = DAG.getMachineFunction();
    MachineFrameInfo *FrameInfo = MF.getFrameInfo();
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
  
    SDValue Ld;
    if (Subtarget.hasLFIWAX() || Subtarget.hasFPCVT()) {
@@ -6252,7 +6481,8 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
    // FCFID it and return it.
    SDValue FP = DAG.getNode(FCFOp, dl, FCFTy, Ld);
    if (Op.getValueType() == MVT::f32 && !Subtarget.hasFPCVT())
-    FP = DAG.getNode(ISD::FP_ROUND, dl, MVT::f32, FP, DAG.getIntPtrConstant(0));
+    FP = DAG.getNode(ISD::FP_ROUND, dl, MVT::f32, FP,
+                     DAG.getIntPtrConstant(0, dl));
    return FP;
  }
  
@@ -6280,7 +6510,7 @@ SDValue PPCTargetLowering::LowerFLT_ROUNDS_(SDValue Op,
  
    MachineFunction &MF = DAG.getMachineFunction();
    EVT VT = Op.getValueType();
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
  
    // Save FP Control Word to register
    EVT NodeTys[] = {
@@ -6296,7 +6526,7 @@ SDValue PPCTargetLowering::LowerFLT_ROUNDS_(SDValue Op,
                                 StackSlot, MachinePointerInfo(), false, false,0);
  
    // Load FP Control Word from low 32 bits of stack slot.
-  SDValue Four = DAG.getConstant(4, PtrVT);
+  SDValue Four = DAG.getConstant(4, dl, PtrVT);
    SDValue Addr = DAG.getNode(ISD::ADD, dl, PtrVT, StackSlot, Four);
    SDValue CWD = DAG.getLoad(MVT::i32, dl, Store, Addr, MachinePointerInfo(),
                              false, false, false, 0);
@@ -6304,14 +6534,14 @@ SDValue PPCTargetLowering::LowerFLT_ROUNDS_(SDValue Op,
    // Transform as necessary
    SDValue CWD1 =
      DAG.getNode(ISD::AND, dl, MVT::i32,
-                CWD, DAG.getConstant(3, MVT::i32));
+                CWD, DAG.getConstant(3, dl, MVT::i32));
    SDValue CWD2 =
      DAG.getNode(ISD::SRL, dl, MVT::i32,
                  DAG.getNode(ISD::AND, dl, MVT::i32,
                              DAG.getNode(ISD::XOR, dl, MVT::i32,
-                                        CWD, DAG.getConstant(3, MVT::i32)),
-                            DAG.getConstant(3, MVT::i32)),
-                DAG.getConstant(1, MVT::i32));
+                                        CWD, DAG.getConstant(3, dl, MVT::i32)),
+                            DAG.getConstant(3, dl, MVT::i32)),
+                DAG.getConstant(1, dl, MVT::i32));
  
    SDValue RetVal =
      DAG.getNode(ISD::XOR, dl, MVT::i32, CWD1, CWD2);
@@ -6336,12 +6566,12 @@ SDValue PPCTargetLowering::LowerSHL_PARTS(SDValue Op, SelectionDAG &DAG) const {
    EVT AmtVT = Amt.getValueType();
  
    SDValue Tmp1 = DAG.getNode(ISD::SUB, dl, AmtVT,
-                             DAG.getConstant(BitWidth, AmtVT), Amt);
+                             DAG.getConstant(BitWidth, dl, AmtVT), Amt);
    SDValue Tmp2 = DAG.getNode(PPCISD::SHL, dl, VT, Hi, Amt);
    SDValue Tmp3 = DAG.getNode(PPCISD::SRL, dl, VT, Lo, Tmp1);
    SDValue Tmp4 = DAG.getNode(ISD::OR , dl, VT, Tmp2, Tmp3);
    SDValue Tmp5 = DAG.getNode(ISD::ADD, dl, AmtVT, Amt,
-                             DAG.getConstant(-BitWidth, AmtVT));
+                             DAG.getConstant(-BitWidth, dl, AmtVT));
    SDValue Tmp6 = DAG.getNode(PPCISD::SHL, dl, VT, Lo, Tmp5);
    SDValue OutHi = DAG.getNode(ISD::OR, dl, VT, Tmp4, Tmp6);
    SDValue OutLo = DAG.getNode(PPCISD::SHL, dl, VT, Lo, Amt);
@@ -6365,12 +6595,12 @@ SDValue PPCTargetLowering::LowerSRL_PARTS(SDValue Op, SelectionDAG &DAG) const {
    EVT AmtVT = Amt.getValueType();
  
    SDValue Tmp1 = DAG.getNode(ISD::SUB, dl, AmtVT,
-                             DAG.getConstant(BitWidth, AmtVT), Amt);
+                             DAG.getConstant(BitWidth, dl, AmtVT), Amt);
    SDValue Tmp2 = DAG.getNode(PPCISD::SRL, dl, VT, Lo, Amt);
    SDValue Tmp3 = DAG.getNode(PPCISD::SHL, dl, VT, Hi, Tmp1);
    SDValue Tmp4 = DAG.getNode(ISD::OR, dl, VT, Tmp2, Tmp3);
    SDValue Tmp5 = DAG.getNode(ISD::ADD, dl, AmtVT, Amt,
-                             DAG.getConstant(-BitWidth, AmtVT));
+                             DAG.getConstant(-BitWidth, dl, AmtVT));
    SDValue Tmp6 = DAG.getNode(PPCISD::SRL, dl, VT, Hi, Tmp5);
    SDValue OutLo = DAG.getNode(ISD::OR, dl, VT, Tmp4, Tmp6);
    SDValue OutHi = DAG.getNode(PPCISD::SRL, dl, VT, Hi, Amt);
@@ -6393,15 +6623,15 @@ SDValue PPCTargetLowering::LowerSRA_PARTS(SDValue Op, SelectionDAG &DAG) const {
    EVT AmtVT = Amt.getValueType();
  
    SDValue Tmp1 = DAG.getNode(ISD::SUB, dl, AmtVT,
-                             DAG.getConstant(BitWidth, AmtVT), Amt);
+                             DAG.getConstant(BitWidth, dl, AmtVT), Amt);
    SDValue Tmp2 = DAG.getNode(PPCISD::SRL, dl, VT, Lo, Amt);
    SDValue Tmp3 = DAG.getNode(PPCISD::SHL, dl, VT, Hi, Tmp1);
    SDValue Tmp4 = DAG.getNode(ISD::OR, dl, VT, Tmp2, Tmp3);
    SDValue Tmp5 = DAG.getNode(ISD::ADD, dl, AmtVT, Amt,
-                             DAG.getConstant(-BitWidth, AmtVT));
+                             DAG.getConstant(-BitWidth, dl, AmtVT));
    SDValue Tmp6 = DAG.getNode(PPCISD::SRA, dl, VT, Hi, Tmp5);
    SDValue OutHi = DAG.getNode(PPCISD::SRA, dl, VT, Hi, Amt);
-  SDValue OutLo = DAG.getSelectCC(dl, Tmp5, DAG.getConstant(0, AmtVT),
+  SDValue OutLo = DAG.getSelectCC(dl, Tmp5, DAG.getConstant(0, dl, AmtVT),
                                    Tmp4, Tmp6, ISD::SETLE);
    SDValue OutOps[] = { OutLo, OutHi };
    return DAG.getMergeValues(OutOps, dl);
@@ -6417,7 +6647,7 @@ static SDValue BuildSplatI(int Val, unsigned SplatSize, EVT VT,
                               SelectionDAG &DAG, SDLoc dl) {
    assert(Val >= -16 && Val <= 15 && "vsplti is out of range!");
  
-  static const EVT VTys[] = { // canonical VT to use for each size.
+  static const MVT VTys[] = { // canonical VT to use for each size.
      MVT::v16i8, MVT::v8i16, MVT::Other, MVT::v4i32
    };
  
@@ -6430,7 +6660,7 @@ static SDValue BuildSplatI(int Val, unsigned SplatSize, EVT VT,
    EVT CanonicalVT = VTys[SplatSize-1];
  
    // Build a canonical splat for this value.
-  SDValue Elt = DAG.getConstant(Val, MVT::i32);
+  SDValue Elt = DAG.getConstant(Val, dl, MVT::i32);
    SmallVector<SDValue, 8> Ops;
    Ops.assign(CanonicalVT.getVectorNumElements(), Elt);
    SDValue Res = DAG.getNode(ISD::BUILD_VECTOR, dl, CanonicalVT, Ops);
@@ -6444,7 +6674,7 @@ static SDValue BuildIntrinsicOp(unsigned IID, SDValue Op,
                                  EVT DestVT = MVT::Other) {
    if (DestVT == MVT::Other) DestVT = Op.getValueType();
    return DAG.getNode(ISD::INTRINSIC_WO_CHAIN, dl, DestVT,
-                     DAG.getConstant(IID, MVT::i32), Op);
+                     DAG.getConstant(IID, dl, MVT::i32), Op);
  }
  
  /// BuildIntrinsicOp - Return a binary operator intrinsic node with the
@@ -6454,7 +6684,7 @@ static SDValue BuildIntrinsicOp(unsigned IID, SDValue LHS, SDValue RHS,
                                  EVT DestVT = MVT::Other) {
    if (DestVT == MVT::Other) DestVT = LHS.getValueType();
    return DAG.getNode(ISD::INTRINSIC_WO_CHAIN, dl, DestVT,
-                     DAG.getConstant(IID, MVT::i32), LHS, RHS);
+                     DAG.getConstant(IID, dl, MVT::i32), LHS, RHS);
  }
  
  /// BuildIntrinsicOp - Return a ternary operator intrinsic node with the
@@ -6464,7 +6694,7 @@ static SDValue BuildIntrinsicOp(unsigned IID, SDValue Op0, SDValue Op1,
                                  SDLoc dl, EVT DestVT = MVT::Other) {
    if (DestVT == MVT::Other) DestVT = Op0.getValueType();
    return DAG.getNode(ISD::INTRINSIC_WO_CHAIN, dl, DestVT,
-                     DAG.getConstant(IID, MVT::i32), Op0, Op1, Op2);
+                     DAG.getConstant(IID, dl, MVT::i32), Op0, Op1, Op2);
  }
  
  
@@ -6501,7 +6731,7 @@ SDValue PPCTargetLowering::LowerBUILD_VECTOR(SDValue Op,
      MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();
      int FrameIdx = FrameInfo->CreateStackObject(16, 16, false);
      MachinePointerInfo PtrInfo = MachinePointerInfo::getFixedStack(FrameIdx);
-    EVT PtrVT = getPointerTy();
+    EVT PtrVT = getPointerTy(DAG.getDataLayout());
      SDValue FIdx = DAG.getFrameIndex(FrameIdx, PtrVT);
  
      assert(BVN->getNumOperands() == 4 &&
@@ -6534,9 +6764,9 @@ SDValue PPCTargetLowering::LowerBUILD_VECTOR(SDValue Op,
        }
  
        Constant *CP = ConstantVector::get(CV);
-      SDValue CPIdx = DAG.getConstantPool(CP, getPointerTy(),
-                      16 /* alignment */);
- 
+      SDValue CPIdx = DAG.getConstantPool(CP, getPointerTy(DAG.getDataLayout()),
+                                          16 /* alignment */);
+
        SmallVector<SDValue, 2> Ops;
        Ops.push_back(DAG.getEntryNode());
        Ops.push_back(CPIdx);
@@ -6556,7 +6786,7 @@ SDValue PPCTargetLowering::LowerBUILD_VECTOR(SDValue Op,
        if (BVN->getOperand(i).getOpcode() == ISD::UNDEF) continue;
  
        unsigned Offset = 4*i;
-      SDValue Idx = DAG.getConstant(Offset, FIdx.getValueType());
+      SDValue Idx = DAG.getConstant(Offset, dl, FIdx.getValueType());
        Idx = DAG.getNode(ISD::ADD, dl, FIdx.getValueType(), FIdx, Idx);
  
        unsigned StoreSize = BVN->getOperand(i).getValueType().getStoreSize();
@@ -6590,7 +6820,7 @@ SDValue PPCTargetLowering::LowerBUILD_VECTOR(SDValue Op,
  
      SmallVector<SDValue, 2> Ops;
      Ops.push_back(StoreChain);
-    Ops.push_back(DAG.getConstant(Intrinsic::ppc_qpx_qvlfiwz, MVT::i32));
+    Ops.push_back(DAG.getConstant(Intrinsic::ppc_qpx_qvlfiwz, dl, MVT::i32));
      Ops.push_back(FIdx);
  
      SmallVector<EVT, 2> ValueVTs;
@@ -6601,10 +6831,10 @@ SDValue PPCTargetLowering::LowerBUILD_VECTOR(SDValue Op,
      SDValue LoadedVect = DAG.getMemIntrinsicNode(ISD::INTRINSIC_W_CHAIN,
        dl, VTs, Ops, MVT::v4i32, PtrInfo);
      LoadedVect = DAG.getNode(ISD::INTRINSIC_WO_CHAIN, dl, MVT::v4f64,
-      DAG.getConstant(Intrinsic::ppc_qpx_qvfcfidu, MVT::i32),
+      DAG.getConstant(Intrinsic::ppc_qpx_qvfcfidu, dl, MVT::i32),
        LoadedVect);
  
-    SDValue FPZeros = DAG.getConstantFP(0.0, MVT::f64);
+    SDValue FPZeros = DAG.getConstantFP(0.0, dl, MVT::f64);
      FPZeros = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4f64,
                            FPZeros, FPZeros, FPZeros, FPZeros);
  
@@ -6620,7 +6850,8 @@ SDValue PPCTargetLowering::LowerBUILD_VECTOR(SDValue Op,
    unsigned SplatBitSize;
    bool HasAnyUndefs;
    if (! BVN->isConstantSplat(APSplatBits, APSplatUndef, SplatBitSize,
-                             HasAnyUndefs, 0, true) || SplatBitSize > 32)
+                             HasAnyUndefs, 0, !Subtarget.isLittleEndian()) ||
+      SplatBitSize > 32)
      return SDValue();
  
    unsigned SplatBits = APSplatBits.getZExtValue();
@@ -6633,7 +6864,7 @@ SDValue PPCTargetLowering::LowerBUILD_VECTOR(SDValue Op,
    if (SplatBits == 0) {
      // Canonicalize all zero vectors to be v4i32.
      if (Op.getValueType() != MVT::v4i32 || HasAnyUndefs) {
-      SDValue Z = DAG.getConstant(0, MVT::i32);
+      SDValue Z = DAG.getConstant(0, dl, MVT::i32);
        Z = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, Z, Z, Z, Z);
        Op = DAG.getNode(ISD::BITCAST, dl, Op.getValueType(), Z);
      }
@@ -6660,10 +6891,10 @@ SDValue PPCTargetLowering::LowerBUILD_VECTOR(SDValue Op,
      // To avoid having these optimizations undone by constant folding,
      // we convert to a pseudo that will be expanded later into one of
      // the above forms.
-    SDValue Elt = DAG.getConstant(SextVal, MVT::i32);
+    SDValue Elt = DAG.getConstant(SextVal, dl, MVT::i32);
      EVT VT = (SplatSize == 1 ? MVT::v16i8 :
                (SplatSize == 2 ? MVT::v8i16 : MVT::v4i32));
-    SDValue EltSize = DAG.getConstant(SplatSize, MVT::i32);
+    SDValue EltSize = DAG.getConstant(SplatSize, dl, MVT::i32);
      SDValue RetVal = DAG.getNode(PPCISD::VADD_SPLAT, dl, VT, Elt, EltSize);
      if (VT == Op.getValueType())
        return RetVal;
@@ -6687,22 +6918,6 @@ SDValue PPCTargetLowering::LowerBUILD_VECTOR(SDValue Op,
      return DAG.getNode(ISD::BITCAST, dl, Op.getValueType(), Res);
    }
  
-  // The remaining cases assume either big endian element order or
-  // a splat-size that equates to the element size of the vector
-  // to be built.  An example that doesn't work for little endian is
-  // {0, -1, 0, -1, 0, -1, 0, -1} which has a splat size of 32 bits
-  // and a vector element size of 16 bits.  The code below will
-  // produce the vector in big endian element order, which for little
-  // endian is {-1, 0, -1, 0, -1, 0, -1, 0}.
-
-  // For now, just avoid these optimizations in that case.
-  // FIXME: Develop correct optimizations for LE with mismatched
-  // splat and element sizes.
-
-  if (Subtarget.isLittleEndian() &&
-      SplatSize != Op.getValueType().getVectorElementType().getSizeInBits())
-    return SDValue();
-
    // Check to see if this is a wide variety of vsplti*, binop self cases.
    static const signed char SplatCsts[] = {
      -1, 1, -2, 2, -3, 3, -4, 4, -5, 5, -6, 6, -7, 7,
@@ -6882,7 +7097,7 @@ SDValue PPCTargetLowering::LowerVECTOR_SHUFFLE(SDValue Op,
      int AlignIdx = PPC::isQVALIGNIShuffleMask(SVOp);
      if (AlignIdx != -1) {
        return DAG.getNode(PPCISD::QVALIGNI, dl, VT, V1, V2,
-                         DAG.getConstant(AlignIdx, MVT::i32));
+                         DAG.getConstant(AlignIdx, dl, MVT::i32));
      } else if (SVOp->isSplat()) {
        int SplatIdx = SVOp->getSplatIndex();
        if (SplatIdx >= 4) {
@@ -6894,7 +7109,7 @@ SDValue PPCTargetLowering::LowerVECTOR_SHUFFLE(SDValue Op,
        // nothing to do.
  
        return DAG.getNode(PPCISD::QVESPLATI, dl, VT, V1,
-                         DAG.getConstant(SplatIdx, MVT::i32));
+                         DAG.getConstant(SplatIdx, dl, MVT::i32));
      }
  
      // Lower this into a qvgpci/qvfperm pair.
@@ -6908,7 +7123,7 @@ SDValue PPCTargetLowering::LowerVECTOR_SHUFFLE(SDValue Op,
      }
  
      SDValue V3 = DAG.getNode(PPCISD::QVGPCI, dl, MVT::v4f64,
-                             DAG.getConstant(idx, MVT::i32));
+                             DAG.getConstant(idx, dl, MVT::i32));
      return DAG.getNode(PPCISD::QVFPERM, dl, VT, V1, V2, V3);
    }
  
@@ -6921,13 +7136,16 @@ SDValue PPCTargetLowering::LowerVECTOR_SHUFFLE(SDValue Op,
          PPC::isSplatShuffleMask(SVOp, 4) ||
          PPC::isVPKUWUMShuffleMask(SVOp, 1, DAG) ||
          PPC::isVPKUHUMShuffleMask(SVOp, 1, DAG) ||
+        PPC::isVPKUDUMShuffleMask(SVOp, 1, DAG) ||
          PPC::isVSLDOIShuffleMask(SVOp, 1, DAG) != -1 ||
          PPC::isVMRGLShuffleMask(SVOp, 1, 1, DAG) ||
          PPC::isVMRGLShuffleMask(SVOp, 2, 1, DAG) ||
          PPC::isVMRGLShuffleMask(SVOp, 4, 1, DAG) ||
          PPC::isVMRGHShuffleMask(SVOp, 1, 1, DAG) ||
          PPC::isVMRGHShuffleMask(SVOp, 2, 1, DAG) ||
-        PPC::isVMRGHShuffleMask(SVOp, 4, 1, DAG)) {
+        PPC::isVMRGHShuffleMask(SVOp, 4, 1, DAG) ||
+        PPC::isVMRGEOShuffleMask(SVOp, true, 1, DAG)   ||
+        PPC::isVMRGEOShuffleMask(SVOp, false, 1, DAG)) {
        return Op;
      }
    }
@@ -6938,13 +7156,16 @@ SDValue PPCTargetLowering::LowerVECTOR_SHUFFLE(SDValue Op,
    unsigned int ShuffleKind = isLittleEndian ? 2 : 0;
    if (PPC::isVPKUWUMShuffleMask(SVOp, ShuffleKind, DAG) ||
        PPC::isVPKUHUMShuffleMask(SVOp, ShuffleKind, DAG) ||
+      PPC::isVPKUDUMShuffleMask(SVOp, ShuffleKind, DAG) ||
        PPC::isVSLDOIShuffleMask(SVOp, ShuffleKind, DAG) != -1 ||
        PPC::isVMRGLShuffleMask(SVOp, 1, ShuffleKind, DAG) ||
        PPC::isVMRGLShuffleMask(SVOp, 2, ShuffleKind, DAG) ||
        PPC::isVMRGLShuffleMask(SVOp, 4, ShuffleKind, DAG) ||
        PPC::isVMRGHShuffleMask(SVOp, 1, ShuffleKind, DAG) ||
        PPC::isVMRGHShuffleMask(SVOp, 2, ShuffleKind, DAG) ||
-      PPC::isVMRGHShuffleMask(SVOp, 4, ShuffleKind, DAG))
+      PPC::isVMRGHShuffleMask(SVOp, 4, ShuffleKind, DAG) ||
+      PPC::isVMRGEOShuffleMask(SVOp, true, ShuffleKind, DAG)             ||
+      PPC::isVMRGEOShuffleMask(SVOp, false, ShuffleKind, DAG))
      return Op;
  
    // Check to see if this is a shuffle of 4-byte values.  If so, we can use our
@@ -7023,10 +7244,10 @@ SDValue PPCTargetLowering::LowerVECTOR_SHUFFLE(SDValue Op,
  
      for (unsigned j = 0; j != BytesPerElement; ++j)
        if (isLittleEndian)
-        ResultMask.push_back(DAG.getConstant(31 - (SrcElt*BytesPerElement+j),
-                                             MVT::i32));
+        ResultMask.push_back(DAG.getConstant(31 - (SrcElt*BytesPerElement + j),
+                                             dl, MVT::i32));
        else
-        ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,
+        ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement + j, dl,
                                               MVT::i32));
    }
  
@@ -7044,7 +7265,7 @@ SDValue PPCTargetLowering::LowerVECTOR_SHUFFLE(SDValue Op,
  /// altivec comparison.  If it is, return true and fill in Opc/isDot with
  /// information about the intrinsic.
  static bool getAltivecCompareInfo(SDValue Intrin, int &CompareOpc,
-                                  bool &isDot) {
+                                  bool &isDot, const PPCSubtarget &Subtarget) {
    unsigned IntrinsicID =
      cast<ConstantSDNode>(Intrin.getOperand(0))->getZExtValue();
    CompareOpc = -1;
@@ -7057,29 +7278,83 @@ static bool getAltivecCompareInfo(SDValue Intrin, int &CompareOpc,
    case Intrinsic::ppc_altivec_vcmpequb_p: CompareOpc =   6; isDot = 1; break;
    case Intrinsic::ppc_altivec_vcmpequh_p: CompareOpc =  70; isDot = 1; break;
    case Intrinsic::ppc_altivec_vcmpequw_p: CompareOpc = 134; isDot = 1; break;
+  case Intrinsic::ppc_altivec_vcmpequd_p: 
+    if (Subtarget.hasP8Altivec()) {
+      CompareOpc = 199; 
+      isDot = 1; 
+    }
+    else 
+      return false;
+
+    break;
    case Intrinsic::ppc_altivec_vcmpgefp_p: CompareOpc = 454; isDot = 1; break;
    case Intrinsic::ppc_altivec_vcmpgtfp_p: CompareOpc = 710; isDot = 1; break;
    case Intrinsic::ppc_altivec_vcmpgtsb_p: CompareOpc = 774; isDot = 1; break;
    case Intrinsic::ppc_altivec_vcmpgtsh_p: CompareOpc = 838; isDot = 1; break;
    case Intrinsic::ppc_altivec_vcmpgtsw_p: CompareOpc = 902; isDot = 1; break;
+  case Intrinsic::ppc_altivec_vcmpgtsd_p: 
+    if (Subtarget.hasP8Altivec()) {
+      CompareOpc = 967; 
+      isDot = 1; 
+    }
+    else 
+      return false;
+
+    break;
    case Intrinsic::ppc_altivec_vcmpgtub_p: CompareOpc = 518; isDot = 1; break;
    case Intrinsic::ppc_altivec_vcmpgtuh_p: CompareOpc = 582; isDot = 1; break;
    case Intrinsic::ppc_altivec_vcmpgtuw_p: CompareOpc = 646; isDot = 1; break;
+  case Intrinsic::ppc_altivec_vcmpgtud_p: 
+    if (Subtarget.hasP8Altivec()) {
+      CompareOpc = 711; 
+      isDot = 1; 
+    }
+    else 
+      return false;
  
+    break;
+      
      // Normal Comparisons.
    case Intrinsic::ppc_altivec_vcmpbfp:    CompareOpc = 966; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpeqfp:   CompareOpc = 198; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpequb:   CompareOpc =   6; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpequh:   CompareOpc =  70; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpequw:   CompareOpc = 134; isDot = 0; break;
+  case Intrinsic::ppc_altivec_vcmpequd:
+    if (Subtarget.hasP8Altivec()) {
+      CompareOpc = 199; 
+      isDot = 0; 
+    }
+    else
+      return false;
+
+    break;
    case Intrinsic::ppc_altivec_vcmpgefp:   CompareOpc = 454; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpgtfp:   CompareOpc = 710; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpgtsb:   CompareOpc = 774; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpgtsh:   CompareOpc = 838; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpgtsw:   CompareOpc = 902; isDot = 0; break;
+  case Intrinsic::ppc_altivec_vcmpgtsd:   
+    if (Subtarget.hasP8Altivec()) {
+      CompareOpc = 967; 
+      isDot = 0; 
+    }
+    else
+      return false;
+
+    break;
    case Intrinsic::ppc_altivec_vcmpgtub:   CompareOpc = 518; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpgtuh:   CompareOpc = 582; isDot = 0; break;
    case Intrinsic::ppc_altivec_vcmpgtuw:   CompareOpc = 646; isDot = 0; break;
+  case Intrinsic::ppc_altivec_vcmpgtud:   
+    if (Subtarget.hasP8Altivec()) {
+      CompareOpc = 711; 
+      isDot = 0; 
+    }
+    else
+      return false;
+
+    break;
    }
    return true;
  }
@@ -7093,14 +7368,14 @@ SDValue PPCTargetLowering::LowerINTRINSIC_WO_CHAIN(SDValue Op,
    SDLoc dl(Op);
    int CompareOpc;
    bool isDot;
-  if (!getAltivecCompareInfo(Op, CompareOpc, isDot))
+  if (!getAltivecCompareInfo(Op, CompareOpc, isDot, Subtarget))
      return SDValue();    // Don't custom lower most intrinsics.
  
    // If this is a non-dot comparison, make the VCMP node and we are done.
    if (!isDot) {
      SDValue Tmp = DAG.getNode(PPCISD::VCMP, dl, Op.getOperand(2).getValueType(),
                                Op.getOperand(1), Op.getOperand(2),
-                              DAG.getConstant(CompareOpc, MVT::i32));
+                              DAG.getConstant(CompareOpc, dl, MVT::i32));
      return DAG.getNode(ISD::BITCAST, dl, Op.getValueType(), Tmp);
    }
  
@@ -7108,7 +7383,7 @@ SDValue PPCTargetLowering::LowerINTRINSIC_WO_CHAIN(SDValue Op,
    SDValue Ops[] = {
      Op.getOperand(2),  // LHS
      Op.getOperand(3),  // RHS
-    DAG.getConstant(CompareOpc, MVT::i32)
+    DAG.getConstant(CompareOpc, dl, MVT::i32)
    };
    EVT VTs[] = { Op.getOperand(2).getValueType(), MVT::Glue };
    SDValue CompNode = DAG.getNode(PPCISD::VCMPo, dl, VTs, Ops);
@@ -7140,15 +7415,15 @@ SDValue PPCTargetLowering::LowerINTRINSIC_WO_CHAIN(SDValue Op,
  
    // Shift the bit into the low position.
    Flags = DAG.getNode(ISD::SRL, dl, MVT::i32, Flags,
-                      DAG.getConstant(8-(3-BitNo), MVT::i32));
+                      DAG.getConstant(8 - (3 - BitNo), dl, MVT::i32));
    // Isolate the bit.
    Flags = DAG.getNode(ISD::AND, dl, MVT::i32, Flags,
-                      DAG.getConstant(1, MVT::i32));
+                      DAG.getConstant(1, dl, MVT::i32));
  
    // If we are supposed to, toggle the bit.
    if (InvertBit)
      Flags = DAG.getNode(ISD::XOR, dl, MVT::i32, Flags,
-                        DAG.getConstant(1, MVT::i32));
+                        DAG.getConstant(1, dl, MVT::i32));
    return Flags;
  }
  
@@ -7182,7 +7457,7 @@ SDValue PPCTargetLowering::LowerSCALAR_TO_VECTOR(SDValue Op,
    // Create a stack slot that is 16-byte aligned.
    MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();
    int FrameIdx = FrameInfo->CreateStackObject(16, 16, false);
-  EVT PtrVT = getPointerTy();
+  EVT PtrVT = getPointerTy(DAG.getDataLayout());
    SDValue FIdx = DAG.getFrameIndex(FrameIdx, PtrVT);
  
    // Store the input value into Value#0 of the stack slot.
@@ -7214,7 +7489,7 @@ SDValue PPCTargetLowering::LowerEXTRACT_VECTOR_ELT(SDValue Op,
  
    // FIXME: We can make this an f32 vector, but the BUILD_VECTOR code needs to
    // understand how to form the extending load.
-  SDValue FPHalfs = DAG.getConstantFP(0.5, MVT::f64);
+  SDValue FPHalfs = DAG.getConstantFP(0.5, dl, MVT::f64);
    FPHalfs = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4f64,
                          FPHalfs, FPHalfs, FPHalfs, FPHalfs);
  
@@ -7222,19 +7497,19 @@ SDValue PPCTargetLowering::LowerEXTRACT_VECTOR_ELT(SDValue Op,
  
    // Now convert to an integer and store.
    Value = DAG.getNode(ISD::INTRINSIC_WO_CHAIN, dl, MVT::v4f64,
-    DAG.getConstant(Intrinsic::ppc_qpx_qvfctiwu, MVT::i32),
+    DAG.getConstant(Intrinsic::ppc_qpx_qvfctiwu, dl, MVT::i32),
      Value);
  
    MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();
    int FrameIdx = FrameInfo->CreateStackObject(16, 16, false);
    MachinePointerInfo PtrInfo = MachinePointerInfo::getFixedStack(FrameIdx);
-  EVT PtrVT = getPointerTy();
+  EVT PtrVT = getPointerTy(DAG.getDataLayout());
    SDValue FIdx = DAG.getFrameIndex(FrameIdx, PtrVT);
  
    SDValue StoreChain = DAG.getEntryNode();
    SmallVector<SDValue, 2> Ops;
    Ops.push_back(StoreChain);
-  Ops.push_back(DAG.getConstant(Intrinsic::ppc_qpx_qvstfiw, MVT::i32));
+  Ops.push_back(DAG.getConstant(Intrinsic::ppc_qpx_qvstfiw, dl, MVT::i32));
    Ops.push_back(Value);
    Ops.push_back(FIdx);
  
@@ -7247,7 +7522,7 @@ SDValue PPCTargetLowering::LowerEXTRACT_VECTOR_ELT(SDValue Op,
  
    // Extract the value requested.
    unsigned Offset = 4*cast<ConstantSDNode>(N->getOperand(1))->getZExtValue();
-  SDValue Idx = DAG.getConstant(Offset, FIdx.getValueType());
+  SDValue Idx = DAG.getConstant(Offset, dl, FIdx.getValueType());
    Idx = DAG.getNode(ISD::ADD, dl, FIdx.getValueType(), FIdx, Idx);
  
    SDValue IntVal = DAG.getLoad(MVT::i32, dl, StoreChain, Idx,
@@ -7311,12 +7586,13 @@ SDValue PPCTargetLowering::LowerVectorLoad(SDValue Op,
        LoadChains.push_back(Load.getValue(1));
  
        BasePtr = DAG.getNode(ISD::ADD, dl, BasePtr.getValueType(), BasePtr,
-                            DAG.getConstant(Stride, BasePtr.getValueType()));
+                            DAG.getConstant(Stride, dl,
+                                            BasePtr.getValueType()));
      }
  
      SDValue TF =  DAG.getNode(ISD::TokenFactor, dl, MVT::Other, LoadChains);
      SDValue Value = DAG.getNode(ISD::BUILD_VECTOR, dl,
-                                   Op.getValueType(), Vals);
+                                Op.getValueType(), Vals);
  
      if (LN->isIndexed()) {
        SDValue RetOps[] = { Value, Vals[0].getValue(1), TF };
@@ -7335,7 +7611,7 @@ SDValue PPCTargetLowering::LowerVectorLoad(SDValue Op,
  
    SmallVector<SDValue, 4> VectElmts, VectElmtChains;
    for (unsigned i = 0; i < 4; ++i) {
-    SDValue Idx = DAG.getConstant(i, BasePtr.getValueType());
+    SDValue Idx = DAG.getConstant(i, dl, BasePtr.getValueType());
      Idx = DAG.getNode(ISD::ADD, dl, BasePtr.getValueType(), BasePtr, Idx);
  
      VectElmts.push_back(DAG.getExtLoad(ISD::EXTLOAD,
@@ -7379,9 +7655,9 @@ SDValue PPCTargetLowering::LowerVectorStore(SDValue Op,
  
      SmallVector<SDValue, 8> Stores;
      for (unsigned Idx = 0; Idx < 4; ++Idx) {
-      SDValue Ex =
-        DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, ScalarVT, Value,
-                    DAG.getConstant(Idx, getVectorIdxTy()));
+      SDValue Ex = DAG.getNode(
+          ISD::EXTRACT_VECTOR_ELT, dl, ScalarVT, Value,
+          DAG.getConstant(Idx, dl, getVectorIdxTy(DAG.getDataLayout())));
        SDValue Store;
        if (ScalarVT != ScalarMemVT)
          Store =
@@ -7404,7 +7680,8 @@ SDValue PPCTargetLowering::LowerVectorStore(SDValue Op,
        }
  
        BasePtr = DAG.getNode(ISD::ADD, dl, BasePtr.getValueType(), BasePtr,
-                            DAG.getConstant(Stride, BasePtr.getValueType()));
+                            DAG.getConstant(Stride, dl,
+                                            BasePtr.getValueType()));
        Stores.push_back(Store);
      }
  
@@ -7428,7 +7705,7 @@ SDValue PPCTargetLowering::LowerVectorStore(SDValue Op,
  
    // FIXME: We can make this an f32 vector, but the BUILD_VECTOR code needs to
    // understand how to form the extending load.
-  SDValue FPHalfs = DAG.getConstantFP(0.5, MVT::f64);
+  SDValue FPHalfs = DAG.getConstantFP(0.5, dl, MVT::f64);
    FPHalfs = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4f64,
                          FPHalfs, FPHalfs, FPHalfs, FPHalfs);
  
@@ -7436,18 +7713,18 @@ SDValue PPCTargetLowering::LowerVectorStore(SDValue Op,
  
    // Now convert to an integer and store.
    Value = DAG.getNode(ISD::INTRINSIC_WO_CHAIN, dl, MVT::v4f64,
-    DAG.getConstant(Intrinsic::ppc_qpx_qvfctiwu, MVT::i32),
+    DAG.getConstant(Intrinsic::ppc_qpx_qvfctiwu, dl, MVT::i32),
      Value);
  
    MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();
    int FrameIdx = FrameInfo->CreateStackObject(16, 16, false);
    MachinePointerInfo PtrInfo = MachinePointerInfo::getFixedStack(FrameIdx);
-  EVT PtrVT = getPointerTy();
+  EVT PtrVT = getPointerTy(DAG.getDataLayout());
    SDValue FIdx = DAG.getFrameIndex(FrameIdx, PtrVT);
  
    SmallVector<SDValue, 2> Ops;
    Ops.push_back(StoreChain);
-  Ops.push_back(DAG.getConstant(Intrinsic::ppc_qpx_qvstfiw, MVT::i32));
+  Ops.push_back(DAG.getConstant(Intrinsic::ppc_qpx_qvstfiw, dl, MVT::i32));
    Ops.push_back(Value);
    Ops.push_back(FIdx);
  
@@ -7462,7 +7739,7 @@ SDValue PPCTargetLowering::LowerVectorStore(SDValue Op,
    SmallVector<SDValue, 4> Loads, LoadChains;
    for (unsigned i = 0; i < 4; ++i) {
      unsigned Offset = 4*i;
-    SDValue Idx = DAG.getConstant(Offset, FIdx.getValueType());
+    SDValue Idx = DAG.getConstant(Offset, dl, FIdx.getValueType());
      Idx = DAG.getNode(ISD::ADD, dl, FIdx.getValueType(), FIdx, Idx);
  
      Loads.push_back(DAG.getLoad(MVT::i32, dl, StoreChain, Idx,
@@ -7475,7 +7752,7 @@ SDValue PPCTargetLowering::LowerVectorStore(SDValue Op,
  
    SmallVector<SDValue, 4> Stores;
    for (unsigned i = 0; i < 4; ++i) {
-    SDValue Idx = DAG.getConstant(i, BasePtr.getValueType());
+    SDValue Idx = DAG.getConstant(i, dl, BasePtr.getValueType());
      Idx = DAG.getNode(ISD::ADD, dl, BasePtr.getValueType(), BasePtr, Idx);
  
      Stores.push_back(DAG.getTruncStore(StoreChain, dl, Loads[i], Idx,
@@ -7647,7 +7924,8 @@ void PPCTargetLowering::ReplaceNodeResults(SDNode *N,
  
      assert(N->getValueType(0) == MVT::i1 &&
             "Unexpected result type for CTR decrement intrinsic");
-    EVT SVT = getSetCCResultType(*DAG.getContext(), N->getValueType(0));
+    EVT SVT = getSetCCResultType(DAG.getDataLayout(), *DAG.getContext(),
+                                 N->getValueType(0));
      SDVTList VTs = DAG.getVTList(SVT, MVT::Other);
      SDValue NewInt = DAG.getNode(N->getOpcode(), dl, VTs, N->getOperand(0),
                                   N->getOperand(1)); 
@@ -7675,10 +7953,10 @@ void PPCTargetLowering::ReplaceNodeResults(SDNode *N,
      assert(N->getOperand(0).getValueType() == MVT::ppcf128);
      SDValue Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, dl,
                               MVT::f64, N->getOperand(0),
-                             DAG.getIntPtrConstant(0));
+                             DAG.getIntPtrConstant(0, dl));
      SDValue Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, dl,
                               MVT::f64, N->getOperand(0),
-                             DAG.getIntPtrConstant(1));
+                             DAG.getIntPtrConstant(1, dl));
  
      // Add the two halves of the long double in round-to-zero mode.
      SDValue FPreg = DAG.getNode(PPCISD::FADDRTZ, dl, MVT::f64, Lo, Hi);
@@ -7690,6 +7968,7 @@ void PPCTargetLowering::ReplaceNodeResults(SDNode *N,
      return;
    }
    case ISD::FP_TO_SINT:
+  case ISD::FP_TO_UINT:
      // LowerFP_TO_INT() can only handle f32 and f64.
      if (N->getOperand(0).getValueType() == MVT::ppcf128)
        return;
@@ -7706,7 +7985,7 @@ void PPCTargetLowering::ReplaceNodeResults(SDNode *N,
  static Instruction* callIntrinsic(IRBuilder<> &Builder, Intrinsic::ID Id) {
    Module *M = Builder.GetInsertBlock()->getParent()->getParent();
    Function *Func = Intrinsic::getDeclaration(M, Id);
-  return Builder.CreateCall(Func);
+  return Builder.CreateCall(Func, {});
  }
  
  // The mappings for emitLeading/TrailingFence is taken from
@@ -7716,10 +7995,9 @@ Instruction* PPCTargetLowering::emitLeadingFence(IRBuilder<> &Builder,
                                           bool IsLoad) const {
    if (Ord == SequentiallyConsistent)
      return callIntrinsic(Builder, Intrinsic::ppc_sync);
-  else if (isAtLeastRelease(Ord))
+  if (isAtLeastRelease(Ord))
      return callIntrinsic(Builder, Intrinsic::ppc_lwsync);
-  else
-    return nullptr;
+  return nullptr;
  }
  
  Instruction* PPCTargetLowering::emitTrailingFence(IRBuilder<> &Builder,
@@ -7731,16 +8009,41 @@ Instruction* PPCTargetLowering::emitTrailingFence(IRBuilder<> &Builder,
    // See http://www.cl.cam.ac.uk/~pes20/cpp/cpp0xmappings.html and
    // http://www.rdrop.com/users/paulmck/scalability/paper/N2745r.2011.03.04a.html
    // and http://www.cl.cam.ac.uk/~pes20/cppppc/ for justification.
-  else
-    return nullptr;
+  return nullptr;
  }
  
  MachineBasicBlock *
  PPCTargetLowering::EmitAtomicBinary(MachineInstr *MI, MachineBasicBlock *BB,
-                                    bool is64bit, unsigned BinOpcode) const {
+                                    unsigned AtomicSize,
+                                    unsigned BinOpcode) const {
    // This also handles ATOMIC_SWAP, indicated by BinOpcode==0.
    const TargetInstrInfo *TII = Subtarget.getInstrInfo();
  
+  auto LoadMnemonic = PPC::LDARX;
+  auto StoreMnemonic = PPC::STDCX;
+  switch (AtomicSize) {
+  default:
+    llvm_unreachable("Unexpected size of atomic entity");
+  case 1:
+    LoadMnemonic = PPC::LBARX;
+    StoreMnemonic = PPC::STBCX;
+    assert(Subtarget.hasPartwordAtomics() && "Call this only with size >=4");
+    break;
+  case 2:
+    LoadMnemonic = PPC::LHARX;
+    StoreMnemonic = PPC::STHCX;
+    assert(Subtarget.hasPartwordAtomics() && "Call this only with size >=4");
+    break;
+  case 4:
+    LoadMnemonic = PPC::LWARX;
+    StoreMnemonic = PPC::STWCX;
+    break;
+  case 8:
+    LoadMnemonic = PPC::LDARX;
+    StoreMnemonic = PPC::STDCX;
+    break;
+  }
+
    const BasicBlock *LLVM_BB = BB->getBasicBlock();
    MachineFunction *F = BB->getParent();
    MachineFunction::iterator It = BB;
@@ -7762,7 +8065,7 @@ PPCTargetLowering::EmitAtomicBinary(MachineInstr *MI, MachineBasicBlock *BB,
  
    MachineRegisterInfo &RegInfo = F->getRegInfo();
    unsigned TmpReg = (!BinOpcode) ? incr :
-    RegInfo.createVirtualRegister( is64bit ? &PPC::G8RCRegClass
+    RegInfo.createVirtualRegister( AtomicSize == 8 ? &PPC::G8RCRegClass
                                             : &PPC::GPRCRegClass);
  
    //  thisMBB:
@@ -7777,11 +8080,11 @@ PPCTargetLowering::EmitAtomicBinary(MachineInstr *MI, MachineBasicBlock *BB,
    //   bne- loopMBB
    //   fallthrough --> exitMBB
    BB = loopMBB;
-  BuildMI(BB, dl, TII->get(is64bit ? PPC::LDARX : PPC::LWARX), dest)
+  BuildMI(BB, dl, TII->get(LoadMnemonic), dest)
      .addReg(ptrA).addReg(ptrB);
    if (BinOpcode)
      BuildMI(BB, dl, TII->get(BinOpcode), TmpReg).addReg(incr).addReg(dest);
-  BuildMI(BB, dl, TII->get(is64bit ? PPC::STDCX : PPC::STWCX))
+  BuildMI(BB, dl, TII->get(StoreMnemonic))
      .addReg(TmpReg).addReg(ptrA).addReg(ptrB);
    BuildMI(BB, dl, TII->get(PPC::BCC))
      .addImm(PPC::PRED_NE).addReg(PPC::CR0).addMBB(loopMBB);
@@ -7799,6 +8102,10 @@ PPCTargetLowering::EmitPartwordAtomicBinary(MachineInstr *MI,
                                              MachineBasicBlock *BB,
                                              bool is8bit,    // operation
                                              unsigned BinOpcode) const {
+  // If we support part-word atomic mnemonics, just use them
+  if (Subtarget.hasPartwordAtomics())
+    return EmitAtomicBinary(MI, BB, is8bit ? 1 : 2, BinOpcode);
+
    // This also handles ATOMIC_SWAP, indicated by BinOpcode==0.
    const TargetInstrInfo *TII = Subtarget.getInstrInfo();
    // In 64 bit mode we have to use 64 bits for addresses, even though the
@@ -7946,7 +8253,7 @@ PPCTargetLowering::emitEHSjLjSetJmp(MachineInstr *MI,
    unsigned mainDstReg = MRI.createVirtualRegister(RC);
    unsigned restoreDstReg = MRI.createVirtualRegister(RC);
  
-  MVT PVT = getPointerTy();
+  MVT PVT = getPointerTy(MF->getDataLayout());
    assert((PVT == MVT::i64 || PVT == MVT::i32) &&
           "Invalid Pointer Size!");
    // For v = setjmp(buf), we generate
@@ -8084,7 +8391,7 @@ PPCTargetLowering::emitEHSjLjLongJmp(MachineInstr *MI,
    MachineInstr::mmo_iterator MMOBegin = MI->memoperands_begin();
    MachineInstr::mmo_iterator MMOEnd = MI->memoperands_end();
  
-  MVT PVT = getPointerTy();
+  MVT PVT = getPointerTy(MF->getDataLayout());
    assert((PVT == MVT::i64 || PVT == MVT::i32) &&
           "Invalid Pointer Size!");
  
@@ -8242,6 +8549,7 @@ PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
               MI->getOpcode() == PPC::SELECT_CC_QBRC ||
               MI->getOpcode() == PPC::SELECT_CC_VRRC ||
               MI->getOpcode() == PPC::SELECT_CC_VSFRC ||
+             MI->getOpcode() == PPC::SELECT_CC_VSSRC ||
               MI->getOpcode() == PPC::SELECT_CC_VSRC ||
               MI->getOpcode() == PPC::SELECT_I4 ||
               MI->getOpcode() == PPC::SELECT_I8 ||
@@ -8252,6 +8560,7 @@ PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
               MI->getOpcode() == PPC::SELECT_QBRC ||
               MI->getOpcode() == PPC::SELECT_VRRC ||
               MI->getOpcode() == PPC::SELECT_VSFRC ||
+             MI->getOpcode() == PPC::SELECT_VSSRC ||
               MI->getOpcode() == PPC::SELECT_VSRC) {
      // The incoming instruction knows the destination vreg to set, the
      // condition code register to branch on, the true/false values to
@@ -8288,6 +8597,7 @@ PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
          MI->getOpcode() == PPC::SELECT_QBRC ||
          MI->getOpcode() == PPC::SELECT_VRRC ||
          MI->getOpcode() == PPC::SELECT_VSFRC ||
+        MI->getOpcode() == PPC::SELECT_VSSRC ||
          MI->getOpcode() == PPC::SELECT_VSRC) {
        BuildMI(BB, dl, TII->get(PPC::BC))
          .addReg(MI->getOperand(1).getReg()).addMBB(sinkMBB);
@@ -8364,68 +8674,96 @@ PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_ADD_I16)
      BB = EmitPartwordAtomicBinary(MI, BB, false, PPC::ADD4);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_ADD_I32)
-    BB = EmitAtomicBinary(MI, BB, false, PPC::ADD4);
+    BB = EmitAtomicBinary(MI, BB, 4, PPC::ADD4);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_ADD_I64)
-    BB = EmitAtomicBinary(MI, BB, true, PPC::ADD8);
+    BB = EmitAtomicBinary(MI, BB, 8, PPC::ADD8);
  
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_AND_I8)
      BB = EmitPartwordAtomicBinary(MI, BB, true, PPC::AND);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_AND_I16)
      BB = EmitPartwordAtomicBinary(MI, BB, false, PPC::AND);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_AND_I32)
-    BB = EmitAtomicBinary(MI, BB, false, PPC::AND);
+    BB = EmitAtomicBinary(MI, BB, 4, PPC::AND);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_AND_I64)
-    BB = EmitAtomicBinary(MI, BB, true, PPC::AND8);
+    BB = EmitAtomicBinary(MI, BB, 8, PPC::AND8);
  
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_OR_I8)
      BB = EmitPartwordAtomicBinary(MI, BB, true, PPC::OR);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_OR_I16)
      BB = EmitPartwordAtomicBinary(MI, BB, false, PPC::OR);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_OR_I32)
-    BB = EmitAtomicBinary(MI, BB, false, PPC::OR);
+    BB = EmitAtomicBinary(MI, BB, 4, PPC::OR);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_OR_I64)
-    BB = EmitAtomicBinary(MI, BB, true, PPC::OR8);
+    BB = EmitAtomicBinary(MI, BB, 8, PPC::OR8);
  
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_XOR_I8)
      BB = EmitPartwordAtomicBinary(MI, BB, true, PPC::XOR);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_XOR_I16)
      BB = EmitPartwordAtomicBinary(MI, BB, false, PPC::XOR);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_XOR_I32)
-    BB = EmitAtomicBinary(MI, BB, false, PPC::XOR);
+    BB = EmitAtomicBinary(MI, BB, 4, PPC::XOR);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_XOR_I64)
-    BB = EmitAtomicBinary(MI, BB, true, PPC::XOR8);
+    BB = EmitAtomicBinary(MI, BB, 8, PPC::XOR8);
  
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_NAND_I8)
      BB = EmitPartwordAtomicBinary(MI, BB, true, PPC::NAND);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_NAND_I16)
      BB = EmitPartwordAtomicBinary(MI, BB, false, PPC::NAND);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_NAND_I32)
-    BB = EmitAtomicBinary(MI, BB, false, PPC::NAND);
+    BB = EmitAtomicBinary(MI, BB, 4, PPC::NAND);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_NAND_I64)
-    BB = EmitAtomicBinary(MI, BB, true, PPC::NAND8);
+    BB = EmitAtomicBinary(MI, BB, 8, PPC::NAND8);
  
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_SUB_I8)
      BB = EmitPartwordAtomicBinary(MI, BB, true, PPC::SUBF);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_SUB_I16)
      BB = EmitPartwordAtomicBinary(MI, BB, false, PPC::SUBF);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_SUB_I32)
-    BB = EmitAtomicBinary(MI, BB, false, PPC::SUBF);
+    BB = EmitAtomicBinary(MI, BB, 4, PPC::SUBF);
    else if (MI->getOpcode() == PPC::ATOMIC_LOAD_SUB_I64)
-    BB = EmitAtomicBinary(MI, BB, true, PPC::SUBF8);
+    BB = EmitAtomicBinary(MI, BB, 8, PPC::SUBF8);
  
    else if (MI->getOpcode() == PPC::ATOMIC_SWAP_I8)
      BB = EmitPartwordAtomicBinary(MI, BB, true, 0);
    else if (MI->getOpcode() == PPC::ATOMIC_SWAP_I16)
      BB = EmitPartwordAtomicBinary(MI, BB, false, 0);
    else if (MI->getOpcode() == PPC::ATOMIC_SWAP_I32)
-    BB = EmitAtomicBinary(MI, BB, false, 0);
+    BB = EmitAtomicBinary(MI, BB, 4, 0);
    else if (MI->getOpcode() == PPC::ATOMIC_SWAP_I64)
-    BB = EmitAtomicBinary(MI, BB, true, 0);
+    BB = EmitAtomicBinary(MI, BB, 8, 0);
  
    else if (MI->getOpcode() == PPC::ATOMIC_CMP_SWAP_I32 ||
-           MI->getOpcode() == PPC::ATOMIC_CMP_SWAP_I64) {
+           MI->getOpcode() == PPC::ATOMIC_CMP_SWAP_I64 ||
+           (Subtarget.hasPartwordAtomics() &&
+            MI->getOpcode() == PPC::ATOMIC_CMP_SWAP_I8) ||
+           (Subtarget.hasPartwordAtomics() &&
+            MI->getOpcode() == PPC::ATOMIC_CMP_SWAP_I16)) {
      bool is64bit = MI->getOpcode() == PPC::ATOMIC_CMP_SWAP_I64;
  
+    auto LoadMnemonic = PPC::LDARX;
+    auto StoreMnemonic = PPC::STDCX;
+    switch(MI->getOpcode()) {
+    default:
+      llvm_unreachable("Compare and swap of unknown size");
+    case PPC::ATOMIC_CMP_SWAP_I8:
+      LoadMnemonic = PPC::LBARX;
+      StoreMnemonic = PPC::STBCX;
+      assert(Subtarget.hasPartwordAtomics() && "No support partword atomics.");
+      break;
+    case PPC::ATOMIC_CMP_SWAP_I16:
+      LoadMnemonic = PPC::LHARX;
+      StoreMnemonic = PPC::STHCX;
+      assert(Subtarget.hasPartwordAtomics() && "No support partword atomics.");
+      break;
+    case PPC::ATOMIC_CMP_SWAP_I32:
+      LoadMnemonic = PPC::LWARX;
+      StoreMnemonic = PPC::STWCX;
+      break;
+    case PPC::ATOMIC_CMP_SWAP_I64:
+      LoadMnemonic = PPC::LDARX;
+      StoreMnemonic = PPC::STDCX;
+      break;
+    }
      unsigned dest   = MI->getOperand(0).getReg();
      unsigned ptrA   = MI->getOperand(1).getReg();
      unsigned ptrB   = MI->getOperand(2).getReg();
@@ -8451,18 +8789,18 @@ PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
      BB->addSuccessor(loop1MBB);
  
      // loop1MBB:
-    //   l[wd]arx dest, ptr
+    //   l[bhwd]arx dest, ptr
      //   cmp[wd] dest, oldval
      //   bne- midMBB
      // loop2MBB:
-    //   st[wd]cx. newval, ptr
+    //   st[bhwd]cx. newval, ptr
      //   bne- loopMBB
      //   b exitBB
      // midMBB:
-    //   st[wd]cx. dest, ptr
+    //   st[bhwd]cx. dest, ptr
      // exitBB:
      BB = loop1MBB;
-    BuildMI(BB, dl, TII->get(is64bit ? PPC::LDARX : PPC::LWARX), dest)
+    BuildMI(BB, dl, TII->get(LoadMnemonic), dest)
        .addReg(ptrA).addReg(ptrB);
      BuildMI(BB, dl, TII->get(is64bit ? PPC::CMPD : PPC::CMPW), PPC::CR0)
        .addReg(oldval).addReg(dest);
@@ -8472,7 +8810,7 @@ PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
      BB->addSuccessor(midMBB);
  
      BB = loop2MBB;
-    BuildMI(BB, dl, TII->get(is64bit ? PPC::STDCX : PPC::STWCX))
+    BuildMI(BB, dl, TII->get(StoreMnemonic))
        .addReg(newval).addReg(ptrA).addReg(ptrB);
      BuildMI(BB, dl, TII->get(PPC::BCC))
        .addImm(PPC::PRED_NE).addReg(PPC::CR0).addMBB(loop1MBB);
@@ -8481,7 +8819,7 @@ PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
      BB->addSuccessor(exitMBB);
  
      BB = midMBB;
-    BuildMI(BB, dl, TII->get(is64bit ? PPC::STDCX : PPC::STWCX))
+    BuildMI(BB, dl, TII->get(StoreMnemonic))
        .addReg(dest).addReg(ptrA).addReg(ptrB);
      BB->addSuccessor(exitMBB);
  
@@ -8681,6 +9019,12 @@ PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
      BuildMI(*BB, MI, dl, TII->get(TargetOpcode::COPY),
              MI->getOperand(0).getReg())
        .addReg(isEQ ? PPC::CR0EQ : PPC::CR0GT);
+  } else if (MI->getOpcode() == PPC::TCHECK_RET) {
+    DebugLoc Dl = MI->getDebugLoc();
+    MachineRegisterInfo &RegInfo = F->getRegInfo();
+    unsigned CRReg = RegInfo.createVirtualRegister(&PPC::CRRCRegClass);
+    BuildMI(*BB, MI, Dl, TII->get(PPC::TCHECK), CRReg);
+    return BB;
    } else {
      llvm_unreachable("Unexpected instr type to insert");
    }
@@ -9511,13 +9855,13 @@ SDValue PPCTargetLowering::DAGCombineExtBoolTrunc(SDNode *N,
      return DAG.getNode(ISD::AND, dl, N->getValueType(0), N->getOperand(0),
                         DAG.getConstant(APInt::getLowBitsSet(
                                           N->getValueSizeInBits(0), PromBits),
-                                       N->getValueType(0)));
+                                       dl, N->getValueType(0)));
  
    assert(N->getOpcode() == ISD::SIGN_EXTEND &&
           "Invalid extension type");
-  EVT ShiftAmountTy = getShiftAmountTy(N->getValueType(0));
+  EVT ShiftAmountTy = getShiftAmountTy(N->getValueType(0), DAG.getDataLayout());
    SDValue ShiftCst =
-    DAG.getConstant(N->getValueSizeInBits(0)-PromBits, ShiftAmountTy);
+    DAG.getConstant(N->getValueSizeInBits(0) - PromBits, dl, ShiftAmountTy);
    return DAG.getNode(ISD::SRA, dl, N->getValueType(0), 
                       DAG.getNode(ISD::SHL, dl, N->getValueType(0),
                                   N->getOperand(0), ShiftCst), ShiftCst);
@@ -9583,7 +9927,7 @@ SDValue PPCTargetLowering::combineFPToIntToFP(SDNode *N,
  
      if (Op.getValueType() == MVT::f32 && !Subtarget.hasFPCVT()) {
        FP = DAG.getNode(ISD::FP_ROUND, dl,
-                       MVT::f32, FP, DAG.getIntPtrConstant(0));
+                       MVT::f32, FP, DAG.getIntPtrConstant(0, dl));
        DCI.AddToWorklist(FP.getNode());
      }
  
@@ -9621,7 +9965,9 @@ SDValue PPCTargetLowering::expandVSXLoadForLE(SDNode *N,
    case ISD::INTRINSIC_W_CHAIN: {
      MemIntrinsicSDNode *Intrin = cast<MemIntrinsicSDNode>(N);
      Chain = Intrin->getChain();
-    Base = Intrin->getBasePtr();
+    // Similarly to the store case below, Intrin->getBasePtr() doesn't get
+    // us what we want. Get operand 2 instead.
+    Base = Intrin->getOperand(2);
      MMO = Intrin->getMemOperand();
      break;
    }
@@ -9878,7 +10224,8 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
                                  2*MemVT.getStoreSize()-1);
  
        // Create the new base load.
-      SDValue LDXIntID = DAG.getTargetConstant(IntrLD, getPointerTy());
+      SDValue LDXIntID =
+          DAG.getTargetConstant(IntrLD, dl, getPointerTy(MF.getDataLayout()));
        SDValue BaseLoadOps[] = { Chain, LDXIntID, Ptr };
        SDValue BaseLoad =
          DAG.getMemIntrinsicNode(ISD::INTRINSIC_W_CHAIN, dl,
@@ -9902,7 +10249,8 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
        if (!findConsecutiveLoad(LD, DAG))
          --IncValue;
  
-      SDValue Increment = DAG.getConstant(IncValue, getPointerTy());
+      SDValue Increment =
+          DAG.getConstant(IncValue, dl, getPointerTy(MF.getDataLayout()));
        Ptr = DAG.getNode(ISD::ADD, dl, Ptr.getValueType(), Ptr, Increment);
  
        MachineMemOperand *ExtraMMO =
@@ -9934,7 +10282,7 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
          Perm = Subtarget.hasAltivec() ?
                   DAG.getNode(ISD::BITCAST, dl, VT, Perm) :
                   DAG.getNode(ISD::FP_ROUND, dl, VT, Perm, // QPX
-                               DAG.getTargetConstant(1, MVT::i64));
+                               DAG.getTargetConstant(1, dl, MVT::i64));
                                 // second argument is 1 because this rounding
                                 // is always exact.
  
@@ -9987,7 +10335,7 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
                  isa<ConstantSDNode>(UI->getOperand(1)) &&
                  (cast<ConstantSDNode>(Add->getOperand(1))->getZExtValue() -
                   cast<ConstantSDNode>(UI->getOperand(1))->getZExtValue()) %
-                (1 << Bits) == 0) {
+                (1ULL << Bits) == 0) {
                SDNode *OtherAdd = *UI;
                for (SDNode::use_iterator VI = OtherAdd->use_begin(),
                     VE = OtherAdd->use_end(); VI != VE; ++VI) {
@@ -10183,7 +10531,7 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
  
      if (LHS.getOpcode() == ISD::INTRINSIC_WO_CHAIN &&
          isa<ConstantSDNode>(RHS) && (CC == ISD::SETEQ || CC == ISD::SETNE) &&
-        getAltivecCompareInfo(LHS, CompareOpc, isDot)) {
+        getAltivecCompareInfo(LHS, CompareOpc, isDot, Subtarget)) {
        assert(isDot && "Can't compare against a vector result!");
  
        // If this is a comparison against something other than 0/1, then we know
@@ -10203,7 +10551,7 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
        SDValue Ops[] = {
          LHS.getOperand(2),  // LHS of compare
          LHS.getOperand(3),  // RHS of compare
-        DAG.getConstant(CompareOpc, MVT::i32)
+        DAG.getConstant(CompareOpc, dl, MVT::i32)
        };
        EVT VTs[] = { LHS.getOperand(2).getValueType(), MVT::Glue };
        SDValue CompNode = DAG.getNode(PPCISD::VCMPo, dl, VTs, Ops);
@@ -10227,7 +10575,7 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
        }
  
        return DAG.getNode(PPCISD::COND_BRANCH, dl, MVT::Other, N->getOperand(0),
-                         DAG.getConstant(CompOpc, MVT::i32),
+                         DAG.getConstant(CompOpc, dl, MVT::i32),
                           DAG.getRegister(PPC::CR6, MVT::i32),
                           N->getOperand(4), CompNode.getValue(1));
      }
@@ -10255,14 +10603,14 @@ PPCTargetLowering::BuildSDIVPow2(SDNode *N, const APInt &Divisor,
  
    bool IsNegPow2 = (-Divisor).isPowerOf2();
    unsigned Lg2 = (IsNegPow2 ? -Divisor : Divisor).countTrailingZeros();
-  SDValue ShiftAmt = DAG.getConstant(Lg2, VT);
+  SDValue ShiftAmt = DAG.getConstant(Lg2, DL, VT);
  
    SDValue Op = DAG.getNode(PPCISD::SRA_ADDZE, DL, VT, N0, ShiftAmt);
    if (Created)
      Created->push_back(Op.getNode());
  
    if (IsNegPow2) {
-    Op = DAG.getNode(ISD::SUB, DL, VT, DAG.getConstant(0, VT), Op);
+    Op = DAG.getNode(ISD::SUB, DL, VT, DAG.getConstant(0, DL, VT), Op);
      if (Created)
        Created->push_back(Op.getNode());
    }
@@ -10296,14 +10644,17 @@ void PPCTargetLowering::computeKnownBitsForTargetNode(const SDValue Op,
      case Intrinsic::ppc_altivec_vcmpequb_p:
      case Intrinsic::ppc_altivec_vcmpequh_p:
      case Intrinsic::ppc_altivec_vcmpequw_p:
+    case Intrinsic::ppc_altivec_vcmpequd_p:
      case Intrinsic::ppc_altivec_vcmpgefp_p:
      case Intrinsic::ppc_altivec_vcmpgtfp_p:
      case Intrinsic::ppc_altivec_vcmpgtsb_p:
      case Intrinsic::ppc_altivec_vcmpgtsh_p:
      case Intrinsic::ppc_altivec_vcmpgtsw_p:
+    case Intrinsic::ppc_altivec_vcmpgtsd_p:
      case Intrinsic::ppc_altivec_vcmpgtub_p:
      case Intrinsic::ppc_altivec_vcmpgtuh_p:
      case Intrinsic::ppc_altivec_vcmpgtuw_p:
+    case Intrinsic::ppc_altivec_vcmpgtud_p:
        KnownZero = ~1U;  // All bits but the low one are known to be zero.
        break;
      }
@@ -10347,7 +10698,7 @@ unsigned PPCTargetLowering::getPrefLoopAlignment(MachineLoop *ML) const {
  /// getConstraintType - Given a constraint, return the type of
  /// constraint it is for this target.
  PPCTargetLowering::ConstraintType
-PPCTargetLowering::getConstraintType(const std::string &Constraint) const {
+PPCTargetLowering::getConstraintType(StringRef Constraint) const {
    if (Constraint.size() == 1) {
      switch (Constraint[0]) {
      default: break;
@@ -10430,8 +10781,9 @@ PPCTargetLowering::getSingleConstraintMatchWeight(
    return weight;
  }
  
-std::pair<unsigned, const TargetRegisterClass*>
-PPCTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
+std::pair<unsigned, const TargetRegisterClass *>
+PPCTargetLowering::getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,
+                                                StringRef Constraint,
                                                  MVT VT) const {
    if (Constraint.size() == 1) {
      // GCC RS6000 Constraint Letters
@@ -10469,11 +10821,14 @@ PPCTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
               Constraint == "wf") {
      return std::make_pair(0U, &PPC::VSRCRegClass);
    } else if (Constraint == "ws") {
-    return std::make_pair(0U, &PPC::VSFRCRegClass);
+    if (VT == MVT::f32)
+      return std::make_pair(0U, &PPC::VSSRCRegClass);
+    else
+      return std::make_pair(0U, &PPC::VSFRCRegClass);
    }
  
-  std::pair<unsigned, const TargetRegisterClass*> R =
-    TargetLowering::getRegForInlineAsmConstraint(Constraint, VT);
+  std::pair<unsigned, const TargetRegisterClass *> R =
+      TargetLowering::getRegForInlineAsmConstraint(TRI, Constraint, VT);
  
    // r[0-9]+ are used, on PPC64, to refer to the corresponding 64-bit registers
    // (which we call X[0-9]+). If a 64-bit value has been requested, and a
@@ -10482,12 +10837,10 @@ PPCTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
    // FIXME: If TargetLowering::getRegForInlineAsmConstraint could somehow use
    // the AsmName field from *RegisterInfo.td, then this would not be necessary.
    if (R.first && VT == MVT::i64 && Subtarget.isPPC64() &&
-      PPC::GPRCRegClass.contains(R.first)) {
-    const TargetRegisterInfo *TRI = Subtarget.getRegisterInfo();
+      PPC::GPRCRegClass.contains(R.first))
      return std::make_pair(TRI->getMatchingSuperReg(R.first,
                              PPC::sub_32, &PPC::G8RCRegClass),
                            &PPC::G8RCRegClass);
-  }
  
    // GCC accepts 'cc' as an alias for 'cr0', and we need to do the same.
    if (!R.second && StringRef("{cc}").equals_lower(Constraint)) {
@@ -10523,6 +10876,7 @@ void PPCTargetLowering::LowerAsmOperandForConstraint(SDValue Op,
    case 'P': {
      ConstantSDNode *CST = dyn_cast<ConstantSDNode>(Op);
      if (!CST) return; // Must be an immediate to match.
+    SDLoc dl(Op);
      int64_t Value = CST->getSExtValue();
      EVT TCVT = MVT::i64; // All constants taken to be 64 bits so that negative
                           // numbers are printed as such.
@@ -10530,35 +10884,35 @@ void PPCTargetLowering::LowerAsmOperandForConstraint(SDValue Op,
      default: llvm_unreachable("Unknown constraint letter!");
      case 'I':  // "I" is a signed 16-bit constant.
        if (isInt<16>(Value))
-        Result = DAG.getTargetConstant(Value, TCVT);
+        Result = DAG.getTargetConstant(Value, dl, TCVT);
        break;
      case 'J':  // "J" is a constant with only the high-order 16 bits nonzero.
        if (isShiftedUInt<16, 16>(Value))
-        Result = DAG.getTargetConstant(Value, TCVT);
+        Result = DAG.getTargetConstant(Value, dl, TCVT);
        break;
      case 'L':  // "L" is a signed 16-bit constant shifted left 16 bits.
        if (isShiftedInt<16, 16>(Value))
-        Result = DAG.getTargetConstant(Value, TCVT);
+        Result = DAG.getTargetConstant(Value, dl, TCVT);
        break;
      case 'K':  // "K" is a constant with only the low-order 16 bits nonzero.
        if (isUInt<16>(Value))
-        Result = DAG.getTargetConstant(Value, TCVT);
+        Result = DAG.getTargetConstant(Value, dl, TCVT);
        break;
      case 'M':  // "M" is a constant that is greater than 31.
        if (Value > 31)
-        Result = DAG.getTargetConstant(Value, TCVT);
+        Result = DAG.getTargetConstant(Value, dl, TCVT);
        break;
      case 'N':  // "N" is a positive constant that is an exact power of two.
        if (Value > 0 && isPowerOf2_64(Value))
-        Result = DAG.getTargetConstant(Value, TCVT);
+        Result = DAG.getTargetConstant(Value, dl, TCVT);
        break;
      case 'O':  // "O" is the constant zero.
        if (Value == 0)
-        Result = DAG.getTargetConstant(Value, TCVT);
+        Result = DAG.getTargetConstant(Value, dl, TCVT);
        break;
      case 'P':  // "P" is a constant whose negation is a signed 16-bit constant.
        if (isInt<16>(-Value))
-        Result = DAG.getTargetConstant(Value, TCVT);
+        Result = DAG.getTargetConstant(Value, dl, TCVT);
        break;
      }
      break;
@@ -10576,8 +10930,9 @@ void PPCTargetLowering::LowerAsmOperandForConstraint(SDValue Op,
  
  // isLegalAddressingMode - Return true if the addressing mode represented
  // by AM is legal for this target, for a load/store of the specified type.
-bool PPCTargetLowering::isLegalAddressingMode(const AddrMode &AM,
-                                              Type *Ty) const {
+bool PPCTargetLowering::isLegalAddressingMode(const DataLayout &DL,
+                                              const AddrMode &AM, Type *Ty,
+                                              unsigned AS) const {
    // PPC does not allow r+i addressing modes for vectors!
    if (Ty->isVectorTy() && AM.BaseOffs != 0)
      return false;
@@ -10629,22 +10984,22 @@ SDValue PPCTargetLowering::LowerRETURNADDR(SDValue Op,
    PPCFunctionInfo *FuncInfo = MF.getInfo<PPCFunctionInfo>();
    FuncInfo->setLRStoreRequired();
    bool isPPC64 = Subtarget.isPPC64();
+  auto PtrVT = getPointerTy(MF.getDataLayout());
  
    if (Depth > 0) {
      SDValue FrameAddr = LowerFRAMEADDR(Op, DAG);
      SDValue Offset =
-        DAG.getConstant(Subtarget.getFrameLowering()->getReturnSaveOffset(),
+        DAG.getConstant(Subtarget.getFrameLowering()->getReturnSaveOffset(), dl,
                          isPPC64 ? MVT::i64 : MVT::i32);
-    return DAG.getLoad(getPointerTy(), dl, DAG.getEntryNode(),
-                       DAG.getNode(ISD::ADD, dl, getPointerTy(),
-                                   FrameAddr, Offset),
+    return DAG.getLoad(PtrVT, dl, DAG.getEntryNode(),
+                       DAG.getNode(ISD::ADD, dl, PtrVT, FrameAddr, Offset),
                         MachinePointerInfo(), false, false, false, 0);
    }
  
    // Just load the return address off the stack.
    SDValue RetAddrFI = getReturnAddrFrameIndex(DAG);
-  return DAG.getLoad(getPointerTy(), dl, DAG.getEntryNode(),
-                     RetAddrFI, MachinePointerInfo(), false, false, false, 0);
+  return DAG.getLoad(PtrVT, dl, DAG.getEntryNode(), RetAddrFI,
+                     MachinePointerInfo(), false, false, false, 0);
  }
  
  SDValue PPCTargetLowering::LowerFRAMEADDR(SDValue Op,
@@ -10652,13 +11007,13 @@ SDValue PPCTargetLowering::LowerFRAMEADDR(SDValue Op,
    SDLoc dl(Op);
    unsigned Depth = cast<ConstantSDNode>(Op.getOperand(0))->getZExtValue();
  
-  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
-  bool isPPC64 = PtrVT == MVT::i64;
-
    MachineFunction &MF = DAG.getMachineFunction();
    MachineFrameInfo *MFI = MF.getFrameInfo();
    MFI->setFrameAddressIsTaken(true);
  
+  EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(MF.getDataLayout());
+  bool isPPC64 = PtrVT == MVT::i64;
+
    // Naked functions never have a frame pointer, and so we use r1. For all
    // other functions, this decision must be delayed until during PEI.
    unsigned FrameReg;
@@ -10914,11 +11269,29 @@ EVT PPCTargetLowering::getOptimalMemOpType(uint64_t Size,
                                             bool IsMemset, bool ZeroMemset,
                                             bool MemcpyStrSrc,
                                             MachineFunction &MF) const {
+  if (getTargetMachine().getOptLevel() != CodeGenOpt::None) {
+    const Function *F = MF.getFunction();
+    // When expanding a memset, require at least two QPX instructions to cover
+    // the cost of loading the value to be stored from the constant pool.
+    if (Subtarget.hasQPX() && Size >= 32 && (!IsMemset || Size >= 64) &&
+       (!SrcAlign || SrcAlign >= 32) && (!DstAlign || DstAlign >= 32) &&
+        !F->hasFnAttribute(Attribute::NoImplicitFloat)) {
+      return MVT::v4f64;
+    }
+
+    // We should use Altivec/VSX loads and stores when available. For unaligned
+    // addresses, unaligned VSX loads are only fast starting with the P8.
+    if (Subtarget.hasAltivec() && Size >= 16 &&
+        (((!SrcAlign || SrcAlign >= 16) && (!DstAlign || DstAlign >= 16)) ||
+         ((IsMemset && Subtarget.hasVSX()) || Subtarget.hasP8Vector())))
+      return MVT::v4i32;
+  }
+
    if (Subtarget.isPPC64()) {
      return MVT::i64;
-  } else {
-    return MVT::i32;
    }
+
+  return MVT::i32;
  }
  
  /// \brief Returns true if it is beneficial to convert a load of a constant