Move all of the header files which are involved in modelling the LLVM IR

[oota-llvm.git] / lib / CodeGen / SelectionDAG / TargetLowering.cpp
diff --git a/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/lib/CodeGen/SelectionDAG/TargetLowering.cpp

index c2a58c6357ad0d7b4efed1a902ae104412ba5154..f63e226ff9c76c80d58ffc0b07e1921b8dc41ffb 100644 (file)
--- a/lib/CodeGen/SelectionDAG/TargetLowering.cpp
+++ b/lib/CodeGen/SelectionDAG/TargetLowering.cpp
@@ -12,55 +12,27 @@
  //===----------------------------------------------------------------------===//
  
  #include "llvm/Target/TargetLowering.h"
-#include "llvm/MC/MCAsmInfo.h"
-#include "llvm/MC/MCExpr.h"
-#include "llvm/Target/TargetData.h"
-#include "llvm/Target/TargetLoweringObjectFile.h"
-#include "llvm/Target/TargetMachine.h"
-#include "llvm/Target/TargetRegisterInfo.h"
-#include "llvm/GlobalVariable.h"
-#include "llvm/DerivedTypes.h"
+#include "llvm/ADT/BitVector.h"
+#include "llvm/ADT/STLExtras.h"
  #include "llvm/CodeGen/Analysis.h"
  #include "llvm/CodeGen/MachineFrameInfo.h"
-#include "llvm/CodeGen/MachineJumpTableInfo.h"
  #include "llvm/CodeGen/MachineFunction.h"
+#include "llvm/CodeGen/MachineJumpTableInfo.h"
  #include "llvm/CodeGen/SelectionDAG.h"
-#include "llvm/ADT/STLExtras.h"
+#include "llvm/IR/DataLayout.h"
+#include "llvm/IR/DerivedTypes.h"
+#include "llvm/IR/GlobalVariable.h"
+#include "llvm/MC/MCAsmInfo.h"
+#include "llvm/MC/MCExpr.h"
  #include "llvm/Support/CommandLine.h"
  #include "llvm/Support/ErrorHandling.h"
  #include "llvm/Support/MathExtras.h"
+#include "llvm/Target/TargetLoweringObjectFile.h"
+#include "llvm/Target/TargetMachine.h"
+#include "llvm/Target/TargetRegisterInfo.h"
  #include <cctype>
  using namespace llvm;
  
-/// We are in the process of implementing a new TypeLegalization action
-/// - the promotion of vector elements. This feature is disabled by default
-/// and only enabled using this flag.
-static cl::opt<bool>
-AllowPromoteIntElem("promote-elements", cl::Hidden,
-  cl::desc("Allow promotion of integer vector element types"));
-
-namespace llvm {
-TLSModel::Model getTLSModel(const GlobalValue *GV, Reloc::Model reloc) {
-  bool isLocal = GV->hasLocalLinkage();
-  bool isDeclaration = GV->isDeclaration();
-  // FIXME: what should we do for protected and internal visibility?
-  // For variables, is internal different from hidden?
-  bool isHidden = GV->hasHiddenVisibility();
-
-  if (reloc == Reloc::PIC_) {
-    if (isLocal || isHidden)
-      return TLSModel::LocalDynamic;
-    else
-      return TLSModel::GeneralDynamic;
-  } else {
-    if (!isDeclaration || isHidden)
-      return TLSModel::LocalExec;
-    else
-      return TLSModel::InitialExec;
-  }
-}
-}
-
  /// InitLibcallNames - Set default libcall names.
  ///
  static void InitLibcallNames(const char **Names) {
@@ -317,7 +289,7 @@ static void InitLibcallNames(const char **Names) {
    Names[RTLIB::SYNC_FETCH_AND_OR_8] = "__sync_fetch_and_or_8";
    Names[RTLIB::SYNC_FETCH_AND_XOR_1] = "__sync_fetch_and_xor_1";
    Names[RTLIB::SYNC_FETCH_AND_XOR_2] = "__sync_fetch_and_xor_2";
-  Names[RTLIB::SYNC_FETCH_AND_XOR_4] = "__sync_fetch_and-xor_4";
+  Names[RTLIB::SYNC_FETCH_AND_XOR_4] = "__sync_fetch_and_xor_4";
    Names[RTLIB::SYNC_FETCH_AND_XOR_8] = "__sync_fetch_and_xor_8";
    Names[RTLIB::SYNC_FETCH_AND_NAND_1] = "__sync_fetch_and_nand_1";
    Names[RTLIB::SYNC_FETCH_AND_NAND_2] = "__sync_fetch_and_nand_2";
@@ -456,29 +428,29 @@ RTLIB::Libcall RTLIB::getSINTTOFP(EVT OpVT, EVT RetVT) {
    if (OpVT == MVT::i32) {
      if (RetVT == MVT::f32)
        return SINTTOFP_I32_F32;
-    else if (RetVT == MVT::f64)
+    if (RetVT == MVT::f64)
        return SINTTOFP_I32_F64;
-    else if (RetVT == MVT::f80)
+    if (RetVT == MVT::f80)
        return SINTTOFP_I32_F80;
-    else if (RetVT == MVT::ppcf128)
+    if (RetVT == MVT::ppcf128)
        return SINTTOFP_I32_PPCF128;
    } else if (OpVT == MVT::i64) {
      if (RetVT == MVT::f32)
        return SINTTOFP_I64_F32;
-    else if (RetVT == MVT::f64)
+    if (RetVT == MVT::f64)
        return SINTTOFP_I64_F64;
-    else if (RetVT == MVT::f80)
+    if (RetVT == MVT::f80)
        return SINTTOFP_I64_F80;
-    else if (RetVT == MVT::ppcf128)
+    if (RetVT == MVT::ppcf128)
        return SINTTOFP_I64_PPCF128;
    } else if (OpVT == MVT::i128) {
      if (RetVT == MVT::f32)
        return SINTTOFP_I128_F32;
-    else if (RetVT == MVT::f64)
+    if (RetVT == MVT::f64)
        return SINTTOFP_I128_F64;
-    else if (RetVT == MVT::f80)
+    if (RetVT == MVT::f80)
        return SINTTOFP_I128_F80;
-    else if (RetVT == MVT::ppcf128)
+    if (RetVT == MVT::ppcf128)
        return SINTTOFP_I128_PPCF128;
    }
    return UNKNOWN_LIBCALL;
@@ -490,29 +462,29 @@ RTLIB::Libcall RTLIB::getUINTTOFP(EVT OpVT, EVT RetVT) {
    if (OpVT == MVT::i32) {
      if (RetVT == MVT::f32)
        return UINTTOFP_I32_F32;
-    else if (RetVT == MVT::f64)
+    if (RetVT == MVT::f64)
        return UINTTOFP_I32_F64;
-    else if (RetVT == MVT::f80)
+    if (RetVT == MVT::f80)
        return UINTTOFP_I32_F80;
-    else if (RetVT == MVT::ppcf128)
+    if (RetVT == MVT::ppcf128)
        return UINTTOFP_I32_PPCF128;
    } else if (OpVT == MVT::i64) {
      if (RetVT == MVT::f32)
        return UINTTOFP_I64_F32;
-    else if (RetVT == MVT::f64)
+    if (RetVT == MVT::f64)
        return UINTTOFP_I64_F64;
-    else if (RetVT == MVT::f80)
+    if (RetVT == MVT::f80)
        return UINTTOFP_I64_F80;
-    else if (RetVT == MVT::ppcf128)
+    if (RetVT == MVT::ppcf128)
        return UINTTOFP_I64_PPCF128;
    } else if (OpVT == MVT::i128) {
      if (RetVT == MVT::f32)
        return UINTTOFP_I128_F32;
-    else if (RetVT == MVT::f64)
+    if (RetVT == MVT::f64)
        return UINTTOFP_I128_F64;
-    else if (RetVT == MVT::f80)
+    if (RetVT == MVT::f80)
        return UINTTOFP_I128_F80;
-    else if (RetVT == MVT::ppcf128)
+    if (RetVT == MVT::ppcf128)
        return UINTTOFP_I128_PPCF128;
    }
    return UNKNOWN_LIBCALL;
@@ -543,8 +515,7 @@ static void InitCmpLibcallCCs(ISD::CondCode *CCs) {
  /// NOTE: The constructor takes ownership of TLOF.
  TargetLowering::TargetLowering(const TargetMachine &tm,
                                 const TargetLoweringObjectFile *tlof)
-  : TM(tm), TD(TM.getTargetData()), TLOF(*tlof),
-  mayPromoteElements(AllowPromoteIntElem) {
+  : TM(tm), TD(TM.getDataLayout()), TLOF(*tlof) {
    // All operations default to being supported.
    memset(OpActions, 0, sizeof(OpActions));
    memset(LoadExtActions, 0, sizeof(LoadExtActions));
@@ -572,27 +543,53 @@ TargetLowering::TargetLowering(const TargetMachine &tm,
    // ConstantFP nodes default to expand.  Targets can either change this to
    // Legal, in which case all fp constants are legal, or use isFPImmLegal()
    // to optimize expansions for certain constants.
+  setOperationAction(ISD::ConstantFP, MVT::f16, Expand);
    setOperationAction(ISD::ConstantFP, MVT::f32, Expand);
    setOperationAction(ISD::ConstantFP, MVT::f64, Expand);
    setOperationAction(ISD::ConstantFP, MVT::f80, Expand);
  
    // These library functions default to expand.
-  setOperationAction(ISD::FLOG , MVT::f64, Expand);
-  setOperationAction(ISD::FLOG2, MVT::f64, Expand);
-  setOperationAction(ISD::FLOG10,MVT::f64, Expand);
-  setOperationAction(ISD::FEXP , MVT::f64, Expand);
-  setOperationAction(ISD::FEXP2, MVT::f64, Expand);
-  setOperationAction(ISD::FLOG , MVT::f32, Expand);
-  setOperationAction(ISD::FLOG2, MVT::f32, Expand);
-  setOperationAction(ISD::FLOG10,MVT::f32, Expand);
-  setOperationAction(ISD::FEXP , MVT::f32, Expand);
-  setOperationAction(ISD::FEXP2, MVT::f32, Expand);
+  setOperationAction(ISD::FLOG ,  MVT::f16, Expand);
+  setOperationAction(ISD::FLOG2,  MVT::f16, Expand);
+  setOperationAction(ISD::FLOG10, MVT::f16, Expand);
+  setOperationAction(ISD::FEXP ,  MVT::f16, Expand);
+  setOperationAction(ISD::FEXP2,  MVT::f16, Expand);
+  setOperationAction(ISD::FFLOOR, MVT::f16, Expand);
+  setOperationAction(ISD::FNEARBYINT, MVT::f16, Expand);
+  setOperationAction(ISD::FCEIL,  MVT::f16, Expand);
+  setOperationAction(ISD::FRINT,  MVT::f16, Expand);
+  setOperationAction(ISD::FTRUNC, MVT::f16, Expand);
+  setOperationAction(ISD::FLOG ,  MVT::f32, Expand);
+  setOperationAction(ISD::FLOG2,  MVT::f32, Expand);
+  setOperationAction(ISD::FLOG10, MVT::f32, Expand);
+  setOperationAction(ISD::FEXP ,  MVT::f32, Expand);
+  setOperationAction(ISD::FEXP2,  MVT::f32, Expand);
+  setOperationAction(ISD::FFLOOR, MVT::f32, Expand);
+  setOperationAction(ISD::FNEARBYINT, MVT::f32, Expand);
+  setOperationAction(ISD::FCEIL,  MVT::f32, Expand);
+  setOperationAction(ISD::FRINT,  MVT::f32, Expand);
+  setOperationAction(ISD::FTRUNC, MVT::f32, Expand);
+  setOperationAction(ISD::FLOG ,  MVT::f64, Expand);
+  setOperationAction(ISD::FLOG2,  MVT::f64, Expand);
+  setOperationAction(ISD::FLOG10, MVT::f64, Expand);
+  setOperationAction(ISD::FEXP ,  MVT::f64, Expand);
+  setOperationAction(ISD::FEXP2,  MVT::f64, Expand);
+  setOperationAction(ISD::FFLOOR, MVT::f64, Expand);
+  setOperationAction(ISD::FNEARBYINT, MVT::f64, Expand);
+  setOperationAction(ISD::FCEIL,  MVT::f64, Expand);
+  setOperationAction(ISD::FRINT,  MVT::f64, Expand);
+  setOperationAction(ISD::FTRUNC, MVT::f64, Expand);
  
    // Default ISD::TRAP to expand (which turns it into abort).
    setOperationAction(ISD::TRAP, MVT::Other, Expand);
  
+  // On most systems, DEBUGTRAP and TRAP have no difference. The "Expand"
+  // here is to inform DAG Legalizer to replace DEBUGTRAP with TRAP.
+  //
+  setOperationAction(ISD::DEBUGTRAP, MVT::Other, Expand);
+
    IsLittleEndian = TD->isLittleEndian();
-  PointerTy = MVT::getIntegerVT(8*TD->getPointerSize());
+  PointerTy = MVT::getIntegerVT(8*TD->getPointerSize(0));
    memset(RegClassForVT, 0,MVT::LAST_VALUETYPE*sizeof(TargetRegisterClass*));
    memset(TargetDAGCombineArray, 0, array_lengthof(TargetDAGCombineArray));
    maxStoresPerMemset = maxStoresPerMemcpy = maxStoresPerMemmove = 8;
@@ -605,12 +602,13 @@ TargetLowering::TargetLowering(const TargetMachine &tm,
    IntDivIsCheap = false;
    Pow2DivIsCheap = false;
    JumpIsExpensive = false;
+  predictableSelectIsExpensive = false;
    StackPointerRegisterToSaveRestore = 0;
    ExceptionPointerRegister = 0;
    ExceptionSelectorRegister = 0;
    BooleanContents = UndefinedBooleanContent;
    BooleanVectorContents = UndefinedBooleanContent;
-  SchedPreferenceInfo = Sched::Latency;
+  SchedPreferenceInfo = Sched::ILP;
    JumpBufSize = 0;
    JumpBufAlignment = 0;
    MinFunctionAlignment = 0;
@@ -619,6 +617,8 @@ TargetLowering::TargetLowering(const TargetMachine &tm,
    MinStackArgumentAlignment = 1;
    ShouldFoldAtomicFences = false;
    InsertFencesForAtomic = false;
+  SupportJumpTables = true;
+  MinimumJumpTableEntries = 4;
  
    InitLibcallNames(LibcallRoutineNames);
    InitCmpLibcallCCs(CmpLibcallCCs);
@@ -630,7 +630,7 @@ TargetLowering::~TargetLowering() {
  }
  
  MVT TargetLowering::getShiftAmountTy(EVT LHSTy) const {
-  return MVT::getIntegerVT(8*TD->getPointerSize());
+  return MVT::getIntegerVT(8*TD->getPointerSize(0));
  }
  
  /// canOpTrap - Returns true if the operation can trap for the value type.
@@ -653,7 +653,7 @@ bool TargetLowering::canOpTrap(unsigned Op, EVT VT) const {
  
  static unsigned getVectorTypeBreakdownMVT(MVT VT, MVT &IntermediateVT,
                                            unsigned &NumIntermediates,
-                                          EVT &RegisterVT,
+                                          MVT &RegisterVT,
                                            TargetLowering *TLI) {
    // Figure out the right, legal destination reg to copy into.
    unsigned NumElts = VT.getVectorNumElements();
@@ -688,7 +688,7 @@ static unsigned getVectorTypeBreakdownMVT(MVT VT, MVT &IntermediateVT,
    if (!isPowerOf2_32(NewVTSize))
      NewVTSize = NextPowerOf2(NewVTSize);
  
-  EVT DestVT = TLI->getRegisterType(NewVT);
+  MVT DestVT = TLI->getRegisterType(NewVT);
    RegisterVT = DestVT;
    if (EVT(DestVT).bitsLT(NewVT))    // Value is expanded, e.g. i64 -> i16.
      return NumVectorRegs*(NewVTSize/DestVT.getSizeInBits());
@@ -709,42 +709,34 @@ bool TargetLowering::isLegalRC(const TargetRegisterClass *RC) const {
    return false;
  }
  
-/// hasLegalSuperRegRegClasses - Return true if the specified register class
-/// has one or more super-reg register classes that are legal.
-bool
-TargetLowering::hasLegalSuperRegRegClasses(const TargetRegisterClass *RC) const{
-  if (*RC->superregclasses_begin() == 0)
-    return false;
-  for (TargetRegisterInfo::regclass_iterator I = RC->superregclasses_begin(),
-         E = RC->superregclasses_end(); I != E; ++I) {
-    const TargetRegisterClass *RRC = *I;
-    if (isLegalRC(RRC))
-      return true;
-  }
-  return false;
-}
-
  /// findRepresentativeClass - Return the largest legal super-reg register class
  /// of the register class for the specified type and its associated "cost".
  std::pair<const TargetRegisterClass*, uint8_t>
-TargetLowering::findRepresentativeClass(EVT VT) const {
-  const TargetRegisterClass *RC = RegClassForVT[VT.getSimpleVT().SimpleTy];
+TargetLowering::findRepresentativeClass(MVT VT) const {
+  const TargetRegisterInfo *TRI = getTargetMachine().getRegisterInfo();
+  const TargetRegisterClass *RC = RegClassForVT[VT.SimpleTy];
    if (!RC)
      return std::make_pair(RC, 0);
+
+  // Compute the set of all super-register classes.
+  BitVector SuperRegRC(TRI->getNumRegClasses());
+  for (SuperRegClassIterator RCI(RC, TRI); RCI.isValid(); ++RCI)
+    SuperRegRC.setBitsInMask(RCI.getMask());
+
+  // Find the first legal register class with the largest spill size.
    const TargetRegisterClass *BestRC = RC;
-  for (TargetRegisterInfo::regclass_iterator I = RC->superregclasses_begin(),
-         E = RC->superregclasses_end(); I != E; ++I) {
-    const TargetRegisterClass *RRC = *I;
-    if (RRC->isASubClass() || !isLegalRC(RRC))
+  for (int i = SuperRegRC.find_first(); i >= 0; i = SuperRegRC.find_next(i)) {
+    const TargetRegisterClass *SuperRC = TRI->getRegClass(i);
+    // We want the largest possible spill size.
+    if (SuperRC->getSize() <= BestRC->getSize())
        continue;
-    if (!hasLegalSuperRegRegClasses(RRC))
-      return std::make_pair(RRC, 1);
-    BestRC = RRC;
+    if (!isLegalRC(SuperRC))
+      continue;
+    BestRC = SuperRC;
    }
    return std::make_pair(BestRC, 1);
  }
  
-
  /// computeRegisterProperties - Once all of the register classes are added,
  /// this allows us to compute derived properties we expose.
  void TargetLowering::computeRegisterProperties() {
@@ -766,14 +758,13 @@ void TargetLowering::computeRegisterProperties() {
  
    // Every integer value type larger than this largest register takes twice as
    // many registers to represent as the previous ValueType.
-  for (unsigned ExpandedReg = LargestIntReg + 1; ; ++ExpandedReg) {
-    EVT ExpandedVT = (MVT::SimpleValueType)ExpandedReg;
-    if (!ExpandedVT.isInteger())
-      break;
+  for (unsigned ExpandedReg = LargestIntReg + 1;
+       ExpandedReg <= MVT::LAST_INTEGER_VALUETYPE; ++ExpandedReg) {
      NumRegistersForVT[ExpandedReg] = 2*NumRegistersForVT[ExpandedReg-1];
      RegisterTypeForVT[ExpandedReg] = (MVT::SimpleValueType)LargestIntReg;
      TransformToType[ExpandedReg] = (MVT::SimpleValueType)(ExpandedReg - 1);
-    ValueTypeActions.setTypeAction(ExpandedVT, TypeExpandInteger);
+    ValueTypeActions.setTypeAction((MVT::SimpleValueType)ExpandedReg,
+                                   TypeExpandInteger);
    }
  
    // Inspect all of the ValueType's smaller than the largest integer
@@ -781,12 +772,12 @@ void TargetLowering::computeRegisterProperties() {
    unsigned LegalIntReg = LargestIntReg;
    for (unsigned IntReg = LargestIntReg - 1;
         IntReg >= (unsigned)MVT::i1; --IntReg) {
-    EVT IVT = (MVT::SimpleValueType)IntReg;
+    MVT IVT = (MVT::SimpleValueType)IntReg;
      if (isTypeLegal(IVT)) {
        LegalIntReg = IntReg;
      } else {
        RegisterTypeForVT[IntReg] = TransformToType[IntReg] =
-        (MVT::SimpleValueType)LegalIntReg;
+        (const MVT::SimpleValueType)LegalIntReg;
        ValueTypeActions.setTypeAction(IVT, TypePromoteInteger);
      }
    }
@@ -832,17 +823,14 @@ void TargetLowering::computeRegisterProperties() {
  
      // Determine if there is a legal wider type.  If so, we should promote to
      // that wider vector type.
-    EVT EltVT = VT.getVectorElementType();
+    MVT EltVT = VT.getVectorElementType();
      unsigned NElts = VT.getVectorNumElements();
-    if (NElts != 1) {
+    if (NElts != 1 && !shouldSplitVectorElementType(EltVT)) {
        bool IsLegalWiderType = false;
-      // If we allow the promotion of vector elements using a flag,
-      // then return TypePromoteInteger on vector elements.
        // First try to promote the elements of integer vectors. If no legal
        // promotion was found, fallback to the widen-vector method.
-      if (mayPromoteElements)
        for (unsigned nVT = i+1; nVT <= MVT::LAST_VECTOR_VALUETYPE; ++nVT) {
-        EVT SVT = (MVT::SimpleValueType)nVT;
+        MVT SVT = (MVT::SimpleValueType)nVT;
          // Promote vectors of integers to vectors with the same number
          // of elements, with a wider element type.
          if (SVT.getVectorElementType().getSizeInBits() > EltVT.getSizeInBits()
@@ -861,7 +849,7 @@ void TargetLowering::computeRegisterProperties() {
  
        // Try to widen the vector.
        for (unsigned nVT = i+1; nVT <= MVT::LAST_VECTOR_VALUETYPE; ++nVT) {
-        EVT SVT = (MVT::SimpleValueType)nVT;
+        MVT SVT = (MVT::SimpleValueType)nVT;
          if (SVT.getVectorElementType() == EltVT &&
              SVT.getVectorNumElements() > NElts &&
              isTypeLegal(SVT)) {
@@ -877,14 +865,14 @@ void TargetLowering::computeRegisterProperties() {
      }
  
      MVT IntermediateVT;
-    EVT RegisterVT;
+    MVT RegisterVT;
      unsigned NumIntermediates;
      NumRegistersForVT[i] =
        getVectorTypeBreakdownMVT(VT, IntermediateVT, NumIntermediates,
                                  RegisterVT, this);
      RegisterTypeForVT[i] = RegisterVT;
  
-    EVT NVT = VT.getPow2VectorType();
+    MVT NVT = VT.getPow2VectorType();
      if (NVT == VT) {
        // Type is already a power of 2.  The default action is to split.
        TransformToType[i] = MVT::Other;
@@ -915,10 +903,9 @@ const char *TargetLowering::getTargetNodeName(unsigned Opcode) const {
    return NULL;
  }
  
-
  EVT TargetLowering::getSetCCResultType(EVT VT) const {
    assert(!VT.isVector() && "No default SetCC type for vectors!");
-  return PointerTy.SimpleTy;
+  return getPointerTy(0).SimpleTy;
  }
  
  MVT::SimpleValueType TargetLowering::getCmpLibcallReturnType() const {
@@ -937,16 +924,20 @@ MVT::SimpleValueType TargetLowering::getCmpLibcallReturnType() const {
  unsigned TargetLowering::getVectorTypeBreakdown(LLVMContext &Context, EVT VT,
                                                  EVT &IntermediateVT,
                                                  unsigned &NumIntermediates,
-                                                EVT &RegisterVT) const {
+                                                MVT &RegisterVT) const {
    unsigned NumElts = VT.getVectorNumElements();
  
    // If there is a wider vector type with the same element type as this one,
-  // we should widen to that legal vector type.  This handles things like
-  // <2 x float> -> <4 x float>.
-  if (NumElts != 1 && getTypeAction(Context, VT) == TypeWidenVector) {
-    RegisterVT = getTypeToTransformTo(Context, VT);
-    if (isTypeLegal(RegisterVT)) {
-      IntermediateVT = RegisterVT;
+  // or a promoted vector type that has the same number of elements which
+  // are wider, then we should convert to that legal vector type.
+  // This handles things like <2 x float> -> <4 x float> and
+  // <4 x i1> -> <4 x i32>.
+  LegalizeTypeAction TA = getTypeAction(Context, VT);
+  if (NumElts != 1 && (TA == TypeWidenVector || TA == TypePromoteInteger)) {
+    EVT RegisterEVT = getTypeToTransformTo(Context, VT);
+    if (isTypeLegal(RegisterEVT)) {
+      IntermediateVT = RegisterEVT;
+      RegisterVT = RegisterEVT.getSimpleVT();
        NumIntermediates = 1;
        return 1;
      }
@@ -979,7 +970,7 @@ unsigned TargetLowering::getVectorTypeBreakdown(LLVMContext &Context, EVT VT,
      NewVT = EltTy;
    IntermediateVT = NewVT;
  
-  EVT DestVT = getRegisterType(Context, NewVT);
+  MVT DestVT = getRegisterType(Context, NewVT);
    RegisterVT = DestVT;
    unsigned NewVTSize = NewVT.getSizeInBits();
  
@@ -987,7 +978,7 @@ unsigned TargetLowering::getVectorTypeBreakdown(LLVMContext &Context, EVT VT,
    if (!isPowerOf2_32(NewVTSize))
      NewVTSize = NextPowerOf2(NewVTSize);
  
-  if (DestVT.bitsLT(NewVT))   // Value is expanded, e.g. i64 -> i16.
+  if (EVT(DestVT).bitsLT(NewVT))   // Value is expanded, e.g. i64 -> i16.
      return NumVectorRegs*(NewVTSize/DestVT.getSizeInBits());
  
    // Otherwise, promotion or legal types use the same number of registers as
@@ -999,23 +990,21 @@ unsigned TargetLowering::getVectorTypeBreakdown(LLVMContext &Context, EVT VT,
  /// type of the given function.  This does not require a DAG or a return value,
  /// and is suitable for use before any DAGs for the function are constructed.
  /// TODO: Move this out of TargetLowering.cpp.
-void llvm::GetReturnInfo(Type* ReturnType, Attributes attr,
+void llvm::GetReturnInfo(Type* ReturnType, AttributeSet attr,
                           SmallVectorImpl<ISD::OutputArg> &Outs,
-                         const TargetLowering &TLI,
-                         SmallVectorImpl<uint64_t> *Offsets) {
+                         const TargetLowering &TLI) {
    SmallVector<EVT, 4> ValueVTs;
    ComputeValueVTs(TLI, ReturnType, ValueVTs);
    unsigned NumValues = ValueVTs.size();
    if (NumValues == 0) return;
-  unsigned Offset = 0;
  
    for (unsigned j = 0, f = NumValues; j != f; ++j) {
      EVT VT = ValueVTs[j];
      ISD::NodeType ExtendKind = ISD::ANY_EXTEND;
  
-    if (attr & Attribute::SExt)
+    if (attr.hasAttribute(AttributeSet::ReturnIndex, Attribute::SExt))
        ExtendKind = ISD::SIGN_EXTEND;
-    else if (attr & Attribute::ZExt)
+    else if (attr.hasAttribute(AttributeSet::ReturnIndex, Attribute::ZExt))
        ExtendKind = ISD::ZERO_EXTEND;
  
      // FIXME: C calling convention requires the return type to be promoted to
@@ -1023,34 +1012,27 @@ void llvm::GetReturnInfo(Type* ReturnType, Attributes attr,
      // conventions. The frontend should mark functions whose return values
      // require promoting with signext or zeroext attributes.
      if (ExtendKind != ISD::ANY_EXTEND && VT.isInteger()) {
-      EVT MinVT = TLI.getRegisterType(ReturnType->getContext(), MVT::i32);
+      MVT MinVT = TLI.getRegisterType(ReturnType->getContext(), MVT::i32);
        if (VT.bitsLT(MinVT))
          VT = MinVT;
      }
  
      unsigned NumParts = TLI.getNumRegisters(ReturnType->getContext(), VT);
-    EVT PartVT = TLI.getRegisterType(ReturnType->getContext(), VT);
-    unsigned PartSize = TLI.getTargetData()->getTypeAllocSize(
-                        PartVT.getTypeForEVT(ReturnType->getContext()));
+    MVT PartVT = TLI.getRegisterType(ReturnType->getContext(), VT);
  
      // 'inreg' on function refers to return value
      ISD::ArgFlagsTy Flags = ISD::ArgFlagsTy();
-    if (attr & Attribute::InReg)
+    if (attr.hasAttribute(AttributeSet::ReturnIndex, Attribute::InReg))
        Flags.setInReg();
  
      // Propagate extension type if any
-    if (attr & Attribute::SExt)
+    if (attr.hasAttribute(AttributeSet::ReturnIndex, Attribute::SExt))
        Flags.setSExt();
-    else if (attr & Attribute::ZExt)
+    else if (attr.hasAttribute(AttributeSet::ReturnIndex, Attribute::ZExt))
        Flags.setZExt();
  
-    for (unsigned i = 0; i < NumParts; ++i) {
-      Outs.push_back(ISD::OutputArg(Flags, PartVT, /*isFixed=*/true));
-      if (Offsets) {
-        Offsets->push_back(Offset);
-        Offset += PartSize;
-      }
-    }
+    for (unsigned i = 0; i < NumParts; ++i)
+      Outs.push_back(ISD::OutputArg(Flags, PartVT, /*isFixed=*/true, 0, 0));
    }
  }
  
@@ -1080,8 +1062,12 @@ unsigned TargetLowering::getJumpTableEncoding() const {
  SDValue TargetLowering::getPICJumpTableRelocBase(SDValue Table,
                                                   SelectionDAG &DAG) const {
    // If our PIC model is GP relative, use the global offset table as the base.
-  if (getJumpTableEncoding() == MachineJumpTableInfo::EK_GPRel32BlockAddress)
-    return DAG.getGLOBAL_OFFSET_TABLE(getPointerTy());
+  unsigned JTEncoding = getJumpTableEncoding();
+
+  if ((JTEncoding == MachineJumpTableInfo::EK_GPRel64BlockAddress) ||
+      (JTEncoding == MachineJumpTableInfo::EK_GPRel32BlockAddress))
+    return DAG.getGLOBAL_OFFSET_TABLE(getPointerTy(0));
+
    return Table;
  }
  
@@ -1176,7 +1162,8 @@ TargetLowering::TargetLoweringOpt::ShrinkDemandedOp(SDValue Op,
    // Search for the smallest integer type with free casts to and from
    // Op's type. For expedience, just check power-of-2 integer types.
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
-  unsigned SmallVTBits = BitWidth - Demanded.countLeadingZeros();
+  unsigned DemandedSize = BitWidth - Demanded.countLeadingZeros();
+  unsigned SmallVTBits = DemandedSize;
    if (!isPowerOf2_32(SmallVTBits))
      SmallVTBits = NextPowerOf2(SmallVTBits);
    for (; SmallVTBits < BitWidth; SmallVTBits = NextPowerOf2(SmallVTBits)) {
@@ -1189,7 +1176,9 @@ TargetLowering::TargetLoweringOpt::ShrinkDemandedOp(SDValue Op,
                                            Op.getNode()->getOperand(0)),
                                DAG.getNode(ISD::TRUNCATE, dl, SmallVT,
                                            Op.getNode()->getOperand(1)));
-      SDValue Z = DAG.getNode(ISD::ZERO_EXTEND, dl, Op.getValueType(), X);
+      bool NeedZext = DemandedSize > SmallVTBits;
+      SDValue Z = DAG.getNode(NeedZext ? ISD::ZERO_EXTEND : ISD::ANY_EXTEND,
+                              dl, Op.getValueType(), X);
        return CombineTo(Op, Z);
      }
    }
@@ -1223,7 +1212,7 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      if (Depth != 0) {
        // If not at the root, Just compute the KnownZero/KnownOne bits to
        // simplify things downstream.
-      TLO.DAG.ComputeMaskedBits(Op, DemandedMask, KnownZero, KnownOne, Depth);
+      TLO.DAG.ComputeMaskedBits(Op, KnownZero, KnownOne, Depth);
        return false;
      }
      // If this is the root being simplified, allow it to have multiple uses,
@@ -1242,8 +1231,8 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
    switch (Op.getOpcode()) {
    case ISD::Constant:
      // We know all of the bits for a constant!
-    KnownOne = cast<ConstantSDNode>(Op)->getAPIntValue() & NewMask;
-    KnownZero = ~KnownOne & NewMask;
+    KnownOne = cast<ConstantSDNode>(Op)->getAPIntValue();
+    KnownZero = ~KnownOne;
      return false;   // Don't fall through, will infinitely loop.
    case ISD::AND:
      // If the RHS is a constant, check to see if the LHS would be zero without
@@ -1253,8 +1242,7 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      if (ConstantSDNode *RHSC = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
        APInt LHSZero, LHSOne;
        // Do not increment Depth here; that can cause an infinite loop.
-      TLO.DAG.ComputeMaskedBits(Op.getOperand(0), NewMask,
-                                LHSZero, LHSOne, Depth);
+      TLO.DAG.ComputeMaskedBits(Op.getOperand(0), LHSZero, LHSOne, Depth);
        // If the LHS already has zeros where RHSC does, this and is dead.
        if ((LHSZero & NewMask) == (~RHSC->getAPIntValue() & NewMask))
          return TLO.CombineTo(Op, Op.getOperand(0));
@@ -1365,8 +1353,9 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      // bits on that side are also known to be set on the other side, turn this
      // into an AND, as we know the bits will be cleared.
      //    e.g. (X | C1) ^ C2 --> (X | C1) & ~C2 iff (C1&C2) == C2
-    if ((NewMask & (KnownZero|KnownOne)) == NewMask) { // all known
-      if ((KnownOne & KnownOne2) == KnownOne) {
+    // NB: it is okay if more bits are known than are requested
+    if ((NewMask & (KnownZero|KnownOne)) == NewMask) { // all known on one side 
+      if (KnownOne == KnownOne2) { // set bits are the same on both sides
          EVT VT = Op.getValueType();
          SDValue ANDC = TLO.DAG.getConstant(~KnownOne & NewMask, VT);
          return TLO.CombineTo(Op, TLO.DAG.getNode(ISD::AND, dl, VT,
@@ -1473,9 +1462,8 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
        if (InOp.getNode()->getOpcode() == ISD::ANY_EXTEND) {
          SDValue InnerOp = InOp.getNode()->getOperand(0);
          EVT InnerVT = InnerOp.getValueType();
-        if ((APInt::getHighBitsSet(BitWidth,
-                                   BitWidth - InnerVT.getSizeInBits()) &
-               DemandedMask) == 0 &&
+        unsigned InnerBits = InnerVT.getSizeInBits();
+        if (ShAmt < InnerBits && NewMask.lshr(InnerBits) == 0 &&
              isTypeDesirableForOp(ISD::SHL, InnerVT)) {
            EVT ShTy = getShiftAmountTy(InnerVT);
            if (!APInt(BitWidth, ShAmt).isIntN(ShTy.getSizeInBits()))
@@ -1545,7 +1533,7 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      // always convert this into a logical shr, even if the shift amount is
      // variable.  The low bit of the shift cannot be an input sign bit unless
      // the shift amount is >= the size of the datatype, which is undefined.
-    if (DemandedMask == 1)
+    if (NewMask == 1)
        return TLO.CombineTo(Op,
                             TLO.DAG.getNode(ISD::SRL, dl, Op.getValueType(),
                                             Op.getOperand(0), Op.getOperand(1)));
@@ -1588,23 +1576,40 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      }
      break;
    case ISD::SIGN_EXTEND_INREG: {
-    EVT EVT = cast<VTSDNode>(Op.getOperand(1))->getVT();
+    EVT ExVT = cast<VTSDNode>(Op.getOperand(1))->getVT();
+
+    APInt MsbMask = APInt::getHighBitsSet(BitWidth, 1);
+    // If we only care about the highest bit, don't bother shifting right.
+    if (MsbMask == DemandedMask) {
+      unsigned ShAmt = ExVT.getScalarType().getSizeInBits();
+      SDValue InOp = Op.getOperand(0);
+
+      // Compute the correct shift amount type, which must be getShiftAmountTy
+      // for scalar types after legalization.
+      EVT ShiftAmtTy = Op.getValueType();
+      if (TLO.LegalTypes() && !ShiftAmtTy.isVector())
+        ShiftAmtTy = getShiftAmountTy(ShiftAmtTy);
+
+      SDValue ShiftAmt = TLO.DAG.getConstant(BitWidth - ShAmt, ShiftAmtTy);
+      return TLO.CombineTo(Op, TLO.DAG.getNode(ISD::SHL, dl,
+                                            Op.getValueType(), InOp, ShiftAmt));
+    }
  
      // Sign extension.  Compute the demanded bits in the result that are not
      // present in the input.
      APInt NewBits =
        APInt::getHighBitsSet(BitWidth,
-                            BitWidth - EVT.getScalarType().getSizeInBits());
+                            BitWidth - ExVT.getScalarType().getSizeInBits());
  
      // If none of the extended bits are demanded, eliminate the sextinreg.
      if ((NewBits & NewMask) == 0)
        return TLO.CombineTo(Op, Op.getOperand(0));
  
      APInt InSignBit =
-      APInt::getSignBit(EVT.getScalarType().getSizeInBits()).zext(BitWidth);
+      APInt::getSignBit(ExVT.getScalarType().getSizeInBits()).zext(BitWidth);
      APInt InputDemandedBits =
        APInt::getLowBitsSet(BitWidth,
-                           EVT.getScalarType().getSizeInBits()) &
+                           ExVT.getScalarType().getSizeInBits()) &
        NewMask;
  
      // Since the sign extended bits are demanded, we know that the sign
@@ -1622,7 +1627,7 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      // If the input sign bit is known zero, convert this into a zero extension.
      if (KnownZero.intersects(InSignBit))
        return TLO.CombineTo(Op,
-                           TLO.DAG.getZeroExtendInReg(Op.getOperand(0),dl,EVT));
+                          TLO.DAG.getZeroExtendInReg(Op.getOperand(0),dl,ExVT));
  
      if (KnownOne.intersects(InSignBit)) {    // Input sign bit known set
        KnownOne |= NewBits;
@@ -1688,11 +1693,11 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
  
      // If the sign bit is known one, the top bits match.
      if (KnownOne.intersects(InSignBit)) {
-      KnownOne  |= NewBits;
-      KnownZero &= ~NewBits;
+      KnownOne |= NewBits;
+      assert((KnownZero & NewBits) == 0);
      } else {   // Otherwise, top bits aren't known.
-      KnownOne  &= ~NewBits;
-      KnownZero &= ~NewBits;
+      assert((KnownOne & NewBits) == 0);
+      assert((KnownZero & NewBits) == 0);
      }
      break;
    }
@@ -1783,7 +1788,9 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
    case ISD::BITCAST:
      // If this is an FP->Int bitcast and if the sign bit is the only
      // thing demanded, turn this into a FGETSIGN.
-    if (!Op.getOperand(0).getValueType().isVector() &&
+    if (!TLO.LegalOperations() &&
+        !Op.getValueType().isVector() &&
+        !Op.getOperand(0).getValueType().isVector() &&
          NewMask == APInt::getSignBit(Op.getValueType().getSizeInBits()) &&
          Op.getOperand(0).getValueType().isFloatingPoint()) {
        bool OpVTLegal = isOperationLegalOrCustom(ISD::FGETSIGN, Op.getValueType());
@@ -1824,7 +1831,7 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
    // FALL THROUGH
    default:
      // Just use ComputeMaskedBits to compute output bits.
-    TLO.DAG.ComputeMaskedBits(Op, NewMask, KnownZero, KnownOne, Depth);
+    TLO.DAG.ComputeMaskedBits(Op, KnownZero, KnownOne, Depth);
      break;
    }
  
@@ -1840,7 +1847,6 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
  /// in Mask are known to be either zero or one and return them in the
  /// KnownZero/KnownOne bitsets.
  void TargetLowering::computeMaskedBitsForTargetNode(const SDValue Op,
-                                                    const APInt &Mask,
                                                      APInt &KnownZero,
                                                      APInt &KnownOne,
                                                      const SelectionDAG &DAG,
@@ -1851,7 +1857,7 @@ void TargetLowering::computeMaskedBitsForTargetNode(const SDValue Op,
            Op.getOpcode() == ISD::INTRINSIC_VOID) &&
           "Should use MaskedValueIsZero if you don't know whether Op"
           " is a target node!");
-  KnownZero = KnownOne = APInt(Mask.getBitWidth(), 0);
+  KnownZero = KnownOne = APInt(KnownOne.getBitWidth(), 0);
  }
  
  /// ComputeNumSignBitsForTargetNode - This method can be implemented by
@@ -1895,9 +1901,8 @@ static bool ValueHasExactlyOneBitSet(SDValue Val, const SelectionDAG &DAG) {
    // Fall back to ComputeMaskedBits to catch other known cases.
    EVT OpVT = Val.getValueType();
    unsigned BitWidth = OpVT.getScalarType().getSizeInBits();
-  APInt Mask = APInt::getAllOnesValue(BitWidth);
    APInt KnownZero, KnownOne;
-  DAG.ComputeMaskedBits(Val, Mask, KnownZero, KnownOne);
+  DAG.ComputeMaskedBits(Val, KnownZero, KnownOne);
    return (KnownZero.countPopulation() == BitWidth - 1) &&
           (KnownOne.countPopulation() == 1);
  }
@@ -2000,7 +2005,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
          }
        }
  
-      // Make sure we're not loosing bits from the constant.
+      // Make sure we're not losing bits from the constant.
        if (MinBits < C1.getBitWidth() && MinBits > C1.getActiveBits()) {
          EVT MinVT = EVT::getIntegerVT(*DAG.getContext(), MinBits);
          if (isTypeDesirableForOp(ISD::SETCC, MinVT)) {
@@ -2060,7 +2065,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
            unsigned NewAlign = MinAlign(Lod->getAlignment(), bestOffset);
            SDValue NewLoad = DAG.getLoad(newVT, dl, Lod->getChain(), Ptr,
                                  Lod->getPointerInfo().getWithOffset(bestOffset),
-                                        false, false, NewAlign);
+                                        false, false, false, NewAlign);
            return DAG.getSetCC(dl, VT,
                                DAG.getNode(ISD::AND, dl, newVT, NewLoad,
                                        DAG.getConstant(bestMask.trunc(bestWidth),
@@ -2109,7 +2114,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
          EVT newVT = N0.getOperand(0).getValueType();
          if (DCI.isBeforeLegalizeOps() ||
              (isOperationLegal(ISD::SETCC, newVT) &&
-              getCondCodeAction(Cond, newVT)==Legal))
+             getCondCodeAction(Cond, newVT.getSimpleVT())==Legal))
            return DAG.getSetCC(dl, VT, N0.getOperand(0),
                                DAG.getConstant(C1.trunc(InSize), newVT),
                                Cond);
@@ -2205,9 +2210,10 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
            Cond = (Cond == ISD::SETEQ) ? ISD::SETNE : ISD::SETEQ;
            return DAG.getSetCC(dl, VT, Op0.getOperand(0), Op0.getOperand(1),
                                Cond);
-        } else if (Op0.getOpcode() == ISD::AND &&
-                isa<ConstantSDNode>(Op0.getOperand(1)) &&
-                cast<ConstantSDNode>(Op0.getOperand(1))->getAPIntValue() == 1) {
+        }
+        if (Op0.getOpcode() == ISD::AND &&
+            isa<ConstantSDNode>(Op0.getOperand(1)) &&
+            cast<ConstantSDNode>(Op0.getOperand(1))->getAPIntValue() == 1) {
            // If this is (X&1) == / != 1, normalize it to (X&1) != / == 0.
            if (Op0.getValueType().bitsGT(VT))
              Op0 = DAG.getNode(ISD::AND, dl, VT,
@@ -2222,6 +2228,11 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
                                DAG.getConstant(0, Op0.getValueType()),
                                Cond == ISD::SETEQ ? ISD::SETNE : ISD::SETEQ);
          }
+        if (Op0.getOpcode() == ISD::AssertZext &&
+            cast<VTSDNode>(Op0.getOperand(1))->getVT() == MVT::i1)
+          return DAG.getSetCC(dl, VT, Op0,
+                              DAG.getConstant(0, Op0.getValueType()),
+                              Cond == ISD::SETEQ ? ISD::SETNE : ISD::SETEQ);
        }
      }
  
@@ -2274,7 +2285,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
                            DAG.getConstant(MinVal, N0.getValueType()),
                            ISD::SETEQ);
      // If we have setugt X, Max-1, turn it into seteq X, Max
-    else if ((Cond == ISD::SETGT || Cond == ISD::SETUGT) && C1 == MaxVal-1)
+    if ((Cond == ISD::SETGT || Cond == ISD::SETUGT) && C1 == MaxVal-1)
        return DAG.getSetCC(dl, VT, N0,
                            DAG.getConstant(MaxVal, N0.getValueType()),
                            ISD::SETEQ);
@@ -2305,7 +2316,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
          N0.getOpcode() == ISD::AND)
        if (ConstantSDNode *AndRHS =
                    dyn_cast<ConstantSDNode>(N0.getOperand(1))) {
-        EVT ShiftTy = DCI.isBeforeLegalize() ?
+        EVT ShiftTy = DCI.isBeforeLegalizeOps() ?
            getPointerTy() : getShiftAmountTy(N0.getValueType());
          if (Cond == ISD::SETNE && C1 == 0) {// (X & 8) != 0  -->  (X & 8) >> 3
            // Perform the xform if the AND RHS is a single bit.
@@ -2324,6 +2335,55 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
            }
          }
        }
+
+    if (C1.getMinSignedBits() <= 64 &&
+        !isLegalICmpImmediate(C1.getSExtValue())) {
+      // (X & -256) == 256 -> (X >> 8) == 1
+      if ((Cond == ISD::SETEQ || Cond == ISD::SETNE) &&
+          N0.getOpcode() == ISD::AND && N0.hasOneUse()) {
+        if (ConstantSDNode *AndRHS =
+            dyn_cast<ConstantSDNode>(N0.getOperand(1))) {
+          const APInt &AndRHSC = AndRHS->getAPIntValue();
+          if ((-AndRHSC).isPowerOf2() && (AndRHSC & C1) == C1) {
+            unsigned ShiftBits = AndRHSC.countTrailingZeros();
+            EVT ShiftTy = DCI.isBeforeLegalizeOps() ?
+              getPointerTy() : getShiftAmountTy(N0.getValueType());
+            EVT CmpTy = N0.getValueType();
+            SDValue Shift = DAG.getNode(ISD::SRL, dl, CmpTy, N0.getOperand(0),
+                                        DAG.getConstant(ShiftBits, ShiftTy));
+            SDValue CmpRHS = DAG.getConstant(C1.lshr(ShiftBits), CmpTy);
+            return DAG.getSetCC(dl, VT, Shift, CmpRHS, Cond);
+          }
+        }
+      } else if (Cond == ISD::SETULT || Cond == ISD::SETUGE ||
+                 Cond == ISD::SETULE || Cond == ISD::SETUGT) {
+        bool AdjOne = (Cond == ISD::SETULE || Cond == ISD::SETUGT);
+        // X <  0x100000000 -> (X >> 32) <  1
+        // X >= 0x100000000 -> (X >> 32) >= 1
+        // X <= 0x0ffffffff -> (X >> 32) <  1
+        // X >  0x0ffffffff -> (X >> 32) >= 1
+        unsigned ShiftBits;
+        APInt NewC = C1;
+        ISD::CondCode NewCond = Cond;
+        if (AdjOne) {
+          ShiftBits = C1.countTrailingOnes();
+          NewC = NewC + 1;
+          NewCond = (Cond == ISD::SETULE) ? ISD::SETULT : ISD::SETUGE;
+        } else {
+          ShiftBits = C1.countTrailingZeros();
+        }
+        NewC = NewC.lshr(ShiftBits);
+        if (ShiftBits && isLegalICmpImmediate(NewC.getSExtValue())) {
+          EVT ShiftTy = DCI.isBeforeLegalizeOps() ?
+            getPointerTy() : getShiftAmountTy(N0.getValueType());
+          EVT CmpTy = N0.getValueType();
+          SDValue Shift = DAG.getNode(ISD::SRL, dl, CmpTy, N0,
+                                      DAG.getConstant(ShiftBits, ShiftTy));
+          SDValue CmpRHS = DAG.getConstant(NewC, CmpTy);
+          return DAG.getSetCC(dl, VT, Shift, CmpRHS, NewCond);
+        }
+      }
+    }
    }
  
    if (isa<ConstantFPSDNode>(N0.getNode())) {
@@ -2355,36 +2415,36 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
  
      // If the condition is not legal, see if we can find an equivalent one
      // which is legal.
-    if (!isCondCodeLegal(Cond, N0.getValueType())) {
+    if (!isCondCodeLegal(Cond, N0.getSimpleValueType())) {
        // If the comparison was an awkward floating-point == or != and one of
        // the comparison operands is infinity or negative infinity, convert the
        // condition to a less-awkward <= or >=.
        if (CFP->getValueAPF().isInfinity()) {
          if (CFP->getValueAPF().isNegative()) {
            if (Cond == ISD::SETOEQ &&
-              isCondCodeLegal(ISD::SETOLE, N0.getValueType()))
+              isCondCodeLegal(ISD::SETOLE, N0.getSimpleValueType()))
              return DAG.getSetCC(dl, VT, N0, N1, ISD::SETOLE);
            if (Cond == ISD::SETUEQ &&
-              isCondCodeLegal(ISD::SETOLE, N0.getValueType()))
+              isCondCodeLegal(ISD::SETOLE, N0.getSimpleValueType()))
              return DAG.getSetCC(dl, VT, N0, N1, ISD::SETULE);
            if (Cond == ISD::SETUNE &&
-              isCondCodeLegal(ISD::SETUGT, N0.getValueType()))
+              isCondCodeLegal(ISD::SETUGT, N0.getSimpleValueType()))
              return DAG.getSetCC(dl, VT, N0, N1, ISD::SETUGT);
            if (Cond == ISD::SETONE &&
-              isCondCodeLegal(ISD::SETUGT, N0.getValueType()))
+              isCondCodeLegal(ISD::SETUGT, N0.getSimpleValueType()))
              return DAG.getSetCC(dl, VT, N0, N1, ISD::SETOGT);
          } else {
            if (Cond == ISD::SETOEQ &&
-              isCondCodeLegal(ISD::SETOGE, N0.getValueType()))
+              isCondCodeLegal(ISD::SETOGE, N0.getSimpleValueType()))
              return DAG.getSetCC(dl, VT, N0, N1, ISD::SETOGE);
            if (Cond == ISD::SETUEQ &&
-              isCondCodeLegal(ISD::SETOGE, N0.getValueType()))
+              isCondCodeLegal(ISD::SETOGE, N0.getSimpleValueType()))
              return DAG.getSetCC(dl, VT, N0, N1, ISD::SETUGE);
            if (Cond == ISD::SETUNE &&
-              isCondCodeLegal(ISD::SETULT, N0.getValueType()))
+              isCondCodeLegal(ISD::SETULT, N0.getSimpleValueType()))
              return DAG.getSetCC(dl, VT, N0, N1, ISD::SETULT);
            if (Cond == ISD::SETONE &&
-              isCondCodeLegal(ISD::SETULT, N0.getValueType()))
+              isCondCodeLegal(ISD::SETULT, N0.getSimpleValueType()))
              return DAG.getSetCC(dl, VT, N0, N1, ISD::SETOLT);
          }
        }
@@ -2392,18 +2452,33 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
    }
  
    if (N0 == N1) {
+    // The sext(setcc()) => setcc() optimization relies on the appropriate
+    // constant being emitted.
+    uint64_t EqVal = 0;
+    switch (getBooleanContents(N0.getValueType().isVector())) {
+    case UndefinedBooleanContent:
+    case ZeroOrOneBooleanContent:
+      EqVal = ISD::isTrueWhenEqual(Cond);
+      break;
+    case ZeroOrNegativeOneBooleanContent:
+      EqVal = ISD::isTrueWhenEqual(Cond) ? -1 : 0;
+      break;
+    }
+
      // We can always fold X == X for integer setcc's.
-    if (N0.getValueType().isInteger())
-      return DAG.getConstant(ISD::isTrueWhenEqual(Cond), VT);
+    if (N0.getValueType().isInteger()) {
+      return DAG.getConstant(EqVal, VT);
+    }
      unsigned UOF = ISD::getUnorderedFlavor(Cond);
      if (UOF == 2)   // FP operators that are undefined on NaNs.
-      return DAG.getConstant(ISD::isTrueWhenEqual(Cond), VT);
+      return DAG.getConstant(EqVal, VT);
      if (UOF == unsigned(ISD::isTrueWhenEqual(Cond)))
-      return DAG.getConstant(UOF, VT);
+      return DAG.getConstant(EqVal, VT);
      // Otherwise, we can't fold it.  However, we can simplify it to SETUO/SETO
      // if it is not already.
      ISD::CondCode NewCond = UOF == 0 ? ISD::SETO : ISD::SETUO;
-    if (NewCond != Cond)
+    if (NewCond != Cond && (DCI.isBeforeLegalizeOps() ||
+          getCondCodeAction(NewCond, N0.getSimpleValueType()) == Legal))
        return DAG.getSetCC(dl, VT, N0, N1, NewCond);
    }
  
@@ -2428,6 +2503,10 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
          }
        }
  
+      // If RHS is a legal immediate value for a compare instruction, we need
+      // to be careful about increasing register pressure needlessly.
+      bool LegalRHSImm = false;
+
        if (ConstantSDNode *RHSC = dyn_cast<ConstantSDNode>(N1)) {
          if (ConstantSDNode *LHSR = dyn_cast<ConstantSDNode>(N0.getOperand(1))) {
            // Turn (X+C1) == C2 --> X == C2-C1
@@ -2462,25 +2541,33 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
                             Cond);
            }
          }
+
+        // Could RHSC fold directly into a compare?
+        if (RHSC->getValueType(0).getSizeInBits() <= 64)
+          LegalRHSImm = isLegalICmpImmediate(RHSC->getSExtValue());
        }
  
        // Simplify (X+Z) == X -->  Z == 0
-      if (N0.getOperand(0) == N1)
-        return DAG.getSetCC(dl, VT, N0.getOperand(1),
-                        DAG.getConstant(0, N0.getValueType()), Cond);
-      if (N0.getOperand(1) == N1) {
-        if (DAG.isCommutativeBinOp(N0.getOpcode()))
-          return DAG.getSetCC(dl, VT, N0.getOperand(0),
-                          DAG.getConstant(0, N0.getValueType()), Cond);
-        else if (N0.getNode()->hasOneUse()) {
-          assert(N0.getOpcode() == ISD::SUB && "Unexpected operation!");
-          // (Z-X) == X  --> Z == X<<1
-          SDValue SH = DAG.getNode(ISD::SHL, dl, N1.getValueType(),
-                                     N1,
+      // Don't do this if X is an immediate that can fold into a cmp
+      // instruction and X+Z has other uses. It could be an induction variable
+      // chain, and the transform would increase register pressure.
+      if (!LegalRHSImm || N0.getNode()->hasOneUse()) {
+        if (N0.getOperand(0) == N1)
+          return DAG.getSetCC(dl, VT, N0.getOperand(1),
+                              DAG.getConstant(0, N0.getValueType()), Cond);
+        if (N0.getOperand(1) == N1) {
+          if (DAG.isCommutativeBinOp(N0.getOpcode()))
+            return DAG.getSetCC(dl, VT, N0.getOperand(0),
+                                DAG.getConstant(0, N0.getValueType()), Cond);
+          if (N0.getNode()->hasOneUse()) {
+            assert(N0.getOpcode() == ISD::SUB && "Unexpected operation!");
+            // (Z-X) == X  --> Z == X<<1
+            SDValue SH = DAG.getNode(ISD::SHL, dl, N1.getValueType(), N1,
                         DAG.getConstant(1, getShiftAmountTy(N1.getValueType())));
-          if (!DCI.isCalledByLegalizer())
-            DCI.AddToWorklist(SH.getNode());
-          return DAG.getSetCC(dl, VT, N0.getOperand(0), SH, Cond);
+            if (!DCI.isCalledByLegalizer())
+              DCI.AddToWorklist(SH.getNode());
+            return DAG.getSetCC(dl, VT, N0.getOperand(0), SH, Cond);
+          }
          }
        }
      }
@@ -2488,14 +2575,14 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
      if (N1.getOpcode() == ISD::ADD || N1.getOpcode() == ISD::SUB ||
          N1.getOpcode() == ISD::XOR) {
        // Simplify  X == (X+Z) -->  Z == 0
-      if (N1.getOperand(0) == N0) {
+      if (N1.getOperand(0) == N0)
          return DAG.getSetCC(dl, VT, N1.getOperand(1),
                          DAG.getConstant(0, N1.getValueType()), Cond);
-      } else if (N1.getOperand(1) == N0) {
-        if (DAG.isCommutativeBinOp(N1.getOpcode())) {
+      if (N1.getOperand(1) == N0) {
+        if (DAG.isCommutativeBinOp(N1.getOpcode()))
            return DAG.getSetCC(dl, VT, N1.getOperand(0),
                            DAG.getConstant(0, N1.getValueType()), Cond);
-        } else if (N1.getNode()->hasOneUse()) {
+        if (N1.getNode()->hasOneUse()) {
            assert(N1.getOpcode() == ISD::SUB && "Unexpected operation!");
            // X == (Z-X)  --> X<<1 == Z
            SDValue SH = DAG.getNode(ISD::SHL, dl, N1.getValueType(), N0,
@@ -2752,6 +2839,9 @@ getRegForInlineAsmConstraint(const std::string &Constraint,
    // Remove the braces from around the name.
    StringRef RegName(Constraint.data()+1, Constraint.size()-2);
  
+  std::pair<unsigned, const TargetRegisterClass*> R =
+    std::make_pair(0u, static_cast<const TargetRegisterClass*>(0));
+
    // Figure out which register class contains this reg.
    const TargetRegisterInfo *RI = TM.getRegisterInfo();
    for (TargetRegisterInfo::regclass_iterator RCI = RI->regclass_begin(),
@@ -2765,12 +2855,22 @@ getRegForInlineAsmConstraint(const std::string &Constraint,
  
      for (TargetRegisterClass::iterator I = RC->begin(), E = RC->end();
           I != E; ++I) {
-      if (RegName.equals_lower(RI->getName(*I)))
-        return std::make_pair(*I, RC);
+      if (RegName.equals_lower(RI->getName(*I))) {
+        std::pair<unsigned, const TargetRegisterClass*> S =
+          std::make_pair(*I, RC);
+
+        // If this register class has the requested value type, return it,
+        // otherwise keep searching and return the first class found
+        // if no other is found which explicitly has the requested type.
+        if (RC->hasType(VT))
+          return S;
+        else if (!R.second)
+          R = S;
+      }
      }
    }
  
-  return std::make_pair(0u, static_cast<const TargetRegisterClass*>(0));
+  return R;
  }
  
  //===----------------------------------------------------------------------===//
@@ -2835,10 +2935,10 @@ TargetLowering::AsmOperandInfoVector TargetLowering::ParseConstraints(
        assert(!CS.getType()->isVoidTy() &&
               "Bad inline asm!");
        if (StructType *STy = dyn_cast<StructType>(CS.getType())) {
-        OpInfo.ConstraintVT = getValueType(STy->getElementType(ResNo));
+        OpInfo.ConstraintVT = getSimpleValueType(STy->getElementType(ResNo));
        } else {
          assert(ResNo == 0 && "Asm only has one result!");
-        OpInfo.ConstraintVT = getValueType(CS.getType());
+        OpInfo.ConstraintVT = getSimpleValueType(CS.getType());
        }
        ++ResNo;
        break;
@@ -2877,13 +2977,14 @@ TargetLowering::AsmOperandInfoVector TargetLowering::ParseConstraints(
          case 64:
          case 128:
            OpInfo.ConstraintVT =
-              EVT::getEVT(IntegerType::get(OpTy->getContext(), BitSize), true);
+            MVT::getVT(IntegerType::get(OpTy->getContext(), BitSize), true);
            break;
          }
-      } else if (dyn_cast<PointerType>(OpTy)) {
-        OpInfo.ConstraintVT = MVT::getIntegerVT(8*TD->getPointerSize());
+      } else if (PointerType *PT = dyn_cast<PointerType>(OpTy)) {
+        OpInfo.ConstraintVT = MVT::getIntegerVT(
+            8*TD->getPointerSize(PT->getAddressSpace()));
        } else {
-        OpInfo.ConstraintVT = EVT::getEVT(OpTy, true);
+        OpInfo.ConstraintVT = MVT::getVT(OpTy, true);
        }
      }
    }
@@ -2960,10 +3061,12 @@ TargetLowering::AsmOperandInfoVector TargetLowering::ParseConstraints(
        AsmOperandInfo &Input = ConstraintOperands[OpInfo.MatchingInput];
  
        if (OpInfo.ConstraintVT != Input.ConstraintVT) {
-       std::pair<unsigned, const TargetRegisterClass*> MatchRC =
-         getRegForInlineAsmConstraint(OpInfo.ConstraintCode, OpInfo.ConstraintVT);
-       std::pair<unsigned, const TargetRegisterClass*> InputRC =
-         getRegForInlineAsmConstraint(Input.ConstraintCode, Input.ConstraintVT);
+        std::pair<unsigned, const TargetRegisterClass*> MatchRC =
+          getRegForInlineAsmConstraint(OpInfo.ConstraintCode,
+                                       OpInfo.ConstraintVT);
+        std::pair<unsigned, const TargetRegisterClass*> InputRC =
+          getRegForInlineAsmConstraint(Input.ConstraintCode,
+                                       Input.ConstraintVT);
          if ((OpInfo.ConstraintVT.isInteger() !=
               Input.ConstraintVT.isInteger()) ||
              (MatchRC.second != InputRC.second)) {
@@ -2984,7 +3087,6 @@ TargetLowering::AsmOperandInfoVector TargetLowering::ParseConstraints(
  /// is.
  static unsigned getConstraintGenerality(TargetLowering::ConstraintType CT) {
    switch (CT) {
-  default: llvm_unreachable("Unknown constraint type!");
    case TargetLowering::C_Other:
    case TargetLowering::C_Unknown:
      return 0;
@@ -2995,6 +3097,7 @@ static unsigned getConstraintGenerality(TargetLowering::ConstraintType CT) {
    case TargetLowering::C_Memory:
      return 3;
    }
+  llvm_unreachable("Invalid constraint type");
  }
  
  /// Examine constraint type and operand type and determine a weight value.
@@ -3242,8 +3345,9 @@ SDValue TargetLowering::BuildExactSDIV(SDValue Op1, SDValue Op2, DebugLoc dl,
  /// return a DAG expression to select that will generate the same value by
  /// multiplying by a magic number.  See:
  /// <http://the.wall.riscom.net/books/proc/ppc/cwg/code2.html>
-SDValue TargetLowering::BuildSDIV(SDNode *N, SelectionDAG &DAG,
-                                  std::vector<SDNode*>* Created) const {
+SDValue TargetLowering::
+BuildSDIV(SDNode *N, SelectionDAG &DAG, bool IsAfterLegalization,
+          std::vector<SDNode*> *Created) const {
    EVT VT = N->getValueType(0);
    DebugLoc dl= N->getDebugLoc();
  
@@ -3258,10 +3362,12 @@ SDValue TargetLowering::BuildSDIV(SDNode *N, SelectionDAG &DAG,
    // Multiply the numerator (operand 0) by the magic value
    // FIXME: We should support doing a MUL in a wider type
    SDValue Q;
-  if (isOperationLegalOrCustom(ISD::MULHS, VT))
+  if (IsAfterLegalization ? isOperationLegal(ISD::MULHS, VT) :
+                            isOperationLegalOrCustom(ISD::MULHS, VT))
      Q = DAG.getNode(ISD::MULHS, dl, VT, N->getOperand(0),
                      DAG.getConstant(magics.m, VT));
-  else if (isOperationLegalOrCustom(ISD::SMUL_LOHI, VT))
+  else if (IsAfterLegalization ? isOperationLegal(ISD::SMUL_LOHI, VT) :
+                                 isOperationLegalOrCustom(ISD::SMUL_LOHI, VT))
      Q = SDValue(DAG.getNode(ISD::SMUL_LOHI, dl, DAG.getVTList(VT, VT),
                                N->getOperand(0),
                                DAG.getConstant(magics.m, VT)).getNode(), 1);
@@ -3299,8 +3405,9 @@ SDValue TargetLowering::BuildSDIV(SDNode *N, SelectionDAG &DAG,
  /// return a DAG expression to select that will generate the same value by
  /// multiplying by a magic number.  See:
  /// <http://the.wall.riscom.net/books/proc/ppc/cwg/code2.html>
-SDValue TargetLowering::BuildUDIV(SDNode *N, SelectionDAG &DAG,
-                                  std::vector<SDNode*>* Created) const {
+SDValue TargetLowering::
+BuildUDIV(SDNode *N, SelectionDAG &DAG, bool IsAfterLegalization,
+          std::vector<SDNode*> *Created) const {
    EVT VT = N->getValueType(0);
    DebugLoc dl = N->getDebugLoc();
  
@@ -3332,9 +3439,11 @@ SDValue TargetLowering::BuildUDIV(SDNode *N, SelectionDAG &DAG,
  
    // Multiply the numerator (operand 0) by the magic value
    // FIXME: We should support doing a MUL in a wider type
-  if (isOperationLegalOrCustom(ISD::MULHU, VT))
+  if (IsAfterLegalization ? isOperationLegal(ISD::MULHU, VT) :
+                            isOperationLegalOrCustom(ISD::MULHU, VT))
      Q = DAG.getNode(ISD::MULHU, dl, VT, Q, DAG.getConstant(magics.m, VT));
-  else if (isOperationLegalOrCustom(ISD::UMUL_LOHI, VT))
+  else if (IsAfterLegalization ? isOperationLegal(ISD::UMUL_LOHI, VT) :
+                                 isOperationLegalOrCustom(ISD::UMUL_LOHI, VT))
      Q = SDValue(DAG.getNode(ISD::UMUL_LOHI, dl, DAG.getVTList(VT, VT), Q,
                              DAG.getConstant(magics.m, VT)).getNode(), 1);
    else