Redirect DataLayout from TargetMachine to Module in SelectionDAG

[oota-llvm.git] / lib / CodeGen / SelectionDAG / SelectionDAGBuilder.cpp
diff --git a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

index 8ba957d6287084a3517097177be9e6765c615213..2cb74fe8a647f2607a69e4b6078cf2049c3dc02a 100644 (file)
--- a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
@@ -78,12 +78,16 @@ LimitFPPrecision("limit-float-precision",
                   cl::location(LimitFloatPrecision),
                   cl::init(0));
  
+static cl::opt<bool>
+EnableFMFInDAG("enable-fmf-dag", cl::init(false), cl::Hidden,
+                cl::desc("Enable fast-math-flags for DAG nodes"));
+
  // Limit the width of DAG chains. This is important in general to prevent
-// prevent DAG-based analysis from blowing up. For example, alias analysis and
+// DAG-based analysis from blowing up. For example, alias analysis and
  // load clustering may not complete in reasonable time. It is difficult to
  // recognize and avoid this situation within each individual analysis, and
  // future analyses are likely to have the same behavior. Limiting DAG width is
-// the safe approach, and will be especially important with global DAGs.
+// the safe approach and will be especially important with global DAGs.
  //
  // MaxParallelChains default is arbitrarily high to avoid affecting
  // optimization, but could be lowered to improve compile time. Any ld-ld-st-st
@@ -142,7 +146,7 @@ static SDValue getCopyFromParts(SelectionDAG &DAG, SDLoc DL,
          Hi = DAG.getNode(ISD::BITCAST, DL, HalfVT, Parts[1]);
        }
  
-      if (TLI.isBigEndian())
+      if (DAG.getDataLayout().isBigEndian())
          std::swap(Lo, Hi);
  
        Val = DAG.getNode(ISD::BUILD_PAIR, DL, RoundVT, Lo, Hi);
@@ -156,7 +160,7 @@ static SDValue getCopyFromParts(SelectionDAG &DAG, SDLoc DL,
  
          // Combine the round and odd parts.
          Lo = Val;
-        if (TLI.isBigEndian())
+        if (DAG.getDataLayout().isBigEndian())
            std::swap(Lo, Hi);
          EVT TotalVT = EVT::getIntegerVT(*DAG.getContext(), NumParts * PartBits);
          Hi = DAG.getNode(ISD::ANY_EXTEND, DL, TotalVT, Hi);
@@ -257,8 +261,9 @@ static SDValue getCopyFromPartsVector(SelectionDAG &DAG, SDLoc DL,
      assert(NumRegs == NumParts && "Part count doesn't match vector breakdown!");
      NumParts = NumRegs; // Silence a compiler warning.
      assert(RegisterVT == PartVT && "Part type doesn't match vector breakdown!");
-    assert(RegisterVT == Parts[0].getSimpleValueType() &&
-           "Part type doesn't match part!");
+    assert(RegisterVT.getSizeInBits() ==
+           Parts[0].getSimpleValueType().getSizeInBits() &&
+           "Part type sizes don't match!");
  
      // Assemble the parts into intermediate operands.
      SmallVector<SDValue, 8> Ops(NumIntermediates);
@@ -357,10 +362,10 @@ static void getCopyToParts(SelectionDAG &DAG, SDLoc DL,
    if (ValueVT.isVector())
      return getCopyToPartsVector(DAG, DL, Val, Parts, NumParts, PartVT, V);
  
-  const TargetLowering &TLI = DAG.getTargetLoweringInfo();
    unsigned PartBits = PartVT.getSizeInBits();
    unsigned OrigNumParts = NumParts;
-  assert(TLI.isTypeLegal(PartVT) && "Copying to an illegal type!");
+  assert(DAG.getTargetLoweringInfo().isTypeLegal(PartVT) &&
+         "Copying to an illegal type!");
  
    if (NumParts == 0)
      return;
@@ -428,7 +433,7 @@ static void getCopyToParts(SelectionDAG &DAG, SDLoc DL,
                                   DAG.getIntPtrConstant(RoundBits, DL));
      getCopyToParts(DAG, DL, OddVal, Parts + RoundParts, OddParts, PartVT, V);
  
-    if (TLI.isBigEndian())
+    if (DAG.getDataLayout().isBigEndian())
        // The odd parts were reversed by getCopyToParts - unreverse them.
        std::reverse(Parts + RoundParts, Parts + NumParts);
  
@@ -463,7 +468,7 @@ static void getCopyToParts(SelectionDAG &DAG, SDLoc DL,
      }
    }
  
-  if (TLI.isBigEndian())
+  if (DAG.getDataLayout().isBigEndian())
      std::reverse(Parts, Parts + OrigNumParts);
  }
  
@@ -802,7 +807,7 @@ void SelectionDAGBuilder::init(GCFunctionInfo *gfi, AliasAnalysis &aa,
    AA = &aa;
    GFI = gfi;
    LibInfo = li;
-  DL = DAG.getTarget().getDataLayout();
+  DL = &DAG.getDataLayout();
    Context = DAG.getContext();
    LPadToCallSiteMap.clear();
  }
@@ -1441,8 +1446,8 @@ void SelectionDAGBuilder::FindMergedConditions(const Value *Cond,
      // We have flexibility in setting Prob for BB1 and Prob for TmpBB.
      // The requirement is that
      //   TrueProb for BB1 + (FalseProb for BB1 * TrueProb for TmpBB)
-    //     = TrueProb for orignal BB.
-    // Assuming the orignal weights are A and B, one choice is to set BB1's
+    //     = TrueProb for original BB.
+    // Assuming the original weights are A and B, one choice is to set BB1's
      // weights to A and A+2B, and set TmpBB's weights to A and 2B. This choice
      // assumes that
      //   TrueProb for BB1 == FalseProb for BB1 * TrueProb for TmpBB.
@@ -1477,8 +1482,8 @@ void SelectionDAGBuilder::FindMergedConditions(const Value *Cond,
      // We have flexibility in setting Prob for BB1 and Prob for TmpBB.
      // The requirement is that
      //   FalseProb for BB1 + (TrueProb for BB1 * FalseProb for TmpBB)
-    //     = FalseProb for orignal BB.
-    // Assuming the orignal weights are A and B, one choice is to set BB1's
+    //     = FalseProb for original BB.
+    // Assuming the original weights are A and B, one choice is to set BB1's
      // weights to 2A+B and B, and set TmpBB's weights to 2A and B. This choice
      // assumes that
      //   FalseProb for BB1 == TrueProb for BB1 * FalseProb for TmpBB.
@@ -1766,8 +1771,7 @@ void SelectionDAGBuilder::visitSPDescriptorParent(StackProtectorDescriptor &SPD,
    SDValue GuardPtr = getValue(IRGuard);
    SDValue StackSlotPtr = DAG.getFrameIndex(FI, PtrTy);
  
-  unsigned Align =
-    TLI.getDataLayout()->getPrefTypeAlignment(IRGuard->getType());
+  unsigned Align = DL->getPrefTypeAlignment(IRGuard->getType());
  
    SDValue Guard;
    SDLoc dl = getCurSDLoc();
@@ -2148,6 +2152,8 @@ void SelectionDAGBuilder::visitBinary(const User &I, unsigned OpCode) {
    bool nuw = false;
    bool nsw = false;
    bool exact = false;
+  FastMathFlags FMF;
+
    if (const OverflowingBinaryOperator *OFBinOp =
            dyn_cast<const OverflowingBinaryOperator>(&I)) {
      nuw = OFBinOp->hasNoUnsignedWrap();
@@ -2156,9 +2162,22 @@ void SelectionDAGBuilder::visitBinary(const User &I, unsigned OpCode) {
    if (const PossiblyExactOperator *ExactOp =
            dyn_cast<const PossiblyExactOperator>(&I))
      exact = ExactOp->isExact();
-
+  if (const FPMathOperator *FPOp = dyn_cast<const FPMathOperator>(&I))
+    FMF = FPOp->getFastMathFlags();
+
+  SDNodeFlags Flags;
+  Flags.setExact(exact);
+  Flags.setNoSignedWrap(nsw);
+  Flags.setNoUnsignedWrap(nuw);
+  if (EnableFMFInDAG) {
+    Flags.setAllowReciprocal(FMF.allowReciprocal());
+    Flags.setNoInfs(FMF.noInfs());
+    Flags.setNoNaNs(FMF.noNaNs());
+    Flags.setNoSignedZeros(FMF.noSignedZeros());
+    Flags.setUnsafeAlgebra(FMF.unsafeAlgebra());
+  }
    SDValue BinNodeValue = DAG.getNode(OpCode, getCurSDLoc(), Op1.getValueType(),
-                                     Op1, Op2, nuw, nsw, exact);
+                                     Op1, Op2, &Flags);
    setValue(&I, BinNodeValue);
  }
  
@@ -2206,9 +2225,12 @@ void SelectionDAGBuilder::visitShift(const User &I, unsigned Opcode) {
              dyn_cast<const PossiblyExactOperator>(&I))
        exact = ExactOp->isExact();
    }
-
+  SDNodeFlags Flags;
+  Flags.setExact(exact);
+  Flags.setNoSignedWrap(nsw);
+  Flags.setNoUnsignedWrap(nuw);
    SDValue Res = DAG.getNode(Opcode, getCurSDLoc(), Op1.getValueType(), Op1, Op2,
-                            nuw, nsw, exact);
+                            &Flags);
    setValue(&I, Res);
  }
  
@@ -2216,17 +2238,11 @@ void SelectionDAGBuilder::visitSDiv(const User &I) {
    SDValue Op1 = getValue(I.getOperand(0));
    SDValue Op2 = getValue(I.getOperand(1));
  
-  // Turn exact SDivs into multiplications.
-  // FIXME: This should be in DAGCombiner, but it doesn't have access to the
-  // exact bit.
-  if (isa<BinaryOperator>(&I) && cast<BinaryOperator>(&I)->isExact() &&
-      !isa<ConstantSDNode>(Op1) &&
-      isa<ConstantSDNode>(Op2) && !cast<ConstantSDNode>(Op2)->isNullValue())
-    setValue(&I, DAG.getTargetLoweringInfo()
-                     .BuildExactSDIV(Op1, Op2, getCurSDLoc(), DAG));
-  else
-    setValue(&I, DAG.getNode(ISD::SDIV, getCurSDLoc(), Op1.getValueType(),
-                             Op1, Op2));
+  SDNodeFlags Flags;
+  Flags.setExact(isa<PossiblyExactOperator>(&I) &&
+                 cast<PossiblyExactOperator>(&I)->isExact());
+  setValue(&I, DAG.getNode(ISD::SDIV, getCurSDLoc(), Op1.getValueType(), Op1,
+                           Op2, &Flags));
  }
  
  void SelectionDAGBuilder::visitICmp(const User &I) {
@@ -2806,10 +2822,10 @@ void SelectionDAGBuilder::visitAlloca(const AllocaInst &I) {
    SDLoc dl = getCurSDLoc();
    Type *Ty = I.getAllocatedType();
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
-  uint64_t TySize = TLI.getDataLayout()->getTypeAllocSize(Ty);
+  auto &DL = DAG.getDataLayout();
+  uint64_t TySize = DL.getTypeAllocSize(Ty);
    unsigned Align =
-      std::max((unsigned)TLI.getDataLayout()->getPrefTypeAlignment(Ty),
-               I.getAlignment());
+      std::max((unsigned)DL.getPrefTypeAlignment(Ty), I.getAlignment());
  
    SDValue AllocSize = getValue(I.getArraySize());
  
@@ -2892,7 +2908,7 @@ void SelectionDAGBuilder::visitLoad(const LoadInst &I) {
      // Serialize volatile loads with other side effects.
      Root = getRoot();
    else if (AA->pointsToConstantMemory(
-             AliasAnalysis::Location(SV, AA->getTypeStoreSize(Ty), AAInfo))) {
+               MemoryLocation(SV, AA->getTypeStoreSize(Ty), AAInfo))) {
      // Do not serialize (non-volatile) loads of constant memory with anything.
      Root = DAG.getEntryNode();
      ConstantMemory = true;
@@ -2907,8 +2923,7 @@ void SelectionDAGBuilder::visitLoad(const LoadInst &I) {
      Root = TLI.prepareVolatileOrAtomicLoad(Root, dl, DAG);
  
    SmallVector<SDValue, 4> Values(NumValues);
-  SmallVector<SDValue, 4> Chains(std::min(unsigned(MaxParallelChains),
-                                          NumValues));
+  SmallVector<SDValue, 4> Chains(std::min(MaxParallelChains, NumValues));
    EVT PtrVT = Ptr.getValueType();
    unsigned ChainI = 0;
    for (unsigned i = 0; i != NumValues; ++i, ++ChainI) {
@@ -2972,8 +2987,7 @@ void SelectionDAGBuilder::visitStore(const StoreInst &I) {
    SDValue Ptr = getValue(PtrV);
  
    SDValue Root = getRoot();
-  SmallVector<SDValue, 4> Chains(std::min(unsigned(MaxParallelChains),
-                                          NumValues));
+  SmallVector<SDValue, 4> Chains(std::min(MaxParallelChains, NumValues));
    EVT PtrVT = Ptr.getValueType();
    bool isVolatile = I.isVolatile();
    bool isNonTemporal = I.getMetadata(LLVMContext::MD_nontemporal) != nullptr;
@@ -3141,10 +3155,8 @@ void SelectionDAGBuilder::visitMaskedLoad(const CallInst &I) {
    const MDNode *Ranges = I.getMetadata(LLVMContext::MD_range);
  
    SDValue InChain = DAG.getRoot();
-  if (AA->pointsToConstantMemory(
-      AliasAnalysis::Location(PtrOperand,
-                              AA->getTypeStoreSize(I.getType()),
-                              AAInfo))) {
+  if (AA->pointsToConstantMemory(MemoryLocation(
+          PtrOperand, AA->getTypeStoreSize(I.getType()), AAInfo))) {
      // Do not serialize (non-volatile) loads of constant memory with anything.
      InChain = DAG.getEntryNode();
    }
@@ -3186,10 +3198,9 @@ void SelectionDAGBuilder::visitMaskedGather(const CallInst &I) {
    Value *BasePtr = Ptr;
    bool UniformBase = getUniformBase(BasePtr, Base, Index, this);
    bool ConstantMemory = false;
-  if (UniformBase && AA->pointsToConstantMemory(
-      AliasAnalysis::Location(BasePtr,
-                                   AA->getTypeStoreSize(I.getType()),
-                              AAInfo))) {
+  if (UniformBase &&
+      AA->pointsToConstantMemory(
+          MemoryLocation(BasePtr, AA->getTypeStoreSize(I.getType()), AAInfo))) {
      // Do not serialize (non-volatile) loads of constant memory with anything.
      Root = DAG.getEntryNode();
      ConstantMemory = true;
@@ -4769,7 +4780,10 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
  
    case Intrinsic::debugtrap:
    case Intrinsic::trap: {
-    StringRef TrapFuncName = TM.Options.getTrapFunctionName();
+    StringRef TrapFuncName =
+        I.getAttributes()
+            .getAttribute(AttributeSet::FunctionIndex, "trap-func-name")
+            .getValueAsString();
      if (TrapFuncName.empty()) {
        ISD::NodeType Op = (Intrinsic == Intrinsic::trap) ?
          ISD::TRAP : ISD::DEBUGTRAP;
@@ -4959,11 +4973,9 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
          MF.getMMI().getContext().getOrCreateFrameAllocSymbol(
              GlobalValue::getRealLinkageName(Fn->getName()), IdxVal);
  
-    // Create a TargetExternalSymbol for the label to avoid any target lowering
+    // Create a MCSymbol for the label to avoid any target lowering
      // that would make this PC relative.
-    StringRef Name = FrameAllocSym->getName();
-    assert(Name.data()[Name.size()] == '\0' && "not null terminated");
-    SDValue OffsetSym = DAG.getTargetExternalSymbol(Name.data(), PtrVT);
+    SDValue OffsetSym = DAG.getMCSymbol(FrameAllocSym, PtrVT);
      SDValue OffsetVal =
          DAG.getNode(ISD::FRAME_ALLOC_RECOVER, sdl, PtrVT, OffsetSym);
  
@@ -4983,6 +4995,7 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      assert(Reg && "cannot get exception code on this platform");
      MVT PtrVT = TLI.getPointerTy();
      const TargetRegisterClass *PtrRC = TLI.getRegClassFor(PtrVT);
+    assert(FuncInfo.MBB->isLandingPad() && "eh.exceptioncode in non-lpad");
      unsigned VReg = FuncInfo.MBB->addLiveIn(Reg, PtrRC);
      SDValue N =
          DAG.getCopyFromReg(DAG.getEntryNode(), getCurSDLoc(), VReg, PtrVT);
@@ -5656,9 +5669,8 @@ public:
    /// getCallOperandValEVT - Return the EVT of the Value* that this operand
    /// corresponds to.  If there is no Value* for this operand, it returns
    /// MVT::Other.
-  EVT getCallOperandValEVT(LLVMContext &Context,
-                           const TargetLowering &TLI,
-                           const DataLayout *DL) const {
+  EVT getCallOperandValEVT(LLVMContext &Context, const TargetLowering &TLI,
+                           const DataLayout &DL) const {
      if (!CallOperandVal) return MVT::Other;
  
      if (isa<BasicBlock>(CallOperandVal))
@@ -5684,7 +5696,7 @@ public:
      // If OpTy is not a single value, it may be a struct/union that we
      // can tile with integers.
      if (!OpTy->isSingleValueType() && OpTy->isSized()) {
-      unsigned BitSize = DL->getTypeSizeInBits(OpTy);
+      unsigned BitSize = DL.getTypeSizeInBits(OpTy);
        switch (BitSize) {
        default: break;
        case 1:
@@ -5824,8 +5836,8 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
    SDISelAsmOperandInfoVector ConstraintOperands;
  
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
-  TargetLowering::AsmOperandInfoVector TargetConstraints =
-      TLI.ParseConstraints(DAG.getSubtarget().getRegisterInfo(), CS);
+  TargetLowering::AsmOperandInfoVector TargetConstraints = TLI.ParseConstraints(
+      DAG.getDataLayout(), DAG.getSubtarget().getRegisterInfo(), CS);
  
    bool hasMemory = false;
  
@@ -5874,8 +5886,8 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
          OpInfo.CallOperand = getValue(OpInfo.CallOperandVal);
        }
  
-      OpVT =
-          OpInfo.getCallOperandValEVT(*DAG.getContext(), TLI, DL).getSimpleVT();
+      OpVT = OpInfo.getCallOperandValEVT(*DAG.getContext(), TLI,
+                                         DAG.getDataLayout()).getSimpleVT();
      }
  
      OpInfo.ConstraintVT = OpVT;
@@ -5969,8 +5981,9 @@ void SelectionDAGBuilder::visitInlineAsm(ImmutableCallSite CS) {
          // Otherwise, create a stack slot and emit a store to it before the
          // asm.
          Type *Ty = OpVal->getType();
-        uint64_t TySize = TLI.getDataLayout()->getTypeAllocSize(Ty);
-        unsigned Align  = TLI.getDataLayout()->getPrefTypeAlignment(Ty);
+        auto &DL = DAG.getDataLayout();
+        uint64_t TySize = DL.getTypeAllocSize(Ty);
+        unsigned Align = DL.getPrefTypeAlignment(Ty);
          MachineFunction &MF = DAG.getMachineFunction();
          int SSFI = MF.getFrameInfo()->CreateStackObject(TySize, Align, false);
          SDValue StackSlot = DAG.getFrameIndex(SSFI, TLI.getPointerTy());
@@ -6366,7 +6379,7 @@ void SelectionDAGBuilder::visitVAStart(const CallInst &I) {
  
  void SelectionDAGBuilder::visitVAArg(const VAArgInst &I) {
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
-  const DataLayout &DL = *TLI.getDataLayout();
+  const DataLayout &DL = DAG.getDataLayout();
    SDValue V = DAG.getVAArg(TLI.getValueType(I.getType()), getCurSDLoc(),
                             getRoot(), getValue(I.getOperand(0)),
                             DAG.getSrcValue(I.getOperand(0)),
@@ -6704,6 +6717,7 @@ TargetLowering::LowerCallTo(TargetLowering::CallLoweringInfo &CLI) const {
    Type *OrigRetTy = CLI.RetTy;
    SmallVector<EVT, 4> RetTys;
    SmallVector<uint64_t, 4> Offsets;
+  auto &DL = CLI.DAG.getDataLayout();
    ComputeValueVTs(*this, CLI.RetTy, RetTys, &Offsets);
  
    SmallVector<ISD::OutputArg, 4> Outs;
@@ -6719,8 +6733,8 @@ TargetLowering::LowerCallTo(TargetLowering::CallLoweringInfo &CLI) const {
      // FIXME: equivalent assert?
      // assert(!CS.hasInAllocaArgument() &&
      //        "sret demotion is incompatible with inalloca");
-    uint64_t TySize = getDataLayout()->getTypeAllocSize(CLI.RetTy);
-    unsigned Align  = getDataLayout()->getPrefTypeAlignment(CLI.RetTy);
+    uint64_t TySize = DL.getTypeAllocSize(CLI.RetTy);
+    unsigned Align = DL.getPrefTypeAlignment(CLI.RetTy);
      MachineFunction &MF = CLI.DAG.getMachineFunction();
      DemoteStackIdx = MF.getFrameInfo()->CreateStackObject(TySize, Align, false);
      Type *StackSlotPtrType = PointerType::getUnqual(CLI.RetTy);
@@ -6783,7 +6797,7 @@ TargetLowering::LowerCallTo(TargetLowering::CallLoweringInfo &CLI) const {
        SDValue Op = SDValue(Args[i].Node.getNode(),
                             Args[i].Node.getResNo() + Value);
        ISD::ArgFlagsTy Flags;
-      unsigned OriginalAlignment = getDataLayout()->getABITypeAlignment(ArgTy);
+      unsigned OriginalAlignment = DL.getABITypeAlignment(ArgTy);
  
        if (Args[i].isZExt)
          Flags.setZExt();
@@ -6807,7 +6821,7 @@ TargetLowering::LowerCallTo(TargetLowering::CallLoweringInfo &CLI) const {
        if (Args[i].isByVal || Args[i].isInAlloca) {
          PointerType *Ty = cast<PointerType>(Args[i].Ty);
          Type *ElementTy = Ty->getElementType();
-        Flags.setByValSize(getDataLayout()->getTypeAllocSize(ElementTy));
+        Flags.setByValSize(DL.getTypeAllocSize(ElementTy));
          // For ByVal, alignment should come from FE.  BE will guess if this
          // info is not there but there are cases it cannot get right.
          unsigned FrameAlign;
@@ -7016,7 +7030,7 @@ static bool isOnlyUsedInEntryBlock(const Argument *A, bool FastISel) {
  void SelectionDAGISel::LowerArguments(const Function &F) {
    SelectionDAG &DAG = SDB->DAG;
    SDLoc dl = SDB->getCurSDLoc();
-  const DataLayout *DL = TLI->getDataLayout();
+  const DataLayout &DL = DAG.getDataLayout();
    SmallVector<ISD::InputArg, 16> Ins;
  
    if (!FuncInfo->CanLowerReturn) {
@@ -7052,7 +7066,7 @@ void SelectionDAGISel::LowerArguments(const Function &F) {
        EVT VT = ValueVTs[Value];
        Type *ArgTy = VT.getTypeForEVT(*DAG.getContext());
        ISD::ArgFlagsTy Flags;
-      unsigned OriginalAlignment = DL->getABITypeAlignment(ArgTy);
+      unsigned OriginalAlignment = DL.getABITypeAlignment(ArgTy);
  
        if (F.getAttributes().hasAttribute(Idx, Attribute::ZExt))
          Flags.setZExt();
@@ -7076,7 +7090,7 @@ void SelectionDAGISel::LowerArguments(const Function &F) {
        if (Flags.isByVal() || Flags.isInAlloca()) {
          PointerType *Ty = cast<PointerType>(I->getType());
          Type *ElementTy = Ty->getElementType();
-        Flags.setByValSize(DL->getTypeAllocSize(ElementTy));
+        Flags.setByValSize(DL.getTypeAllocSize(ElementTy));
          // For ByVal, alignment should be passed from FE.  BE will guess if
          // this info is not there but there are cases it cannot get right.
          unsigned FrameAlign;
@@ -7486,6 +7500,31 @@ void SelectionDAGBuilder::findJumpTables(CaseClusterVector &Clusters,
    const int64_t N = Clusters.size();
    const unsigned MinJumpTableSize = TLI.getMinimumJumpTableEntries();
  
+  // TotalCases[i]: Total nbr of cases in Clusters[0..i].
+  SmallVector<unsigned, 8> TotalCases(N);
+
+  for (unsigned i = 0; i < N; ++i) {
+    APInt Hi = Clusters[i].High->getValue();
+    APInt Lo = Clusters[i].Low->getValue();
+    TotalCases[i] = (Hi - Lo).getLimitedValue() + 1;
+    if (i != 0)
+      TotalCases[i] += TotalCases[i - 1];
+  }
+
+  if (N >= MinJumpTableSize && isDense(Clusters, &TotalCases[0], 0, N - 1)) {
+    // Cheap case: the whole range might be suitable for jump table.
+    CaseCluster JTCluster;
+    if (buildJumpTable(Clusters, 0, N - 1, SI, DefaultMBB, JTCluster)) {
+      Clusters[0] = JTCluster;
+      Clusters.resize(1);
+      return;
+    }
+  }
+
+  // The algorithm below is not suitable for -O0.
+  if (TM.getOptLevel() == CodeGenOpt::None)
+    return;
+
    // Split Clusters into minimum number of dense partitions. The algorithm uses
    // the same idea as Kannan & Proebsting "Correction to 'Producing Good Code
    // for the Case Statement'" (1994), but builds the MinPartitions array in
@@ -7499,16 +7538,6 @@ void SelectionDAGBuilder::findJumpTables(CaseClusterVector &Clusters,
    SmallVector<unsigned, 8> LastElement(N);
    // NumTables[i]: nbr of >= MinJumpTableSize partitions from Clusters[i..N-1].
    SmallVector<unsigned, 8> NumTables(N);
-  // TotalCases[i]: Total nbr of cases in Clusters[0..i].
-  SmallVector<unsigned, 8> TotalCases(N);
-
-  for (unsigned i = 0; i < N; ++i) {
-    APInt Hi = Clusters[i].High->getValue();
-    APInt Lo = Clusters[i].Low->getValue();
-    TotalCases[i] = (Hi - Lo).getLimitedValue() + 1;
-    if (i != 0)
-      TotalCases[i] += TotalCases[i - 1];
-  }
  
    // Base case: There is only one way to partition Clusters[N-1].
    MinPartitions[N - 1] = 1;
@@ -7566,7 +7595,7 @@ void SelectionDAGBuilder::findJumpTables(CaseClusterVector &Clusters,
  
  bool SelectionDAGBuilder::rangeFitsInWord(const APInt &Low, const APInt &High) {
    // FIXME: Using the pointer type doesn't seem ideal.
-  uint64_t BW = DAG.getTargetLoweringInfo().getPointerTy().getSizeInBits();
+  uint64_t BW = DAG.getDataLayout().getPointerSizeInBits();
    uint64_t Range = (High - Low).getLimitedValue(UINT64_MAX - 1) + 1;
    return Range <= BW;
  }
@@ -7696,6 +7725,10 @@ void SelectionDAGBuilder::findBitTestClusters(CaseClusterVector &Clusters,
      assert(Clusters[i-1].High->getValue().slt(Clusters[i].Low->getValue()));
  #endif
  
+  // The algorithm below is not suitable for -O0.
+  if (TM.getOptLevel() == CodeGenOpt::None)
+    return;
+
    // If target does not have legal shift left, do not emit bit tests at all.
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
    EVT PTy = TLI.getPointerTy();
@@ -7959,6 +7992,18 @@ void SelectionDAGBuilder::lowerWorkItem(SwitchWorkListItem W, Value *Cond,
    }
  }
  
+unsigned SelectionDAGBuilder::caseClusterRank(const CaseCluster &CC,
+                                              CaseClusterIt First,
+                                              CaseClusterIt Last) {
+  return std::count_if(First, Last + 1, [&](const CaseCluster &X) {
+    if (X.Weight != CC.Weight)
+      return X.Weight > CC.Weight;
+
+    // Ties are broken by comparing the case value.
+    return X.Low->getValue().slt(CC.Low->getValue());
+  });
+}
+
  void SelectionDAGBuilder::splitWorkItem(SwitchWorkList &WorkList,
                                          const SwitchWorkListItem &W,
                                          Value *Cond,
@@ -7988,6 +8033,48 @@ void SelectionDAGBuilder::splitWorkItem(SwitchWorkList &WorkList,
        RightWeight += (--FirstRight)->Weight;
      I++;
    }
+
+  for (;;) {
+    // Our binary search tree differs from a typical BST in that ours can have up
+    // to three values in each leaf. The pivot selection above doesn't take that
+    // into account, which means the tree might require more nodes and be less
+    // efficient. We compensate for this here.
+
+    unsigned NumLeft = LastLeft - W.FirstCluster + 1;
+    unsigned NumRight = W.LastCluster - FirstRight + 1;
+
+    if (std::min(NumLeft, NumRight) < 3 && std::max(NumLeft, NumRight) > 3) {
+      // If one side has less than 3 clusters, and the other has more than 3,
+      // consider taking a cluster from the other side.
+
+      if (NumLeft < NumRight) {
+        // Consider moving the first cluster on the right to the left side.
+        CaseCluster &CC = *FirstRight;
+        unsigned RightSideRank = caseClusterRank(CC, FirstRight, W.LastCluster);
+        unsigned LeftSideRank = caseClusterRank(CC, W.FirstCluster, LastLeft);
+        if (LeftSideRank <= RightSideRank) {
+          // Moving the cluster to the left does not demote it.
+          ++LastLeft;
+          ++FirstRight;
+          continue;
+        }
+      } else {
+        assert(NumRight < NumLeft);
+        // Consider moving the last element on the left to the right side.
+        CaseCluster &CC = *LastLeft;
+        unsigned LeftSideRank = caseClusterRank(CC, W.FirstCluster, LastLeft);
+        unsigned RightSideRank = caseClusterRank(CC, FirstRight, W.LastCluster);
+        if (RightSideRank <= LeftSideRank) {
+          // Moving the cluster to the right does not demot it.
+          --LastLeft;
+          --FirstRight;
+          continue;
+        }
+      }
+    }
+    break;
+  }
+
    assert(LastLeft + 1 == FirstRight);
    assert(LastLeft >= W.FirstCluster);
    assert(FirstRight <= W.LastCluster);
@@ -8111,11 +8198,8 @@ void SelectionDAGBuilder::visitSwitch(const SwitchInst &SI) {
      return;
    }
  
-  if (TM.getOptLevel() != CodeGenOpt::None) {
-    findJumpTables(Clusters, &SI, DefaultMBB);
-    findBitTestClusters(Clusters, &SI);
-  }
-
+  findJumpTables(Clusters, &SI, DefaultMBB);
+  findBitTestClusters(Clusters, &SI);
  
    DEBUG({
      dbgs() << "Case clusters: ";