[fast-isel] SelectInsertValue seems to be causing miscompiles for ARM. Disable while...

[oota-llvm.git] / lib / CodeGen / SelectionDAG / TargetLowering.cpp
diff --git a/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/lib/CodeGen/SelectionDAG/TargetLowering.cpp

index 403d0d9fb2214aac4050f98daf43931cee74595d..ee329dc671ea118e647b359a0aeff33d1c5de018 100644 (file)
--- a/lib/CodeGen/SelectionDAG/TargetLowering.cpp
+++ b/lib/CodeGen/SelectionDAG/TargetLowering.cpp
@@ -36,7 +36,7 @@ using namespace llvm;
  /// - the promotion of vector elements. This feature is disabled by default
  /// and only enabled using this flag.
  static cl::opt<bool>
-AllowPromoteIntElem("promote-elements", cl::Hidden,
+AllowPromoteIntElem("promote-elements", cl::Hidden, cl::init(true),
    cl::desc("Allow promotion of integer vector element types"));
  
  namespace llvm {
@@ -81,6 +81,9 @@ static void InitLibcallNames(const char **Names) {
    Names[RTLIB::MUL_I32] = "__mulsi3";
    Names[RTLIB::MUL_I64] = "__muldi3";
    Names[RTLIB::MUL_I128] = "__multi3";
+  Names[RTLIB::MULO_I32] = "__mulosi4";
+  Names[RTLIB::MULO_I64] = "__mulodi4";
+  Names[RTLIB::MULO_I128] = "__muloti4";
    Names[RTLIB::SDIV_I8] = "__divqi3";
    Names[RTLIB::SDIV_I16] = "__divhi3";
    Names[RTLIB::SDIV_I32] = "__divsi3";
@@ -136,6 +139,10 @@ static void InitLibcallNames(const char **Names) {
    Names[RTLIB::REM_F64] = "fmod";
    Names[RTLIB::REM_F80] = "fmodl";
    Names[RTLIB::REM_PPCF128] = "fmodl";
+  Names[RTLIB::FMA_F32] = "fmaf";
+  Names[RTLIB::FMA_F64] = "fma";
+  Names[RTLIB::FMA_F80] = "fmal";
+  Names[RTLIB::FMA_PPCF128] = "fmal";
    Names[RTLIB::POWI_F32] = "__powisf2";
    Names[RTLIB::POWI_F64] = "__powidf2";
    Names[RTLIB::POWI_F80] = "__powixf2";
@@ -310,7 +317,7 @@ static void InitLibcallNames(const char **Names) {
    Names[RTLIB::SYNC_FETCH_AND_OR_8] = "__sync_fetch_and_or_8";
    Names[RTLIB::SYNC_FETCH_AND_XOR_1] = "__sync_fetch_and_xor_1";
    Names[RTLIB::SYNC_FETCH_AND_XOR_2] = "__sync_fetch_and_xor_2";
-  Names[RTLIB::SYNC_FETCH_AND_XOR_4] = "__sync_fetch_and-xor_4";
+  Names[RTLIB::SYNC_FETCH_AND_XOR_4] = "__sync_fetch_and_xor_4";
    Names[RTLIB::SYNC_FETCH_AND_XOR_8] = "__sync_fetch_and_xor_8";
    Names[RTLIB::SYNC_FETCH_AND_NAND_1] = "__sync_fetch_and_nand_1";
    Names[RTLIB::SYNC_FETCH_AND_NAND_2] = "__sync_fetch_and_nand_2";
@@ -570,16 +577,26 @@ TargetLowering::TargetLowering(const TargetMachine &tm,
    setOperationAction(ISD::ConstantFP, MVT::f80, Expand);
  
    // These library functions default to expand.
-  setOperationAction(ISD::FLOG , MVT::f64, Expand);
-  setOperationAction(ISD::FLOG2, MVT::f64, Expand);
-  setOperationAction(ISD::FLOG10,MVT::f64, Expand);
-  setOperationAction(ISD::FEXP , MVT::f64, Expand);
-  setOperationAction(ISD::FEXP2, MVT::f64, Expand);
-  setOperationAction(ISD::FLOG , MVT::f32, Expand);
-  setOperationAction(ISD::FLOG2, MVT::f32, Expand);
-  setOperationAction(ISD::FLOG10,MVT::f32, Expand);
-  setOperationAction(ISD::FEXP , MVT::f32, Expand);
-  setOperationAction(ISD::FEXP2, MVT::f32, Expand);
+  setOperationAction(ISD::FLOG ,  MVT::f64, Expand);
+  setOperationAction(ISD::FLOG2,  MVT::f64, Expand);
+  setOperationAction(ISD::FLOG10, MVT::f64, Expand);
+  setOperationAction(ISD::FEXP ,  MVT::f64, Expand);
+  setOperationAction(ISD::FEXP2,  MVT::f64, Expand);
+  setOperationAction(ISD::FFLOOR, MVT::f64, Expand);
+  setOperationAction(ISD::FNEARBYINT, MVT::f64, Expand);
+  setOperationAction(ISD::FCEIL,  MVT::f64, Expand);
+  setOperationAction(ISD::FRINT,  MVT::f64, Expand);
+  setOperationAction(ISD::FTRUNC, MVT::f64, Expand);
+  setOperationAction(ISD::FLOG ,  MVT::f32, Expand);
+  setOperationAction(ISD::FLOG2,  MVT::f32, Expand);
+  setOperationAction(ISD::FLOG10, MVT::f32, Expand);
+  setOperationAction(ISD::FEXP ,  MVT::f32, Expand);
+  setOperationAction(ISD::FEXP2,  MVT::f32, Expand);
+  setOperationAction(ISD::FFLOOR, MVT::f32, Expand);
+  setOperationAction(ISD::FNEARBYINT, MVT::f32, Expand);
+  setOperationAction(ISD::FCEIL,  MVT::f32, Expand);
+  setOperationAction(ISD::FRINT,  MVT::f32, Expand);
+  setOperationAction(ISD::FTRUNC, MVT::f32, Expand);
  
    // Default ISD::TRAP to expand (which turns it into abort).
    setOperationAction(ISD::TRAP, MVT::Other, Expand);
@@ -602,7 +619,8 @@ TargetLowering::TargetLowering(const TargetMachine &tm,
    ExceptionPointerRegister = 0;
    ExceptionSelectorRegister = 0;
    BooleanContents = UndefinedBooleanContent;
-  SchedPreferenceInfo = Sched::Latency;
+  BooleanVectorContents = UndefinedBooleanContent;
+  SchedPreferenceInfo = Sched::ILP;
    JumpBufSize = 0;
    JumpBufAlignment = 0;
    MinFunctionAlignment = 0;
@@ -610,6 +628,7 @@ TargetLowering::TargetLowering(const TargetMachine &tm,
    PrefLoopAlignment = 0;
    MinStackArgumentAlignment = 1;
    ShouldFoldAtomicFences = false;
+  InsertFencesForAtomic = false;
  
    InitLibcallNames(LibcallRoutineNames);
    InitCmpLibcallCCs(CmpLibcallCCs);
@@ -673,10 +692,16 @@ static unsigned getVectorTypeBreakdownMVT(MVT VT, MVT &IntermediateVT,
      NewVT = EltTy;
    IntermediateVT = NewVT;
  
+  unsigned NewVTSize = NewVT.getSizeInBits();
+
+  // Convert sizes such as i33 to i64.
+  if (!isPowerOf2_32(NewVTSize))
+    NewVTSize = NextPowerOf2(NewVTSize);
+
    EVT DestVT = TLI->getRegisterType(NewVT);
    RegisterVT = DestVT;
    if (EVT(DestVT).bitsLT(NewVT))    // Value is expanded, e.g. i64 -> i16.
-    return NumVectorRegs*(NewVT.getSizeInBits()/DestVT.getSizeInBits());
+    return NumVectorRegs*(NewVTSize/DestVT.getSizeInBits());
  
    // Otherwise, promotion or legal types use the same number of registers as
    // the vector decimated to the appropriate level.
@@ -901,7 +926,8 @@ const char *TargetLowering::getTargetNodeName(unsigned Opcode) const {
  }
  
  
-MVT::SimpleValueType TargetLowering::getSetCCResultType(EVT VT) const {
+EVT TargetLowering::getSetCCResultType(EVT VT) const {
+  assert(!VT.isVector() && "No default SetCC type for vectors!");
    return PointerTy.SimpleTy;
  }
  
@@ -965,8 +991,14 @@ unsigned TargetLowering::getVectorTypeBreakdown(LLVMContext &Context, EVT VT,
  
    EVT DestVT = getRegisterType(Context, NewVT);
    RegisterVT = DestVT;
+  unsigned NewVTSize = NewVT.getSizeInBits();
+
+  // Convert sizes such as i33 to i64.
+  if (!isPowerOf2_32(NewVTSize))
+    NewVTSize = NextPowerOf2(NewVTSize);
+
    if (DestVT.bitsLT(NewVT))   // Value is expanded, e.g. i64 -> i16.
-    return NumVectorRegs*(NewVT.getSizeInBits()/DestVT.getSizeInBits());
+    return NumVectorRegs*(NewVTSize/DestVT.getSizeInBits());
  
    // Otherwise, promotion or legal types use the same number of registers as
    // the vector decimated to the appropriate level.
@@ -977,7 +1009,7 @@ unsigned TargetLowering::getVectorTypeBreakdown(LLVMContext &Context, EVT VT,
  /// type of the given function.  This does not require a DAG or a return value,
  /// and is suitable for use before any DAGs for the function are constructed.
  /// TODO: Move this out of TargetLowering.cpp.
-void llvm::GetReturnInfo(const Type* ReturnType, Attributes attr,
+void llvm::GetReturnInfo(Type* ReturnType, Attributes attr,
                           SmallVectorImpl<ISD::OutputArg> &Outs,
                           const TargetLowering &TLI,
                           SmallVectorImpl<uint64_t> *Offsets) {
@@ -1035,7 +1067,7 @@ void llvm::GetReturnInfo(const Type* ReturnType, Attributes attr,
  /// getByValTypeAlignment - Return the desired alignment for ByVal aggregate
  /// function arguments in the caller parameter area.  This is the actual
  /// alignment, not its logarithm.
-unsigned TargetLowering::getByValTypeAlignment(const Type *Ty) const {
+unsigned TargetLowering::getByValTypeAlignment(Type *Ty) const {
    return TD->getCallFrameTypeAlignment(Ty);
  }
  
@@ -1451,9 +1483,8 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
        if (InOp.getNode()->getOpcode() == ISD::ANY_EXTEND) {
          SDValue InnerOp = InOp.getNode()->getOperand(0);
          EVT InnerVT = InnerOp.getValueType();
-        if ((APInt::getHighBitsSet(BitWidth,
-                                   BitWidth - InnerVT.getSizeInBits()) &
-               DemandedMask) == 0 &&
+        unsigned InnerBits = InnerVT.getSizeInBits();
+        if (ShAmt < InnerBits && NewMask.lshr(InnerBits) == 0 &&
              isTypeDesirableForOp(ISD::SHL, InnerVT)) {
            EVT ShTy = getShiftAmountTy(InnerVT);
            if (!APInt(BitWidth, ShAmt).isIntN(ShTy.getSizeInBits()))
@@ -1523,7 +1554,7 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      // always convert this into a logical shr, even if the shift amount is
      // variable.  The low bit of the shift cannot be an input sign bit unless
      // the shift amount is >= the size of the datatype, which is undefined.
-    if (DemandedMask == 1)
+    if (NewMask == 1)
        return TLO.CombineTo(Op,
                             TLO.DAG.getNode(ISD::SRL, dl, Op.getValueType(),
                                             Op.getOperand(0), Op.getOperand(1)));
@@ -1745,33 +1776,35 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      break;
    }
    case ISD::AssertZext: {
-    // Demand all the bits of the input that are demanded in the output.
-    // The low bits are obvious; the high bits are demanded because we're
-    // asserting that they're zero here.
-    if (SimplifyDemandedBits(Op.getOperand(0), NewMask,
+    // AssertZext demands all of the high bits, plus any of the low bits
+    // demanded by its users.
+    EVT VT = cast<VTSDNode>(Op.getOperand(1))->getVT();
+    APInt InMask = APInt::getLowBitsSet(BitWidth,
+                                        VT.getSizeInBits());
+    if (SimplifyDemandedBits(Op.getOperand(0), ~InMask | NewMask,
                               KnownZero, KnownOne, TLO, Depth+1))
        return true;
      assert((KnownZero & KnownOne) == 0 && "Bits known to be one AND zero?");
  
-    EVT VT = cast<VTSDNode>(Op.getOperand(1))->getVT();
-    APInt InMask = APInt::getLowBitsSet(BitWidth,
-                                        VT.getSizeInBits());
      KnownZero |= ~InMask & NewMask;
      break;
    }
    case ISD::BITCAST:
-    // If this is an FP->Int bitcast and if the sign bit is the only thing that
-    // is demanded, turn this into a FGETSIGN.
-    if (NewMask == APInt::getSignBit(Op.getValueType().getSizeInBits()) &&
-        Op.getOperand(0).getValueType().isFloatingPoint() &&
-        !Op.getOperand(0).getValueType().isVector()) {
-      if (isOperationLegalOrCustom(ISD::FGETSIGN, MVT::i32)) {
-        EVT Ty = (isOperationLegalOrCustom(ISD::FGETSIGN, Op.getValueType())) ?
-          Op.getValueType() : MVT::i32;
+    // If this is an FP->Int bitcast and if the sign bit is the only
+    // thing demanded, turn this into a FGETSIGN.
+    if (!Op.getValueType().isVector() &&
+        !Op.getOperand(0).getValueType().isVector() &&
+        NewMask == APInt::getSignBit(Op.getValueType().getSizeInBits()) &&
+        Op.getOperand(0).getValueType().isFloatingPoint()) {
+      bool OpVTLegal = isOperationLegalOrCustom(ISD::FGETSIGN, Op.getValueType());
+      bool i32Legal  = isOperationLegalOrCustom(ISD::FGETSIGN, MVT::i32);
+      if ((OpVTLegal || i32Legal) && Op.getValueType().isSimple()) {
+        EVT Ty = OpVTLegal ? Op.getValueType() : MVT::i32;
          // Make a FGETSIGN + SHL to move the sign bit into the appropriate
          // place.  We expect the SHL to be eliminated by other optimizations.
          SDValue Sign = TLO.DAG.getNode(ISD::FGETSIGN, dl, Ty, Op.getOperand(0));
-        if (Ty != Op.getValueType())
+        unsigned OpVTSizeInBits = Op.getValueType().getSizeInBits();
+        if (!OpVTLegal && OpVTSizeInBits > 32)
            Sign = TLO.DAG.getNode(ISD::ZERO_EXTEND, dl, Op.getValueType(), Sign);
          unsigned ShVal = Op.getValueType().getSizeInBits()-1;
          SDValue ShAmt = TLO.DAG.getConstant(ShVal, Op.getValueType());
@@ -1900,7 +1933,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
    // comparisons.
    if (isa<ConstantSDNode>(N0.getNode()))
      return DAG.getSetCC(dl, VT, N1, N0, ISD::getSetCCSwappedOperands(Cond));
-  
+
    if (ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N1.getNode())) {
      const APInt &C1 = N1C->getAPIntValue();
  
@@ -2037,7 +2070,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
            unsigned NewAlign = MinAlign(Lod->getAlignment(), bestOffset);
            SDValue NewLoad = DAG.getLoad(newVT, dl, Lod->getChain(), Ptr,
                                  Lod->getPointerInfo().getWithOffset(bestOffset),
-                                        false, false, NewAlign);
+                                        false, false, false, NewAlign);
            return DAG.getSetCC(dl, VT,
                                DAG.getNode(ISD::AND, dl, newVT, NewLoad,
                                        DAG.getConstant(bestMask.trunc(bestWidth),
@@ -2170,7 +2203,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
          }
        } else if (N1C->getAPIntValue() == 1 &&
                   (VT == MVT::i1 ||
-                  getBooleanContents() == ZeroOrOneBooleanContent)) {
+                  getBooleanContents(false) == ZeroOrOneBooleanContent)) {
          SDValue Op0 = N0;
          if (Op0.getOpcode() == ISD::TRUNCATE)
            Op0 = Op0.getOperand(0);
@@ -2606,7 +2639,6 @@ PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const {
  
  TargetLowering::ConstraintType
  TargetLowering::getConstraintType(const std::string &Constraint) const {
-  // FIXME: lots more standard ones to handle.
    if (Constraint.size() == 1) {
      switch (Constraint[0]) {
      default: break;
@@ -2659,9 +2691,9 @@ void TargetLowering::LowerAsmOperandForConstraint(SDValue Op,
                                                    std::string &Constraint,
                                                    std::vector<SDValue> &Ops,
                                                    SelectionDAG &DAG) const {
-  
+
    if (Constraint.length() > 1) return;
-  
+
    char ConstraintLetter = Constraint[0];
    switch (ConstraintLetter) {
    default: break;
@@ -2720,13 +2752,6 @@ void TargetLowering::LowerAsmOperandForConstraint(SDValue Op,
    }
  }
  
-std::vector<unsigned> TargetLowering::
-getRegClassForInlineAsmConstraint(const std::string &Constraint,
-                                  EVT VT) const {
-  return std::vector<unsigned>();
-}
-
-
  std::pair<unsigned, const TargetRegisterClass*> TargetLowering::
  getRegForInlineAsmConstraint(const std::string &Constraint,
                               EVT VT) const {
@@ -2745,16 +2770,8 @@ getRegForInlineAsmConstraint(const std::string &Constraint,
  
      // If none of the value types for this register class are valid, we
      // can't use it.  For example, 64-bit reg classes on 32-bit targets.
-    bool isLegal = false;
-    for (TargetRegisterClass::vt_iterator I = RC->vt_begin(), E = RC->vt_end();
-         I != E; ++I) {
-      if (isTypeLegal(*I)) {
-        isLegal = true;
-        break;
-      }
-    }
-
-    if (!isLegal) continue;
+    if (!isLegalRC(RC))
+      continue;
  
      for (TargetRegisterClass::iterator I = RC->begin(), E = RC->end();
           I != E; ++I) {
@@ -2827,7 +2844,7 @@ TargetLowering::AsmOperandInfoVector TargetLowering::ParseConstraints(
        // corresponding argument.
        assert(!CS.getType()->isVoidTy() &&
               "Bad inline asm!");
-      if (const StructType *STy = dyn_cast<StructType>(CS.getType())) {
+      if (StructType *STy = dyn_cast<StructType>(CS.getType())) {
          OpInfo.ConstraintVT = getValueType(STy->getElementType(ResNo));
        } else {
          assert(ResNo == 0 && "Asm only has one result!");
@@ -2844,16 +2861,16 @@ TargetLowering::AsmOperandInfoVector TargetLowering::ParseConstraints(
      }
  
      if (OpInfo.CallOperandVal) {
-      const llvm::Type *OpTy = OpInfo.CallOperandVal->getType();
+      llvm::Type *OpTy = OpInfo.CallOperandVal->getType();
        if (OpInfo.isIndirect) {
-        const llvm::PointerType *PtrTy = dyn_cast<PointerType>(OpTy);
+        llvm::PointerType *PtrTy = dyn_cast<PointerType>(OpTy);
          if (!PtrTy)
            report_fatal_error("Indirect operand for inline asm not a pointer!");
          OpTy = PtrTy->getElementType();
        }
-      
+
        // Look for vector wrapped in a struct. e.g. { <16 x i8> }.
-      if (const StructType *STy = dyn_cast<StructType>(OpTy))
+      if (StructType *STy = dyn_cast<StructType>(OpTy))
          if (STy->getNumElements() == 1)
            OpTy = STy->getElementType(0);
  
@@ -2953,10 +2970,13 @@ TargetLowering::AsmOperandInfoVector TargetLowering::ParseConstraints(
        AsmOperandInfo &Input = ConstraintOperands[OpInfo.MatchingInput];
  
        if (OpInfo.ConstraintVT != Input.ConstraintVT) {
+       std::pair<unsigned, const TargetRegisterClass*> MatchRC =
+         getRegForInlineAsmConstraint(OpInfo.ConstraintCode, OpInfo.ConstraintVT);
+       std::pair<unsigned, const TargetRegisterClass*> InputRC =
+         getRegForInlineAsmConstraint(Input.ConstraintCode, Input.ConstraintVT);
          if ((OpInfo.ConstraintVT.isInteger() !=
               Input.ConstraintVT.isInteger()) ||
-            (OpInfo.ConstraintVT.getSizeInBits() !=
-             Input.ConstraintVT.getSizeInBits())) {
+            (MatchRC.second != InputRC.second)) {
            report_fatal_error("Unsupported asm: input constraint"
                               " with a matching output constraint of"
                               " incompatible type!");
@@ -3171,7 +3191,7 @@ void TargetLowering::ComputeConstraintToUse(AsmOperandInfo &OpInfo,
  /// isLegalAddressingMode - Return true if the addressing mode represented
  /// by AM is legal for this target, for a load/store of the specified type.
  bool TargetLowering::isLegalAddressingMode(const AddrMode &AM,
-                                           const Type *Ty) const {
+                                           Type *Ty) const {
    // The default implementation of this implements a conservative RISCy, r+r and
    // r+i addr mode.
  
@@ -3202,12 +3222,39 @@ bool TargetLowering::isLegalAddressingMode(const AddrMode &AM,
    return true;
  }
  
+/// BuildExactDiv - Given an exact SDIV by a constant, create a multiplication
+/// with the multiplicative inverse of the constant.
+SDValue TargetLowering::BuildExactSDIV(SDValue Op1, SDValue Op2, DebugLoc dl,
+                                       SelectionDAG &DAG) const {
+  ConstantSDNode *C = cast<ConstantSDNode>(Op2);
+  APInt d = C->getAPIntValue();
+  assert(d != 0 && "Division by zero!");
+
+  // Shift the value upfront if it is even, so the LSB is one.
+  unsigned ShAmt = d.countTrailingZeros();
+  if (ShAmt) {
+    // TODO: For UDIV use SRL instead of SRA.
+    SDValue Amt = DAG.getConstant(ShAmt, getShiftAmountTy(Op1.getValueType()));
+    Op1 = DAG.getNode(ISD::SRA, dl, Op1.getValueType(), Op1, Amt);
+    d = d.ashr(ShAmt);
+  }
+
+  // Calculate the multiplicative inverse, using Newton's method.
+  APInt t, xn = d;
+  while ((t = d*xn) != 1)
+    xn *= APInt(d.getBitWidth(), 2) - t;
+
+  Op2 = DAG.getConstant(xn, Op1.getValueType());
+  return DAG.getNode(ISD::MUL, dl, Op1.getValueType(), Op1, Op2);
+}
+
  /// BuildSDIVSequence - Given an ISD::SDIV node expressing a divide by constant,
  /// return a DAG expression to select that will generate the same value by
  /// multiplying by a magic number.  See:
  /// <http://the.wall.riscom.net/books/proc/ppc/cwg/code2.html>
-SDValue TargetLowering::BuildSDIV(SDNode *N, SelectionDAG &DAG,
-                                  std::vector<SDNode*>* Created) const {
+SDValue TargetLowering::
+BuildSDIV(SDNode *N, SelectionDAG &DAG, bool IsAfterLegalization,
+          std::vector<SDNode*>* Created) const {
    EVT VT = N->getValueType(0);
    DebugLoc dl= N->getDebugLoc();
  
@@ -3222,10 +3269,12 @@ SDValue TargetLowering::BuildSDIV(SDNode *N, SelectionDAG &DAG,
    // Multiply the numerator (operand 0) by the magic value
    // FIXME: We should support doing a MUL in a wider type
    SDValue Q;
-  if (isOperationLegalOrCustom(ISD::MULHS, VT))
+  if (IsAfterLegalization ? isOperationLegal(ISD::MULHS, VT) :
+                            isOperationLegalOrCustom(ISD::MULHS, VT))
      Q = DAG.getNode(ISD::MULHS, dl, VT, N->getOperand(0),
                      DAG.getConstant(magics.m, VT));
-  else if (isOperationLegalOrCustom(ISD::SMUL_LOHI, VT))
+  else if (IsAfterLegalization ? isOperationLegal(ISD::SMUL_LOHI, VT) :
+                                 isOperationLegalOrCustom(ISD::SMUL_LOHI, VT))
      Q = SDValue(DAG.getNode(ISD::SMUL_LOHI, dl, DAG.getVTList(VT, VT),
                                N->getOperand(0),
                                DAG.getConstant(magics.m, VT)).getNode(), 1);
@@ -3263,8 +3312,9 @@ SDValue TargetLowering::BuildSDIV(SDNode *N, SelectionDAG &DAG,
  /// return a DAG expression to select that will generate the same value by
  /// multiplying by a magic number.  See:
  /// <http://the.wall.riscom.net/books/proc/ppc/cwg/code2.html>
-SDValue TargetLowering::BuildUDIV(SDNode *N, SelectionDAG &DAG,
-                                  std::vector<SDNode*>* Created) const {
+SDValue TargetLowering::
+BuildUDIV(SDNode *N, SelectionDAG &DAG, bool IsAfterLegalization,
+          std::vector<SDNode*>* Created) const {
    EVT VT = N->getValueType(0);
    DebugLoc dl = N->getDebugLoc();
  
@@ -3296,9 +3346,11 @@ SDValue TargetLowering::BuildUDIV(SDNode *N, SelectionDAG &DAG,
  
    // Multiply the numerator (operand 0) by the magic value
    // FIXME: We should support doing a MUL in a wider type
-  if (isOperationLegalOrCustom(ISD::MULHU, VT))
+  if (IsAfterLegalization ? isOperationLegal(ISD::MULHU, VT) :
+                            isOperationLegalOrCustom(ISD::MULHU, VT))
      Q = DAG.getNode(ISD::MULHU, dl, VT, Q, DAG.getConstant(magics.m, VT));
-  else if (isOperationLegalOrCustom(ISD::UMUL_LOHI, VT))
+  else if (IsAfterLegalization ? isOperationLegal(ISD::UMUL_LOHI, VT) :
+                                 isOperationLegalOrCustom(ISD::UMUL_LOHI, VT))
      Q = SDValue(DAG.getNode(ISD::UMUL_LOHI, dl, DAG.getVTList(VT, VT), Q,
                              DAG.getConstant(magics.m, VT)).getNode(), 1);
    else