[X86] Fold 'if' followed by just an llvm_unreachable into an assert.

[oota-llvm.git] / lib / Target / X86 / X86ISelLowering.cpp
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index 63c2b9a21dc15ef186eb965177c81a6e49b835e6..dd085c21f7a74a4362e7622e500fe0bd4a579f42 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -75,7 +75,6 @@ X86TargetLowering::X86TargetLowering(const X86TargetMachine &TM,
    MVT PtrVT = MVT::getIntegerVT(8 * TM.getPointerSize());
  
    // Set up the TargetLowering object.
-  static const MVT IntVTs[] = { MVT::i8, MVT::i16, MVT::i32, MVT::i64 };
  
    // X86 is weird. It always uses i8 for shift amounts and setcc results.
    setBooleanContents(ZeroOrOneBooleanContent);
@@ -270,8 +269,7 @@ X86TargetLowering::X86TargetLowering(const X86TargetMachine &TM,
    // (low) operations are left as Legal, as there are single-result
    // instructions for this in x86. Using the two-result multiply instructions
    // when both high and low results are needed must be arranged by dagcombine.
-  for (unsigned i = 0; i != array_lengthof(IntVTs); ++i) {
-    MVT VT = IntVTs[i];
+  for (auto VT : { MVT::i8, MVT::i16, MVT::i32, MVT::i64 }) {
      setOperationAction(ISD::MULHS, VT, Expand);
      setOperationAction(ISD::MULHU, VT, Expand);
      setOperationAction(ISD::SDIV, VT, Expand);
@@ -462,8 +460,7 @@ X86TargetLowering::X86TargetLowering(const X86TargetMachine &TM,
    setOperationAction(ISD::ATOMIC_FENCE  , MVT::Other, Custom);
  
    // Expand certain atomics
-  for (unsigned i = 0; i != array_lengthof(IntVTs); ++i) {
-    MVT VT = IntVTs[i];
+  for (auto VT : { MVT::i8, MVT::i16, MVT::i32, MVT::i64 }) {
      setOperationAction(ISD::ATOMIC_CMP_SWAP_WITH_SUCCESS, VT, Custom);
      setOperationAction(ISD::ATOMIC_LOAD_SUB, VT, Custom);
      setOperationAction(ISD::ATOMIC_STORE, VT, Custom);
@@ -861,14 +858,7 @@ X86TargetLowering::X86TargetLowering(const X86TargetMachine &TM,
      // ISD::CTTZ_ZERO_UNDEF v2i64 - scalarization is faster.
  
      // Custom lower build_vector, vector_shuffle, and extract_vector_elt.
-    for (int i = MVT::v16i8; i != MVT::v2i64; ++i) {
-      MVT VT = (MVT::SimpleValueType)i;
-      // Do not attempt to custom lower non-power-of-2 vectors
-      if (!isPowerOf2_32(VT.getVectorNumElements()))
-        continue;
-      // Do not attempt to custom lower non-128-bit vectors
-      if (!VT.is128BitVector())
-        continue;
+    for (auto VT : { MVT::v16i8, MVT::v8i16, MVT::v4i32 }) {
        setOperationAction(ISD::BUILD_VECTOR,       VT, Custom);
        setOperationAction(ISD::VECTOR_SHUFFLE,     VT, Custom);
        setOperationAction(ISD::VSELECT,            VT, Custom);
@@ -906,13 +896,7 @@ X86TargetLowering::X86TargetLowering(const X86TargetMachine &TM,
      }
  
      // Promote v16i8, v8i16, v4i32 load, select, and, or, xor to v2i64.
-    for (int i = MVT::v16i8; i != MVT::v2i64; ++i) {
-      MVT VT = (MVT::SimpleValueType)i;
-
-      // Do not attempt to promote non-128-bit vectors
-      if (!VT.is128BitVector())
-        continue;
-
+    for (auto VT : { MVT::v16i8, MVT::v8i16, MVT::v4i32 }) {
        setOperationAction(ISD::AND,    VT, Promote);
        AddPromotedToType (ISD::AND,    VT, MVT::v2i64);
        setOperationAction(ISD::OR,     VT, Promote);
@@ -1291,13 +1275,7 @@ X86TargetLowering::X86TargetLowering(const X86TargetMachine &TM,
        setOperationAction(ISD::VSELECT,         MVT::v32i8, Legal);
  
      // Promote v32i8, v16i16, v8i32 select, and, or, xor to v4i64.
-    for (int i = MVT::v32i8; i != MVT::v4i64; ++i) {
-      MVT VT = (MVT::SimpleValueType)i;
-
-      // Do not attempt to promote non-256-bit vectors
-      if (!VT.is256BitVector())
-        continue;
-
+    for (auto VT : { MVT::v32i8, MVT::v16i16, MVT::v8i32 }) {
        setOperationAction(ISD::AND,    VT, Promote);
        AddPromotedToType (ISD::AND,    VT, MVT::v4i64);
        setOperationAction(ISD::OR,     VT, Promote);
@@ -1605,13 +1583,7 @@ X86TargetLowering::X86TargetLowering(const X86TargetMachine &TM,
          setOperationAction(ISD::MSTORE,              VT, Legal);
        }
      }
-    for (int i = MVT::v32i8; i != MVT::v8i64; ++i) {
-      MVT VT = (MVT::SimpleValueType)i;
-
-      // Do not attempt to promote non-512-bit vectors.
-      if (!VT.is512BitVector())
-        continue;
-
+    for (auto VT : { MVT::v64i8, MVT::v32i16, MVT::v16i32 }) {
        setOperationAction(ISD::SELECT, VT, Promote);
        AddPromotedToType (ISD::SELECT, VT, MVT::v8i64);
      }
@@ -1688,19 +1660,9 @@ X86TargetLowering::X86TargetLowering(const X86TargetMachine &TM,
        setOperationAction(ISD::CTLZ_ZERO_UNDEF, MVT::v64i8,  Custom);
      }
  
-    for (int i = MVT::v32i8; i != MVT::v8i64; ++i) {
-      const MVT VT = (MVT::SimpleValueType)i;
-
-      const unsigned EltSize = VT.getVectorElementType().getSizeInBits();
-
-      // Do not attempt to promote non-512-bit vectors.
-      if (!VT.is512BitVector())
-        continue;
-
-      if (EltSize < 32) {
-        setOperationAction(ISD::BUILD_VECTOR,        VT, Custom);
-        setOperationAction(ISD::VSELECT,             VT, Legal);
-      }
+    for (auto VT : { MVT::v64i8, MVT::v32i16 }) {
+      setOperationAction(ISD::BUILD_VECTOR,        VT, Custom);
+      setOperationAction(ISD::VSELECT,             VT, Legal);
      }
    }
  
@@ -1753,9 +1715,10 @@ X86TargetLowering::X86TargetLowering(const X86TargetMachine &TM,
    // FIXME: We really should do custom legalization for addition and
    // subtraction on x86-32 once PR3203 is fixed.  We really can't do much better
    // than generic legalization for 64-bit multiplication-with-overflow, though.
-  for (unsigned i = 0, e = 3+Subtarget->is64Bit(); i != e; ++i) {
+  for (auto VT : { MVT::i8, MVT::i16, MVT::i32, MVT::i64 }) {
+    if (VT == MVT::i64 && !Subtarget->is64Bit())
+      continue;
      // Add/Sub/Mul with overflow operations are custom lowered.
-    MVT VT = IntVTs[i];
      setOperationAction(ISD::SADDO, VT, Custom);
      setOperationAction(ISD::UADDO, VT, Custom);
      setOperationAction(ISD::SSUBO, VT, Custom);
@@ -1862,40 +1825,43 @@ EVT X86TargetLowering::getSetCCResultType(const DataLayout &DL, LLVMContext &,
    if (!VT.isVector())
      return Subtarget->hasAVX512() ? MVT::i1: MVT::i8;
  
-  const unsigned NumElts = VT.getVectorNumElements();
-  const EVT EltVT = VT.getVectorElementType();
-  if (VT.is512BitVector()) {
-    if (Subtarget->hasAVX512())
-      if (EltVT == MVT::i32 || EltVT == MVT::i64 ||
-          EltVT == MVT::f32 || EltVT == MVT::f64)
-        switch(NumElts) {
-        case  8: return MVT::v8i1;
-        case 16: return MVT::v16i1;
-      }
-    if (Subtarget->hasBWI())
-      if (EltVT == MVT::i8 || EltVT == MVT::i16)
-        switch(NumElts) {
-        case 32: return MVT::v32i1;
-        case 64: return MVT::v64i1;
-      }
-  }
+  if (VT.isSimple()) {
+    MVT VVT = VT.getSimpleVT();
+    const unsigned NumElts = VVT.getVectorNumElements();
+    const MVT EltVT = VVT.getVectorElementType();
+    if (VVT.is512BitVector()) {
+      if (Subtarget->hasAVX512())
+        if (EltVT == MVT::i32 || EltVT == MVT::i64 ||
+            EltVT == MVT::f32 || EltVT == MVT::f64)
+          switch(NumElts) {
+          case  8: return MVT::v8i1;
+          case 16: return MVT::v16i1;
+        }
+      if (Subtarget->hasBWI())
+        if (EltVT == MVT::i8 || EltVT == MVT::i16)
+          switch(NumElts) {
+          case 32: return MVT::v32i1;
+          case 64: return MVT::v64i1;
+        }
+    }
  
-  if (VT.is256BitVector() || VT.is128BitVector()) {
-    if (Subtarget->hasVLX())
-      if (EltVT == MVT::i32 || EltVT == MVT::i64 ||
-          EltVT == MVT::f32 || EltVT == MVT::f64)
-        switch(NumElts) {
-        case 2: return MVT::v2i1;
-        case 4: return MVT::v4i1;
-        case 8: return MVT::v8i1;
-      }
-    if (Subtarget->hasBWI() && Subtarget->hasVLX())
-      if (EltVT == MVT::i8 || EltVT == MVT::i16)
-        switch(NumElts) {
-        case  8: return MVT::v8i1;
-        case 16: return MVT::v16i1;
-        case 32: return MVT::v32i1;
-      }
+    if (VVT.is256BitVector() || VVT.is128BitVector()) {
+      if (Subtarget->hasVLX())
+        if (EltVT == MVT::i32 || EltVT == MVT::i64 ||
+            EltVT == MVT::f32 || EltVT == MVT::f64)
+          switch(NumElts) {
+          case 2: return MVT::v2i1;
+          case 4: return MVT::v4i1;
+          case 8: return MVT::v8i1;
+        }
+      if (Subtarget->hasBWI() && Subtarget->hasVLX())
+        if (EltVT == MVT::i8 || EltVT == MVT::i16)
+          switch(NumElts) {
+          case  8: return MVT::v8i1;
+          case 16: return MVT::v16i1;
+          case 32: return MVT::v32i1;
+        }
+    }
    }
  
    return VT.changeVectorElementTypeToInteger();
@@ -2213,7 +2179,7 @@ X86TargetLowering::LowerReturn(SDValue Chain,
      else if (VA.getLocInfo() == CCValAssign::ZExt)
        ValToCopy = DAG.getNode(ISD::ZERO_EXTEND, dl, VA.getLocVT(), ValToCopy);
      else if (VA.getLocInfo() == CCValAssign::AExt) {
-      if (ValVT.isVector() && ValVT.getScalarType() == MVT::i1)
+      if (ValVT.isVector() && ValVT.getVectorElementType() == MVT::i1)
          ValToCopy = DAG.getNode(ISD::SIGN_EXTEND, dl, VA.getLocVT(), ValToCopy);
        else
          ValToCopy = DAG.getNode(ISD::ANY_EXTEND, dl, VA.getLocVT(), ValToCopy);
@@ -2992,7 +2958,7 @@ static SDValue EmitTailCallStoreRetAddr(SelectionDAG &DAG, MachineFunction &MF,
  
  /// Returns a vector_shuffle mask for an movs{s|d}, movd
  /// operation of specified width.
-static SDValue getMOVL(SelectionDAG &DAG, SDLoc dl, EVT VT, SDValue V1,
+static SDValue getMOVL(SelectionDAG &DAG, SDLoc dl, MVT VT, SDValue V1,
                         SDValue V2) {
    unsigned NumElems = VT.getVectorNumElements();
    SmallVector<int, 8> Mask;
@@ -3154,7 +3120,7 @@ X86TargetLowering::LowerCall(TargetLowering::CallLoweringInfo &CLI,
        break;
      case CCValAssign::AExt:
        if (Arg.getValueType().isVector() &&
-          Arg.getValueType().getScalarType() == MVT::i1)
+          Arg.getValueType().getVectorElementType() == MVT::i1)
          Arg = DAG.getNode(ISD::SIGN_EXTEND, dl, RegVT, Arg);
        else if (RegVT.is128BitVector()) {
          // Special case: passing MMX values in XMM registers.
@@ -3878,7 +3844,7 @@ static bool isTargetShuffle(unsigned Opcode) {
    }
  }
  
-static SDValue getTargetShuffleNode(unsigned Opc, SDLoc dl, EVT VT,
+static SDValue getTargetShuffleNode(unsigned Opc, SDLoc dl, MVT VT,
                                      SDValue V1, unsigned TargetMask,
                                      SelectionDAG &DAG) {
    switch(Opc) {
@@ -3893,7 +3859,7 @@ static SDValue getTargetShuffleNode(unsigned Opc, SDLoc dl, EVT VT,
    }
  }
  
-static SDValue getTargetShuffleNode(unsigned Opc, SDLoc dl, EVT VT,
+static SDValue getTargetShuffleNode(unsigned Opc, SDLoc dl, MVT VT,
                                      SDValue V1, SDValue V2, SelectionDAG &DAG) {
    switch(Opc) {
    default: llvm_unreachable("Unknown x86 shuffle node");
@@ -3993,7 +3959,6 @@ static bool isX86CCUnsigned(unsigned X86CC) {
    case X86::COND_BE:    return true;
    case X86::COND_AE:    return true;
    }
-  llvm_unreachable("covered switch fell through?!");
  }
  
  /// Do a one-to-one translation of a ISD::CondCode to the X86-specific
@@ -4241,8 +4206,8 @@ bool X86::isVEXTRACT256Index(SDNode *N) {
  
  static unsigned getExtractVEXTRACTImmediate(SDNode *N, unsigned vecWidth) {
    assert((vecWidth == 128 || vecWidth == 256) && "Unsupported vector width");
-  if (!isa<ConstantSDNode>(N->getOperand(1).getNode()))
-    llvm_unreachable("Illegal extract subvector for VEXTRACT");
+  assert(isa<ConstantSDNode>(N->getOperand(1).getNode()) &&
+         "Illegal extract subvector for VEXTRACT");
  
    uint64_t Index =
      cast<ConstantSDNode>(N->getOperand(1).getNode())->getZExtValue();
@@ -4256,8 +4221,8 @@ static unsigned getExtractVEXTRACTImmediate(SDNode *N, unsigned vecWidth) {
  
  static unsigned getInsertVINSERTImmediate(SDNode *N, unsigned vecWidth) {
    assert((vecWidth == 128 || vecWidth == 256) && "Unsupported vector width");
-  if (!isa<ConstantSDNode>(N->getOperand(2).getNode()))
-    llvm_unreachable("Illegal insert subvector for VINSERT");
+  assert(isa<ConstantSDNode>(N->getOperand(2).getNode()) &&
+         "Illegal insert subvector for VINSERT");
  
    uint64_t Index =
      cast<ConstantSDNode>(N->getOperand(2).getNode())->getZExtValue();
@@ -4311,22 +4276,22 @@ bool X86::isZeroNode(SDValue Elt) {
  // Build a vector of constants
  // Use an UNDEF node if MaskElt == -1.
  // Spilt 64-bit constants in the 32-bit mode.
-static SDValue getConstVector(ArrayRef<int> Values, EVT VT,
+static SDValue getConstVector(ArrayRef<int> Values, MVT VT,
                                SelectionDAG &DAG,
                                SDLoc dl, bool IsMask = false) {
  
    SmallVector<SDValue, 32>  Ops;
    bool Split = false;
  
-  EVT ConstVecVT = VT;
+  MVT ConstVecVT = VT;
    unsigned NumElts = VT.getVectorNumElements();
    bool In64BitMode = DAG.getTargetLoweringInfo().isTypeLegal(MVT::i64);
-  if (!In64BitMode && VT.getScalarType() == MVT::i64) {
+  if (!In64BitMode && VT.getVectorElementType() == MVT::i64) {
      ConstVecVT = MVT::getVectorVT(MVT::i32, NumElts * 2);
      Split = true;
    }
  
-  EVT EltVT = ConstVecVT.getScalarType();
+  MVT EltVT = ConstVecVT.getVectorElementType();
    for (unsigned i = 0; i < NumElts; ++i) {
      bool IsUndef = Values[i] < 0 && IsMask;
      SDValue OpNode = IsUndef ? DAG.getUNDEF(EltVT) :
@@ -4375,7 +4340,7 @@ static SDValue getZeroVector(EVT VT, const X86Subtarget *Subtarget,
        SDValue Ops[] = { Cst, Cst, Cst, Cst, Cst, Cst, Cst, Cst,
                          Cst, Cst, Cst, Cst, Cst, Cst, Cst, Cst };
        Vec = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v16i32, Ops);
-  } else if (VT.getScalarType() == MVT::i1) {
+  } else if (VT.getVectorElementType() == MVT::i1) {
  
      assert((Subtarget->hasBWI() || VT.getVectorNumElements() <= 16)
              && "Unexpected vector type");
@@ -4407,19 +4372,18 @@ static SDValue ExtractSubVector(SDValue Vec, unsigned IdxVal,
  
    // Extract the relevant vectorWidth bits.  Generate an EXTRACT_SUBVECTOR
    unsigned ElemsPerChunk = vectorWidth / ElVT.getSizeInBits();
+  assert(isPowerOf2_32(ElemsPerChunk) && "Elements per chunk not power of 2");
  
    // This is the index of the first element of the vectorWidth-bit chunk
-  // we want.
-  unsigned NormalizedIdxVal = (((IdxVal * ElVT.getSizeInBits()) / vectorWidth)
-                               * ElemsPerChunk);
+  // we want. Since ElemsPerChunk is a power of 2 just need to clear bits.
+  IdxVal &= ~(ElemsPerChunk - 1);
  
    // If the input is a buildvector just emit a smaller one.
    if (Vec.getOpcode() == ISD::BUILD_VECTOR)
      return DAG.getNode(ISD::BUILD_VECTOR, dl, ResultVT,
-                       makeArrayRef(Vec->op_begin() + NormalizedIdxVal,
-                                    ElemsPerChunk));
+                       makeArrayRef(Vec->op_begin() + IdxVal, ElemsPerChunk));
  
-  SDValue VecIdx = DAG.getIntPtrConstant(NormalizedIdxVal, dl);
+  SDValue VecIdx = DAG.getIntPtrConstant(IdxVal, dl);
    return DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, ResultVT, Vec, VecIdx);
  }
  
@@ -4457,13 +4421,13 @@ static SDValue InsertSubVector(SDValue Result, SDValue Vec,
  
    // Insert the relevant vectorWidth bits.
    unsigned ElemsPerChunk = vectorWidth/ElVT.getSizeInBits();
+  assert(isPowerOf2_32(ElemsPerChunk) && "Elements per chunk not power of 2");
  
    // This is the index of the first element of the vectorWidth-bit chunk
-  // we want.
-  unsigned NormalizedIdxVal = (((IdxVal * ElVT.getSizeInBits())/vectorWidth)
-                               * ElemsPerChunk);
+  // we want. Since ElemsPerChunk is a power of 2 just need to clear bits.
+  IdxVal &= ~(ElemsPerChunk - 1);
  
-  SDValue VecIdx = DAG.getIntPtrConstant(NormalizedIdxVal, dl);
+  SDValue VecIdx = DAG.getIntPtrConstant(IdxVal, dl);
    return DAG.getNode(ISD::INSERT_SUBVECTOR, dl, ResultVT, Result, Vec, VecIdx);
  }
  
@@ -4491,7 +4455,7 @@ static SDValue Insert128BitVector(SDValue Result, SDValue Vec, unsigned IdxVal,
                                   Vec, ZeroIndex);
  
      // The blend instruction, and therefore its mask, depend on the data type.
-    MVT ScalarType = ResultVT.getScalarType().getSimpleVT();
+    MVT ScalarType = ResultVT.getVectorElementType().getSimpleVT();
      if (ScalarType.isFloatingPoint()) {
        // Choose either vblendps (float) or vblendpd (double).
        unsigned ScalarSize = ScalarType.getSizeInBits();
@@ -4686,7 +4650,7 @@ static bool getTargetShuffleMask(SDNode *N, MVT VT,
  
      if (MaskNode->getOpcode() == ISD::BUILD_VECTOR) {
        // If we have a build-vector, then things are easy.
-      EVT VT = MaskNode.getValueType();
+      MVT VT = MaskNode.getSimpleValueType();
        assert(VT.isVector() &&
               "Can't produce a non-vector with a build_vector!");
        if (!VT.isInteger())
@@ -4786,8 +4750,8 @@ static bool getTargetShuffleMask(SDNode *N, MVT VT,
      SmallVector<uint64_t, 32> RawMask;
      if (MaskNode->getOpcode() == ISD::BUILD_VECTOR) {
        // If we have a build-vector, then things are easy.
-      assert(MaskNode.getValueType().isInteger() &&
-             MaskNode.getValueType().getVectorNumElements() ==
+      assert(MaskNode.getSimpleValueType().isInteger() &&
+             MaskNode.getSimpleValueType().getVectorNumElements() ==
               VT.getVectorNumElements());
  
        for (unsigned i = 0; i < MaskNode->getNumOperands(); ++i) {
@@ -4847,8 +4811,8 @@ static bool getTargetShuffleMask(SDNode *N, MVT VT,
  
      if (MaskNode->getOpcode() == ISD::BUILD_VECTOR) {
        // If we have a build-vector, then things are easy.
-      assert(MaskNode.getValueType().isInteger() &&
-             MaskNode.getValueType().getVectorNumElements() ==
+      assert(MaskNode.getSimpleValueType().isInteger() &&
+             MaskNode.getSimpleValueType().getVectorNumElements() ==
               VT.getVectorNumElements());
  
        SmallVector<uint64_t, 32> RawMask;
@@ -5918,7 +5882,7 @@ static SDValue ExpandHorizontalBinOp(const SDValue &V0, const SDValue &V1,
  /// node.
  static SDValue LowerToAddSub(const BuildVectorSDNode *BV,
                               const X86Subtarget *Subtarget, SelectionDAG &DAG) {
-  EVT VT = BV->getValueType(0);
+  MVT VT = BV->getSimpleValueType(0);
    if ((!Subtarget->hasSSE3() || (VT != MVT::v4f32 && VT != MVT::v2f64)) &&
        (!Subtarget->hasAVX() || (VT != MVT::v8f32 && VT != MVT::v4f64)))
      return SDValue();
@@ -5980,12 +5944,12 @@ static SDValue LowerToAddSub(const BuildVectorSDNode *BV,
      // Update InVec0 and InVec1.
      if (InVec0.getOpcode() == ISD::UNDEF) {
        InVec0 = Op0.getOperand(0);
-      if (InVec0.getValueType() != VT)
+      if (InVec0.getSimpleValueType() != VT)
          return SDValue();
      }
      if (InVec1.getOpcode() == ISD::UNDEF) {
        InVec1 = Op1.getOperand(0);
-      if (InVec1.getValueType() != VT)
+      if (InVec1.getSimpleValueType() != VT)
          return SDValue();
      }
  
@@ -6021,7 +5985,7 @@ static SDValue LowerToAddSub(const BuildVectorSDNode *BV,
  static SDValue LowerToHorizontalOp(const BuildVectorSDNode *BV,
                                     const X86Subtarget *Subtarget,
                                     SelectionDAG &DAG) {
-  EVT VT = BV->getValueType(0);
+  MVT VT = BV->getSimpleValueType(0);
    unsigned NumElts = VT.getVectorNumElements();
    unsigned NumUndefsLO = 0;
    unsigned NumUndefsHI = 0;
@@ -6163,7 +6127,7 @@ X86TargetLowering::LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const {
    unsigned NumElems = Op.getNumOperands();
  
    // Generate vectors for predicate vectors.
-  if (VT.getScalarType() == MVT::i1 && Subtarget->hasAVX512())
+  if (VT.getVectorElementType() == MVT::i1 && Subtarget->hasAVX512())
      return LowerBUILD_VECTORvXi1(Op, DAG);
  
    // Vectors containing all zeros can be matched by pxor and xorps later
@@ -6237,7 +6201,7 @@ X86TargetLowering::LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const {
        if (DAG.MaskedValueIsZero(Item, APInt::getBitsSet(64, 32, 64))) {
          // Handle SSE only.
          assert(VT == MVT::v2i64 && "Expected an SSE value type!");
-        EVT VecVT = MVT::v4i32;
+        MVT VecVT = MVT::v4i32;
  
          // Truncate the value (which may itself be a constant) to i32, and
          // convert it to a vector with movd (S2V+shuffle to zero extend).
@@ -6511,8 +6475,8 @@ static SDValue LowerAVXCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) {
      return Concat128BitVectors(V1, V2, ResVT, NumElems, DAG, dl);
  
    if (Op.getNumOperands() == 4) {
-    MVT HalfVT = MVT::getVectorVT(ResVT.getScalarType(),
-                                ResVT.getVectorNumElements()/2);
+    MVT HalfVT = MVT::getVectorVT(ResVT.getVectorElementType(),
+                                  ResVT.getVectorNumElements()/2);
      SDValue V3 = Op.getOperand(2);
      SDValue V4 = Op.getOperand(3);
      return Concat256BitVectors(Concat128BitVectors(V1, V2, HalfVT, NumElems/2, DAG, dl),
@@ -6532,7 +6496,7 @@ static SDValue LowerCONCAT_VECTORSvXi1(SDValue Op,
           "Unexpected number of operands in CONCAT_VECTORS");
  
    if (NumOfOperands > 2) {
-    MVT HalfVT = MVT::getVectorVT(ResVT.getScalarType(),
+    MVT HalfVT = MVT::getVectorVT(ResVT.getVectorElementType(),
                                    ResVT.getVectorNumElements()/2);
      SmallVector<SDValue, 2> Ops;
      for (unsigned i = 0; i < NumOfOperands/2; i++)
@@ -6825,7 +6789,7 @@ static SDValue lowerVectorShuffleWithUNPCK(SDLoc DL, MVT VT, ArrayRef<int> Mask,
  static SDValue lowerVectorShuffleAsBitMask(SDLoc DL, MVT VT, SDValue V1,
                                             SDValue V2, ArrayRef<int> Mask,
                                             SelectionDAG &DAG) {
-  MVT EltVT = VT.getScalarType();
+  MVT EltVT = VT.getVectorElementType();
    int NumEltBits = EltVT.getSizeInBits();
    MVT IntEltVT = MVT::getIntegerVT(NumEltBits);
    SDValue Zero = DAG.getConstant(0, DL, IntEltVT);
@@ -6869,7 +6833,7 @@ static SDValue lowerVectorShuffleAsBitBlend(SDLoc DL, MVT VT, SDValue V1,
                                              SDValue V2, ArrayRef<int> Mask,
                                              SelectionDAG &DAG) {
    assert(VT.isInteger() && "Only supports integer vector types!");
-  MVT EltVT = VT.getScalarType();
+  MVT EltVT = VT.getVectorElementType();
    int NumEltBits = EltVT.getSizeInBits();
    SDValue Zero = DAG.getConstant(0, DL, EltVT);
    SDValue AllOnes = DAG.getConstant(APInt::getAllOnesValue(NumEltBits), DL,
@@ -6896,22 +6860,62 @@ static SDValue lowerVectorShuffleAsBitBlend(SDLoc DL, MVT VT, SDValue V1,
  /// This doesn't do any checks for the availability of instructions for blending
  /// these values. It relies on the availability of the X86ISD::BLENDI pattern to
  /// be matched in the backend with the type given. What it does check for is
-/// that the shuffle mask is in fact a blend.
+/// that the shuffle mask is a blend, or convertible into a blend with zero.
  static SDValue lowerVectorShuffleAsBlend(SDLoc DL, MVT VT, SDValue V1,
-                                         SDValue V2, ArrayRef<int> Mask,
+                                         SDValue V2, ArrayRef<int> Original,
                                           const X86Subtarget *Subtarget,
                                           SelectionDAG &DAG) {
+  bool V1IsZero = ISD::isBuildVectorAllZeros(V1.getNode());
+  bool V2IsZero = ISD::isBuildVectorAllZeros(V2.getNode());
+  SmallVector<int, 8> Mask(Original.begin(), Original.end());
+  SmallBitVector Zeroable = computeZeroableShuffleElements(Mask, V1, V2);
+  bool ForceV1Zero = false, ForceV2Zero = false;
+
+  // Attempt to generate the binary blend mask. If an input is zero then
+  // we can use any lane.
+  // TODO: generalize the zero matching to any scalar like isShuffleEquivalent.
    unsigned BlendMask = 0;
    for (int i = 0, Size = Mask.size(); i < Size; ++i) {
-    if (Mask[i] >= Size) {
-      if (Mask[i] != i + Size)
-        return SDValue(); // Shuffled V2 input!
+    int M = Mask[i];
+    if (M < 0)
+      continue;
+    if (M == i)
+      continue;
+    if (M == i + Size) {
        BlendMask |= 1u << i;
        continue;
      }
-    if (Mask[i] >= 0 && Mask[i] != i)
-      return SDValue(); // Shuffled V1 input!
+    if (Zeroable[i]) {
+      if (V1IsZero) {
+        ForceV1Zero = true;
+        Mask[i] = i;
+        continue;
+      }
+      if (V2IsZero) {
+        ForceV2Zero = true;
+        BlendMask |= 1u << i;
+        Mask[i] = i + Size;
+        continue;
+      }
+    }
+    return SDValue(); // Shuffled input!
    }
+
+  // Create a REAL zero vector - ISD::isBuildVectorAllZeros allows UNDEFs.
+  if (ForceV1Zero)
+    V1 = getZeroVector(VT, Subtarget, DAG, DL);
+  if (ForceV2Zero)
+    V2 = getZeroVector(VT, Subtarget, DAG, DL);
+
+  auto ScaleBlendMask = [](unsigned BlendMask, int Size, int Scale) {
+    unsigned ScaledMask = 0;
+    for (int i = 0; i != Size; ++i)
+      if (BlendMask & (1u << i))
+        for (int j = 0; j != Scale; ++j)
+          ScaledMask |= 1u << (i * Scale + j);
+    return ScaledMask;
+  };
+
    switch (VT.SimpleTy) {
    case MVT::v2f64:
    case MVT::v4f32:
@@ -6931,12 +6935,7 @@ static SDValue lowerVectorShuffleAsBlend(SDLoc DL, MVT VT, SDValue V1,
      if (Subtarget->hasAVX2()) {
        // Scale the blend by the number of 32-bit dwords per element.
        int Scale =  VT.getScalarSizeInBits() / 32;
-      BlendMask = 0;
-      for (int i = 0, Size = Mask.size(); i < Size; ++i)
-        if (Mask[i] >= Size)
-          for (int j = 0; j < Scale; ++j)
-            BlendMask |= 1u << (i * Scale + j);
-
+      BlendMask = ScaleBlendMask(BlendMask, Mask.size(), Scale);
        MVT BlendVT = VT.getSizeInBits() > 128 ? MVT::v8i32 : MVT::v4i32;
        V1 = DAG.getBitcast(BlendVT, V1);
        V2 = DAG.getBitcast(BlendVT, V2);
@@ -6949,12 +6948,7 @@ static SDValue lowerVectorShuffleAsBlend(SDLoc DL, MVT VT, SDValue V1,
      // For integer shuffles we need to expand the mask and cast the inputs to
      // v8i16s prior to blending.
      int Scale = 8 / VT.getVectorNumElements();
-    BlendMask = 0;
-    for (int i = 0, Size = Mask.size(); i < Size; ++i)
-      if (Mask[i] >= Size)
-        for (int j = 0; j < Scale; ++j)
-          BlendMask |= 1u << (i * Scale + j);
-
+    BlendMask = ScaleBlendMask(BlendMask, Mask.size(), Scale);
      V1 = DAG.getBitcast(MVT::v8i16, V1);
      V2 = DAG.getBitcast(MVT::v8i16, V2);
      return DAG.getBitcast(VT,
@@ -6979,7 +6973,7 @@ static SDValue lowerVectorShuffleAsBlend(SDLoc DL, MVT VT, SDValue V1,
      // FALLTHROUGH
    case MVT::v16i8:
    case MVT::v32i8: {
-    assert((VT.getSizeInBits() == 128 || Subtarget->hasAVX2()) &&
+    assert((VT.is128BitVector() || Subtarget->hasAVX2()) &&
             "256-bit byte-blends require AVX2 support!");
  
      // Attempt to lower to a bitmask if we can. VPAND is faster than VPBLENDVB.
@@ -7206,7 +7200,7 @@ static SDValue lowerVectorShuffleAsByteRotate(SDLoc DL, MVT VT, SDValue V1,
                          DAG.getConstant(Rotation * Scale, DL, MVT::i8)));
    }
  
-  assert(VT.getSizeInBits() == 128 &&
+  assert(VT.is128BitVector() &&
           "Rotate-based lowering only supports 128-bit lowering!");
    assert(Mask.size() <= 16 &&
           "Can shuffle at most 16 bytes in a 128-bit vector!");
@@ -7494,7 +7488,7 @@ static SDValue lowerVectorShuffleAsSpecificZeroOrAnyExtend(
    if (Subtarget->hasSSE41()) {
      // Not worth offseting 128-bit vectors if scale == 2, a pattern using
      // PUNPCK will catch this in a later shuffle match.
-    if (Offset && Scale == 2 && VT.getSizeInBits() == 128)
+    if (Offset && Scale == 2 && VT.is128BitVector())
        return SDValue();
      MVT ExtVT = MVT::getVectorVT(MVT::getIntegerVT(EltBits * Scale),
                                   NumElements / Scale);
@@ -7502,7 +7496,7 @@ static SDValue lowerVectorShuffleAsSpecificZeroOrAnyExtend(
      return DAG.getBitcast(VT, InputV);
    }
  
-  assert(VT.getSizeInBits() == 128 && "Only 128-bit vectors can be extended.");
+  assert(VT.is128BitVector() && "Only 128-bit vectors can be extended.");
  
    // For any extends we can cheat for larger element sizes and use shuffle
    // instructions that can fold with a load and/or copy.
@@ -7532,7 +7526,7 @@ static SDValue lowerVectorShuffleAsSpecificZeroOrAnyExtend(
    // to 64-bits.
    if ((Scale * EltBits) == 64 && EltBits < 32 && Subtarget->hasSSE4A()) {
      assert(NumElements == (int)Mask.size() && "Unexpected shuffle mask size!");
-    assert(VT.getSizeInBits() == 128 && "Unexpected vector width!");
+    assert(VT.is128BitVector() && "Unexpected vector width!");
  
      int LoIdx = Offset * EltBits;
      SDValue Lo = DAG.getNode(ISD::BITCAST, DL, MVT::v2i64,
@@ -7917,7 +7911,7 @@ static SDValue lowerVectorShuffleAsBroadcast(SDLoc DL, MVT VT, SDValue V,
  
        int BeginIdx = (int)ConstantIdx->getZExtValue();
        int EndIdx =
-          BeginIdx + (int)VInner.getValueType().getVectorNumElements();
+          BeginIdx + (int)VInner.getSimpleValueType().getVectorNumElements();
        if (BroadcastIdx >= BeginIdx && BroadcastIdx < EndIdx) {
          BroadcastIdx -= BeginIdx;
          V = VInner;
@@ -7936,9 +7930,9 @@ static SDValue lowerVectorShuffleAsBroadcast(SDLoc DL, MVT VT, SDValue V,
    // type than the shuffle, the broadcast element is in essence truncated.
    // Make that explicit to ease folding.
    if (V.getOpcode() == ISD::BITCAST && VT.isInteger()) {
-    EVT EltVT = VT.getVectorElementType();
+    MVT EltVT = VT.getVectorElementType();
      SDValue V0 = V.getOperand(0);
-    EVT V0VT = V0.getValueType();
+    MVT V0VT = V0.getSimpleValueType();
  
      if (V0VT.isInteger() && V0VT.getVectorElementType().bitsGT(EltVT) &&
          ((V0.getOpcode() == ISD::BUILD_VECTOR ||
@@ -8665,7 +8659,7 @@ static SDValue lowerV4I32VectorShuffle(SDValue Op, SDValue V1, SDValue V2,
  static SDValue lowerV8I16GeneralSingleInputVectorShuffle(
      SDLoc DL, MVT VT, SDValue V, MutableArrayRef<int> Mask,
      const X86Subtarget *Subtarget, SelectionDAG &DAG) {
-  assert(VT.getScalarType() == MVT::i16 && "Bad input type!");
+  assert(VT.getVectorElementType() == MVT::i16 && "Bad input type!");
    MVT PSHUFDVT = MVT::getVectorVT(MVT::i32, VT.getVectorNumElements() / 2);
  
    assert(Mask.size() == 8 && "Shuffle mask length doen't match!");
@@ -9739,7 +9733,7 @@ static SDValue splitAndLowerVectorShuffle(SDLoc DL, MVT VT, SDValue V1,
  
    int NumElements = VT.getVectorNumElements();
    int SplitNumElements = NumElements / 2;
-  MVT ScalarVT = VT.getScalarType();
+  MVT ScalarVT = VT.getVectorElementType();
    MVT SplitVT = MVT::getVectorVT(ScalarVT, NumElements / 2);
  
    // Rather than splitting build-vectors, just build two narrower build
@@ -9751,7 +9745,7 @@ static SDValue splitAndLowerVectorShuffle(SDLoc DL, MVT VT, SDValue V1,
      MVT OrigVT = V.getSimpleValueType();
      int OrigNumElements = OrigVT.getVectorNumElements();
      int OrigSplitNumElements = OrigNumElements / 2;
-    MVT OrigScalarVT = OrigVT.getScalarType();
+    MVT OrigScalarVT = OrigVT.getVectorElementType();
      MVT OrigSplitVT = MVT::getVectorVT(OrigScalarVT, OrigNumElements / 2);
  
      SDValue LoV, HiV;
@@ -9921,7 +9915,7 @@ static SDValue lowerVectorShuffleAsLanePermuteAndBlend(SDLoc DL, MVT VT,
                                                         ArrayRef<int> Mask,
                                                         SelectionDAG &DAG) {
    // FIXME: This should probably be generalized for 512-bit vectors as well.
-  assert(VT.getSizeInBits() == 256 && "Only for 256-bit vector shuffles!");
+  assert(VT.is256BitVector() && "Only for 256-bit vector shuffles!");
    int LaneSize = Mask.size() / 2;
  
    // If there are only inputs from one 128-bit lane, splitting will in fact be
@@ -10736,16 +10730,15 @@ static SDValue lower256BitVectorShuffle(SDValue Op, SDValue V1, SDValue V2,
  
  /// \brief Try to lower a vector shuffle as a 128-bit shuffles.
  static SDValue lowerV4X128VectorShuffle(SDLoc DL, MVT VT,
-                                             ArrayRef<int> Mask,
-                                             SDValue V1, SDValue V2,
-                                             SelectionDAG &DAG) {
+                                        ArrayRef<int> Mask,
+                                        SDValue V1, SDValue V2,
+                                        SelectionDAG &DAG) {
    assert(VT.getScalarSizeInBits() == 64 &&
           "Unexpected element type size for 128bit shuffle.");
  
    // To handle 256 bit vector requires VLX and most probably
    // function lowerV2X128VectorShuffle() is better solution.
-  assert(VT.getSizeInBits() == 512 &&
-         "Unexpected vector size for 128bit shuffle.");
+  assert(VT.is512BitVector() && "Unexpected vector size for 128bit shuffle.");
  
    SmallVector<int, 4> WidenedMask;
    if (!canWidenShuffleElements(Mask, WidenedMask))
@@ -10810,8 +10803,8 @@ static SDValue lowerV8F64VectorShuffle(SDValue Op, SDValue V1, SDValue V2,
  
  /// \brief Handle lowering of 16-lane 32-bit floating point shuffles.
  static SDValue lowerV16F32VectorShuffle(SDValue Op, SDValue V1, SDValue V2,
-                                       const X86Subtarget *Subtarget,
-                                       SelectionDAG &DAG) {
+                                        const X86Subtarget *Subtarget,
+                                        SelectionDAG &DAG) {
    SDLoc DL(Op);
    assert(V1.getSimpleValueType() == MVT::v16f32 && "Bad operand type!");
    assert(V2.getSimpleValueType() == MVT::v16f32 && "Bad operand type!");
@@ -10850,8 +10843,8 @@ static SDValue lowerV8I64VectorShuffle(SDValue Op, SDValue V1, SDValue V2,
  
  /// \brief Handle lowering of 16-lane 32-bit integer shuffles.
  static SDValue lowerV16I32VectorShuffle(SDValue Op, SDValue V1, SDValue V2,
-                                       const X86Subtarget *Subtarget,
-                                       SelectionDAG &DAG) {
+                                        const X86Subtarget *Subtarget,
+                                        SelectionDAG &DAG) {
    SDLoc DL(Op);
    assert(V1.getSimpleValueType() == MVT::v16i32 && "Bad operand type!");
    assert(V2.getSimpleValueType() == MVT::v16i32 && "Bad operand type!");
@@ -10958,7 +10951,7 @@ static SDValue lower1BitVectorShuffle(SDValue Op, SDValue V1, SDValue V2,
    ArrayRef<int> Mask = SVOp->getMask();
    assert(Subtarget->hasAVX512() &&
           "Cannot lower 512-bit vectors w/o basic ISA!");
-  EVT ExtVT;
+  MVT ExtVT;
    switch (VT.SimpleTy) {
    default:
      llvm_unreachable("Expected a vector of i1 elements");
@@ -11016,7 +11009,7 @@ static SDValue lowerVectorShuffle(SDValue Op, const X86Subtarget *Subtarget,
    MVT VT = Op.getSimpleValueType();
    int NumElements = VT.getVectorNumElements();
    SDLoc dl(Op);
-  bool Is1BitVector = (VT.getScalarType() == MVT::i1);
+  bool Is1BitVector = (VT.getVectorElementType() == MVT::i1);
  
    assert((VT.getSizeInBits() != 64 || Is1BitVector) &&
           "Can't lower MMX shuffles");
@@ -11125,13 +11118,13 @@ static SDValue lowerVectorShuffle(SDValue Op, const X86Subtarget *Subtarget,
    }
  
    // For each vector width, delegate to a specialized lowering routine.
-  if (VT.getSizeInBits() == 128)
+  if (VT.is128BitVector())
      return lower128BitVectorShuffle(Op, V1, V2, VT, Subtarget, DAG);
  
-  if (VT.getSizeInBits() == 256)
+  if (VT.is256BitVector())
      return lower256BitVectorShuffle(Op, V1, V2, VT, Subtarget, DAG);
  
-  if (VT.getSizeInBits() == 512)
+  if (VT.is512BitVector())
      return lower512BitVectorShuffle(Op, V1, V2, VT, Subtarget, DAG);
  
    if (Is1BitVector)
@@ -11395,10 +11388,11 @@ X86TargetLowering::LowerEXTRACT_VECTOR_ELT(SDValue Op,
      MVT EltVT = VecVT.getVectorElementType();
  
      unsigned ElemsPerChunk = 128 / EltVT.getSizeInBits();
+    assert(isPowerOf2_32(ElemsPerChunk) && "Elements per chunk not power of 2");
  
-    //if (IdxVal >= NumElems/2)
-    //  IdxVal -= NumElems/2;
-    IdxVal -= (IdxVal/ElemsPerChunk)*ElemsPerChunk;
+    // Find IdxVal modulo ElemsPerChunk. Since ElemsPerChunk is a power of 2
+    // this can be done with a mask.
+    IdxVal &= ElemsPerChunk - 1;
      return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, Op.getValueType(), Vec,
                         DAG.getConstant(IdxVal, dl, MVT::i32));
    }
@@ -11534,7 +11528,9 @@ SDValue X86TargetLowering::LowerINSERT_VECTOR_ELT(SDValue Op,
  
      // Insert the element into the desired chunk.
      unsigned NumEltsIn128 = 128 / EltVT.getSizeInBits();
-    unsigned IdxIn128 = IdxVal - (IdxVal / NumEltsIn128) * NumEltsIn128;
+    assert(isPowerOf2_32(NumEltsIn128));
+    // Since NumEltsIn128 is a power of 2 we can use mask instead of modulo.
+    unsigned IdxIn128 = IdxVal & (NumEltsIn128 - 1);
  
      V = DAG.getNode(ISD::INSERT_VECTOR_ELT, dl, V.getValueType(), V, N1,
                      DAG.getConstant(IdxIn128, dl, MVT::i32));
@@ -12512,7 +12508,7 @@ SDValue X86TargetLowering::LowerUINT_TO_FP_i32(SDValue Op,
    SDValue Sub = DAG.getNode(ISD::FSUB, dl, MVT::f64, Or, Bias);
  
    // Handle final rounding.
-  EVT DestVT = Op.getValueType();
+  MVT DestVT = Op.getSimpleValueType();
  
    if (DestVT.bitsLT(MVT::f64))
      return DAG.getNode(ISD::FP_ROUND, dl, DestVT, Sub,
@@ -12549,12 +12545,12 @@ static SDValue lowerUINT_TO_FP_vXi32(SDValue Op, SelectionDAG &DAG,
  
    SDLoc DL(Op);
    SDValue V = Op->getOperand(0);
-  EVT VecIntVT = V.getValueType();
+  MVT VecIntVT = V.getSimpleValueType();
    bool Is128 = VecIntVT == MVT::v4i32;
-  EVT VecFloatVT = Is128 ? MVT::v4f32 : MVT::v8f32;
+  MVT VecFloatVT = Is128 ? MVT::v4f32 : MVT::v8f32;
    // If we convert to something else than the supported type, e.g., to v4f64,
    // abort early.
-  if (VecFloatVT != Op->getValueType(0))
+  if (VecFloatVT != Op->getSimpleValueType(0))
      return SDValue();
  
    unsigned NumElts = VecIntVT.getVectorNumElements();
@@ -12592,7 +12588,7 @@ static SDValue lowerUINT_TO_FP_vXi32(SDValue Op, SelectionDAG &DAG,
  
    SDValue Low, High;
    if (Subtarget.hasSSE41()) {
-    EVT VecI16VT = Is128 ? MVT::v8i16 : MVT::v16i16;
+    MVT VecI16VT = Is128 ? MVT::v8i16 : MVT::v16i16;
      //     uint4 lo = _mm_blend_epi16( v, (uint4) 0x4b000000, 0xaa);
      SDValue VecCstLowBitcast = DAG.getBitcast(VecI16VT, VecCstLow);
      SDValue VecBitcast = DAG.getBitcast(VecI16VT, V);
@@ -12660,11 +12656,10 @@ SDValue X86TargetLowering::lowerUINT_TO_FP_vec(SDValue Op,
      return lowerUINT_TO_FP_vXi32(Op, DAG, *Subtarget);
    case MVT::v16i8:
    case MVT::v16i16:
-    if (Subtarget->hasAVX512())
-      return DAG.getNode(ISD::UINT_TO_FP, dl, Op.getValueType(),
-                         DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::v16i32, N0));
+    assert(Subtarget->hasAVX512());
+    return DAG.getNode(ISD::UINT_TO_FP, dl, Op.getValueType(),
+                       DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::v16i32, N0));
    }
-  llvm_unreachable(nullptr);
  }
  
  SDValue X86TargetLowering::LowerUINT_TO_FP(SDValue Op,
@@ -12673,7 +12668,7 @@ SDValue X86TargetLowering::LowerUINT_TO_FP(SDValue Op,
    SDLoc dl(Op);
    auto PtrVT = getPointerTy(DAG.getDataLayout());
  
-  if (Op.getValueType().isVector())
+  if (Op.getSimpleValueType().isVector())
      return lowerUINT_TO_FP_vec(Op, DAG);
  
    // Since UINT_TO_FP is legal (it's marked custom), dag combiner won't
@@ -12960,7 +12955,7 @@ static SDValue LowerAVXExtend(SDValue Op, SelectionDAG &DAG,
    MVT InVT = In.getSimpleValueType();
    SDLoc dl(Op);
  
-  if (VT.is512BitVector() || InVT.getScalarType() == MVT::i1)
+  if (VT.is512BitVector() || InVT.getVectorElementType() == MVT::i1)
      return DAG.getNode(ISD::ZERO_EXTEND, dl, VT, In);
  
    // Optimize vectors in AVX mode:
@@ -13105,10 +13100,13 @@ SDValue X86TargetLowering::LowerTRUNCATE(SDValue Op, SelectionDAG &DAG) const {
    }
  
    // vpmovqb/w/d, vpmovdb/w, vpmovwb
-  if (((!InVT.is512BitVector() && Subtarget->hasVLX()) || InVT.is512BitVector()) &&
-      (InVT.getVectorElementType() != MVT::i16 || Subtarget->hasBWI()))
+  if (Subtarget->hasAVX512()) {
+    // word to byte only under BWI
+    if (InVT == MVT::v16i16 && !Subtarget->hasBWI()) // v16i16 -> v16i8
+      return DAG.getNode(X86ISD::VTRUNC, DL, VT,
+                         DAG.getNode(X86ISD::VSEXT, DL, MVT::v16i32, In));
      return DAG.getNode(X86ISD::VTRUNC, DL, VT, In);
-
+  }
    if ((VT == MVT::v4i32) && (InVT == MVT::v4i64)) {
      // On AVX2, v4i64 -> v4i32 becomes VPERMD.
      if (Subtarget->hasInt256()) {
@@ -13495,7 +13493,7 @@ static SDValue LowerVectorAllZeroTest(SDValue Op, const X86Subtarget *Subtarget,
        return SDValue();
    }
  
-  EVT TestVT = VT.is128BitVector() ? MVT::v2i64 : MVT::v4i64;
+  MVT TestVT = VT.is128BitVector() ? MVT::v2i64 : MVT::v4i64;
  
    // Cast all vectors into TestVT for PTEST.
    for (unsigned i = 0, e = VecIns.size(); i < e; ++i)
@@ -13775,8 +13773,8 @@ SDValue X86TargetLowering::EmitCmp(SDValue Op0, SDValue Op1, unsigned X86CC,
      if (C->getAPIntValue() == 0)
        return EmitTest(Op0, X86CC, dl, DAG);
  
-     if (Op0.getValueType() == MVT::i1)
-       llvm_unreachable("Unexpected comparison operation for MVT::i1 operands");
+     assert(Op0.getValueType() != MVT::i1 &&
+            "Unexpected comparison operation for MVT::i1 operands");
    }
  
    if ((Op0.getValueType() == MVT::i8 || Op0.getValueType() == MVT::i16 ||
@@ -14058,7 +14056,7 @@ static SDValue LowerBoolVSETCC_AVX512(SDValue Op, SelectionDAG &DAG) {
    MVT VT = Op.getSimpleValueType();
    SDLoc dl(Op);
  
-  assert(Op0.getValueType().getVectorElementType() == MVT::i1 &&
+  assert(Op0.getSimpleValueType().getVectorElementType() == MVT::i1 &&
           "Unexpected type for boolean compare operation");
    ISD::CondCode SetCCOpcode = cast<CondCodeSDNode>(CC)->get();
    SDValue NotOp0 = DAG.getNode(ISD::XOR, dl, VT, Op0,
@@ -14102,8 +14100,8 @@ static SDValue LowerIntVSETCC_AVX512(SDValue Op, SelectionDAG &DAG,
    MVT VT = Op.getSimpleValueType();
    SDLoc dl(Op);
  
-  assert(Op0.getValueType().getVectorElementType().getSizeInBits() >= 8 &&
-         Op.getValueType().getScalarType() == MVT::i1 &&
+  assert(Op0.getSimpleValueType().getVectorElementType().getSizeInBits() >= 8 &&
+         Op.getSimpleValueType().getVectorElementType() == MVT::i1 &&
           "Cannot set masked compare for this operation");
  
    ISD::CondCode SetCCOpcode = cast<CondCodeSDNode>(CC)->get();
@@ -14150,7 +14148,7 @@ static SDValue ChangeVSETULTtoVSETULE(SDLoc dl, SDValue Op1, SelectionDAG &DAG)
  
    for (unsigned i = 0; i < n; ++i) {
      ConstantSDNode *Elt = dyn_cast<ConstantSDNode>(BV->getOperand(i));
-    if (!Elt || Elt->isOpaque() || Elt->getValueType(0) != EVT)
+    if (!Elt || Elt->isOpaque() || Elt->getSimpleValueType(0) != EVT)
        return SDValue();
  
      // Avoid underflow.
@@ -14241,13 +14239,13 @@ static SDValue LowerVSETCC(SDValue Op, const X86Subtarget *Subtarget,
    if (VT.is256BitVector() && !Subtarget->hasInt256())
      return Lower256IntVSETCC(Op, DAG);
  
-  EVT OpVT = Op1.getValueType();
+  MVT OpVT = Op1.getSimpleValueType();
    if (OpVT.getVectorElementType() == MVT::i1)
      return LowerBoolVSETCC_AVX512(Op, DAG);
  
    bool MaskResult = (VT.getVectorElementType() == MVT::i1);
    if (Subtarget->hasAVX512()) {
-    if (Op1.getValueType().is512BitVector() ||
+    if (Op1.getSimpleValueType().is512BitVector() ||
          (Subtarget->hasBWI() && Subtarget->hasVLX()) ||
          (MaskResult && OpVT.getVectorElementType().getSizeInBits() >= 32))
        return LowerIntVSETCC_AVX512(Op, DAG, Subtarget);
@@ -14439,7 +14437,7 @@ static SDValue LowerVSETCC(SDValue Op, const X86Subtarget *Subtarget,
    // Since SSE has no unsigned integer comparisons, we need to flip the sign
    // bits of the inputs before performing those operations.
    if (FlipSigns) {
-    EVT EltVT = VT.getVectorElementType();
+    MVT EltVT = VT.getVectorElementType();
      SDValue SB = DAG.getConstant(APInt::getSignBit(EltVT.getSizeInBits()), dl,
                                   VT);
      Op0 = DAG.getNode(ISD::XOR, dl, VT, Op0, SB);
@@ -14580,7 +14578,7 @@ SDValue X86TargetLowering::LowerSELECT(SDValue Op, SelectionDAG &DAG) const {
    SDValue Op1 = Op.getOperand(1);
    SDValue Op2 = Op.getOperand(2);
    SDLoc DL(Op);
-  EVT VT = Op1.getValueType();
+  MVT VT = Op1.getSimpleValueType();
    SDValue CC;
  
    // Lower FP selects into a CMP/AND/ANDN/OR sequence when the necessary SSE ops
@@ -14589,7 +14587,7 @@ SDValue X86TargetLowering::LowerSELECT(SDValue Op, SelectionDAG &DAG) const {
    if (Cond.getOpcode() == ISD::SETCC &&
        ((Subtarget->hasSSE2() && (VT == MVT::f32 || VT == MVT::f64)) ||
         (Subtarget->hasSSE1() && VT == MVT::f32)) &&
-      VT == Cond.getOperand(0).getValueType() && Cond->hasOneUse()) {
+      VT == Cond.getOperand(0).getSimpleValueType() && Cond->hasOneUse()) {
      SDValue CondOp0 = Cond.getOperand(0), CondOp1 = Cond.getOperand(1);
      int SSECC = translateX86FSETCC(
          cast<CondCodeSDNode>(Cond.getOperand(2))->get(), CondOp0, CondOp1);
@@ -14623,12 +14621,12 @@ SDValue X86TargetLowering::LowerSELECT(SDValue Op, SelectionDAG &DAG) const {
          // Convert to vectors, do a VSELECT, and convert back to scalar.
          // All of the conversions should be optimized away.
  
-        EVT VecVT = VT == MVT::f32 ? MVT::v4f32 : MVT::v2f64;
+        MVT VecVT = VT == MVT::f32 ? MVT::v4f32 : MVT::v2f64;
          SDValue VOp1 = DAG.getNode(ISD::SCALAR_TO_VECTOR, DL, VecVT, Op1);
          SDValue VOp2 = DAG.getNode(ISD::SCALAR_TO_VECTOR, DL, VecVT, Op2);
          SDValue VCmp = DAG.getNode(ISD::SCALAR_TO_VECTOR, DL, VecVT, Cmp);
  
-        EVT VCmpVT = VT == MVT::f32 ? MVT::v4i32 : MVT::v2i64;
+        MVT VCmpVT = VT == MVT::f32 ? MVT::v4i32 : MVT::v2i64;
          VCmp = DAG.getBitcast(VCmpVT, VCmp);
  
          SDValue VSel = DAG.getNode(ISD::VSELECT, DL, VecVT, VCmp, VOp1, VOp2);
@@ -14642,7 +14640,7 @@ SDValue X86TargetLowering::LowerSELECT(SDValue Op, SelectionDAG &DAG) const {
      }
    }
  
-  if (VT.isVector() && VT.getScalarType() == MVT::i1) {
+  if (VT.isVector() && VT.getVectorElementType() == MVT::i1) {
      SDValue Op1Scalar;
      if (ISD::isBuildVectorOfConstantSDNodes(Op1.getNode()))
        Op1Scalar = ConvertI1VectorToInteger(Op1, DAG);
@@ -14918,8 +14916,8 @@ static SDValue LowerSIGN_EXTEND_VECTOR_INREG(SDValue Op,
    MVT InVT = In.getSimpleValueType();
    assert(VT.getSizeInBits() == InVT.getSizeInBits());
  
-  MVT InSVT = InVT.getScalarType();
-  assert(VT.getScalarType().getScalarSizeInBits() > InSVT.getScalarSizeInBits());
+  MVT InSVT = InVT.getVectorElementType();
+  assert(VT.getVectorElementType().getSizeInBits() > InSVT.getSizeInBits());
  
    if (VT != MVT::v2i64 && VT != MVT::v4i32 && VT != MVT::v8i16)
      return SDValue();
@@ -14938,7 +14936,7 @@ static SDValue LowerSIGN_EXTEND_VECTOR_INREG(SDValue Op,
  
    // As SRAI is only available on i16/i32 types, we expand only up to i32
    // and handle i64 separately.
-  while (CurrVT != VT && CurrVT.getScalarType() != MVT::i32) {
+  while (CurrVT != VT && CurrVT.getVectorElementType() != MVT::i32) {
      Curr = DAG.getNode(X86ISD::UNPCKL, dl, CurrVT, DAG.getUNDEF(CurrVT), Curr);
      MVT CurrSVT = MVT::getIntegerVT(CurrVT.getScalarSizeInBits() * 2);
      CurrVT = MVT::getVectorVT(CurrSVT, CurrVT.getVectorNumElements() / 2);
@@ -14948,7 +14946,7 @@ static SDValue LowerSIGN_EXTEND_VECTOR_INREG(SDValue Op,
    SDValue SignExt = Curr;
    if (CurrVT != InVT) {
      unsigned SignExtShift =
-        CurrVT.getScalarSizeInBits() - InSVT.getScalarSizeInBits();
+        CurrVT.getVectorElementType().getSizeInBits() - InSVT.getSizeInBits();
      SignExt = DAG.getNode(X86ISD::VSRAI, dl, CurrVT, Curr,
                            DAG.getConstant(SignExtShift, dl, MVT::i8));
    }
@@ -15008,7 +15006,7 @@ static SDValue LowerSIGN_EXTEND(SDValue Op, const X86Subtarget *Subtarget,
  
    SDValue OpHi = DAG.getVectorShuffle(InVT, dl, In, Undef, &ShufMask2[0]);
  
-  MVT HalfVT = MVT::getVectorVT(VT.getScalarType(),
+  MVT HalfVT = MVT::getVectorVT(VT.getVectorElementType(),
                                  VT.getVectorNumElements()/2);
  
    OpLo = DAG.getNode(X86ISD::VSEXT, dl, HalfVT, OpLo);
@@ -15132,7 +15130,7 @@ static SDValue LowerExtendedLoad(SDValue Op, const X86Subtarget *Subtarget,
    // memory. In practice, we ''widen'' MemVT.
    EVT WideVecVT =
        EVT::getVectorVT(*DAG.getContext(), MemVT.getScalarType(),
-                       loadRegZize / MemVT.getScalarType().getSizeInBits());
+                       loadRegZize / MemVT.getScalarSizeInBits());
  
    assert(WideVecVT.getSizeInBits() == LoadUnitVecVT.getSizeInBits() &&
           "Invalid vector type");
@@ -15885,7 +15883,7 @@ static SDValue getTargetVShiftNode(unsigned Opc, SDLoc dl, MVT VT,
    // The return type has to be a 128-bit type with the same element
    // type as the input type.
    MVT EltVT = VT.getVectorElementType();
-  EVT ShVT = MVT::getVectorVT(EltVT, 128/EltVT.getSizeInBits());
+  MVT ShVT = MVT::getVectorVT(EltVT, 128/EltVT.getSizeInBits());
  
    ShAmt = DAG.getBitcast(ShVT, ShAmt);
    return DAG.getNode(Opc, dl, VT, SrcOp, ShAmt);
@@ -15898,26 +15896,22 @@ static SDValue getVectorMaskingNode(SDValue Op, SDValue Mask,
                                      SDValue PreservedSrc,
                                      const X86Subtarget *Subtarget,
                                      SelectionDAG &DAG) {
-    EVT VT = Op.getValueType();
-    EVT MaskVT = EVT::getVectorVT(*DAG.getContext(),
-                                  MVT::i1, VT.getVectorNumElements());
-    SDValue VMask = SDValue();
+    MVT VT = Op.getSimpleValueType();
+    MVT MaskVT = MVT::getVectorVT(MVT::i1, VT.getVectorNumElements());
+    SDValue VMask;
      unsigned OpcodeSelect = ISD::VSELECT;
      SDLoc dl(Op);
  
-    assert(MaskVT.isSimple() && "invalid mask type");
-
      if (isAllOnes(Mask))
        return Op;
  
-    if (MaskVT.bitsGT(Mask.getValueType())) {
-      EVT newMaskVT =  EVT::getIntegerVT(*DAG.getContext(),
-                                         MaskVT.getSizeInBits());
+    if (MaskVT.bitsGT(Mask.getSimpleValueType())) {
+      MVT newMaskVT = MVT::getIntegerVT(MaskVT.getSizeInBits());
        VMask = DAG.getBitcast(MaskVT,
                               DAG.getNode(ISD::ANY_EXTEND, dl, newMaskVT, Mask));
      } else {
-      EVT BitcastVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                       Mask.getValueType().getSizeInBits());
+      MVT BitcastVT = MVT::getVectorVT(MVT::i1,
+                                       Mask.getSimpleValueType().getSizeInBits());
        // In case when MaskVT equals v2i1 or v4i1, low 2 or 4 elements
        // are extracted by EXTRACT_SUBVECTOR.
        VMask = DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, MaskVT,
@@ -15926,22 +15920,22 @@ static SDValue getVectorMaskingNode(SDValue Op, SDValue Mask,
      }
  
      switch (Op.getOpcode()) {
-      default: break;
-      case X86ISD::PCMPEQM:
-      case X86ISD::PCMPGTM:
-      case X86ISD::CMPM:
-      case X86ISD::CMPMU:
-        return DAG.getNode(ISD::AND, dl, VT, Op, VMask);
-      case X86ISD::VFPCLASS:
-        return DAG.getNode(ISD::OR, dl, VT, Op, VMask);
-      case X86ISD::VTRUNC:
-      case X86ISD::VTRUNCS:
-      case X86ISD::VTRUNCUS:
-        // We can't use ISD::VSELECT here because it is not always "Legal"
-        // for the destination type. For example vpmovqb require only AVX512
-        // and vselect that can operate on byte element type require BWI
-        OpcodeSelect = X86ISD::SELECT;
-        break;
+    default: break;
+    case X86ISD::PCMPEQM:
+    case X86ISD::PCMPGTM:
+    case X86ISD::CMPM:
+    case X86ISD::CMPMU:
+      return DAG.getNode(ISD::AND, dl, VT, Op, VMask);
+    case X86ISD::VFPCLASS:
+      return DAG.getNode(ISD::OR, dl, VT, Op, VMask);
+    case X86ISD::VTRUNC:
+    case X86ISD::VTRUNCS:
+    case X86ISD::VTRUNCUS:
+      // We can't use ISD::VSELECT here because it is not always "Legal"
+      // for the destination type. For example vpmovqb require only AVX512
+      // and vselect that can operate on byte element type require BWI
+      OpcodeSelect = X86ISD::SELECT;
+      break;
      }
      if (PreservedSrc.getOpcode() == ISD::UNDEF)
        PreservedSrc = getZeroVector(VT, Subtarget, DAG, dl);
@@ -15962,7 +15956,7 @@ static SDValue getScalarMaskingNode(SDValue Op, SDValue Mask,
    if (isAllOnes(Mask))
      return Op;
  
-  EVT VT = Op.getValueType();
+  MVT VT = Op.getSimpleValueType();
    SDLoc dl(Op);
    // The mask should be of type MVT::i1
    SDValue IMask = DAG.getNode(ISD::TRUNCATE, dl, MVT::i1, Mask);
@@ -16035,7 +16029,7 @@ static SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, const X86Subtarget *Subtarget
                                         SelectionDAG &DAG) {
    SDLoc dl(Op);
    unsigned IntNo = cast<ConstantSDNode>(Op.getOperand(0))->getZExtValue();
-  EVT VT = Op.getValueType();
+  MVT VT = Op.getSimpleValueType();
    const IntrinsicData* IntrData = getIntrinsicWithoutChain(IntNo);
    if (IntrData) {
      switch(IntrData->Type) {
@@ -16220,7 +16214,7 @@ static SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, const X86Subtarget *Subtarget
          // imm should be adapted to ISD::INSERT_SUBVECTOR behavior
          assert(isa<ConstantSDNode>(Src3) && "Expected a ConstantSDNode here!");
          unsigned Imm = cast<ConstantSDNode>(Src3)->getZExtValue();
-        Imm *= Src2.getValueType().getVectorNumElements();
+        Imm *= Src2.getSimpleValueType().getVectorNumElements();
          Src3 = DAG.getTargetConstant(Imm, dl, MVT::i32);
        }
  
@@ -16251,7 +16245,7 @@ static SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, const X86Subtarget *Subtarget
        SDValue Src2 = Op.getOperand(2);
        SDValue Src3 = Op.getOperand(3);
        SDValue Mask = Op.getOperand(4);
-      EVT VT = Op.getValueType();
+      MVT VT = Op.getSimpleValueType();
        SDValue PassThru = SDValue();
  
        // set PassThru element
@@ -16287,7 +16281,7 @@ static SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, const X86Subtarget *Subtarget
        SDValue Src3 = Op.getOperand(3);
        SDValue Src4 = DAG.getNode(ISD::TRUNCATE, dl, MVT::i8, Op.getOperand(4));
        SDValue Mask = Op.getOperand(5);
-      EVT VT = Op.getValueType();
+      MVT VT = Op.getSimpleValueType();
        SDValue PassThru = Src1;
        // Set PassThru element.
        if (IntrData->Type == TERLOG_OP_MASKZ)
@@ -16300,13 +16294,12 @@ static SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, const X86Subtarget *Subtarget
      case FPCLASS: {
        // FPclass intrinsics with mask
         SDValue Src1 = Op.getOperand(1);
-       EVT VT = Src1.getValueType();
-       EVT MaskVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                      VT.getVectorNumElements());
+       MVT VT = Src1.getSimpleValueType();
+       MVT MaskVT = MVT::getVectorVT(MVT::i1, VT.getVectorNumElements());
         SDValue Imm = Op.getOperand(2);
         SDValue Mask = Op.getOperand(3);
-       EVT BitcastVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                        Mask.getValueType().getSizeInBits());
+       MVT BitcastVT = MVT::getVectorVT(MVT::i1,
+                                     Mask.getSimpleValueType().getSizeInBits());
         SDValue FPclass = DAG.getNode(IntrData->Opc0, dl, MaskVT, Src1, Imm);
         SDValue FPclassMask = getVectorMaskingNode(FPclass, Mask,
                                                   DAG.getTargetConstant(0, dl, MaskVT),
@@ -16336,12 +16329,11 @@ static SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, const X86Subtarget *Subtarget
        //           (v2i1 (and (PCMPEQM %a, %b),
        //                      (extract_subvector
        //                         (v8i1 (bitcast %mask)), 0))), 0))))
-      EVT VT = Op.getOperand(1).getValueType();
-      EVT MaskVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                    VT.getVectorNumElements());
+      MVT VT = Op.getOperand(1).getSimpleValueType();
+      MVT MaskVT = MVT::getVectorVT(MVT::i1, VT.getVectorNumElements());
        SDValue Mask = Op.getOperand((IntrData->Type == CMP_MASK_CC) ? 4 : 3);
-      EVT BitcastVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                       Mask.getValueType().getSizeInBits());
+      MVT BitcastVT = MVT::getVectorVT(MVT::i1,
+                                       Mask.getSimpleValueType().getSizeInBits());
        SDValue Cmp;
        if (IntrData->Type == CMP_MASK_CC) {
          SDValue CC = Op.getOperand(3);
@@ -16435,11 +16427,10 @@ static SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, const X86Subtarget *Subtarget
      }
      case BLEND: {
        SDValue Mask = Op.getOperand(3);
-      EVT VT = Op.getValueType();
-      EVT MaskVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                    VT.getVectorNumElements());
-      EVT BitcastVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                       Mask.getValueType().getSizeInBits());
+      MVT VT = Op.getSimpleValueType();
+      MVT MaskVT = MVT::getVectorVT(MVT::i1, VT.getVectorNumElements());
+      MVT BitcastVT = MVT::getVectorVT(MVT::i1,
+                                       Mask.getSimpleValueType().getSizeInBits());
        SDLoc dl(Op);
        SDValue VMask = DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, MaskVT,
                                    DAG.getBitcast(BitcastVT, Mask),
@@ -16660,23 +16651,21 @@ static SDValue getGatherNode(unsigned Opc, SDValue Op, SelectionDAG &DAG,
                                SDValue Index, SDValue ScaleOp, SDValue Chain,
                                const X86Subtarget * Subtarget) {
    SDLoc dl(Op);
-  ConstantSDNode *C = dyn_cast<ConstantSDNode>(ScaleOp);
-  if (!C)
-    llvm_unreachable("Invalid scale type");
+  auto *C = cast<ConstantSDNode>(ScaleOp);
    unsigned ScaleVal = C->getZExtValue();
    if (ScaleVal > 2 && ScaleVal != 4 && ScaleVal != 8)
      llvm_unreachable("Valid scale values are 1, 2, 4, 8");
  
    SDValue Scale = DAG.getTargetConstant(C->getZExtValue(), dl, MVT::i8);
-  EVT MaskVT = MVT::getVectorVT(MVT::i1,
+  MVT MaskVT = MVT::getVectorVT(MVT::i1,
                               Index.getSimpleValueType().getVectorNumElements());
    SDValue MaskInReg;
    ConstantSDNode *MaskC = dyn_cast<ConstantSDNode>(Mask);
    if (MaskC)
      MaskInReg = DAG.getTargetConstant(MaskC->getSExtValue(), dl, MaskVT);
    else {
-    EVT BitcastVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                     Mask.getValueType().getSizeInBits());
+    MVT BitcastVT = MVT::getVectorVT(MVT::i1,
+                                     Mask.getSimpleValueType().getSizeInBits());
  
      // In case when MaskVT equals v2i1 or v4i1, low 2 or 4 elements
      // are extracted by EXTRACT_SUBVECTOR.
@@ -16699,9 +16688,7 @@ static SDValue getScatterNode(unsigned Opc, SDValue Op, SelectionDAG &DAG,
                                 SDValue Src, SDValue Mask, SDValue Base,
                                 SDValue Index, SDValue ScaleOp, SDValue Chain) {
    SDLoc dl(Op);
-  ConstantSDNode *C = dyn_cast<ConstantSDNode>(ScaleOp);
-  if (!C)
-    llvm_unreachable("Invalid scale type");
+  auto *C = cast<ConstantSDNode>(ScaleOp);
    unsigned ScaleVal = C->getZExtValue();
    if (ScaleVal > 2 && ScaleVal != 4 && ScaleVal != 8)
      llvm_unreachable("Valid scale values are 1, 2, 4, 8");
@@ -16709,15 +16696,15 @@ static SDValue getScatterNode(unsigned Opc, SDValue Op, SelectionDAG &DAG,
    SDValue Scale = DAG.getTargetConstant(C->getZExtValue(), dl, MVT::i8);
    SDValue Disp = DAG.getTargetConstant(0, dl, MVT::i32);
    SDValue Segment = DAG.getRegister(0, MVT::i32);
-  EVT MaskVT = MVT::getVectorVT(MVT::i1,
+  MVT MaskVT = MVT::getVectorVT(MVT::i1,
                               Index.getSimpleValueType().getVectorNumElements());
    SDValue MaskInReg;
    ConstantSDNode *MaskC = dyn_cast<ConstantSDNode>(Mask);
    if (MaskC)
      MaskInReg = DAG.getTargetConstant(MaskC->getSExtValue(), dl, MaskVT);
    else {
-    EVT BitcastVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                     Mask.getValueType().getSizeInBits());
+    MVT BitcastVT = MVT::getVectorVT(MVT::i1,
+                                     Mask.getSimpleValueType().getSizeInBits());
  
      // In case when MaskVT equals v2i1 or v4i1, low 2 or 4 elements
      // are extracted by EXTRACT_SUBVECTOR.
@@ -16735,12 +16722,11 @@ static SDValue getPrefetchNode(unsigned Opc, SDValue Op, SelectionDAG &DAG,
                                 SDValue Mask, SDValue Base, SDValue Index,
                                 SDValue ScaleOp, SDValue Chain) {
    SDLoc dl(Op);
-  ConstantSDNode *C = dyn_cast<ConstantSDNode>(ScaleOp);
-  assert(C && "Invalid scale type");
+  auto *C = cast<ConstantSDNode>(ScaleOp);
    SDValue Scale = DAG.getTargetConstant(C->getZExtValue(), dl, MVT::i8);
    SDValue Disp = DAG.getTargetConstant(0, dl, MVT::i32);
    SDValue Segment = DAG.getRegister(0, MVT::i32);
-  EVT MaskVT =
+  MVT MaskVT =
      MVT::getVectorVT(MVT::i1, Index.getSimpleValueType().getVectorNumElements());
    SDValue MaskInReg;
    ConstantSDNode *MaskC = dyn_cast<ConstantSDNode>(Mask);
@@ -16933,19 +16919,17 @@ static SDValue LowerINTRINSIC_TRUNCATE_TO_MEM(const SDValue & Op,
    SDValue Addr = Op.getOperand(2);
    SDValue Chain = Op.getOperand(0);
  
-  EVT VT  = DataToTruncate.getValueType();
-  EVT SVT = EVT::getVectorVT(*DAG.getContext(),
-                             ElementType, VT.getVectorNumElements());
+  MVT VT  = DataToTruncate.getSimpleValueType();
+  MVT SVT = MVT::getVectorVT(ElementType, VT.getVectorNumElements());
  
    if (isAllOnes(Mask)) // return just a truncate store
      return DAG.getTruncStore(Chain, dl, DataToTruncate, Addr,
                               MachinePointerInfo(), SVT, false, false,
                               SVT.getScalarSizeInBits()/8);
  
-  EVT MaskVT = EVT::getVectorVT(*DAG.getContext(),
-                                MVT::i1, VT.getVectorNumElements());
-  EVT BitcastVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1,
-                                   Mask.getValueType().getSizeInBits());
+  MVT MaskVT = MVT::getVectorVT(MVT::i1, VT.getVectorNumElements());
+  MVT BitcastVT = MVT::getVectorVT(MVT::i1,
+                                   Mask.getSimpleValueType().getSizeInBits());
    // In case when MaskVT equals v2i1 or v4i1, low 2 or 4 elements
    // are extracted by EXTRACT_SUBVECTOR.
    SDValue VMask = DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, MaskVT,
@@ -16974,9 +16958,7 @@ static SDValue LowerINTRINSIC_W_CHAIN(SDValue Op, const X86Subtarget *Subtarget,
  
    SDLoc dl(Op);
    switch(IntrData->Type) {
-  default:
-    llvm_unreachable("Unknown Intrinsic Type");
-    break;
+  default: llvm_unreachable("Unknown Intrinsic Type");
    case RDSEED:
    case RDRAND: {
      // Emit the node with the right value type.
@@ -17081,7 +17063,7 @@ static SDValue LowerINTRINSIC_W_CHAIN(SDValue Op, const X86Subtarget *Subtarget,
      SDValue Addr = Op.getOperand(2);
      SDValue Chain = Op.getOperand(0);
  
-    EVT VT = DataToCompress.getValueType();
+    MVT VT = DataToCompress.getSimpleValueType();
      if (isAllOnes(Mask)) // return just a store
        return DAG.getStore(Chain, dl, DataToCompress, Addr,
                            MachinePointerInfo(), false, false,
@@ -17106,7 +17088,7 @@ static SDValue LowerINTRINSIC_W_CHAIN(SDValue Op, const X86Subtarget *Subtarget,
      SDValue PassThru = Op.getOperand(3);
      SDValue Addr = Op.getOperand(2);
      SDValue Chain = Op.getOperand(0);
-    EVT VT = Op.getValueType();
+    MVT VT = Op.getSimpleValueType();
  
      if (isAllOnes(Mask)) // return just a load
        return DAG.getLoad(VT, dl, Chain, Addr, MachinePointerInfo(), false, false,
@@ -17560,7 +17542,7 @@ static SDValue LowerVectorCTLZ_AVX512(SDValue Op, SelectionDAG &DAG) {
  static SDValue LowerCTLZ(SDValue Op, const X86Subtarget *Subtarget,
                           SelectionDAG &DAG) {
    MVT VT = Op.getSimpleValueType();
-  EVT OpVT = VT;
+  MVT OpVT = VT;
    unsigned NumBits = VT.getSizeInBits();
    SDLoc dl(Op);
  
@@ -17860,7 +17842,7 @@ static SDValue LowerMUL(SDValue Op, const X86Subtarget *Subtarget,
    SDValue AhiBlo = Ahi;
    SDValue AloBhi = Bhi;
    // Bit cast to 32-bit vectors for MULUDQ
-  EVT MulVT = (VT == MVT::v2i64) ? MVT::v4i32 :
+  MVT MulVT = (VT == MVT::v2i64) ? MVT::v4i32 :
                                    (VT == MVT::v4i64) ? MVT::v8i32 : MVT::v16i32;
    A = DAG.getBitcast(MulVT, A);
    B = DAG.getBitcast(MulVT, B);
@@ -17937,7 +17919,7 @@ SDValue X86TargetLowering::LowerWin64_i128OP(SDValue Op, SelectionDAG &DAG) cons
  static SDValue LowerMUL_LOHI(SDValue Op, const X86Subtarget *Subtarget,
                               SelectionDAG &DAG) {
    SDValue Op0 = Op.getOperand(0), Op1 = Op.getOperand(1);
-  EVT VT = Op0.getValueType();
+  MVT VT = Op0.getSimpleValueType();
    SDLoc dl(Op);
  
    assert((VT == MVT::v4i32 && Subtarget->hasSSE2()) ||
@@ -18240,7 +18222,7 @@ static SDValue LowerScalarVariableShift(SDValue Op, SelectionDAG &DAG,
  
    if (SupportedVectorShiftWithBaseAmnt(VT, Subtarget, Op.getOpcode())) {
      SDValue BaseShAmt;
-    EVT EltVT = VT.getVectorElementType();
+    MVT EltVT = VT.getVectorElementType();
  
      if (BuildVectorSDNode *BV = dyn_cast<BuildVectorSDNode>(Amt)) {
        // Check if this build_vector node is doing a splat.
@@ -18257,7 +18239,7 @@ static SDValue LowerScalarVariableShift(SDValue Op, SelectionDAG &DAG,
          unsigned SplatIdx = (unsigned)SVN->getSplatIndex();
          SDValue InVec = Amt.getOperand(0);
          if (InVec.getOpcode() == ISD::BUILD_VECTOR) {
-          assert((SplatIdx < InVec.getValueType().getVectorNumElements()) &&
+          assert((SplatIdx < InVec.getSimpleValueType().getVectorNumElements()) &&
                   "Unexpected shuffle index found!");
            BaseShAmt = InVec.getOperand(SplatIdx);
          } else if (InVec.getOpcode() == ISD::INSERT_VECTOR_ELT) {
@@ -18374,9 +18356,9 @@ static SDValue LowerShift(SDValue Op, const X86Subtarget* Subtarget,
         (Subtarget->hasInt256() && VT == MVT::v16i16)) &&
        ISD::isBuildVectorOfConstantSDNodes(Amt.getNode())) {
      SmallVector<SDValue, 8> Elts;
-    EVT SVT = VT.getScalarType();
+    MVT SVT = VT.getVectorElementType();
      unsigned SVTBits = SVT.getSizeInBits();
-    const APInt &One = APInt(SVTBits, 1);
+    APInt One(SVTBits, 1);
      unsigned NumElems = VT.getVectorNumElements();
  
      for (unsigned i=0; i !=NumElems; ++i) {
@@ -18387,7 +18369,7 @@ static SDValue LowerShift(SDValue Op, const X86Subtarget* Subtarget,
        }
  
        ConstantSDNode *ND = cast<ConstantSDNode>(Op);
-      const APInt &C = APInt(SVTBits, ND->getAPIntValue().getZExtValue());
+      APInt C(SVTBits, ND->getAPIntValue().getZExtValue());
        uint64_t ShAmt = C.getZExtValue();
        if (ShAmt >= SVTBits) {
          Elts.push_back(DAG.getUNDEF(SVT));
@@ -18466,7 +18448,7 @@ static SDValue LowerShift(SDValue Op, const X86Subtarget* Subtarget,
      if (CanBeSimplified && isa<ConstantSDNode>(Amt1) &&
          isa<ConstantSDNode>(Amt2)) {
        // Replace this node with two shifts followed by a MOVSS/MOVSD.
-      EVT CastVT = MVT::v4i32;
+      MVT CastVT = MVT::v4i32;
        SDValue Splat1 =
          DAG.getConstant(cast<ConstantSDNode>(Amt1)->getAPIntValue(), dl, VT);
        SDValue Shift1 = DAG.getNode(Op->getOpcode(), dl, VT, R, Splat1);
@@ -18734,7 +18716,7 @@ static SDValue LowerShift(SDValue Op, const X86Subtarget* Subtarget,
    if (VT.is256BitVector()) {
      unsigned NumElems = VT.getVectorNumElements();
      MVT EltVT = VT.getVectorElementType();
-    EVT NewVT = MVT::getVectorVT(EltVT, NumElems/2);
+    MVT NewVT = MVT::getVectorVT(EltVT, NumElems/2);
  
      // Extract the two vectors
      SDValue V1 = Extract128BitVector(R, 0, DAG, dl);
@@ -18782,10 +18764,10 @@ static SDValue LowerRotate(SDValue Op, const X86Subtarget *Subtarget,
    // +ve/-ve Amt = rotate left/right.
  
    // Split 256-bit integers.
-  if (VT.getSizeInBits() == 256)
+  if (VT.is256BitVector())
      return Lower256IntArith(Op, DAG);
  
-  assert(VT.getSizeInBits() == 128 && "Only rotate 128-bit vectors!");
+  assert(VT.is128BitVector() && "Only rotate 128-bit vectors!");
  
    // Attempt to rotate by immediate.
    if (auto *BVAmt = dyn_cast<BuildVectorSDNode>(Amt)) {
@@ -19103,7 +19085,7 @@ static SDValue LowerBITCAST(SDValue Op, const X86Subtarget *Subtarget,
      SDValue InVec = Op->getOperand(0);
      SDLoc dl(Op);
      unsigned NumElts = SrcVT.getVectorNumElements();
-    EVT SVT = SrcVT.getVectorElementType();
+    MVT SVT = SrcVT.getVectorElementType();
  
      // Widen the vector in input in the case of MVT::v2i32.
      // Example: from MVT::v2i32 to MVT::v4i32.
@@ -19371,7 +19353,7 @@ static SDValue LowerVectorCTPOP(SDValue Op, const X86Subtarget *Subtarget,
  
  static SDValue LowerCTPOP(SDValue Op, const X86Subtarget *Subtarget,
                            SelectionDAG &DAG) {
-  assert(Op.getValueType().isVector() &&
+  assert(Op.getSimpleValueType().isVector() &&
           "We only do custom lowering for vector population count.");
    return LowerVectorCTPOP(Op, Subtarget, DAG);
  }
@@ -19417,7 +19399,7 @@ static SDValue LowerATOMIC_STORE(SDValue Op, SelectionDAG &DAG) {
  }
  
  static SDValue LowerADDC_ADDE_SUBC_SUBE(SDValue Op, SelectionDAG &DAG) {
-  EVT VT = Op.getNode()->getSimpleValueType(0);
+  MVT VT = Op.getNode()->getSimpleValueType(0);
  
    // Let legalize expand this if it isn't a legal type yet.
    if (!DAG.getTargetLoweringInfo().isTypeLegal(VT))
@@ -19501,7 +19483,7 @@ static SDValue LowerMSCATTER(SDValue Op, const X86Subtarget *Subtarget,
           "MGATHER/MSCATTER are supported on AVX-512 arch only");
  
    MaskedScatterSDNode *N = cast<MaskedScatterSDNode>(Op.getNode());
-  EVT VT = N->getValue().getValueType();
+  MVT VT = N->getValue().getSimpleValueType();
    assert(VT.getScalarSizeInBits() >= 32 && "Unsupported scatter op");
    SDLoc dl(Op);
  
@@ -19510,7 +19492,7 @@ static SDValue LowerMSCATTER(SDValue Op, const X86Subtarget *Subtarget,
    if (N->getNumValues() == 1) {
      SDValue Index = N->getIndex();
      if (!Subtarget->hasVLX() && !VT.is512BitVector() &&
-        !Index.getValueType().is512BitVector())
+        !Index.getSimpleValueType().is512BitVector())
        Index = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::v8i64, Index);
  
      SDVTList VTs = DAG.getVTList(N->getMask().getValueType(), MVT::Other);
@@ -19530,13 +19512,13 @@ static SDValue LowerMGATHER(SDValue Op, const X86Subtarget *Subtarget,
           "MGATHER/MSCATTER are supported on AVX-512 arch only");
  
    MaskedGatherSDNode *N = cast<MaskedGatherSDNode>(Op.getNode());
-  EVT VT = Op.getValueType();
+  MVT VT = Op.getSimpleValueType();
    assert(VT.getScalarSizeInBits() >= 32 && "Unsupported gather op");
    SDLoc dl(Op);
  
    SDValue Index = N->getIndex();
    if (!Subtarget->hasVLX() && !VT.is512BitVector() &&
-      !Index.getValueType().is512BitVector()) {
+      !Index.getSimpleValueType().is512BitVector()) {
      Index = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::v8i64, Index);
      SDValue Ops[] = { N->getOperand(0), N->getOperand(1),  N->getOperand(2),
                        N->getOperand(3), Index };
@@ -19706,8 +19688,7 @@ void X86TargetLowering::ReplaceNodeResults(SDNode *N,
    case X86ISD::FMAXC:
    case X86ISD::FMAX: {
      EVT VT = N->getValueType(0);
-    if (VT != MVT::v2f32)
-      llvm_unreachable("Unexpected type (!= v2f32) on FMIN/FMAX.");
+    assert(VT == MVT::v2f32 && "Unexpected type (!= v2f32) on FMIN/FMAX.");
      SDValue UNDEF = DAG.getUNDEF(VT);
      SDValue LHS = DAG.getNode(ISD::CONCAT_VECTORS, dl, MVT::v4f32,
                                N->getOperand(0), UNDEF);
@@ -19807,7 +19788,7 @@ void X86TargetLowering::ReplaceNodeResults(SDNode *N,
      EVT T = N->getValueType(0);
      assert((T == MVT::i64 || T == MVT::i128) && "can only expand cmpxchg pair");
      bool Regs64bit = T == MVT::i128;
-    EVT HalfT = Regs64bit ? MVT::i64 : MVT::i32;
+    MVT HalfT = Regs64bit ? MVT::i64 : MVT::i32;
      SDValue cpInL, cpInH;
      cpInL = DAG.getNode(ISD::EXTRACT_ELEMENT, dl, HalfT, N->getOperand(2),
                          DAG.getConstant(0, dl, HalfT));
@@ -20327,11 +20308,11 @@ X86TargetLowering::isShuffleMaskLegal(const SmallVectorImpl<int> &M,
      return false;
  
    // Not for i1 vectors
-  if (VT.getScalarType() == MVT::i1)
+  if (VT.getSimpleVT().getScalarType() == MVT::i1)
      return false;
  
    // Very little shuffling can be done for 64-bit vectors right now.
-  if (VT.getSizeInBits() == 64)
+  if (VT.getSimpleVT().getSizeInBits() == 64)
      return false;
  
    // We only care that the types being shuffled are legal. The lowering can
@@ -22035,7 +22016,7 @@ unsigned X86TargetLowering::ComputeNumSignBitsForTargetNode(
    unsigned Depth) const {
    // SETCC_CARRY sets the dest to ~0 for true or 0 for false.
    if (Op.getOpcode() == X86ISD::SETCC_CARRY)
-    return Op.getValueType().getScalarType().getSizeInBits();
+    return Op.getValueType().getScalarSizeInBits();
  
    // Fallback case.
    return 1;
@@ -22239,7 +22220,7 @@ static bool combineX86ShuffleChain(SDValue Op, SDValue Root, ArrayRef<int> Mask,
    // doesn't preclude something switching to the shorter encoding post-RA.
    //
    // FIXME: Should teach these routines about AVX vector widths.
-  if (FloatDomain && VT.getSizeInBits() == 128) {
+  if (FloatDomain && VT.is128BitVector()) {
      if (Mask.equals({0, 0}) || Mask.equals({1, 1})) {
        bool Lo = Mask.equals({0, 0});
        unsigned Shuffle;
@@ -22303,7 +22284,7 @@ static bool combineX86ShuffleChain(SDValue Op, SDValue Root, ArrayRef<int> Mask,
    // We always canonicalize the 8 x i16 and 16 x i8 shuffles into their UNPCK
    // variants as none of these have single-instruction variants that are
    // superior to the UNPCK formulation.
-  if (!FloatDomain && VT.getSizeInBits() == 128 &&
+  if (!FloatDomain && VT.is128BitVector() &&
        (Mask.equals({0, 0, 1, 1, 2, 2, 3, 3}) ||
         Mask.equals({4, 4, 5, 5, 6, 6, 7, 7}) ||
         Mask.equals({0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7}) ||
@@ -22616,8 +22597,8 @@ combineRedundantDWordShuffle(SDValue N, MutableArrayRef<int> Mask,
      case X86ISD::UNPCKH:
        // For either i8 -> i16 or i16 -> i32 unpacks, we can combine a dword
        // shuffle into a preceding word shuffle.
-      if (V.getSimpleValueType().getScalarType() != MVT::i8 &&
-          V.getSimpleValueType().getScalarType() != MVT::i16)
+      if (V.getSimpleValueType().getVectorElementType() != MVT::i8 &&
+          V.getSimpleValueType().getVectorElementType() != MVT::i16)
          return SDValue();
  
        // Search for a half-shuffle which we can combine with.
@@ -22792,7 +22773,7 @@ static SDValue PerformTargetShuffleCombine(SDValue N, SelectionDAG &DAG,
      break;
    case X86ISD::PSHUFLW:
    case X86ISD::PSHUFHW:
-    assert(VT.getScalarType() == MVT::i16 && "Bad word shuffle type!");
+    assert(VT.getVectorElementType() == MVT::i16 && "Bad word shuffle type!");
  
      if (combineRedundantHalfShuffle(N, Mask, DAG, DCI))
        return SDValue(); // We combined away this shuffle, so we're done.
@@ -23123,21 +23104,45 @@ static SDValue XFormVExtractWithShuffleIntoLoad(SDNode *N, SelectionDAG &DAG,
                       EltNo);
  }
  
-/// \brief Detect bitcasts between i32 to x86mmx low word. Since MMX types are
-/// special and don't usually play with other vector types, it's better to
-/// handle them early to be sure we emit efficient code by avoiding
-/// store-load conversions.
-static SDValue PerformBITCASTCombine(SDNode *N, SelectionDAG &DAG) {
-  if (N->getValueType(0) != MVT::x86mmx ||
-      N->getOperand(0)->getOpcode() != ISD::BUILD_VECTOR ||
-      N->getOperand(0)->getValueType(0) != MVT::v2i32)
-    return SDValue();
+static SDValue PerformBITCASTCombine(SDNode *N, SelectionDAG &DAG,
+                                     const X86Subtarget *Subtarget) {
+  SDValue N0 = N->getOperand(0);
+  EVT VT = N->getValueType(0);
  
-  SDValue V = N->getOperand(0);
-  ConstantSDNode *C = dyn_cast<ConstantSDNode>(V.getOperand(1));
-  if (C && C->getZExtValue() == 0 && V.getOperand(0).getValueType() == MVT::i32)
-    return DAG.getNode(X86ISD::MMX_MOVW2D, SDLoc(V.getOperand(0)),
-                       N->getValueType(0), V.getOperand(0));
+  // Detect bitcasts between i32 to x86mmx low word. Since MMX types are
+  // special and don't usually play with other vector types, it's better to
+  // handle them early to be sure we emit efficient code by avoiding
+  // store-load conversions.
+  if (VT == MVT::x86mmx && N0.getOpcode() == ISD::BUILD_VECTOR &&
+      N0.getValueType() == MVT::v2i32 &&
+      isa<ConstantSDNode>(N0.getOperand(1))) {
+    SDValue N00 = N0->getOperand(0);
+    if (N0.getConstantOperandVal(1) == 0 && N00.getValueType() == MVT::i32)
+      return DAG.getNode(X86ISD::MMX_MOVW2D, SDLoc(N00), VT, N00);
+  }
+
+  // Convert a bitcasted integer logic operation that has one bitcasted
+  // floating-point operand and one constant operand into a floating-point
+  // logic operation. This may create a load of the constant, but that is
+  // cheaper than materializing the constant in an integer register and
+  // transferring it to an SSE register or transferring the SSE operand to
+  // integer register and back.
+  unsigned FPOpcode;
+  switch (N0.getOpcode()) {
+    case ISD::AND: FPOpcode = X86ISD::FAND; break;
+    case ISD::OR:  FPOpcode = X86ISD::FOR;  break;
+    case ISD::XOR: FPOpcode = X86ISD::FXOR; break;
+    default: return SDValue();
+  }
+  if (((Subtarget->hasSSE1() && VT == MVT::f32) ||
+       (Subtarget->hasSSE2() && VT == MVT::f64)) &&
+      isa<ConstantSDNode>(N0.getOperand(1)) &&
+      N0.getOperand(0).getOpcode() == ISD::BITCAST &&
+      N0.getOperand(0).getOperand(0).getValueType() == VT) {
+    SDValue N000 = N0.getOperand(0).getOperand(0);
+    SDValue FPConst = DAG.getBitcast(VT, N0.getOperand(1));
+    return DAG.getNode(FPOpcode, SDLoc(N0), VT, N000, FPConst);
+  }
  
    return SDValue();
  }
@@ -23180,9 +23185,9 @@ static SDValue PerformEXTRACT_VECTOR_ELTCombine(SDNode *N, SelectionDAG &DAG,
  
    EVT VT = N->getValueType(0);
  
-  if (VT == MVT::i1 && dyn_cast<ConstantSDNode>(N->getOperand(1)) &&
+  if (VT == MVT::i1 && isa<ConstantSDNode>(N->getOperand(1)) &&
        InputVector.getOpcode() == ISD::BITCAST &&
-      dyn_cast<ConstantSDNode>(InputVector.getOperand(0))) {
+      isa<ConstantSDNode>(InputVector.getOperand(0))) {
      uint64_t ExtractedElt =
          cast<ConstantSDNode>(N->getOperand(1))->getZExtValue();
      uint64_t InputValue =
@@ -23776,7 +23781,7 @@ static SDValue PerformSELECTCombine(SDNode *N, SelectionDAG &DAG,
    if (N->getOpcode() == ISD::VSELECT && DCI.isBeforeLegalizeOps() &&
        !DCI.isBeforeLegalize() &&
        !ISD::isBuildVectorOfConstantSDNodes(Cond.getNode())) {
-    unsigned BitWidth = Cond.getValueType().getScalarType().getSizeInBits();
+    unsigned BitWidth = Cond.getValueType().getScalarSizeInBits();
  
      // Don't optimize vector selects that map to mask-registers.
      if (BitWidth == 1)
@@ -23797,14 +23802,13 @@ static SDValue PerformSELECTCombine(SDNode *N, SelectionDAG &DAG,
      // FIXME: We don't support i16-element blends currently. We could and
      // should support them by making *all* the bits in the condition be set
      // rather than just the high bit and using an i8-element blend.
-    if (VT.getScalarType() == MVT::i16)
+    if (VT.getVectorElementType() == MVT::i16)
        return SDValue();
      // Dynamic blending was only available from SSE4.1 onward.
-    if (VT.getSizeInBits() == 128 && !Subtarget->hasSSE41())
+    if (VT.is128BitVector() && !Subtarget->hasSSE41())
        return SDValue();
      // Byte blends are only available in AVX2
-    if (VT.getSizeInBits() == 256 && VT.getScalarType() == MVT::i8 &&
-        !Subtarget->hasAVX2())
+    if (VT == MVT::v32i8 && !Subtarget->hasAVX2())
        return SDValue();
  
      assert(BitWidth >= 8 && BitWidth <= 64 && "Invalid mask size");
@@ -24387,7 +24391,8 @@ static SDValue performShiftToAllZeros(SDNode *N, SelectionDAG &DAG,
    if (auto *AmtBV = dyn_cast<BuildVectorSDNode>(Amt))
      if (auto *AmtSplat = AmtBV->getConstantSplatNode()) {
        APInt ShiftAmt = AmtSplat->getAPIntValue();
-      unsigned MaxAmount = VT.getVectorElementType().getSizeInBits();
+      unsigned MaxAmount =
+        VT.getSimpleVT().getVectorElementType().getSizeInBits();
  
        // SSE2/AVX2 logical shifts always return a vector of 0s
        // if the shift amount is bigger than or equal to
@@ -24603,7 +24608,7 @@ static SDValue WidenMaskArithmetic(SDNode *N, SelectionDAG &DAG,
    // Set N0 and N1 to hold the inputs to the new wide operation.
    N0 = N0->getOperand(0);
    if (RHSConstSplat) {
-    N1 = DAG.getNode(ISD::ZERO_EXTEND, DL, WideVT.getScalarType(),
+    N1 = DAG.getNode(ISD::ZERO_EXTEND, DL, WideVT.getVectorElementType(),
                       SDValue(RHSConstSplat, 0));
      SmallVector<SDValue, 8> C(WideVT.getVectorNumElements(), N1);
      N1 = DAG.getNode(ISD::BUILD_VECTOR, DL, WideVT, C);
@@ -24618,9 +24623,9 @@ static SDValue WidenMaskArithmetic(SDNode *N, SelectionDAG &DAG,
    case ISD::ANY_EXTEND:
      return Op;
    case ISD::ZERO_EXTEND: {
-    unsigned InBits = NarrowVT.getScalarType().getSizeInBits();
+    unsigned InBits = NarrowVT.getScalarSizeInBits();
      APInt Mask = APInt::getAllOnesValue(InBits);
-    Mask = Mask.zext(VT.getScalarType().getSizeInBits());
+    Mask = Mask.zext(VT.getScalarSizeInBits());
      return DAG.getNode(ISD::AND, DL, VT,
                         Op, DAG.getConstant(Mask, DL, VT));
    }
@@ -24906,7 +24911,7 @@ static SDValue PerformOrCombine(SDNode *N, SelectionDAG &DAG,
        if (!Subtarget->hasSSE41())
          return SDValue();
  
-      EVT BlendVT = (VT == MVT::v4i64) ? MVT::v32i8 : MVT::v16i8;
+      MVT BlendVT = (VT == MVT::v4i64) ? MVT::v32i8 : MVT::v16i8;
  
        X = DAG.getBitcast(BlendVT, X);
        Y = DAG.getBitcast(BlendVT, Y);
@@ -25482,7 +25487,7 @@ static SDValue PerformSTORECombine(SDNode *N, SelectionDAG &DAG,
      // Otherwise, if it's legal to use f64 SSE instructions, use f64 load/store
      // pair instead.
      if (Subtarget->is64Bit() || F64IsLegal) {
-      EVT LdVT = Subtarget->is64Bit() ? MVT::i64 : MVT::f64;
+      MVT LdVT = Subtarget->is64Bit() ? MVT::i64 : MVT::f64;
        SDValue NewLd = DAG.getLoad(LdVT, LdDL, Ld->getChain(), Ld->getBasePtr(),
                                    Ld->getPointerInfo(), Ld->isVolatile(),
                                    Ld->isNonTemporal(), Ld->isInvariant(),
@@ -26004,7 +26009,7 @@ static SDValue PerformSExtCombine(SDNode *N, SelectionDAG &DAG,
      }
    }
  
-  if (Subtarget->hasAVX() && VT.isVector() && VT.getSizeInBits() == 256)
+  if (Subtarget->hasAVX() && VT.is256BitVector())
      if (SDValue R = WidenMaskArithmetic(N, DAG, DCI, Subtarget))
        return R;
  
@@ -26635,7 +26640,7 @@ SDValue X86TargetLowering::PerformDAGCombine(SDNode *N,
    case ISD::SELECT:
    case X86ISD::SHRUNKBLEND:
      return PerformSELECTCombine(N, DAG, DCI, Subtarget);
-  case ISD::BITCAST:        return PerformBITCASTCombine(N, DAG);
+  case ISD::BITCAST:        return PerformBITCASTCombine(N, DAG, Subtarget);
    case X86ISD::CMOV:        return PerformCMOVCombine(N, DAG, DCI, Subtarget);
    case ISD::ADD:            return PerformAddCombine(N, DAG, Subtarget);
    case ISD::SUB:            return PerformSubCombine(N, DAG, Subtarget);