lib/CodeGen/SelectionDAG/SelectionDAG.cpp

   1 //===-- SelectionDAG.cpp - Implement the SelectionDAG data structures -----===//
   2 //
   3 //                     The LLVM Compiler Infrastructure
   4 //
   5 // This file is distributed under the University of Illinois Open Source
   6 // License. See LICENSE.TXT for details.
   7 //
   8 //===----------------------------------------------------------------------===//
   9 //
  10 // This implements the SelectionDAG class.
  11 //
  12 //===----------------------------------------------------------------------===//
  13
  14 #include "llvm/CodeGen/SelectionDAG.h"
  15 #include "SDNodeDbgValue.h"
  16 #include "llvm/ADT/APSInt.h"
  17 #include "llvm/ADT/SetVector.h"
  18 #include "llvm/ADT/SmallPtrSet.h"
  19 #include "llvm/ADT/SmallSet.h"
  20 #include "llvm/ADT/SmallVector.h"
  21 #include "llvm/ADT/StringExtras.h"
  22 #include "llvm/Analysis/ValueTracking.h"
  23 #include "llvm/CodeGen/MachineBasicBlock.h"
  24 #include "llvm/CodeGen/MachineConstantPool.h"
  25 #include "llvm/CodeGen/MachineFrameInfo.h"
  26 #include "llvm/CodeGen/MachineModuleInfo.h"
  27 #include "llvm/IR/CallingConv.h"
  28 #include "llvm/IR/Constants.h"
  29 #include "llvm/IR/DataLayout.h"
  30 #include "llvm/IR/DebugInfo.h"
  31 #include "llvm/IR/DerivedTypes.h"
  32 #include "llvm/IR/Function.h"
  33 #include "llvm/IR/GlobalAlias.h"
  34 #include "llvm/IR/GlobalVariable.h"
  35 #include "llvm/IR/Intrinsics.h"
  36 #include "llvm/Support/CommandLine.h"
  37 #include "llvm/Support/Debug.h"
  38 #include "llvm/Support/ErrorHandling.h"
  39 #include "llvm/Support/ManagedStatic.h"
  40 #include "llvm/Support/MathExtras.h"
  41 #include "llvm/Support/Mutex.h"
  42 #include "llvm/Support/raw_ostream.h"
  43 #include "llvm/Target/TargetInstrInfo.h"
  44 #include "llvm/Target/TargetIntrinsicInfo.h"
  45 #include "llvm/Target/TargetLowering.h"
  46 #include "llvm/Target/TargetMachine.h"
  47 #include "llvm/Target/TargetOptions.h"
  48 #include "llvm/Target/TargetRegisterInfo.h"
  49 #include "llvm/Target/TargetSelectionDAGInfo.h"
  50 #include "llvm/Target/TargetSubtargetInfo.h"
  51 #include <algorithm>
  52 #include <cmath>
  53 #include <utility>
  54
  55 using namespace llvm;
  56
  57 /// makeVTList - Return an instance of the SDVTList struct initialized with the
  58 /// specified members.
  59 static SDVTList makeVTList(const EVT *VTs, unsigned NumVTs) {
  60   SDVTList Res = {VTs, NumVTs};
  61   return Res;
  62 }
  63
  64 // Default null implementations of the callbacks.
  65 void SelectionDAG::DAGUpdateListener::NodeDeleted(SDNode*, SDNode*) {}
  66 void SelectionDAG::DAGUpdateListener::NodeUpdated(SDNode*) {}
  67
  68 //===----------------------------------------------------------------------===//
  69 //                              ConstantFPSDNode Class
  70 //===----------------------------------------------------------------------===//
  71
  72 /// isExactlyValue - We don't rely on operator== working on double values, as
  73 /// it returns true for things that are clearly not equal, like -0.0 and 0.0.
  74 /// As such, this method can be used to do an exact bit-for-bit comparison of
  75 /// two floating point values.
  76 bool ConstantFPSDNode::isExactlyValue(const APFloat& V) const {
  77   return getValueAPF().bitwiseIsEqual(V);
  78 }
  79
  80 bool ConstantFPSDNode::isValueValidForType(EVT VT,
  81                                            const APFloat& Val) {
  82   assert(VT.isFloatingPoint() && "Can only convert between FP types");
  83
  84   // convert modifies in place, so make a copy.
  85   APFloat Val2 = APFloat(Val);
  86   bool losesInfo;
  87   (void) Val2.convert(SelectionDAG::EVTToAPFloatSemantics(VT),
  88                       APFloat::rmNearestTiesToEven,
  89                       &losesInfo);
  90   return !losesInfo;
  91 }
  92
  93 //===----------------------------------------------------------------------===//
  94 //                              ISD Namespace
  95 //===----------------------------------------------------------------------===//
  96
  97 /// isBuildVectorAllOnes - Return true if the specified node is a
  98 /// BUILD_VECTOR where all of the elements are ~0 or undef.
  99 bool ISD::isBuildVectorAllOnes(const SDNode *N) {
 100   // Look through a bit convert.
 101   while (N->getOpcode() == ISD::BITCAST)
 102     N = N->getOperand(0).getNode();
 103
 104   if (N->getOpcode() != ISD::BUILD_VECTOR) return false;
 105
 106   unsigned i = 0, e = N->getNumOperands();
 107
 108   // Skip over all of the undef values.
 109   while (i != e && N->getOperand(i).getOpcode() == ISD::UNDEF)
 110     ++i;
 111
 112   // Do not accept an all-undef vector.
 113   if (i == e) return false;
 114
 115   // Do not accept build_vectors that aren't all constants or which have non-~0
 116   // elements. We have to be a bit careful here, as the type of the constant
 117   // may not be the same as the type of the vector elements due to type
 118   // legalization (the elements are promoted to a legal type for the target and
 119   // a vector of a type may be legal when the base element type is not).
 120   // We only want to check enough bits to cover the vector elements, because
 121   // we care if the resultant vector is all ones, not whether the individual
 122   // constants are.
 123   SDValue NotZero = N->getOperand(i);
 124   unsigned EltSize = N->getValueType(0).getVectorElementType().getSizeInBits();
 125   if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(NotZero)) {
 126     if (CN->getAPIntValue().countTrailingOnes() < EltSize)
 127       return false;
 128   } else if (ConstantFPSDNode *CFPN = dyn_cast<ConstantFPSDNode>(NotZero)) {
 129     if (CFPN->getValueAPF().bitcastToAPInt().countTrailingOnes() < EltSize)
 130       return false;
 131   } else
 132     return false;
 133
 134   // Okay, we have at least one ~0 value, check to see if the rest match or are
 135   // undefs. Even with the above element type twiddling, this should be OK, as
 136   // the same type legalization should have applied to all the elements.
 137   for (++i; i != e; ++i)
 138     if (N->getOperand(i) != NotZero &&
 139         N->getOperand(i).getOpcode() != ISD::UNDEF)
 140       return false;
 141   return true;
 142 }
 143
 144
 145 /// isBuildVectorAllZeros - Return true if the specified node is a
 146 /// BUILD_VECTOR where all of the elements are 0 or undef.
 147 bool ISD::isBuildVectorAllZeros(const SDNode *N) {
 148   // Look through a bit convert.
 149   while (N->getOpcode() == ISD::BITCAST)
 150     N = N->getOperand(0).getNode();
 151
 152   if (N->getOpcode() != ISD::BUILD_VECTOR) return false;
 153
 154   bool IsAllUndef = true;
 155   for (const SDValue &Op : N->op_values()) {
 156     if (Op.getOpcode() == ISD::UNDEF)
 157       continue;
 158     IsAllUndef = false;
 159     // Do not accept build_vectors that aren't all constants or which have non-0
 160     // elements. We have to be a bit careful here, as the type of the constant
 161     // may not be the same as the type of the vector elements due to type
 162     // legalization (the elements are promoted to a legal type for the target
 163     // and a vector of a type may be legal when the base element type is not).
 164     // We only want to check enough bits to cover the vector elements, because
 165     // we care if the resultant vector is all zeros, not whether the individual
 166     // constants are.
 167     unsigned EltSize = N->getValueType(0).getVectorElementType().getSizeInBits();
 168     if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Op)) {
 169       if (CN->getAPIntValue().countTrailingZeros() < EltSize)
 170         return false;
 171     } else if (ConstantFPSDNode *CFPN = dyn_cast<ConstantFPSDNode>(Op)) {
 172       if (CFPN->getValueAPF().bitcastToAPInt().countTrailingZeros() < EltSize)
 173         return false;
 174     } else
 175       return false;
 176   }
 177
 178   // Do not accept an all-undef vector.
 179   if (IsAllUndef)
 180     return false;
 181   return true;
 182 }
 183
 184 /// \brief Return true if the specified node is a BUILD_VECTOR node of
 185 /// all ConstantSDNode or undef.
 186 bool ISD::isBuildVectorOfConstantSDNodes(const SDNode *N) {
 187   if (N->getOpcode() != ISD::BUILD_VECTOR)
 188     return false;
 189
 190   for (const SDValue &Op : N->op_values()) {
 191     if (Op.getOpcode() == ISD::UNDEF)
 192       continue;
 193     if (!isa<ConstantSDNode>(Op))
 194       return false;
 195   }
 196   return true;
 197 }
 198
 199 /// \brief Return true if the specified node is a BUILD_VECTOR node of
 200 /// all ConstantFPSDNode or undef.
 201 bool ISD::isBuildVectorOfConstantFPSDNodes(const SDNode *N) {
 202   if (N->getOpcode() != ISD::BUILD_VECTOR)
 203     return false;
 204
 205   for (const SDValue &Op : N->op_values()) {
 206     if (Op.getOpcode() == ISD::UNDEF)
 207       continue;
 208     if (!isa<ConstantFPSDNode>(Op))
 209       return false;
 210   }
 211   return true;
 212 }
 213
 214 /// allOperandsUndef - Return true if the node has at least one operand
 215 /// and all operands of the specified node are ISD::UNDEF.
 216 bool ISD::allOperandsUndef(const SDNode *N) {
 217   // Return false if the node has no operands.
 218   // This is "logically inconsistent" with the definition of "all" but
 219   // is probably the desired behavior.
 220   if (N->getNumOperands() == 0)
 221     return false;
 222
 223   for (const SDValue &Op : N->op_values())
 224     if (Op.getOpcode() != ISD::UNDEF)
 225       return false;
 226
 227   return true;
 228 }
 229
 230 ISD::NodeType ISD::getExtForLoadExtType(bool IsFP, ISD::LoadExtType ExtType) {
 231   switch (ExtType) {
 232   case ISD::EXTLOAD:
 233     return IsFP ? ISD::FP_EXTEND : ISD::ANY_EXTEND;
 234   case ISD::SEXTLOAD:
 235     return ISD::SIGN_EXTEND;
 236   case ISD::ZEXTLOAD:
 237     return ISD::ZERO_EXTEND;
 238   default:
 239     break;
 240   }
 241
 242   llvm_unreachable("Invalid LoadExtType");
 243 }
 244
 245 /// getSetCCSwappedOperands - Return the operation corresponding to (Y op X)
 246 /// when given the operation for (X op Y).
 247 ISD::CondCode ISD::getSetCCSwappedOperands(ISD::CondCode Operation) {
 248   // To perform this operation, we just need to swap the L and G bits of the
 249   // operation.
 250   unsigned OldL = (Operation >> 2) & 1;
 251   unsigned OldG = (Operation >> 1) & 1;
 252   return ISD::CondCode((Operation & ~6) |  // Keep the N, U, E bits
 253                        (OldL << 1) |       // New G bit
 254                        (OldG << 2));       // New L bit.
 255 }
 256
 257 /// getSetCCInverse - Return the operation corresponding to !(X op Y), where
 258 /// 'op' is a valid SetCC operation.
 259 ISD::CondCode ISD::getSetCCInverse(ISD::CondCode Op, bool isInteger) {
 260   unsigned Operation = Op;
 261   if (isInteger)
 262     Operation ^= 7;   // Flip L, G, E bits, but not U.
 263   else
 264     Operation ^= 15;  // Flip all of the condition bits.
 265
 266   if (Operation > ISD::SETTRUE2)
 267     Operation &= ~8;  // Don't let N and U bits get set.
 268
 269   return ISD::CondCode(Operation);
 270 }
 271
 272
 273 /// isSignedOp - For an integer comparison, return 1 if the comparison is a
 274 /// signed operation and 2 if the result is an unsigned comparison.  Return zero
 275 /// if the operation does not depend on the sign of the input (setne and seteq).
 276 static int isSignedOp(ISD::CondCode Opcode) {
 277   switch (Opcode) {
 278   default: llvm_unreachable("Illegal integer setcc operation!");
 279   case ISD::SETEQ:
 280   case ISD::SETNE: return 0;
 281   case ISD::SETLT:
 282   case ISD::SETLE:
 283   case ISD::SETGT:
 284   case ISD::SETGE: return 1;
 285   case ISD::SETULT:
 286   case ISD::SETULE:
 287   case ISD::SETUGT:
 288   case ISD::SETUGE: return 2;
 289   }
 290 }
 291
 292 /// getSetCCOrOperation - Return the result of a logical OR between different
 293 /// comparisons of identical values: ((X op1 Y) | (X op2 Y)).  This function
 294 /// returns SETCC_INVALID if it is not possible to represent the resultant
 295 /// comparison.
 296 ISD::CondCode ISD::getSetCCOrOperation(ISD::CondCode Op1, ISD::CondCode Op2,
 297                                        bool isInteger) {
 298   if (isInteger && (isSignedOp(Op1) | isSignedOp(Op2)) == 3)
 299     // Cannot fold a signed integer setcc with an unsigned integer setcc.
 300     return ISD::SETCC_INVALID;
 301
 302   unsigned Op = Op1 | Op2;  // Combine all of the condition bits.
 303
 304   // If the N and U bits get set then the resultant comparison DOES suddenly
 305   // care about orderedness, and is true when ordered.
 306   if (Op > ISD::SETTRUE2)
 307     Op &= ~16;     // Clear the U bit if the N bit is set.
 308
 309   // Canonicalize illegal integer setcc's.
 310   if (isInteger && Op == ISD::SETUNE)  // e.g. SETUGT | SETULT
 311     Op = ISD::SETNE;
 312
 313   return ISD::CondCode(Op);
 314 }
 315
 316 /// getSetCCAndOperation - Return the result of a logical AND between different
 317 /// comparisons of identical values: ((X op1 Y) & (X op2 Y)).  This
 318 /// function returns zero if it is not possible to represent the resultant
 319 /// comparison.
 320 ISD::CondCode ISD::getSetCCAndOperation(ISD::CondCode Op1, ISD::CondCode Op2,
 321                                         bool isInteger) {
 322   if (isInteger && (isSignedOp(Op1) | isSignedOp(Op2)) == 3)
 323     // Cannot fold a signed setcc with an unsigned setcc.
 324     return ISD::SETCC_INVALID;
 325
 326   // Combine all of the condition bits.
 327   ISD::CondCode Result = ISD::CondCode(Op1 & Op2);
 328
 329   // Canonicalize illegal integer setcc's.
 330   if (isInteger) {
 331     switch (Result) {
 332     default: break;
 333     case ISD::SETUO : Result = ISD::SETFALSE; break;  // SETUGT & SETULT
 334     case ISD::SETOEQ:                                 // SETEQ  & SETU[LG]E
 335     case ISD::SETUEQ: Result = ISD::SETEQ   ; break;  // SETUGE & SETULE
 336     case ISD::SETOLT: Result = ISD::SETULT  ; break;  // SETULT & SETNE
 337     case ISD::SETOGT: Result = ISD::SETUGT  ; break;  // SETUGT & SETNE
 338     }
 339   }
 340
 341   return Result;
 342 }
 343
 344 //===----------------------------------------------------------------------===//
 345 //                           SDNode Profile Support
 346 //===----------------------------------------------------------------------===//
 347
 348 /// AddNodeIDOpcode - Add the node opcode to the NodeID data.
 349 ///
 350 static void AddNodeIDOpcode(FoldingSetNodeID &ID, unsigned OpC)  {
 351   ID.AddInteger(OpC);
 352 }
 353
 354 /// AddNodeIDValueTypes - Value type lists are intern'd so we can represent them
 355 /// solely with their pointer.
 356 static void AddNodeIDValueTypes(FoldingSetNodeID &ID, SDVTList VTList) {
 357   ID.AddPointer(VTList.VTs);
 358 }
 359
 360 /// AddNodeIDOperands - Various routines for adding operands to the NodeID data.
 361 ///
 362 static void AddNodeIDOperands(FoldingSetNodeID &ID,
 363                               ArrayRef<SDValue> Ops) {
 364   for (auto& Op : Ops) {
 365     ID.AddPointer(Op.getNode());
 366     ID.AddInteger(Op.getResNo());
 367   }
 368 }
 369
 370 /// AddNodeIDOperands - Various routines for adding operands to the NodeID data.
 371 ///
 372 static void AddNodeIDOperands(FoldingSetNodeID &ID,
 373                               ArrayRef<SDUse> Ops) {
 374   for (auto& Op : Ops) {
 375     ID.AddPointer(Op.getNode());
 376     ID.AddInteger(Op.getResNo());
 377   }
 378 }
 379
 380 /// Add logical or fast math flag values to FoldingSetNodeID value.
 381 static void AddNodeIDFlags(FoldingSetNodeID &ID, unsigned Opcode,
 382                            const SDNodeFlags *Flags) {
 383   if (!isBinOpWithFlags(Opcode))
 384     return;
 385
 386   unsigned RawFlags = 0;
 387   if (Flags)
 388     RawFlags = Flags->getRawFlags();
 389   ID.AddInteger(RawFlags);
 390 }
 391
 392 static void AddNodeIDFlags(FoldingSetNodeID &ID, const SDNode *N) {
 393   AddNodeIDFlags(ID, N->getOpcode(), N->getFlags());
 394 }
 395
 396 static void AddNodeIDNode(FoldingSetNodeID &ID, unsigned short OpC,
 397                           SDVTList VTList, ArrayRef<SDValue> OpList) {
 398   AddNodeIDOpcode(ID, OpC);
 399   AddNodeIDValueTypes(ID, VTList);
 400   AddNodeIDOperands(ID, OpList);
 401 }
 402
 403 /// If this is an SDNode with special info, add this info to the NodeID data.
 404 static void AddNodeIDCustom(FoldingSetNodeID &ID, const SDNode *N) {
 405   switch (N->getOpcode()) {
 406   case ISD::TargetExternalSymbol:
 407   case ISD::ExternalSymbol:
 408   case ISD::MCSymbol:
 409     llvm_unreachable("Should only be used on nodes with operands");
 410   default: break;  // Normal nodes don't need extra info.
 411   case ISD::TargetConstant:
 412   case ISD::Constant: {
 413     const ConstantSDNode *C = cast<ConstantSDNode>(N);
 414     ID.AddPointer(C->getConstantIntValue());
 415     ID.AddBoolean(C->isOpaque());
 416     break;
 417   }
 418   case ISD::TargetConstantFP:
 419   case ISD::ConstantFP: {
 420     ID.AddPointer(cast<ConstantFPSDNode>(N)->getConstantFPValue());
 421     break;
 422   }
 423   case ISD::TargetGlobalAddress:
 424   case ISD::GlobalAddress:
 425   case ISD::TargetGlobalTLSAddress:
 426   case ISD::GlobalTLSAddress: {
 427     const GlobalAddressSDNode *GA = cast<GlobalAddressSDNode>(N);
 428     ID.AddPointer(GA->getGlobal());
 429     ID.AddInteger(GA->getOffset());
 430     ID.AddInteger(GA->getTargetFlags());
 431     ID.AddInteger(GA->getAddressSpace());
 432     break;
 433   }
 434   case ISD::BasicBlock:
 435     ID.AddPointer(cast<BasicBlockSDNode>(N)->getBasicBlock());
 436     break;
 437   case ISD::Register:
 438     ID.AddInteger(cast<RegisterSDNode>(N)->getReg());
 439     break;
 440   case ISD::RegisterMask:
 441     ID.AddPointer(cast<RegisterMaskSDNode>(N)->getRegMask());
 442     break;
 443   case ISD::SRCVALUE:
 444     ID.AddPointer(cast<SrcValueSDNode>(N)->getValue());
 445     break;
 446   case ISD::FrameIndex:
 447   case ISD::TargetFrameIndex:
 448     ID.AddInteger(cast<FrameIndexSDNode>(N)->getIndex());
 449     break;
 450   case ISD::JumpTable:
 451   case ISD::TargetJumpTable:
 452     ID.AddInteger(cast<JumpTableSDNode>(N)->getIndex());
 453     ID.AddInteger(cast<JumpTableSDNode>(N)->getTargetFlags());
 454     break;
 455   case ISD::ConstantPool:
 456   case ISD::TargetConstantPool: {
 457     const ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(N);
 458     ID.AddInteger(CP->getAlignment());
 459     ID.AddInteger(CP->getOffset());
 460     if (CP->isMachineConstantPoolEntry())
 461       CP->getMachineCPVal()->addSelectionDAGCSEId(ID);
 462     else
 463       ID.AddPointer(CP->getConstVal());
 464     ID.AddInteger(CP->getTargetFlags());
 465     break;
 466   }
 467   case ISD::TargetIndex: {
 468     const TargetIndexSDNode *TI = cast<TargetIndexSDNode>(N);
 469     ID.AddInteger(TI->getIndex());
 470     ID.AddInteger(TI->getOffset());
 471     ID.AddInteger(TI->getTargetFlags());
 472     break;
 473   }
 474   case ISD::LOAD: {
 475     const LoadSDNode *LD = cast<LoadSDNode>(N);
 476     ID.AddInteger(LD->getMemoryVT().getRawBits());
 477     ID.AddInteger(LD->getRawSubclassData());
 478     ID.AddInteger(LD->getPointerInfo().getAddrSpace());
 479     break;
 480   }
 481   case ISD::STORE: {
 482     const StoreSDNode *ST = cast<StoreSDNode>(N);
 483     ID.AddInteger(ST->getMemoryVT().getRawBits());
 484     ID.AddInteger(ST->getRawSubclassData());
 485     ID.AddInteger(ST->getPointerInfo().getAddrSpace());
 486     break;
 487   }
 488   case ISD::ATOMIC_CMP_SWAP:
 489   case ISD::ATOMIC_CMP_SWAP_WITH_SUCCESS:
 490   case ISD::ATOMIC_SWAP:
 491   case ISD::ATOMIC_LOAD_ADD:
 492   case ISD::ATOMIC_LOAD_SUB:
 493   case ISD::ATOMIC_LOAD_AND:
 494   case ISD::ATOMIC_LOAD_OR:
 495   case ISD::ATOMIC_LOAD_XOR:
 496   case ISD::ATOMIC_LOAD_NAND:
 497   case ISD::ATOMIC_LOAD_MIN:
 498   case ISD::ATOMIC_LOAD_MAX:
 499   case ISD::ATOMIC_LOAD_UMIN:
 500   case ISD::ATOMIC_LOAD_UMAX:
 501   case ISD::ATOMIC_LOAD:
 502   case ISD::ATOMIC_STORE: {
 503     const AtomicSDNode *AT = cast<AtomicSDNode>(N);
 504     ID.AddInteger(AT->getMemoryVT().getRawBits());
 505     ID.AddInteger(AT->getRawSubclassData());
 506     ID.AddInteger(AT->getPointerInfo().getAddrSpace());
 507     break;
 508   }
 509   case ISD::PREFETCH: {
 510     const MemSDNode *PF = cast<MemSDNode>(N);
 511     ID.AddInteger(PF->getPointerInfo().getAddrSpace());
 512     break;
 513   }
 514   case ISD::VECTOR_SHUFFLE: {
 515     const ShuffleVectorSDNode *SVN = cast<ShuffleVectorSDNode>(N);
 516     for (unsigned i = 0, e = N->getValueType(0).getVectorNumElements();
 517          i != e; ++i)
 518       ID.AddInteger(SVN->getMaskElt(i));
 519     break;
 520   }
 521   case ISD::TargetBlockAddress:
 522   case ISD::BlockAddress: {
 523     const BlockAddressSDNode *BA = cast<BlockAddressSDNode>(N);
 524     ID.AddPointer(BA->getBlockAddress());
 525     ID.AddInteger(BA->getOffset());
 526     ID.AddInteger(BA->getTargetFlags());
 527     break;
 528   }
 529   } // end switch (N->getOpcode())
 530
 531   AddNodeIDFlags(ID, N);
 532
 533   // Target specific memory nodes could also have address spaces to check.
 534   if (N->isTargetMemoryOpcode())
 535     ID.AddInteger(cast<MemSDNode>(N)->getPointerInfo().getAddrSpace());
 536 }
 537
 538 /// AddNodeIDNode - Generic routine for adding a nodes info to the NodeID
 539 /// data.
 540 static void AddNodeIDNode(FoldingSetNodeID &ID, const SDNode *N) {
 541   AddNodeIDOpcode(ID, N->getOpcode());
 542   // Add the return value info.
 543   AddNodeIDValueTypes(ID, N->getVTList());
 544   // Add the operand info.
 545   AddNodeIDOperands(ID, N->ops());
 546
 547   // Handle SDNode leafs with special info.
 548   AddNodeIDCustom(ID, N);
 549 }
 550
 551 /// encodeMemSDNodeFlags - Generic routine for computing a value for use in
 552 /// the CSE map that carries volatility, temporalness, indexing mode, and
 553 /// extension/truncation information.
 554 ///
 555 static inline unsigned
 556 encodeMemSDNodeFlags(int ConvType, ISD::MemIndexedMode AM, bool isVolatile,
 557                      bool isNonTemporal, bool isInvariant) {
 558   assert((ConvType & 3) == ConvType &&
 559          "ConvType may not require more than 2 bits!");
 560   assert((AM & 7) == AM &&
 561          "AM may not require more than 3 bits!");
 562   return ConvType |
 563          (AM << 2) |
 564          (isVolatile << 5) |
 565          (isNonTemporal << 6) |
 566          (isInvariant << 7);
 567 }
 568
 569 //===----------------------------------------------------------------------===//
 570 //                              SelectionDAG Class
 571 //===----------------------------------------------------------------------===//
 572
 573 /// doNotCSE - Return true if CSE should not be performed for this node.
 574 static bool doNotCSE(SDNode *N) {
 575   if (N->getValueType(0) == MVT::Glue)
 576     return true; // Never CSE anything that produces a flag.
 577
 578   switch (N->getOpcode()) {
 579   default: break;
 580   case ISD::HANDLENODE:
 581   case ISD::EH_LABEL:
 582     return true;   // Never CSE these nodes.
 583   }
 584
 585   // Check that remaining values produced are not flags.
 586   for (unsigned i = 1, e = N->getNumValues(); i != e; ++i)
 587     if (N->getValueType(i) == MVT::Glue)
 588       return true; // Never CSE anything that produces a flag.
 589
 590   return false;
 591 }
 592
 593 /// RemoveDeadNodes - This method deletes all unreachable nodes in the
 594 /// SelectionDAG.
 595 void SelectionDAG::RemoveDeadNodes() {
 596   // Create a dummy node (which is not added to allnodes), that adds a reference
 597   // to the root node, preventing it from being deleted.
 598   HandleSDNode Dummy(getRoot());
 599
 600   SmallVector<SDNode*, 128> DeadNodes;
 601
 602   // Add all obviously-dead nodes to the DeadNodes worklist.
 603   for (SDNode &Node : allnodes())
 604     if (Node.use_empty())
 605       DeadNodes.push_back(&Node);
 606
 607   RemoveDeadNodes(DeadNodes);
 608
 609   // If the root changed (e.g. it was a dead load, update the root).
 610   setRoot(Dummy.getValue());
 611 }
 612
 613 /// RemoveDeadNodes - This method deletes the unreachable nodes in the
 614 /// given list, and any nodes that become unreachable as a result.
 615 void SelectionDAG::RemoveDeadNodes(SmallVectorImpl<SDNode *> &DeadNodes) {
 616
 617   // Process the worklist, deleting the nodes and adding their uses to the
 618   // worklist.
 619   while (!DeadNodes.empty()) {
 620     SDNode *N = DeadNodes.pop_back_val();
 621
 622     for (DAGUpdateListener *DUL = UpdateListeners; DUL; DUL = DUL->Next)
 623       DUL->NodeDeleted(N, nullptr);
 624
 625     // Take the node out of the appropriate CSE map.
 626     RemoveNodeFromCSEMaps(N);
 627
 628     // Next, brutally remove the operand list.  This is safe to do, as there are
 629     // no cycles in the graph.
 630     for (SDNode::op_iterator I = N->op_begin(), E = N->op_end(); I != E; ) {
 631       SDUse &Use = *I++;
 632       SDNode *Operand = Use.getNode();
 633       Use.set(SDValue());
 634
 635       // Now that we removed this operand, see if there are no uses of it left.
 636       if (Operand->use_empty())
 637         DeadNodes.push_back(Operand);
 638     }
 639
 640     DeallocateNode(N);
 641   }
 642 }
 643
 644 void SelectionDAG::RemoveDeadNode(SDNode *N){
 645   SmallVector<SDNode*, 16> DeadNodes(1, N);
 646
 647   // Create a dummy node that adds a reference to the root node, preventing
 648   // it from being deleted.  (This matters if the root is an operand of the
 649   // dead node.)
 650   HandleSDNode Dummy(getRoot());
 651
 652   RemoveDeadNodes(DeadNodes);
 653 }
 654
 655 void SelectionDAG::DeleteNode(SDNode *N) {
 656   // First take this out of the appropriate CSE map.
 657   RemoveNodeFromCSEMaps(N);
 658
 659   // Finally, remove uses due to operands of this node, remove from the
 660   // AllNodes list, and delete the node.
 661   DeleteNodeNotInCSEMaps(N);
 662 }
 663
 664 void SelectionDAG::DeleteNodeNotInCSEMaps(SDNode *N) {
 665   assert(N != AllNodes.begin() && "Cannot delete the entry node!");
 666   assert(N->use_empty() && "Cannot delete a node that is not dead!");
 667
 668   // Drop all of the operands and decrement used node's use counts.
 669   N->DropOperands();
 670
 671   DeallocateNode(N);
 672 }
 673
 674 void SDDbgInfo::erase(const SDNode *Node) {
 675   DbgValMapType::iterator I = DbgValMap.find(Node);
 676   if (I == DbgValMap.end())
 677     return;
 678   for (auto &Val: I->second)
 679     Val->setIsInvalidated();
 680   DbgValMap.erase(I);
 681 }
 682
 683 void SelectionDAG::DeallocateNode(SDNode *N) {
 684   if (N->OperandsNeedDelete)
 685     delete[] N->OperandList;
 686
 687   // Set the opcode to DELETED_NODE to help catch bugs when node
 688   // memory is reallocated.
 689   N->NodeType = ISD::DELETED_NODE;
 690
 691   NodeAllocator.Deallocate(AllNodes.remove(N));
 692
 693   // If any of the SDDbgValue nodes refer to this SDNode, invalidate
 694   // them and forget about that node.
 695   DbgInfo->erase(N);
 696 }
 697
 698 #ifndef NDEBUG
 699 /// VerifySDNode - Sanity check the given SDNode.  Aborts if it is invalid.
 700 static void VerifySDNode(SDNode *N) {
 701   switch (N->getOpcode()) {
 702   default:
 703     break;
 704   case ISD::BUILD_PAIR: {
 705     EVT VT = N->getValueType(0);
 706     assert(N->getNumValues() == 1 && "Too many results!");
 707     assert(!VT.isVector() && (VT.isInteger() || VT.isFloatingPoint()) &&
 708            "Wrong return type!");
 709     assert(N->getNumOperands() == 2 && "Wrong number of operands!");
 710     assert(N->getOperand(0).getValueType() == N->getOperand(1).getValueType() &&
 711            "Mismatched operand types!");
 712     assert(N->getOperand(0).getValueType().isInteger() == VT.isInteger() &&
 713            "Wrong operand type!");
 714     assert(VT.getSizeInBits() == 2 * N->getOperand(0).getValueSizeInBits() &&
 715            "Wrong return type size");
 716     break;
 717   }
 718   case ISD::BUILD_VECTOR: {
 719     assert(N->getNumValues() == 1 && "Too many results!");
 720     assert(N->getValueType(0).isVector() && "Wrong return type!");
 721     assert(N->getNumOperands() == N->getValueType(0).getVectorNumElements() &&
 722            "Wrong number of operands!");
 723     EVT EltVT = N->getValueType(0).getVectorElementType();
 724     for (SDNode::op_iterator I = N->op_begin(), E = N->op_end(); I != E; ++I) {
 725       assert((I->getValueType() == EltVT ||
 726              (EltVT.isInteger() && I->getValueType().isInteger() &&
 727               EltVT.bitsLE(I->getValueType()))) &&
 728             "Wrong operand type!");
 729       assert(I->getValueType() == N->getOperand(0).getValueType() &&
 730              "Operands must all have the same type");
 731     }
 732     break;
 733   }
 734   }
 735 }
 736 #endif // NDEBUG
 737
 738 /// \brief Insert a newly allocated node into the DAG.
 739 ///
 740 /// Handles insertion into the all nodes list and CSE map, as well as
 741 /// verification and other common operations when a new node is allocated.
 742 void SelectionDAG::InsertNode(SDNode *N) {
 743   AllNodes.push_back(N);
 744 #ifndef NDEBUG
 745   N->PersistentId = NextPersistentId++;
 746   VerifySDNode(N);
 747 #endif
 748 }
 749
 750 /// RemoveNodeFromCSEMaps - Take the specified node out of the CSE map that
 751 /// correspond to it.  This is useful when we're about to delete or repurpose
 752 /// the node.  We don't want future request for structurally identical nodes
 753 /// to return N anymore.
 754 bool SelectionDAG::RemoveNodeFromCSEMaps(SDNode *N) {
 755   bool Erased = false;
 756   switch (N->getOpcode()) {
 757   case ISD::HANDLENODE: return false;  // noop.
 758   case ISD::CONDCODE:
 759     assert(CondCodeNodes[cast<CondCodeSDNode>(N)->get()] &&
 760            "Cond code doesn't exist!");
 761     Erased = CondCodeNodes[cast<CondCodeSDNode>(N)->get()] != nullptr;
 762     CondCodeNodes[cast<CondCodeSDNode>(N)->get()] = nullptr;
 763     break;
 764   case ISD::ExternalSymbol:
 765     Erased = ExternalSymbols.erase(cast<ExternalSymbolSDNode>(N)->getSymbol());
 766     break;
 767   case ISD::TargetExternalSymbol: {
 768     ExternalSymbolSDNode *ESN = cast<ExternalSymbolSDNode>(N);
 769     Erased = TargetExternalSymbols.erase(
 770                std::pair<std::string,unsigned char>(ESN->getSymbol(),
 771                                                     ESN->getTargetFlags()));
 772     break;
 773   }
 774   case ISD::MCSymbol: {
 775     auto *MCSN = cast<MCSymbolSDNode>(N);
 776     Erased = MCSymbols.erase(MCSN->getMCSymbol());
 777     break;
 778   }
 779   case ISD::VALUETYPE: {
 780     EVT VT = cast<VTSDNode>(N)->getVT();
 781     if (VT.isExtended()) {
 782       Erased = ExtendedValueTypeNodes.erase(VT);
 783     } else {
 784       Erased = ValueTypeNodes[VT.getSimpleVT().SimpleTy] != nullptr;
 785       ValueTypeNodes[VT.getSimpleVT().SimpleTy] = nullptr;
 786     }
 787     break;
 788   }
 789   default:
 790     // Remove it from the CSE Map.
 791     assert(N->getOpcode() != ISD::DELETED_NODE && "DELETED_NODE in CSEMap!");
 792     assert(N->getOpcode() != ISD::EntryToken && "EntryToken in CSEMap!");
 793     Erased = CSEMap.RemoveNode(N);
 794     break;
 795   }
 796 #ifndef NDEBUG
 797   // Verify that the node was actually in one of the CSE maps, unless it has a
 798   // flag result (which cannot be CSE'd) or is one of the special cases that are
 799   // not subject to CSE.
 800   if (!Erased && N->getValueType(N->getNumValues()-1) != MVT::Glue &&
 801       !N->isMachineOpcode() && !doNotCSE(N)) {
 802     N->dump(this);
 803     dbgs() << "\n";
 804     llvm_unreachable("Node is not in map!");
 805   }
 806 #endif
 807   return Erased;
 808 }
 809
 810 /// AddModifiedNodeToCSEMaps - The specified node has been removed from the CSE
 811 /// maps and modified in place. Add it back to the CSE maps, unless an identical
 812 /// node already exists, in which case transfer all its users to the existing
 813 /// node. This transfer can potentially trigger recursive merging.
 814 ///
 815 void
 816 SelectionDAG::AddModifiedNodeToCSEMaps(SDNode *N) {
 817   // For node types that aren't CSE'd, just act as if no identical node
 818   // already exists.
 819   if (!doNotCSE(N)) {
 820     SDNode *Existing = CSEMap.GetOrInsertNode(N);
 821     if (Existing != N) {
 822       // If there was already an existing matching node, use ReplaceAllUsesWith
 823       // to replace the dead one with the existing one.  This can cause
 824       // recursive merging of other unrelated nodes down the line.
 825       ReplaceAllUsesWith(N, Existing);
 826
 827       // N is now dead. Inform the listeners and delete it.
 828       for (DAGUpdateListener *DUL = UpdateListeners; DUL; DUL = DUL->Next)
 829         DUL->NodeDeleted(N, Existing);
 830       DeleteNodeNotInCSEMaps(N);
 831       return;
 832     }
 833   }
 834
 835   // If the node doesn't already exist, we updated it.  Inform listeners.
 836   for (DAGUpdateListener *DUL = UpdateListeners; DUL; DUL = DUL->Next)
 837     DUL->NodeUpdated(N);
 838 }
 839
 840 /// FindModifiedNodeSlot - Find a slot for the specified node if its operands
 841 /// were replaced with those specified.  If this node is never memoized,
 842 /// return null, otherwise return a pointer to the slot it would take.  If a
 843 /// node already exists with these operands, the slot will be non-null.
 844 SDNode *SelectionDAG::FindModifiedNodeSlot(SDNode *N, SDValue Op,
 845                                            void *&InsertPos) {
 846   if (doNotCSE(N))
 847     return nullptr;
 848
 849   SDValue Ops[] = { Op };
 850   FoldingSetNodeID ID;
 851   AddNodeIDNode(ID, N->getOpcode(), N->getVTList(), Ops);
 852   AddNodeIDCustom(ID, N);
 853   SDNode *Node = FindNodeOrInsertPos(ID, N->getDebugLoc(), InsertPos);
 854   return Node;
 855 }
 856
 857 /// FindModifiedNodeSlot - Find a slot for the specified node if its operands
 858 /// were replaced with those specified.  If this node is never memoized,
 859 /// return null, otherwise return a pointer to the slot it would take.  If a
 860 /// node already exists with these operands, the slot will be non-null.
 861 SDNode *SelectionDAG::FindModifiedNodeSlot(SDNode *N,
 862                                            SDValue Op1, SDValue Op2,
 863                                            void *&InsertPos) {
 864   if (doNotCSE(N))
 865     return nullptr;
 866
 867   SDValue Ops[] = { Op1, Op2 };
 868   FoldingSetNodeID ID;
 869   AddNodeIDNode(ID, N->getOpcode(), N->getVTList(), Ops);
 870   AddNodeIDCustom(ID, N);
 871   SDNode *Node = FindNodeOrInsertPos(ID, N->getDebugLoc(), InsertPos);
 872   return Node;
 873 }
 874
 875
 876 /// FindModifiedNodeSlot - Find a slot for the specified node if its operands
 877 /// were replaced with those specified.  If this node is never memoized,
 878 /// return null, otherwise return a pointer to the slot it would take.  If a
 879 /// node already exists with these operands, the slot will be non-null.
 880 SDNode *SelectionDAG::FindModifiedNodeSlot(SDNode *N, ArrayRef<SDValue> Ops,
 881                                            void *&InsertPos) {
 882   if (doNotCSE(N))
 883     return nullptr;
 884
 885   FoldingSetNodeID ID;
 886   AddNodeIDNode(ID, N->getOpcode(), N->getVTList(), Ops);
 887   AddNodeIDCustom(ID, N);
 888   SDNode *Node = FindNodeOrInsertPos(ID, N->getDebugLoc(), InsertPos);
 889   return Node;
 890 }
 891
 892 /// getEVTAlignment - Compute the default alignment value for the
 893 /// given type.
 894 ///
 895 unsigned SelectionDAG::getEVTAlignment(EVT VT) const {
 896   Type *Ty = VT == MVT::iPTR ?
 897                    PointerType::get(Type::getInt8Ty(*getContext()), 0) :
 898                    VT.getTypeForEVT(*getContext());
 899
 900   return getDataLayout().getABITypeAlignment(Ty);
 901 }
 902
 903 // EntryNode could meaningfully have debug info if we can find it...
 904 SelectionDAG::SelectionDAG(const TargetMachine &tm, CodeGenOpt::Level OL)
 905     : TM(tm), TSI(nullptr), TLI(nullptr), OptLevel(OL),
 906       EntryNode(ISD::EntryToken, 0, DebugLoc(), getVTList(MVT::Other)),
 907       Root(getEntryNode()), NewNodesMustHaveLegalTypes(false),
 908       UpdateListeners(nullptr) {
 909   InsertNode(&EntryNode);
 910   DbgInfo = new SDDbgInfo();
 911 }
 912
 913 void SelectionDAG::init(MachineFunction &mf) {
 914   MF = &mf;
 915   TLI = getSubtarget().getTargetLowering();
 916   TSI = getSubtarget().getSelectionDAGInfo();
 917   Context = &mf.getFunction()->getContext();
 918 }
 919
 920 SelectionDAG::~SelectionDAG() {
 921   assert(!UpdateListeners && "Dangling registered DAGUpdateListeners");
 922   allnodes_clear();
 923   delete DbgInfo;
 924 }
 925
 926 void SelectionDAG::allnodes_clear() {
 927   assert(&*AllNodes.begin() == &EntryNode);
 928   AllNodes.remove(AllNodes.begin());
 929   while (!AllNodes.empty())
 930     DeallocateNode(&AllNodes.front());
 931 #ifndef NDEBUG
 932   NextPersistentId = 0;
 933 #endif
 934 }
 935
 936 BinarySDNode *SelectionDAG::GetBinarySDNode(unsigned Opcode, SDLoc DL,
 937                                             SDVTList VTs, SDValue N1,
 938                                             SDValue N2,
 939                                             const SDNodeFlags *Flags) {
 940   if (isBinOpWithFlags(Opcode)) {
 941     // If no flags were passed in, use a default flags object.
 942     SDNodeFlags F;
 943     if (Flags == nullptr)
 944       Flags = &F;
 945
 946     BinaryWithFlagsSDNode *FN = new (NodeAllocator) BinaryWithFlagsSDNode(
 947         Opcode, DL.getIROrder(), DL.getDebugLoc(), VTs, N1, N2, *Flags);
 948
 949     return FN;
 950   }
 951
 952   BinarySDNode *N = new (NodeAllocator)
 953       BinarySDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(), VTs, N1, N2);
 954   return N;
 955 }
 956
 957 SDNode *SelectionDAG::FindNodeOrInsertPos(const FoldingSetNodeID &ID,
 958                                           void *&InsertPos) {
 959   SDNode *N = CSEMap.FindNodeOrInsertPos(ID, InsertPos);
 960   if (N) {
 961     switch (N->getOpcode()) {
 962     default: break;
 963     case ISD::Constant:
 964     case ISD::ConstantFP:
 965       llvm_unreachable("Querying for Constant and ConstantFP nodes requires "
 966                        "debug location.  Use another overload.");
 967     }
 968   }
 969   return N;
 970 }
 971
 972 SDNode *SelectionDAG::FindNodeOrInsertPos(const FoldingSetNodeID &ID,
 973                                           DebugLoc DL, void *&InsertPos) {
 974   SDNode *N = CSEMap.FindNodeOrInsertPos(ID, InsertPos);
 975   if (N) {
 976     switch (N->getOpcode()) {
 977     default: break; // Process only regular (non-target) constant nodes.
 978     case ISD::Constant:
 979     case ISD::ConstantFP:
 980       // Erase debug location from the node if the node is used at several
 981       // different places to do not propagate one location to all uses as it
 982       // leads to incorrect debug info.
 983       if (N->getDebugLoc() != DL)
 984         N->setDebugLoc(DebugLoc());
 985       break;
 986     }
 987   }
 988   return N;
 989 }
 990
 991 void SelectionDAG::clear() {
 992   allnodes_clear();
 993   OperandAllocator.Reset();
 994   CSEMap.clear();
 995
 996   ExtendedValueTypeNodes.clear();
 997   ExternalSymbols.clear();
 998   TargetExternalSymbols.clear();
 999   MCSymbols.clear();
1000   std::fill(CondCodeNodes.begin(), CondCodeNodes.end(),
1001             static_cast<CondCodeSDNode*>(nullptr));
1002   std::fill(ValueTypeNodes.begin(), ValueTypeNodes.end(),
1003             static_cast<SDNode*>(nullptr));
1004
1005   EntryNode.UseList = nullptr;
1006   InsertNode(&EntryNode);
1007   Root = getEntryNode();
1008   DbgInfo->clear();
1009 }
1010
1011 SDValue SelectionDAG::getAnyExtOrTrunc(SDValue Op, SDLoc DL, EVT VT) {
1012   return VT.bitsGT(Op.getValueType()) ?
1013     getNode(ISD::ANY_EXTEND, DL, VT, Op) :
1014     getNode(ISD::TRUNCATE, DL, VT, Op);
1015 }
1016
1017 SDValue SelectionDAG::getSExtOrTrunc(SDValue Op, SDLoc DL, EVT VT) {
1018   return VT.bitsGT(Op.getValueType()) ?
1019     getNode(ISD::SIGN_EXTEND, DL, VT, Op) :
1020     getNode(ISD::TRUNCATE, DL, VT, Op);
1021 }
1022
1023 SDValue SelectionDAG::getZExtOrTrunc(SDValue Op, SDLoc DL, EVT VT) {
1024   return VT.bitsGT(Op.getValueType()) ?
1025     getNode(ISD::ZERO_EXTEND, DL, VT, Op) :
1026     getNode(ISD::TRUNCATE, DL, VT, Op);
1027 }
1028
1029 SDValue SelectionDAG::getBoolExtOrTrunc(SDValue Op, SDLoc SL, EVT VT,
1030                                         EVT OpVT) {
1031   if (VT.bitsLE(Op.getValueType()))
1032     return getNode(ISD::TRUNCATE, SL, VT, Op);
1033
1034   TargetLowering::BooleanContent BType = TLI->getBooleanContents(OpVT);
1035   return getNode(TLI->getExtendForContent(BType), SL, VT, Op);
1036 }
1037
1038 SDValue SelectionDAG::getZeroExtendInReg(SDValue Op, SDLoc DL, EVT VT) {
1039   assert(!VT.isVector() &&
1040          "getZeroExtendInReg should use the vector element type instead of "
1041          "the vector type!");
1042   if (Op.getValueType() == VT) return Op;
1043   unsigned BitWidth = Op.getValueType().getScalarType().getSizeInBits();
1044   APInt Imm = APInt::getLowBitsSet(BitWidth,
1045                                    VT.getSizeInBits());
1046   return getNode(ISD::AND, DL, Op.getValueType(), Op,
1047                  getConstant(Imm, DL, Op.getValueType()));
1048 }
1049
1050 SDValue SelectionDAG::getAnyExtendVectorInReg(SDValue Op, SDLoc DL, EVT VT) {
1051   assert(VT.isVector() && "This DAG node is restricted to vector types.");
1052   assert(VT.getSizeInBits() == Op.getValueType().getSizeInBits() &&
1053          "The sizes of the input and result must match in order to perform the "
1054          "extend in-register.");
1055   assert(VT.getVectorNumElements() < Op.getValueType().getVectorNumElements() &&
1056          "The destination vector type must have fewer lanes than the input.");
1057   return getNode(ISD::ANY_EXTEND_VECTOR_INREG, DL, VT, Op);
1058 }
1059
1060 SDValue SelectionDAG::getSignExtendVectorInReg(SDValue Op, SDLoc DL, EVT VT) {
1061   assert(VT.isVector() && "This DAG node is restricted to vector types.");
1062   assert(VT.getSizeInBits() == Op.getValueType().getSizeInBits() &&
1063          "The sizes of the input and result must match in order to perform the "
1064          "extend in-register.");
1065   assert(VT.getVectorNumElements() < Op.getValueType().getVectorNumElements() &&
1066          "The destination vector type must have fewer lanes than the input.");
1067   return getNode(ISD::SIGN_EXTEND_VECTOR_INREG, DL, VT, Op);
1068 }
1069
1070 SDValue SelectionDAG::getZeroExtendVectorInReg(SDValue Op, SDLoc DL, EVT VT) {
1071   assert(VT.isVector() && "This DAG node is restricted to vector types.");
1072   assert(VT.getSizeInBits() == Op.getValueType().getSizeInBits() &&
1073          "The sizes of the input and result must match in order to perform the "
1074          "extend in-register.");
1075   assert(VT.getVectorNumElements() < Op.getValueType().getVectorNumElements() &&
1076          "The destination vector type must have fewer lanes than the input.");
1077   return getNode(ISD::ZERO_EXTEND_VECTOR_INREG, DL, VT, Op);
1078 }
1079
1080 /// getNOT - Create a bitwise NOT operation as (XOR Val, -1).
1081 ///
1082 SDValue SelectionDAG::getNOT(SDLoc DL, SDValue Val, EVT VT) {
1083   EVT EltVT = VT.getScalarType();
1084   SDValue NegOne =
1085     getConstant(APInt::getAllOnesValue(EltVT.getSizeInBits()), DL, VT);
1086   return getNode(ISD::XOR, DL, VT, Val, NegOne);
1087 }
1088
1089 SDValue SelectionDAG::getLogicalNOT(SDLoc DL, SDValue Val, EVT VT) {
1090   EVT EltVT = VT.getScalarType();
1091   SDValue TrueValue;
1092   switch (TLI->getBooleanContents(VT)) {
1093     case TargetLowering::ZeroOrOneBooleanContent:
1094     case TargetLowering::UndefinedBooleanContent:
1095       TrueValue = getConstant(1, DL, VT);
1096       break;
1097     case TargetLowering::ZeroOrNegativeOneBooleanContent:
1098       TrueValue = getConstant(APInt::getAllOnesValue(EltVT.getSizeInBits()), DL,
1099                               VT);
1100       break;
1101   }
1102   return getNode(ISD::XOR, DL, VT, Val, TrueValue);
1103 }
1104
1105 SDValue SelectionDAG::getConstant(uint64_t Val, SDLoc DL, EVT VT, bool isT,
1106                                   bool isO) {
1107   EVT EltVT = VT.getScalarType();
1108   assert((EltVT.getSizeInBits() >= 64 ||
1109          (uint64_t)((int64_t)Val >> EltVT.getSizeInBits()) + 1 < 2) &&
1110          "getConstant with a uint64_t value that doesn't fit in the type!");
1111   return getConstant(APInt(EltVT.getSizeInBits(), Val), DL, VT, isT, isO);
1112 }
1113
1114 SDValue SelectionDAG::getConstant(const APInt &Val, SDLoc DL, EVT VT, bool isT,
1115                                   bool isO)
1116 {
1117   return getConstant(*ConstantInt::get(*Context, Val), DL, VT, isT, isO);
1118 }
1119
1120 SDValue SelectionDAG::getConstant(const ConstantInt &Val, SDLoc DL, EVT VT,
1121                                   bool isT, bool isO) {
1122   assert(VT.isInteger() && "Cannot create FP integer constant!");
1123
1124   EVT EltVT = VT.getScalarType();
1125   const ConstantInt *Elt = &Val;
1126
1127   // In some cases the vector type is legal but the element type is illegal and
1128   // needs to be promoted, for example v8i8 on ARM.  In this case, promote the
1129   // inserted value (the type does not need to match the vector element type).
1130   // Any extra bits introduced will be truncated away.
1131   if (VT.isVector() && TLI->getTypeAction(*getContext(), EltVT) ==
1132       TargetLowering::TypePromoteInteger) {
1133    EltVT = TLI->getTypeToTransformTo(*getContext(), EltVT);
1134    APInt NewVal = Elt->getValue().zext(EltVT.getSizeInBits());
1135    Elt = ConstantInt::get(*getContext(), NewVal);
1136   }
1137   // In other cases the element type is illegal and needs to be expanded, for
1138   // example v2i64 on MIPS32. In this case, find the nearest legal type, split
1139   // the value into n parts and use a vector type with n-times the elements.
1140   // Then bitcast to the type requested.
1141   // Legalizing constants too early makes the DAGCombiner's job harder so we
1142   // only legalize if the DAG tells us we must produce legal types.
1143   else if (NewNodesMustHaveLegalTypes && VT.isVector() &&
1144            TLI->getTypeAction(*getContext(), EltVT) ==
1145            TargetLowering::TypeExpandInteger) {
1146     APInt NewVal = Elt->getValue();
1147     EVT ViaEltVT = TLI->getTypeToTransformTo(*getContext(), EltVT);
1148     unsigned ViaEltSizeInBits = ViaEltVT.getSizeInBits();
1149     unsigned ViaVecNumElts = VT.getSizeInBits() / ViaEltSizeInBits;
1150     EVT ViaVecVT = EVT::getVectorVT(*getContext(), ViaEltVT, ViaVecNumElts);
1151
1152     // Check the temporary vector is the correct size. If this fails then
1153     // getTypeToTransformTo() probably returned a type whose size (in bits)
1154     // isn't a power-of-2 factor of the requested type size.
1155     assert(ViaVecVT.getSizeInBits() == VT.getSizeInBits());
1156
1157     SmallVector<SDValue, 2> EltParts;
1158     for (unsigned i = 0; i < ViaVecNumElts / VT.getVectorNumElements(); ++i) {
1159       EltParts.push_back(getConstant(NewVal.lshr(i * ViaEltSizeInBits)
1160                                            .trunc(ViaEltSizeInBits), DL,
1161                                      ViaEltVT, isT, isO));
1162     }
1163
1164     // EltParts is currently in little endian order. If we actually want
1165     // big-endian order then reverse it now.
1166     if (getDataLayout().isBigEndian())
1167       std::reverse(EltParts.begin(), EltParts.end());
1168
1169     // The elements must be reversed when the element order is different
1170     // to the endianness of the elements (because the BITCAST is itself a
1171     // vector shuffle in this situation). However, we do not need any code to
1172     // perform this reversal because getConstant() is producing a vector
1173     // splat.
1174     // This situation occurs in MIPS MSA.
1175
1176     SmallVector<SDValue, 8> Ops;
1177     for (unsigned i = 0; i < VT.getVectorNumElements(); ++i)
1178       Ops.insert(Ops.end(), EltParts.begin(), EltParts.end());
1179
1180     SDValue Result = getNode(ISD::BITCAST, SDLoc(), VT,
1181                              getNode(ISD::BUILD_VECTOR, SDLoc(), ViaVecVT,
1182                                      Ops));
1183     return Result;
1184   }
1185
1186   assert(Elt->getBitWidth() == EltVT.getSizeInBits() &&
1187          "APInt size does not match type size!");
1188   unsigned Opc = isT ? ISD::TargetConstant : ISD::Constant;
1189   FoldingSetNodeID ID;
1190   AddNodeIDNode(ID, Opc, getVTList(EltVT), None);
1191   ID.AddPointer(Elt);
1192   ID.AddBoolean(isO);
1193   void *IP = nullptr;
1194   SDNode *N = nullptr;
1195   if ((N = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP)))
1196     if (!VT.isVector())
1197       return SDValue(N, 0);
1198
1199   if (!N) {
1200     N = new (NodeAllocator) ConstantSDNode(isT, isO, Elt, DL.getDebugLoc(),
1201                                            EltVT);
1202     CSEMap.InsertNode(N, IP);
1203     InsertNode(N);
1204   }
1205
1206   SDValue Result(N, 0);
1207   if (VT.isVector()) {
1208     SmallVector<SDValue, 8> Ops;
1209     Ops.assign(VT.getVectorNumElements(), Result);
1210     Result = getNode(ISD::BUILD_VECTOR, SDLoc(), VT, Ops);
1211   }
1212   return Result;
1213 }
1214
1215 SDValue SelectionDAG::getIntPtrConstant(uint64_t Val, SDLoc DL, bool isTarget) {
1216   return getConstant(Val, DL, TLI->getPointerTy(getDataLayout()), isTarget);
1217 }
1218
1219 SDValue SelectionDAG::getConstantFP(const APFloat& V, SDLoc DL, EVT VT,
1220                                     bool isTarget) {
1221   return getConstantFP(*ConstantFP::get(*getContext(), V), DL, VT, isTarget);
1222 }
1223
1224 SDValue SelectionDAG::getConstantFP(const ConstantFP& V, SDLoc DL, EVT VT,
1225                                     bool isTarget){
1226   assert(VT.isFloatingPoint() && "Cannot create integer FP constant!");
1227
1228   EVT EltVT = VT.getScalarType();
1229
1230   // Do the map lookup using the actual bit pattern for the floating point
1231   // value, so that we don't have problems with 0.0 comparing equal to -0.0, and
1232   // we don't have issues with SNANs.
1233   unsigned Opc = isTarget ? ISD::TargetConstantFP : ISD::ConstantFP;
1234   FoldingSetNodeID ID;
1235   AddNodeIDNode(ID, Opc, getVTList(EltVT), None);
1236   ID.AddPointer(&V);
1237   void *IP = nullptr;
1238   SDNode *N = nullptr;
1239   if ((N = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP)))
1240     if (!VT.isVector())
1241       return SDValue(N, 0);
1242
1243   if (!N) {
1244     N = new (NodeAllocator) ConstantFPSDNode(isTarget, &V, DL.getDebugLoc(),
1245                                              EltVT);
1246     CSEMap.InsertNode(N, IP);
1247     InsertNode(N);
1248   }
1249
1250   SDValue Result(N, 0);
1251   if (VT.isVector()) {
1252     SmallVector<SDValue, 8> Ops;
1253     Ops.assign(VT.getVectorNumElements(), Result);
1254     Result = getNode(ISD::BUILD_VECTOR, SDLoc(), VT, Ops);
1255   }
1256   return Result;
1257 }
1258
1259 SDValue SelectionDAG::getConstantFP(double Val, SDLoc DL, EVT VT,
1260                                     bool isTarget) {
1261   EVT EltVT = VT.getScalarType();
1262   if (EltVT==MVT::f32)
1263     return getConstantFP(APFloat((float)Val), DL, VT, isTarget);
1264   else if (EltVT==MVT::f64)
1265     return getConstantFP(APFloat(Val), DL, VT, isTarget);
1266   else if (EltVT==MVT::f80 || EltVT==MVT::f128 || EltVT==MVT::ppcf128 ||
1267            EltVT==MVT::f16) {
1268     bool ignored;
1269     APFloat apf = APFloat(Val);
1270     apf.convert(EVTToAPFloatSemantics(EltVT), APFloat::rmNearestTiesToEven,
1271                 &ignored);
1272     return getConstantFP(apf, DL, VT, isTarget);
1273   } else
1274     llvm_unreachable("Unsupported type in getConstantFP");
1275 }
1276
1277 SDValue SelectionDAG::getGlobalAddress(const GlobalValue *GV, SDLoc DL,
1278                                        EVT VT, int64_t Offset,
1279                                        bool isTargetGA,
1280                                        unsigned char TargetFlags) {
1281   assert((TargetFlags == 0 || isTargetGA) &&
1282          "Cannot set target flags on target-independent globals");
1283
1284   // Truncate (with sign-extension) the offset value to the pointer size.
1285   unsigned BitWidth = getDataLayout().getPointerTypeSizeInBits(GV->getType());
1286   if (BitWidth < 64)
1287     Offset = SignExtend64(Offset, BitWidth);
1288
1289   unsigned Opc;
1290   if (GV->isThreadLocal())
1291     Opc = isTargetGA ? ISD::TargetGlobalTLSAddress : ISD::GlobalTLSAddress;
1292   else
1293     Opc = isTargetGA ? ISD::TargetGlobalAddress : ISD::GlobalAddress;
1294
1295   FoldingSetNodeID ID;
1296   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1297   ID.AddPointer(GV);
1298   ID.AddInteger(Offset);
1299   ID.AddInteger(TargetFlags);
1300   ID.AddInteger(GV->getType()->getAddressSpace());
1301   void *IP = nullptr;
1302   if (SDNode *E = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP))
1303     return SDValue(E, 0);
1304
1305   SDNode *N = new (NodeAllocator) GlobalAddressSDNode(Opc, DL.getIROrder(),
1306                                                       DL.getDebugLoc(), GV, VT,
1307                                                       Offset, TargetFlags);
1308   CSEMap.InsertNode(N, IP);
1309     InsertNode(N);
1310   return SDValue(N, 0);
1311 }
1312
1313 SDValue SelectionDAG::getFrameIndex(int FI, EVT VT, bool isTarget) {
1314   unsigned Opc = isTarget ? ISD::TargetFrameIndex : ISD::FrameIndex;
1315   FoldingSetNodeID ID;
1316   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1317   ID.AddInteger(FI);
1318   void *IP = nullptr;
1319   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1320     return SDValue(E, 0);
1321
1322   SDNode *N = new (NodeAllocator) FrameIndexSDNode(FI, VT, isTarget);
1323   CSEMap.InsertNode(N, IP);
1324   InsertNode(N);
1325   return SDValue(N, 0);
1326 }
1327
1328 SDValue SelectionDAG::getJumpTable(int JTI, EVT VT, bool isTarget,
1329                                    unsigned char TargetFlags) {
1330   assert((TargetFlags == 0 || isTarget) &&
1331          "Cannot set target flags on target-independent jump tables");
1332   unsigned Opc = isTarget ? ISD::TargetJumpTable : ISD::JumpTable;
1333   FoldingSetNodeID ID;
1334   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1335   ID.AddInteger(JTI);
1336   ID.AddInteger(TargetFlags);
1337   void *IP = nullptr;
1338   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1339     return SDValue(E, 0);
1340
1341   SDNode *N = new (NodeAllocator) JumpTableSDNode(JTI, VT, isTarget,
1342                                                   TargetFlags);
1343   CSEMap.InsertNode(N, IP);
1344   InsertNode(N);
1345   return SDValue(N, 0);
1346 }
1347
1348 SDValue SelectionDAG::getConstantPool(const Constant *C, EVT VT,
1349                                       unsigned Alignment, int Offset,
1350                                       bool isTarget,
1351                                       unsigned char TargetFlags) {
1352   assert((TargetFlags == 0 || isTarget) &&
1353          "Cannot set target flags on target-independent globals");
1354   if (Alignment == 0)
1355     Alignment = getDataLayout().getPrefTypeAlignment(C->getType());
1356   unsigned Opc = isTarget ? ISD::TargetConstantPool : ISD::ConstantPool;
1357   FoldingSetNodeID ID;
1358   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1359   ID.AddInteger(Alignment);
1360   ID.AddInteger(Offset);
1361   ID.AddPointer(C);
1362   ID.AddInteger(TargetFlags);
1363   void *IP = nullptr;
1364   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1365     return SDValue(E, 0);
1366
1367   SDNode *N = new (NodeAllocator) ConstantPoolSDNode(isTarget, C, VT, Offset,
1368                                                      Alignment, TargetFlags);
1369   CSEMap.InsertNode(N, IP);
1370   InsertNode(N);
1371   return SDValue(N, 0);
1372 }
1373
1374
1375 SDValue SelectionDAG::getConstantPool(MachineConstantPoolValue *C, EVT VT,
1376                                       unsigned Alignment, int Offset,
1377                                       bool isTarget,
1378                                       unsigned char TargetFlags) {
1379   assert((TargetFlags == 0 || isTarget) &&
1380          "Cannot set target flags on target-independent globals");
1381   if (Alignment == 0)
1382     Alignment = getDataLayout().getPrefTypeAlignment(C->getType());
1383   unsigned Opc = isTarget ? ISD::TargetConstantPool : ISD::ConstantPool;
1384   FoldingSetNodeID ID;
1385   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1386   ID.AddInteger(Alignment);
1387   ID.AddInteger(Offset);
1388   C->addSelectionDAGCSEId(ID);
1389   ID.AddInteger(TargetFlags);
1390   void *IP = nullptr;
1391   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1392     return SDValue(E, 0);
1393
1394   SDNode *N = new (NodeAllocator) ConstantPoolSDNode(isTarget, C, VT, Offset,
1395                                                      Alignment, TargetFlags);
1396   CSEMap.InsertNode(N, IP);
1397   InsertNode(N);
1398   return SDValue(N, 0);
1399 }
1400
1401 SDValue SelectionDAG::getTargetIndex(int Index, EVT VT, int64_t Offset,
1402                                      unsigned char TargetFlags) {
1403   FoldingSetNodeID ID;
1404   AddNodeIDNode(ID, ISD::TargetIndex, getVTList(VT), None);
1405   ID.AddInteger(Index);
1406   ID.AddInteger(Offset);
1407   ID.AddInteger(TargetFlags);
1408   void *IP = nullptr;
1409   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1410     return SDValue(E, 0);
1411
1412   SDNode *N =
1413       new (NodeAllocator) TargetIndexSDNode(Index, VT, Offset, TargetFlags);
1414   CSEMap.InsertNode(N, IP);
1415   InsertNode(N);
1416   return SDValue(N, 0);
1417 }
1418
1419 SDValue SelectionDAG::getBasicBlock(MachineBasicBlock *MBB) {
1420   FoldingSetNodeID ID;
1421   AddNodeIDNode(ID, ISD::BasicBlock, getVTList(MVT::Other), None);
1422   ID.AddPointer(MBB);
1423   void *IP = nullptr;
1424   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1425     return SDValue(E, 0);
1426
1427   SDNode *N = new (NodeAllocator) BasicBlockSDNode(MBB);
1428   CSEMap.InsertNode(N, IP);
1429   InsertNode(N);
1430   return SDValue(N, 0);
1431 }
1432
1433 SDValue SelectionDAG::getValueType(EVT VT) {
1434   if (VT.isSimple() && (unsigned)VT.getSimpleVT().SimpleTy >=
1435       ValueTypeNodes.size())
1436     ValueTypeNodes.resize(VT.getSimpleVT().SimpleTy+1);
1437
1438   SDNode *&N = VT.isExtended() ?
1439     ExtendedValueTypeNodes[VT] : ValueTypeNodes[VT.getSimpleVT().SimpleTy];
1440
1441   if (N) return SDValue(N, 0);
1442   N = new (NodeAllocator) VTSDNode(VT);
1443   InsertNode(N);
1444   return SDValue(N, 0);
1445 }
1446
1447 SDValue SelectionDAG::getExternalSymbol(const char *Sym, EVT VT) {
1448   SDNode *&N = ExternalSymbols[Sym];
1449   if (N) return SDValue(N, 0);
1450   N = new (NodeAllocator) ExternalSymbolSDNode(false, Sym, 0, VT);
1451   InsertNode(N);
1452   return SDValue(N, 0);
1453 }
1454
1455 SDValue SelectionDAG::getMCSymbol(MCSymbol *Sym, EVT VT) {
1456   SDNode *&N = MCSymbols[Sym];
1457   if (N)
1458     return SDValue(N, 0);
1459   N = new (NodeAllocator) MCSymbolSDNode(Sym, VT);
1460   InsertNode(N);
1461   return SDValue(N, 0);
1462 }
1463
1464 SDValue SelectionDAG::getTargetExternalSymbol(const char *Sym, EVT VT,
1465                                               unsigned char TargetFlags) {
1466   SDNode *&N =
1467     TargetExternalSymbols[std::pair<std::string,unsigned char>(Sym,
1468                                                                TargetFlags)];
1469   if (N) return SDValue(N, 0);
1470   N = new (NodeAllocator) ExternalSymbolSDNode(true, Sym, TargetFlags, VT);
1471   InsertNode(N);
1472   return SDValue(N, 0);
1473 }
1474
1475 SDValue SelectionDAG::getCondCode(ISD::CondCode Cond) {
1476   if ((unsigned)Cond >= CondCodeNodes.size())
1477     CondCodeNodes.resize(Cond+1);
1478
1479   if (!CondCodeNodes[Cond]) {
1480     CondCodeSDNode *N = new (NodeAllocator) CondCodeSDNode(Cond);
1481     CondCodeNodes[Cond] = N;
1482     InsertNode(N);
1483   }
1484
1485   return SDValue(CondCodeNodes[Cond], 0);
1486 }
1487
1488 // commuteShuffle - swaps the values of N1 and N2, and swaps all indices in
1489 // the shuffle mask M that point at N1 to point at N2, and indices that point
1490 // N2 to point at N1.
1491 static void commuteShuffle(SDValue &N1, SDValue &N2, SmallVectorImpl<int> &M) {
1492   std::swap(N1, N2);
1493   ShuffleVectorSDNode::commuteMask(M);
1494 }
1495
1496 SDValue SelectionDAG::getVectorShuffle(EVT VT, SDLoc dl, SDValue N1,
1497                                        SDValue N2, const int *Mask) {
1498   assert(VT == N1.getValueType() && VT == N2.getValueType() &&
1499          "Invalid VECTOR_SHUFFLE");
1500
1501   // Canonicalize shuffle undef, undef -> undef
1502   if (N1.getOpcode() == ISD::UNDEF && N2.getOpcode() == ISD::UNDEF)
1503     return getUNDEF(VT);
1504
1505   // Validate that all indices in Mask are within the range of the elements
1506   // input to the shuffle.
1507   unsigned NElts = VT.getVectorNumElements();
1508   SmallVector<int, 8> MaskVec;
1509   for (unsigned i = 0; i != NElts; ++i) {
1510     assert(Mask[i] < (int)(NElts * 2) && "Index out of range");
1511     MaskVec.push_back(Mask[i]);
1512   }
1513
1514   // Canonicalize shuffle v, v -> v, undef
1515   if (N1 == N2) {
1516     N2 = getUNDEF(VT);
1517     for (unsigned i = 0; i != NElts; ++i)
1518       if (MaskVec[i] >= (int)NElts) MaskVec[i] -= NElts;
1519   }
1520
1521   // Canonicalize shuffle undef, v -> v, undef.  Commute the shuffle mask.
1522   if (N1.getOpcode() == ISD::UNDEF)
1523     commuteShuffle(N1, N2, MaskVec);
1524
1525   // If shuffling a splat, try to blend the splat instead. We do this here so
1526   // that even when this arises during lowering we don't have to re-handle it.
1527   auto BlendSplat = [&](BuildVectorSDNode *BV, int Offset) {
1528     BitVector UndefElements;
1529     SDValue Splat = BV->getSplatValue(&UndefElements);
1530     if (!Splat)
1531       return;
1532
1533     for (int i = 0; i < (int)NElts; ++i) {
1534       if (MaskVec[i] < Offset || MaskVec[i] >= (Offset + (int)NElts))
1535         continue;
1536
1537       // If this input comes from undef, mark it as such.
1538       if (UndefElements[MaskVec[i] - Offset]) {
1539         MaskVec[i] = -1;
1540         continue;
1541       }
1542
1543       // If we can blend a non-undef lane, use that instead.
1544       if (!UndefElements[i])
1545         MaskVec[i] = i + Offset;
1546     }
1547   };
1548   if (auto *N1BV = dyn_cast<BuildVectorSDNode>(N1))
1549     BlendSplat(N1BV, 0);
1550   if (auto *N2BV = dyn_cast<BuildVectorSDNode>(N2))
1551     BlendSplat(N2BV, NElts);
1552
1553   // Canonicalize all index into lhs, -> shuffle lhs, undef
1554   // Canonicalize all index into rhs, -> shuffle rhs, undef
1555   bool AllLHS = true, AllRHS = true;
1556   bool N2Undef = N2.getOpcode() == ISD::UNDEF;
1557   for (unsigned i = 0; i != NElts; ++i) {
1558     if (MaskVec[i] >= (int)NElts) {
1559       if (N2Undef)
1560         MaskVec[i] = -1;
1561       else
1562         AllLHS = false;
1563     } else if (MaskVec[i] >= 0) {
1564       AllRHS = false;
1565     }
1566   }
1567   if (AllLHS && AllRHS)
1568     return getUNDEF(VT);
1569   if (AllLHS && !N2Undef)
1570     N2 = getUNDEF(VT);
1571   if (AllRHS) {
1572     N1 = getUNDEF(VT);
1573     commuteShuffle(N1, N2, MaskVec);
1574   }
1575   // Reset our undef status after accounting for the mask.
1576   N2Undef = N2.getOpcode() == ISD::UNDEF;
1577   // Re-check whether both sides ended up undef.
1578   if (N1.getOpcode() == ISD::UNDEF && N2Undef)
1579     return getUNDEF(VT);
1580
1581   // If Identity shuffle return that node.
1582   bool Identity = true, AllSame = true;
1583   for (unsigned i = 0; i != NElts; ++i) {
1584     if (MaskVec[i] >= 0 && MaskVec[i] != (int)i) Identity = false;
1585     if (MaskVec[i] != MaskVec[0]) AllSame = false;
1586   }
1587   if (Identity && NElts)
1588     return N1;
1589
1590   // Shuffling a constant splat doesn't change the result.
1591   if (N2Undef) {
1592     SDValue V = N1;
1593
1594     // Look through any bitcasts. We check that these don't change the number
1595     // (and size) of elements and just changes their types.
1596     while (V.getOpcode() == ISD::BITCAST)
1597       V = V->getOperand(0);
1598
1599     // A splat should always show up as a build vector node.
1600     if (auto *BV = dyn_cast<BuildVectorSDNode>(V)) {
1601       BitVector UndefElements;
1602       SDValue Splat = BV->getSplatValue(&UndefElements);
1603       // If this is a splat of an undef, shuffling it is also undef.
1604       if (Splat && Splat.getOpcode() == ISD::UNDEF)
1605         return getUNDEF(VT);
1606
1607       bool SameNumElts =
1608           V.getValueType().getVectorNumElements() == VT.getVectorNumElements();
1609
1610       // We only have a splat which can skip shuffles if there is a splatted
1611       // value and no undef lanes rearranged by the shuffle.
1612       if (Splat && UndefElements.none()) {
1613         // Splat of <x, x, ..., x>, return <x, x, ..., x>, provided that the
1614         // number of elements match or the value splatted is a zero constant.
1615         if (SameNumElts)
1616           return N1;
1617         if (auto *C = dyn_cast<ConstantSDNode>(Splat))
1618           if (C->isNullValue())
1619             return N1;
1620       }
1621
1622       // If the shuffle itself creates a splat, build the vector directly.
1623       if (AllSame && SameNumElts) {
1624         const SDValue &Splatted = BV->getOperand(MaskVec[0]);
1625         SmallVector<SDValue, 8> Ops(NElts, Splatted);
1626
1627         EVT BuildVT = BV->getValueType(0);
1628         SDValue NewBV = getNode(ISD::BUILD_VECTOR, dl, BuildVT, Ops);
1629
1630         // We may have jumped through bitcasts, so the type of the
1631         // BUILD_VECTOR may not match the type of the shuffle.
1632         if (BuildVT != VT)
1633           NewBV = getNode(ISD::BITCAST, dl, VT, NewBV);
1634         return NewBV;
1635       }
1636     }
1637   }
1638
1639   FoldingSetNodeID ID;
1640   SDValue Ops[2] = { N1, N2 };
1641   AddNodeIDNode(ID, ISD::VECTOR_SHUFFLE, getVTList(VT), Ops);
1642   for (unsigned i = 0; i != NElts; ++i)
1643     ID.AddInteger(MaskVec[i]);
1644
1645   void* IP = nullptr;
1646   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP))
1647     return SDValue(E, 0);
1648
1649   // Allocate the mask array for the node out of the BumpPtrAllocator, since
1650   // SDNode doesn't have access to it.  This memory will be "leaked" when
1651   // the node is deallocated, but recovered when the NodeAllocator is released.
1652   int *MaskAlloc = OperandAllocator.Allocate<int>(NElts);
1653   memcpy(MaskAlloc, &MaskVec[0], NElts * sizeof(int));
1654
1655   ShuffleVectorSDNode *N =
1656     new (NodeAllocator) ShuffleVectorSDNode(VT, dl.getIROrder(),
1657                                             dl.getDebugLoc(), N1, N2,
1658                                             MaskAlloc);
1659   CSEMap.InsertNode(N, IP);
1660   InsertNode(N);
1661   return SDValue(N, 0);
1662 }
1663
1664 SDValue SelectionDAG::getCommutedVectorShuffle(const ShuffleVectorSDNode &SV) {
1665   MVT VT = SV.getSimpleValueType(0);
1666   SmallVector<int, 8> MaskVec(SV.getMask().begin(), SV.getMask().end());
1667   ShuffleVectorSDNode::commuteMask(MaskVec);
1668
1669   SDValue Op0 = SV.getOperand(0);
1670   SDValue Op1 = SV.getOperand(1);
1671   return getVectorShuffle(VT, SDLoc(&SV), Op1, Op0, &MaskVec[0]);
1672 }
1673
1674 SDValue SelectionDAG::getConvertRndSat(EVT VT, SDLoc dl,
1675                                        SDValue Val, SDValue DTy,
1676                                        SDValue STy, SDValue Rnd, SDValue Sat,
1677                                        ISD::CvtCode Code) {
1678   // If the src and dest types are the same and the conversion is between
1679   // integer types of the same sign or two floats, no conversion is necessary.
1680   if (DTy == STy &&
1681       (Code == ISD::CVT_UU || Code == ISD::CVT_SS || Code == ISD::CVT_FF))
1682     return Val;
1683
1684   FoldingSetNodeID ID;
1685   SDValue Ops[] = { Val, DTy, STy, Rnd, Sat };
1686   AddNodeIDNode(ID, ISD::CONVERT_RNDSAT, getVTList(VT), Ops);
1687   void* IP = nullptr;
1688   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP))
1689     return SDValue(E, 0);
1690
1691   CvtRndSatSDNode *N = new (NodeAllocator) CvtRndSatSDNode(VT, dl.getIROrder(),
1692                                                            dl.getDebugLoc(),
1693                                                            Ops, Code);
1694   CSEMap.InsertNode(N, IP);
1695   InsertNode(N);
1696   return SDValue(N, 0);
1697 }
1698
1699 SDValue SelectionDAG::getRegister(unsigned RegNo, EVT VT) {
1700   FoldingSetNodeID ID;
1701   AddNodeIDNode(ID, ISD::Register, getVTList(VT), None);
1702   ID.AddInteger(RegNo);
1703   void *IP = nullptr;
1704   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1705     return SDValue(E, 0);
1706
1707   SDNode *N = new (NodeAllocator) RegisterSDNode(RegNo, VT);
1708   CSEMap.InsertNode(N, IP);
1709   InsertNode(N);
1710   return SDValue(N, 0);
1711 }
1712
1713 SDValue SelectionDAG::getRegisterMask(const uint32_t *RegMask) {
1714   FoldingSetNodeID ID;
1715   AddNodeIDNode(ID, ISD::RegisterMask, getVTList(MVT::Untyped), None);
1716   ID.AddPointer(RegMask);
1717   void *IP = nullptr;
1718   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1719     return SDValue(E, 0);
1720
1721   SDNode *N = new (NodeAllocator) RegisterMaskSDNode(RegMask);
1722   CSEMap.InsertNode(N, IP);
1723   InsertNode(N);
1724   return SDValue(N, 0);
1725 }
1726
1727 SDValue SelectionDAG::getEHLabel(SDLoc dl, SDValue Root, MCSymbol *Label) {
1728   FoldingSetNodeID ID;
1729   SDValue Ops[] = { Root };
1730   AddNodeIDNode(ID, ISD::EH_LABEL, getVTList(MVT::Other), Ops);
1731   ID.AddPointer(Label);
1732   void *IP = nullptr;
1733   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1734     return SDValue(E, 0);
1735
1736   SDNode *N = new (NodeAllocator) EHLabelSDNode(dl.getIROrder(),
1737                                                 dl.getDebugLoc(), Root, Label);
1738   CSEMap.InsertNode(N, IP);
1739   InsertNode(N);
1740   return SDValue(N, 0);
1741 }
1742
1743
1744 SDValue SelectionDAG::getBlockAddress(const BlockAddress *BA, EVT VT,
1745                                       int64_t Offset,
1746                                       bool isTarget,
1747                                       unsigned char TargetFlags) {
1748   unsigned Opc = isTarget ? ISD::TargetBlockAddress : ISD::BlockAddress;
1749
1750   FoldingSetNodeID ID;
1751   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1752   ID.AddPointer(BA);
1753   ID.AddInteger(Offset);
1754   ID.AddInteger(TargetFlags);
1755   void *IP = nullptr;
1756   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1757     return SDValue(E, 0);
1758
1759   SDNode *N = new (NodeAllocator) BlockAddressSDNode(Opc, VT, BA, Offset,
1760                                                      TargetFlags);
1761   CSEMap.InsertNode(N, IP);
1762   InsertNode(N);
1763   return SDValue(N, 0);
1764 }
1765
1766 SDValue SelectionDAG::getSrcValue(const Value *V) {
1767   assert((!V || V->getType()->isPointerTy()) &&
1768          "SrcValue is not a pointer?");
1769
1770   FoldingSetNodeID ID;
1771   AddNodeIDNode(ID, ISD::SRCVALUE, getVTList(MVT::Other), None);
1772   ID.AddPointer(V);
1773
1774   void *IP = nullptr;
1775   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1776     return SDValue(E, 0);
1777
1778   SDNode *N = new (NodeAllocator) SrcValueSDNode(V);
1779   CSEMap.InsertNode(N, IP);
1780   InsertNode(N);
1781   return SDValue(N, 0);
1782 }
1783
1784 /// getMDNode - Return an MDNodeSDNode which holds an MDNode.
1785 SDValue SelectionDAG::getMDNode(const MDNode *MD) {
1786   FoldingSetNodeID ID;
1787   AddNodeIDNode(ID, ISD::MDNODE_SDNODE, getVTList(MVT::Other), None);
1788   ID.AddPointer(MD);
1789
1790   void *IP = nullptr;
1791   if (SDNode *E = FindNodeOrInsertPos(ID, IP))
1792     return SDValue(E, 0);
1793
1794   SDNode *N = new (NodeAllocator) MDNodeSDNode(MD);
1795   CSEMap.InsertNode(N, IP);
1796   InsertNode(N);
1797   return SDValue(N, 0);
1798 }
1799
1800 SDValue SelectionDAG::getBitcast(EVT VT, SDValue V) {
1801   if (VT == V.getValueType())
1802     return V;
1803
1804   return getNode(ISD::BITCAST, SDLoc(V), VT, V);
1805 }
1806
1807 /// getAddrSpaceCast - Return an AddrSpaceCastSDNode.
1808 SDValue SelectionDAG::getAddrSpaceCast(SDLoc dl, EVT VT, SDValue Ptr,
1809                                        unsigned SrcAS, unsigned DestAS) {
1810   SDValue Ops[] = {Ptr};
1811   FoldingSetNodeID ID;
1812   AddNodeIDNode(ID, ISD::ADDRSPACECAST, getVTList(VT), Ops);
1813   ID.AddInteger(SrcAS);
1814   ID.AddInteger(DestAS);
1815
1816   void *IP = nullptr;
1817   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP))
1818     return SDValue(E, 0);
1819
1820   SDNode *N = new (NodeAllocator) AddrSpaceCastSDNode(dl.getIROrder(),
1821                                                       dl.getDebugLoc(),
1822                                                       VT, Ptr, SrcAS, DestAS);
1823   CSEMap.InsertNode(N, IP);
1824   InsertNode(N);
1825   return SDValue(N, 0);
1826 }
1827
1828 /// getShiftAmountOperand - Return the specified value casted to
1829 /// the target's desired shift amount type.
1830 SDValue SelectionDAG::getShiftAmountOperand(EVT LHSTy, SDValue Op) {
1831   EVT OpTy = Op.getValueType();
1832   EVT ShTy = TLI->getShiftAmountTy(LHSTy, getDataLayout());
1833   if (OpTy == ShTy || OpTy.isVector()) return Op;
1834
1835   return getZExtOrTrunc(Op, SDLoc(Op), ShTy);
1836 }
1837
1838 SDValue SelectionDAG::expandVAArg(SDNode *Node) {
1839   SDLoc dl(Node);
1840   const TargetLowering &TLI = getTargetLoweringInfo();
1841   const Value *V = cast<SrcValueSDNode>(Node->getOperand(2))->getValue();
1842   EVT VT = Node->getValueType(0);
1843   SDValue Tmp1 = Node->getOperand(0);
1844   SDValue Tmp2 = Node->getOperand(1);
1845   unsigned Align = Node->getConstantOperandVal(3);
1846
1847   SDValue VAListLoad =
1848     getLoad(TLI.getPointerTy(getDataLayout()), dl, Tmp1, Tmp2,
1849             MachinePointerInfo(V), false, false, false, 0);
1850   SDValue VAList = VAListLoad;
1851
1852   if (Align > TLI.getMinStackArgumentAlignment()) {
1853     assert(((Align & (Align-1)) == 0) && "Expected Align to be a power of 2");
1854
1855     VAList = getNode(ISD::ADD, dl, VAList.getValueType(), VAList,
1856                      getConstant(Align - 1, dl, VAList.getValueType()));
1857
1858     VAList = getNode(ISD::AND, dl, VAList.getValueType(), VAList,
1859                      getConstant(-(int64_t)Align, dl, VAList.getValueType()));
1860   }
1861
1862   // Increment the pointer, VAList, to the next vaarg
1863   Tmp1 = getNode(ISD::ADD, dl, VAList.getValueType(), VAList,
1864                  getConstant(getDataLayout().getTypeAllocSize(
1865                                                VT.getTypeForEVT(*getContext())),
1866                              dl, VAList.getValueType()));
1867   // Store the incremented VAList to the legalized pointer
1868   Tmp1 = getStore(VAListLoad.getValue(1), dl, Tmp1, Tmp2,
1869                   MachinePointerInfo(V), false, false, 0);
1870   // Load the actual argument out of the pointer VAList
1871   return getLoad(VT, dl, Tmp1, VAList, MachinePointerInfo(),
1872                  false, false, false, 0);
1873 }
1874
1875 SDValue SelectionDAG::expandVACopy(SDNode *Node) {
1876   SDLoc dl(Node);
1877   const TargetLowering &TLI = getTargetLoweringInfo();
1878   // This defaults to loading a pointer from the input and storing it to the
1879   // output, returning the chain.
1880   const Value *VD = cast<SrcValueSDNode>(Node->getOperand(3))->getValue();
1881   const Value *VS = cast<SrcValueSDNode>(Node->getOperand(4))->getValue();
1882   SDValue Tmp1 = getLoad(TLI.getPointerTy(getDataLayout()), dl,
1883                          Node->getOperand(0), Node->getOperand(2),
1884                          MachinePointerInfo(VS), false, false, false, 0);
1885   return getStore(Tmp1.getValue(1), dl, Tmp1, Node->getOperand(1),
1886                   MachinePointerInfo(VD), false, false, 0);
1887 }
1888
1889 /// CreateStackTemporary - Create a stack temporary, suitable for holding the
1890 /// specified value type.
1891 SDValue SelectionDAG::CreateStackTemporary(EVT VT, unsigned minAlign) {
1892   MachineFrameInfo *FrameInfo = getMachineFunction().getFrameInfo();
1893   unsigned ByteSize = VT.getStoreSize();
1894   Type *Ty = VT.getTypeForEVT(*getContext());
1895   unsigned StackAlign =
1896       std::max((unsigned)getDataLayout().getPrefTypeAlignment(Ty), minAlign);
1897
1898   int FrameIdx = FrameInfo->CreateStackObject(ByteSize, StackAlign, false);
1899   return getFrameIndex(FrameIdx, TLI->getPointerTy(getDataLayout()));
1900 }
1901
1902 /// CreateStackTemporary - Create a stack temporary suitable for holding
1903 /// either of the specified value types.
1904 SDValue SelectionDAG::CreateStackTemporary(EVT VT1, EVT VT2) {
1905   unsigned Bytes = std::max(VT1.getStoreSize(), VT2.getStoreSize());
1906   Type *Ty1 = VT1.getTypeForEVT(*getContext());
1907   Type *Ty2 = VT2.getTypeForEVT(*getContext());
1908   const DataLayout &DL = getDataLayout();
1909   unsigned Align =
1910       std::max(DL.getPrefTypeAlignment(Ty1), DL.getPrefTypeAlignment(Ty2));
1911
1912   MachineFrameInfo *FrameInfo = getMachineFunction().getFrameInfo();
1913   int FrameIdx = FrameInfo->CreateStackObject(Bytes, Align, false);
1914   return getFrameIndex(FrameIdx, TLI->getPointerTy(getDataLayout()));
1915 }
1916
1917 SDValue SelectionDAG::FoldSetCC(EVT VT, SDValue N1,
1918                                 SDValue N2, ISD::CondCode Cond, SDLoc dl) {
1919   // These setcc operations always fold.
1920   switch (Cond) {
1921   default: break;
1922   case ISD::SETFALSE:
1923   case ISD::SETFALSE2: return getConstant(0, dl, VT);
1924   case ISD::SETTRUE:
1925   case ISD::SETTRUE2: {
1926     TargetLowering::BooleanContent Cnt =
1927         TLI->getBooleanContents(N1->getValueType(0));
1928     return getConstant(
1929         Cnt == TargetLowering::ZeroOrNegativeOneBooleanContent ? -1ULL : 1, dl,
1930         VT);
1931   }
1932
1933   case ISD::SETOEQ:
1934   case ISD::SETOGT:
1935   case ISD::SETOGE:
1936   case ISD::SETOLT:
1937   case ISD::SETOLE:
1938   case ISD::SETONE:
1939   case ISD::SETO:
1940   case ISD::SETUO:
1941   case ISD::SETUEQ:
1942   case ISD::SETUNE:
1943     assert(!N1.getValueType().isInteger() && "Illegal setcc for integer!");
1944     break;
1945   }
1946
1947   if (ConstantSDNode *N2C = dyn_cast<ConstantSDNode>(N2)) {
1948     const APInt &C2 = N2C->getAPIntValue();
1949     if (ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N1)) {
1950       const APInt &C1 = N1C->getAPIntValue();
1951
1952       switch (Cond) {
1953       default: llvm_unreachable("Unknown integer setcc!");
1954       case ISD::SETEQ:  return getConstant(C1 == C2, dl, VT);
1955       case ISD::SETNE:  return getConstant(C1 != C2, dl, VT);
1956       case ISD::SETULT: return getConstant(C1.ult(C2), dl, VT);
1957       case ISD::SETUGT: return getConstant(C1.ugt(C2), dl, VT);
1958       case ISD::SETULE: return getConstant(C1.ule(C2), dl, VT);
1959       case ISD::SETUGE: return getConstant(C1.uge(C2), dl, VT);
1960       case ISD::SETLT:  return getConstant(C1.slt(C2), dl, VT);
1961       case ISD::SETGT:  return getConstant(C1.sgt(C2), dl, VT);
1962       case ISD::SETLE:  return getConstant(C1.sle(C2), dl, VT);
1963       case ISD::SETGE:  return getConstant(C1.sge(C2), dl, VT);
1964       }
1965     }
1966   }
1967   if (ConstantFPSDNode *N1C = dyn_cast<ConstantFPSDNode>(N1)) {
1968     if (ConstantFPSDNode *N2C = dyn_cast<ConstantFPSDNode>(N2)) {
1969       APFloat::cmpResult R = N1C->getValueAPF().compare(N2C->getValueAPF());
1970       switch (Cond) {
1971       default: break;
1972       case ISD::SETEQ:  if (R==APFloat::cmpUnordered)
1973                           return getUNDEF(VT);
1974                         // fall through
1975       case ISD::SETOEQ: return getConstant(R==APFloat::cmpEqual, dl, VT);
1976       case ISD::SETNE:  if (R==APFloat::cmpUnordered)
1977                           return getUNDEF(VT);
1978                         // fall through
1979       case ISD::SETONE: return getConstant(R==APFloat::cmpGreaterThan ||
1980                                            R==APFloat::cmpLessThan, dl, VT);
1981       case ISD::SETLT:  if (R==APFloat::cmpUnordered)
1982                           return getUNDEF(VT);
1983                         // fall through
1984       case ISD::SETOLT: return getConstant(R==APFloat::cmpLessThan, dl, VT);
1985       case ISD::SETGT:  if (R==APFloat::cmpUnordered)
1986                           return getUNDEF(VT);
1987                         // fall through
1988       case ISD::SETOGT: return getConstant(R==APFloat::cmpGreaterThan, dl, VT);
1989       case ISD::SETLE:  if (R==APFloat::cmpUnordered)
1990                           return getUNDEF(VT);
1991                         // fall through
1992       case ISD::SETOLE: return getConstant(R==APFloat::cmpLessThan ||
1993                                            R==APFloat::cmpEqual, dl, VT);
1994       case ISD::SETGE:  if (R==APFloat::cmpUnordered)
1995                           return getUNDEF(VT);
1996                         // fall through
1997       case ISD::SETOGE: return getConstant(R==APFloat::cmpGreaterThan ||
1998                                            R==APFloat::cmpEqual, dl, VT);
1999       case ISD::SETO:   return getConstant(R!=APFloat::cmpUnordered, dl, VT);
2000       case ISD::SETUO:  return getConstant(R==APFloat::cmpUnordered, dl, VT);
2001       case ISD::SETUEQ: return getConstant(R==APFloat::cmpUnordered ||
2002                                            R==APFloat::cmpEqual, dl, VT);
2003       case ISD::SETUNE: return getConstant(R!=APFloat::cmpEqual, dl, VT);
2004       case ISD::SETULT: return getConstant(R==APFloat::cmpUnordered ||
2005                                            R==APFloat::cmpLessThan, dl, VT);
2006       case ISD::SETUGT: return getConstant(R==APFloat::cmpGreaterThan ||
2007                                            R==APFloat::cmpUnordered, dl, VT);
2008       case ISD::SETULE: return getConstant(R!=APFloat::cmpGreaterThan, dl, VT);
2009       case ISD::SETUGE: return getConstant(R!=APFloat::cmpLessThan, dl, VT);
2010       }
2011     } else {
2012       // Ensure that the constant occurs on the RHS.
2013       ISD::CondCode SwappedCond = ISD::getSetCCSwappedOperands(Cond);
2014       MVT CompVT = N1.getValueType().getSimpleVT();
2015       if (!TLI->isCondCodeLegal(SwappedCond, CompVT))
2016         return SDValue();
2017
2018       return getSetCC(dl, VT, N2, N1, SwappedCond);
2019     }
2020   }
2021
2022   // Could not fold it.
2023   return SDValue();
2024 }
2025
2026 /// SignBitIsZero - Return true if the sign bit of Op is known to be zero.  We
2027 /// use this predicate to simplify operations downstream.
2028 bool SelectionDAG::SignBitIsZero(SDValue Op, unsigned Depth) const {
2029   // This predicate is not safe for vector operations.
2030   if (Op.getValueType().isVector())
2031     return false;
2032
2033   unsigned BitWidth = Op.getValueType().getScalarType().getSizeInBits();
2034   return MaskedValueIsZero(Op, APInt::getSignBit(BitWidth), Depth);
2035 }
2036
2037 /// MaskedValueIsZero - Return true if 'V & Mask' is known to be zero.  We use
2038 /// this predicate to simplify operations downstream.  Mask is known to be zero
2039 /// for bits that V cannot have.
2040 bool SelectionDAG::MaskedValueIsZero(SDValue Op, const APInt &Mask,
2041                                      unsigned Depth) const {
2042   APInt KnownZero, KnownOne;
2043   computeKnownBits(Op, KnownZero, KnownOne, Depth);
2044   return (KnownZero & Mask) == Mask;
2045 }
2046
2047 /// Determine which bits of Op are known to be either zero or one and return
2048 /// them in the KnownZero/KnownOne bitsets.
2049 void SelectionDAG::computeKnownBits(SDValue Op, APInt &KnownZero,
2050                                     APInt &KnownOne, unsigned Depth) const {
2051   unsigned BitWidth = Op.getValueType().getScalarType().getSizeInBits();
2052
2053   KnownZero = KnownOne = APInt(BitWidth, 0);   // Don't know anything.
2054   if (Depth == 6)
2055     return;  // Limit search depth.
2056
2057   APInt KnownZero2, KnownOne2;
2058
2059   switch (Op.getOpcode()) {
2060   case ISD::Constant:
2061     // We know all of the bits for a constant!
2062     KnownOne = cast<ConstantSDNode>(Op)->getAPIntValue();
2063     KnownZero = ~KnownOne;
2064     break;
2065   case ISD::AND:
2066     // If either the LHS or the RHS are Zero, the result is zero.
2067     computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
2068     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
2069
2070     // Output known-1 bits are only known if set in both the LHS & RHS.
2071     KnownOne &= KnownOne2;
2072     // Output known-0 are known to be clear if zero in either the LHS | RHS.
2073     KnownZero |= KnownZero2;
2074     break;
2075   case ISD::OR:
2076     computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
2077     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
2078
2079     // Output known-0 bits are only known if clear in both the LHS & RHS.
2080     KnownZero &= KnownZero2;
2081     // Output known-1 are known to be set if set in either the LHS | RHS.
2082     KnownOne |= KnownOne2;
2083     break;
2084   case ISD::XOR: {
2085     computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
2086     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
2087
2088     // Output known-0 bits are known if clear or set in both the LHS & RHS.
2089     APInt KnownZeroOut = (KnownZero & KnownZero2) | (KnownOne & KnownOne2);
2090     // Output known-1 are known to be set if set in only one of the LHS, RHS.
2091     KnownOne = (KnownZero & KnownOne2) | (KnownOne & KnownZero2);
2092     KnownZero = KnownZeroOut;
2093     break;
2094   }
2095   case ISD::MUL: {
2096     computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
2097     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
2098
2099     // If low bits are zero in either operand, output low known-0 bits.
2100     // Also compute a conserative estimate for high known-0 bits.
2101     // More trickiness is possible, but this is sufficient for the
2102     // interesting case of alignment computation.
2103     KnownOne.clearAllBits();
2104     unsigned TrailZ = KnownZero.countTrailingOnes() +
2105                       KnownZero2.countTrailingOnes();
2106     unsigned LeadZ =  std::max(KnownZero.countLeadingOnes() +
2107                                KnownZero2.countLeadingOnes(),
2108                                BitWidth) - BitWidth;
2109
2110     TrailZ = std::min(TrailZ, BitWidth);
2111     LeadZ = std::min(LeadZ, BitWidth);
2112     KnownZero = APInt::getLowBitsSet(BitWidth, TrailZ) |
2113                 APInt::getHighBitsSet(BitWidth, LeadZ);
2114     break;
2115   }
2116   case ISD::UDIV: {
2117     // For the purposes of computing leading zeros we can conservatively
2118     // treat a udiv as a logical right shift by the power of 2 known to
2119     // be less than the denominator.
2120     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
2121     unsigned LeadZ = KnownZero2.countLeadingOnes();
2122
2123     KnownOne2.clearAllBits();
2124     KnownZero2.clearAllBits();
2125     computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2126     unsigned RHSUnknownLeadingOnes = KnownOne2.countLeadingZeros();
2127     if (RHSUnknownLeadingOnes != BitWidth)
2128       LeadZ = std::min(BitWidth,
2129                        LeadZ + BitWidth - RHSUnknownLeadingOnes - 1);
2130
2131     KnownZero = APInt::getHighBitsSet(BitWidth, LeadZ);
2132     break;
2133   }
2134   case ISD::SELECT:
2135     computeKnownBits(Op.getOperand(2), KnownZero, KnownOne, Depth+1);
2136     computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2137
2138     // Only known if known in both the LHS and RHS.
2139     KnownOne &= KnownOne2;
2140     KnownZero &= KnownZero2;
2141     break;
2142   case ISD::SELECT_CC:
2143     computeKnownBits(Op.getOperand(3), KnownZero, KnownOne, Depth+1);
2144     computeKnownBits(Op.getOperand(2), KnownZero2, KnownOne2, Depth+1);
2145
2146     // Only known if known in both the LHS and RHS.
2147     KnownOne &= KnownOne2;
2148     KnownZero &= KnownZero2;
2149     break;
2150   case ISD::SADDO:
2151   case ISD::UADDO:
2152   case ISD::SSUBO:
2153   case ISD::USUBO:
2154   case ISD::SMULO:
2155   case ISD::UMULO:
2156     if (Op.getResNo() != 1)
2157       break;
2158     // The boolean result conforms to getBooleanContents.
2159     // If we know the result of a setcc has the top bits zero, use this info.
2160     // We know that we have an integer-based boolean since these operations
2161     // are only available for integer.
2162     if (TLI->getBooleanContents(Op.getValueType().isVector(), false) ==
2163             TargetLowering::ZeroOrOneBooleanContent &&
2164         BitWidth > 1)
2165       KnownZero |= APInt::getHighBitsSet(BitWidth, BitWidth - 1);
2166     break;
2167   case ISD::SETCC:
2168     // If we know the result of a setcc has the top bits zero, use this info.
2169     if (TLI->getBooleanContents(Op.getOperand(0).getValueType()) ==
2170             TargetLowering::ZeroOrOneBooleanContent &&
2171         BitWidth > 1)
2172       KnownZero |= APInt::getHighBitsSet(BitWidth, BitWidth - 1);
2173     break;
2174   case ISD::SHL:
2175     // (shl X, C1) & C2 == 0   iff   (X & C2 >>u C1) == 0
2176     if (ConstantSDNode *SA = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2177       unsigned ShAmt = SA->getZExtValue();
2178
2179       // If the shift count is an invalid immediate, don't do anything.
2180       if (ShAmt >= BitWidth)
2181         break;
2182
2183       computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2184       KnownZero <<= ShAmt;
2185       KnownOne  <<= ShAmt;
2186       // low bits known zero.
2187       KnownZero |= APInt::getLowBitsSet(BitWidth, ShAmt);
2188     }
2189     break;
2190   case ISD::SRL:
2191     // (ushr X, C1) & C2 == 0   iff  (-1 >> C1) & C2 == 0
2192     if (ConstantSDNode *SA = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2193       unsigned ShAmt = SA->getZExtValue();
2194
2195       // If the shift count is an invalid immediate, don't do anything.
2196       if (ShAmt >= BitWidth)
2197         break;
2198
2199       computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2200       KnownZero = KnownZero.lshr(ShAmt);
2201       KnownOne  = KnownOne.lshr(ShAmt);
2202
2203       APInt HighBits = APInt::getHighBitsSet(BitWidth, ShAmt);
2204       KnownZero |= HighBits;  // High bits known zero.
2205     }
2206     break;
2207   case ISD::SRA:
2208     if (ConstantSDNode *SA = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2209       unsigned ShAmt = SA->getZExtValue();
2210
2211       // If the shift count is an invalid immediate, don't do anything.
2212       if (ShAmt >= BitWidth)
2213         break;
2214
2215       // If any of the demanded bits are produced by the sign extension, we also
2216       // demand the input sign bit.
2217       APInt HighBits = APInt::getHighBitsSet(BitWidth, ShAmt);
2218
2219       computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2220       KnownZero = KnownZero.lshr(ShAmt);
2221       KnownOne  = KnownOne.lshr(ShAmt);
2222
2223       // Handle the sign bits.
2224       APInt SignBit = APInt::getSignBit(BitWidth);
2225       SignBit = SignBit.lshr(ShAmt);  // Adjust to where it is now in the mask.
2226
2227       if (KnownZero.intersects(SignBit)) {
2228         KnownZero |= HighBits;  // New bits are known zero.
2229       } else if (KnownOne.intersects(SignBit)) {
2230         KnownOne  |= HighBits;  // New bits are known one.
2231       }
2232     }
2233     break;
2234   case ISD::SIGN_EXTEND_INREG: {
2235     EVT EVT = cast<VTSDNode>(Op.getOperand(1))->getVT();
2236     unsigned EBits = EVT.getScalarType().getSizeInBits();
2237
2238     // Sign extension.  Compute the demanded bits in the result that are not
2239     // present in the input.
2240     APInt NewBits = APInt::getHighBitsSet(BitWidth, BitWidth - EBits);
2241
2242     APInt InSignBit = APInt::getSignBit(EBits);
2243     APInt InputDemandedBits = APInt::getLowBitsSet(BitWidth, EBits);
2244
2245     // If the sign extended bits are demanded, we know that the sign
2246     // bit is demanded.
2247     InSignBit = InSignBit.zext(BitWidth);
2248     if (NewBits.getBoolValue())
2249       InputDemandedBits |= InSignBit;
2250
2251     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2252     KnownOne &= InputDemandedBits;
2253     KnownZero &= InputDemandedBits;
2254
2255     // If the sign bit of the input is known set or clear, then we know the
2256     // top bits of the result.
2257     if (KnownZero.intersects(InSignBit)) {         // Input sign bit known clear
2258       KnownZero |= NewBits;
2259       KnownOne  &= ~NewBits;
2260     } else if (KnownOne.intersects(InSignBit)) {   // Input sign bit known set
2261       KnownOne  |= NewBits;
2262       KnownZero &= ~NewBits;
2263     } else {                              // Input sign bit unknown
2264       KnownZero &= ~NewBits;
2265       KnownOne  &= ~NewBits;
2266     }
2267     break;
2268   }
2269   case ISD::CTTZ:
2270   case ISD::CTTZ_ZERO_UNDEF:
2271   case ISD::CTLZ:
2272   case ISD::CTLZ_ZERO_UNDEF:
2273   case ISD::CTPOP: {
2274     unsigned LowBits = Log2_32(BitWidth)+1;
2275     KnownZero = APInt::getHighBitsSet(BitWidth, BitWidth - LowBits);
2276     KnownOne.clearAllBits();
2277     break;
2278   }
2279   case ISD::LOAD: {
2280     LoadSDNode *LD = cast<LoadSDNode>(Op);
2281     // If this is a ZEXTLoad and we are looking at the loaded value.
2282     if (ISD::isZEXTLoad(Op.getNode()) && Op.getResNo() == 0) {
2283       EVT VT = LD->getMemoryVT();
2284       unsigned MemBits = VT.getScalarType().getSizeInBits();
2285       KnownZero |= APInt::getHighBitsSet(BitWidth, BitWidth - MemBits);
2286     } else if (const MDNode *Ranges = LD->getRanges()) {
2287       if (LD->getExtensionType() == ISD::NON_EXTLOAD)
2288         computeKnownBitsFromRangeMetadata(*Ranges, KnownZero, KnownOne);
2289     }
2290     break;
2291   }
2292   case ISD::ZERO_EXTEND: {
2293     EVT InVT = Op.getOperand(0).getValueType();
2294     unsigned InBits = InVT.getScalarType().getSizeInBits();
2295     APInt NewBits   = APInt::getHighBitsSet(BitWidth, BitWidth - InBits);
2296     KnownZero = KnownZero.trunc(InBits);
2297     KnownOne = KnownOne.trunc(InBits);
2298     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2299     KnownZero = KnownZero.zext(BitWidth);
2300     KnownOne = KnownOne.zext(BitWidth);
2301     KnownZero |= NewBits;
2302     break;
2303   }
2304   case ISD::SIGN_EXTEND: {
2305     EVT InVT = Op.getOperand(0).getValueType();
2306     unsigned InBits = InVT.getScalarType().getSizeInBits();
2307     APInt NewBits   = APInt::getHighBitsSet(BitWidth, BitWidth - InBits);
2308
2309     KnownZero = KnownZero.trunc(InBits);
2310     KnownOne = KnownOne.trunc(InBits);
2311     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2312
2313     // Note if the sign bit is known to be zero or one.
2314     bool SignBitKnownZero = KnownZero.isNegative();
2315     bool SignBitKnownOne  = KnownOne.isNegative();
2316
2317     KnownZero = KnownZero.zext(BitWidth);
2318     KnownOne = KnownOne.zext(BitWidth);
2319
2320     // If the sign bit is known zero or one, the top bits match.
2321     if (SignBitKnownZero)
2322       KnownZero |= NewBits;
2323     else if (SignBitKnownOne)
2324       KnownOne  |= NewBits;
2325     break;
2326   }
2327   case ISD::ANY_EXTEND: {
2328     EVT InVT = Op.getOperand(0).getValueType();
2329     unsigned InBits = InVT.getScalarType().getSizeInBits();
2330     KnownZero = KnownZero.trunc(InBits);
2331     KnownOne = KnownOne.trunc(InBits);
2332     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2333     KnownZero = KnownZero.zext(BitWidth);
2334     KnownOne = KnownOne.zext(BitWidth);
2335     break;
2336   }
2337   case ISD::TRUNCATE: {
2338     EVT InVT = Op.getOperand(0).getValueType();
2339     unsigned InBits = InVT.getScalarType().getSizeInBits();
2340     KnownZero = KnownZero.zext(InBits);
2341     KnownOne = KnownOne.zext(InBits);
2342     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2343     KnownZero = KnownZero.trunc(BitWidth);
2344     KnownOne = KnownOne.trunc(BitWidth);
2345     break;
2346   }
2347   case ISD::AssertZext: {
2348     EVT VT = cast<VTSDNode>(Op.getOperand(1))->getVT();
2349     APInt InMask = APInt::getLowBitsSet(BitWidth, VT.getSizeInBits());
2350     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2351     KnownZero |= (~InMask);
2352     KnownOne  &= (~KnownZero);
2353     break;
2354   }
2355   case ISD::FGETSIGN:
2356     // All bits are zero except the low bit.
2357     KnownZero = APInt::getHighBitsSet(BitWidth, BitWidth - 1);
2358     break;
2359
2360   case ISD::SUB: {
2361     if (ConstantSDNode *CLHS = dyn_cast<ConstantSDNode>(Op.getOperand(0))) {
2362       // We know that the top bits of C-X are clear if X contains less bits
2363       // than C (i.e. no wrap-around can happen).  For example, 20-X is
2364       // positive if we can prove that X is >= 0 and < 16.
2365       if (CLHS->getAPIntValue().isNonNegative()) {
2366         unsigned NLZ = (CLHS->getAPIntValue()+1).countLeadingZeros();
2367         // NLZ can't be BitWidth with no sign bit
2368         APInt MaskV = APInt::getHighBitsSet(BitWidth, NLZ+1);
2369         computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2370
2371         // If all of the MaskV bits are known to be zero, then we know the
2372         // output top bits are zero, because we now know that the output is
2373         // from [0-C].
2374         if ((KnownZero2 & MaskV) == MaskV) {
2375           unsigned NLZ2 = CLHS->getAPIntValue().countLeadingZeros();
2376           // Top bits known zero.
2377           KnownZero = APInt::getHighBitsSet(BitWidth, NLZ2);
2378         }
2379       }
2380     }
2381   }
2382   // fall through
2383   case ISD::ADD:
2384   case ISD::ADDE: {
2385     // Output known-0 bits are known if clear or set in both the low clear bits
2386     // common to both LHS & RHS.  For example, 8+(X<<3) is known to have the
2387     // low 3 bits clear.
2388     // Output known-0 bits are also known if the top bits of each input are
2389     // known to be clear. For example, if one input has the top 10 bits clear
2390     // and the other has the top 8 bits clear, we know the top 7 bits of the
2391     // output must be clear.
2392     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
2393     unsigned KnownZeroHigh = KnownZero2.countLeadingOnes();
2394     unsigned KnownZeroLow = KnownZero2.countTrailingOnes();
2395
2396     computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2397     KnownZeroHigh = std::min(KnownZeroHigh,
2398                              KnownZero2.countLeadingOnes());
2399     KnownZeroLow = std::min(KnownZeroLow,
2400                             KnownZero2.countTrailingOnes());
2401
2402     if (Op.getOpcode() == ISD::ADD) {
2403       KnownZero |= APInt::getLowBitsSet(BitWidth, KnownZeroLow);
2404       if (KnownZeroHigh > 1)
2405         KnownZero |= APInt::getHighBitsSet(BitWidth, KnownZeroHigh - 1);
2406       break;
2407     }
2408
2409     // With ADDE, a carry bit may be added in, so we can only use this
2410     // information if we know (at least) that the low two bits are clear.  We
2411     // then return to the caller that the low bit is unknown but that other bits
2412     // are known zero.
2413     if (KnownZeroLow >= 2) // ADDE
2414       KnownZero |= APInt::getBitsSet(BitWidth, 1, KnownZeroLow);
2415     break;
2416   }
2417   case ISD::SREM:
2418     if (ConstantSDNode *Rem = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2419       const APInt &RA = Rem->getAPIntValue().abs();
2420       if (RA.isPowerOf2()) {
2421         APInt LowBits = RA - 1;
2422         computeKnownBits(Op.getOperand(0), KnownZero2,KnownOne2,Depth+1);
2423
2424         // The low bits of the first operand are unchanged by the srem.
2425         KnownZero = KnownZero2 & LowBits;
2426         KnownOne = KnownOne2 & LowBits;
2427
2428         // If the first operand is non-negative or has all low bits zero, then
2429         // the upper bits are all zero.
2430         if (KnownZero2[BitWidth-1] || ((KnownZero2 & LowBits) == LowBits))
2431           KnownZero |= ~LowBits;
2432
2433         // If the first operand is negative and not all low bits are zero, then
2434         // the upper bits are all one.
2435         if (KnownOne2[BitWidth-1] && ((KnownOne2 & LowBits) != 0))
2436           KnownOne |= ~LowBits;
2437         assert((KnownZero & KnownOne) == 0&&"Bits known to be one AND zero?");
2438       }
2439     }
2440     break;
2441   case ISD::UREM: {
2442     if (ConstantSDNode *Rem = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2443       const APInt &RA = Rem->getAPIntValue();
2444       if (RA.isPowerOf2()) {
2445         APInt LowBits = (RA - 1);
2446         computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth + 1);
2447
2448         // The upper bits are all zero, the lower ones are unchanged.
2449         KnownZero = KnownZero2 | ~LowBits;
2450         KnownOne = KnownOne2 & LowBits;
2451         break;
2452       }
2453     }
2454
2455     // Since the result is less than or equal to either operand, any leading
2456     // zero bits in either operand must also exist in the result.
2457     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2458     computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2459
2460     uint32_t Leaders = std::max(KnownZero.countLeadingOnes(),
2461                                 KnownZero2.countLeadingOnes());
2462     KnownOne.clearAllBits();
2463     KnownZero = APInt::getHighBitsSet(BitWidth, Leaders);
2464     break;
2465   }
2466   case ISD::EXTRACT_ELEMENT: {
2467     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2468     const unsigned Index =
2469       cast<ConstantSDNode>(Op.getOperand(1))->getZExtValue();
2470     const unsigned BitWidth = Op.getValueType().getSizeInBits();
2471
2472     // Remove low part of known bits mask
2473     KnownZero = KnownZero.getHiBits(KnownZero.getBitWidth() - Index * BitWidth);
2474     KnownOne = KnownOne.getHiBits(KnownOne.getBitWidth() - Index * BitWidth);
2475
2476     // Remove high part of known bit mask
2477     KnownZero = KnownZero.trunc(BitWidth);
2478     KnownOne = KnownOne.trunc(BitWidth);
2479     break;
2480   }
2481   case ISD::SMIN:
2482   case ISD::SMAX:
2483   case ISD::UMIN:
2484   case ISD::UMAX: {
2485     APInt Op0Zero, Op0One;
2486     APInt Op1Zero, Op1One;
2487     computeKnownBits(Op.getOperand(0), Op0Zero, Op0One, Depth);
2488     computeKnownBits(Op.getOperand(1), Op1Zero, Op1One, Depth);
2489
2490     KnownZero = Op0Zero & Op1Zero;
2491     KnownOne = Op0One & Op1One;
2492     break;
2493   }
2494   case ISD::FrameIndex:
2495   case ISD::TargetFrameIndex:
2496     if (unsigned Align = InferPtrAlignment(Op)) {
2497       // The low bits are known zero if the pointer is aligned.
2498       KnownZero = APInt::getLowBitsSet(BitWidth, Log2_32(Align));
2499       break;
2500     }
2501     break;
2502
2503   default:
2504     if (Op.getOpcode() < ISD::BUILTIN_OP_END)
2505       break;
2506     // Fallthrough
2507   case ISD::INTRINSIC_WO_CHAIN:
2508   case ISD::INTRINSIC_W_CHAIN:
2509   case ISD::INTRINSIC_VOID:
2510     // Allow the target to implement this method for its nodes.
2511     TLI->computeKnownBitsForTargetNode(Op, KnownZero, KnownOne, *this, Depth);
2512     break;
2513   }
2514
2515   assert((KnownZero & KnownOne) == 0 && "Bits known to be one AND zero?");
2516 }
2517
2518 /// ComputeNumSignBits - Return the number of times the sign bit of the
2519 /// register is replicated into the other bits.  We know that at least 1 bit
2520 /// is always equal to the sign bit (itself), but other cases can give us
2521 /// information.  For example, immediately after an "SRA X, 2", we know that
2522 /// the top 3 bits are all equal to each other, so we return 3.
2523 unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, unsigned Depth) const{
2524   EVT VT = Op.getValueType();
2525   assert(VT.isInteger() && "Invalid VT!");
2526   unsigned VTBits = VT.getScalarType().getSizeInBits();
2527   unsigned Tmp, Tmp2;
2528   unsigned FirstAnswer = 1;
2529
2530   if (Depth == 6)
2531     return 1;  // Limit search depth.
2532
2533   switch (Op.getOpcode()) {
2534   default: break;
2535   case ISD::AssertSext:
2536     Tmp = cast<VTSDNode>(Op.getOperand(1))->getVT().getSizeInBits();
2537     return VTBits-Tmp+1;
2538   case ISD::AssertZext:
2539     Tmp = cast<VTSDNode>(Op.getOperand(1))->getVT().getSizeInBits();
2540     return VTBits-Tmp;
2541
2542   case ISD::Constant: {
2543     const APInt &Val = cast<ConstantSDNode>(Op)->getAPIntValue();
2544     return Val.getNumSignBits();
2545   }
2546
2547   case ISD::SIGN_EXTEND:
2548     Tmp =
2549         VTBits-Op.getOperand(0).getValueType().getScalarType().getSizeInBits();
2550     return ComputeNumSignBits(Op.getOperand(0), Depth+1) + Tmp;
2551
2552   case ISD::SIGN_EXTEND_INREG:
2553     // Max of the input and what this extends.
2554     Tmp =
2555       cast<VTSDNode>(Op.getOperand(1))->getVT().getScalarType().getSizeInBits();
2556     Tmp = VTBits-Tmp+1;
2557
2558     Tmp2 = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2559     return std::max(Tmp, Tmp2);
2560
2561   case ISD::SRA:
2562     Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2563     // SRA X, C   -> adds C sign bits.
2564     if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2565       Tmp += C->getZExtValue();
2566       if (Tmp > VTBits) Tmp = VTBits;
2567     }
2568     return Tmp;
2569   case ISD::SHL:
2570     if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2571       // shl destroys sign bits.
2572       Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2573       if (C->getZExtValue() >= VTBits ||      // Bad shift.
2574           C->getZExtValue() >= Tmp) break;    // Shifted all sign bits out.
2575       return Tmp - C->getZExtValue();
2576     }
2577     break;
2578   case ISD::AND:
2579   case ISD::OR:
2580   case ISD::XOR:    // NOT is handled here.
2581     // Logical binary ops preserve the number of sign bits at the worst.
2582     Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2583     if (Tmp != 1) {
2584       Tmp2 = ComputeNumSignBits(Op.getOperand(1), Depth+1);
2585       FirstAnswer = std::min(Tmp, Tmp2);
2586       // We computed what we know about the sign bits as our first
2587       // answer. Now proceed to the generic code that uses
2588       // computeKnownBits, and pick whichever answer is better.
2589     }
2590     break;
2591
2592   case ISD::SELECT:
2593     Tmp = ComputeNumSignBits(Op.getOperand(1), Depth+1);
2594     if (Tmp == 1) return 1;  // Early out.
2595     Tmp2 = ComputeNumSignBits(Op.getOperand(2), Depth+1);
2596     return std::min(Tmp, Tmp2);
2597   case ISD::SELECT_CC:
2598     Tmp = ComputeNumSignBits(Op.getOperand(2), Depth+1);
2599     if (Tmp == 1) return 1;  // Early out.
2600     Tmp2 = ComputeNumSignBits(Op.getOperand(3), Depth+1);
2601     return std::min(Tmp, Tmp2);
2602   case ISD::SMIN:
2603   case ISD::SMAX:
2604   case ISD::UMIN:
2605   case ISD::UMAX:
2606     Tmp = ComputeNumSignBits(Op.getOperand(0), Depth + 1);
2607     if (Tmp == 1)
2608       return 1;  // Early out.
2609     Tmp2 = ComputeNumSignBits(Op.getOperand(1), Depth + 1);
2610     return std::min(Tmp, Tmp2);
2611   case ISD::SADDO:
2612   case ISD::UADDO:
2613   case ISD::SSUBO:
2614   case ISD::USUBO:
2615   case ISD::SMULO:
2616   case ISD::UMULO:
2617     if (Op.getResNo() != 1)
2618       break;
2619     // The boolean result conforms to getBooleanContents.  Fall through.
2620     // If setcc returns 0/-1, all bits are sign bits.
2621     // We know that we have an integer-based boolean since these operations
2622     // are only available for integer.
2623     if (TLI->getBooleanContents(Op.getValueType().isVector(), false) ==
2624         TargetLowering::ZeroOrNegativeOneBooleanContent)
2625       return VTBits;
2626     break;
2627   case ISD::SETCC:
2628     // If setcc returns 0/-1, all bits are sign bits.
2629     if (TLI->getBooleanContents(Op.getOperand(0).getValueType()) ==
2630         TargetLowering::ZeroOrNegativeOneBooleanContent)
2631       return VTBits;
2632     break;
2633   case ISD::ROTL:
2634   case ISD::ROTR:
2635     if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2636       unsigned RotAmt = C->getZExtValue() & (VTBits-1);
2637
2638       // Handle rotate right by N like a rotate left by 32-N.
2639       if (Op.getOpcode() == ISD::ROTR)
2640         RotAmt = (VTBits-RotAmt) & (VTBits-1);
2641
2642       // If we aren't rotating out all of the known-in sign bits, return the
2643       // number that are left.  This handles rotl(sext(x), 1) for example.
2644       Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2645       if (Tmp > RotAmt+1) return Tmp-RotAmt;
2646     }
2647     break;
2648   case ISD::ADD:
2649     // Add can have at most one carry bit.  Thus we know that the output
2650     // is, at worst, one more bit than the inputs.
2651     Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2652     if (Tmp == 1) return 1;  // Early out.
2653
2654     // Special case decrementing a value (ADD X, -1):
2655     if (ConstantSDNode *CRHS = dyn_cast<ConstantSDNode>(Op.getOperand(1)))
2656       if (CRHS->isAllOnesValue()) {
2657         APInt KnownZero, KnownOne;
2658         computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2659
2660         // If the input is known to be 0 or 1, the output is 0/-1, which is all
2661         // sign bits set.
2662         if ((KnownZero | APInt(VTBits, 1)).isAllOnesValue())
2663           return VTBits;
2664
2665         // If we are subtracting one from a positive number, there is no carry
2666         // out of the result.
2667         if (KnownZero.isNegative())
2668           return Tmp;
2669       }
2670
2671     Tmp2 = ComputeNumSignBits(Op.getOperand(1), Depth+1);
2672     if (Tmp2 == 1) return 1;
2673     return std::min(Tmp, Tmp2)-1;
2674
2675   case ISD::SUB:
2676     Tmp2 = ComputeNumSignBits(Op.getOperand(1), Depth+1);
2677     if (Tmp2 == 1) return 1;
2678
2679     // Handle NEG.
2680     if (ConstantSDNode *CLHS = dyn_cast<ConstantSDNode>(Op.getOperand(0)))
2681       if (CLHS->isNullValue()) {
2682         APInt KnownZero, KnownOne;
2683         computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
2684         // If the input is known to be 0 or 1, the output is 0/-1, which is all
2685         // sign bits set.
2686         if ((KnownZero | APInt(VTBits, 1)).isAllOnesValue())
2687           return VTBits;
2688
2689         // If the input is known to be positive (the sign bit is known clear),
2690         // the output of the NEG has the same number of sign bits as the input.
2691         if (KnownZero.isNegative())
2692           return Tmp2;
2693
2694         // Otherwise, we treat this like a SUB.
2695       }
2696
2697     // Sub can have at most one carry bit.  Thus we know that the output
2698     // is, at worst, one more bit than the inputs.
2699     Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2700     if (Tmp == 1) return 1;  // Early out.
2701     return std::min(Tmp, Tmp2)-1;
2702   case ISD::TRUNCATE:
2703     // FIXME: it's tricky to do anything useful for this, but it is an important
2704     // case for targets like X86.
2705     break;
2706   case ISD::EXTRACT_ELEMENT: {
2707     const int KnownSign = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2708     const int BitWidth = Op.getValueType().getSizeInBits();
2709     const int Items =
2710       Op.getOperand(0).getValueType().getSizeInBits() / BitWidth;
2711
2712     // Get reverse index (starting from 1), Op1 value indexes elements from
2713     // little end. Sign starts at big end.
2714     const int rIndex = Items - 1 -
2715       cast<ConstantSDNode>(Op.getOperand(1))->getZExtValue();
2716
2717     // If the sign portion ends in our element the subtraction gives correct
2718     // result. Otherwise it gives either negative or > bitwidth result
2719     return std::max(std::min(KnownSign - rIndex * BitWidth, BitWidth), 0);
2720   }
2721   }
2722
2723   // If we are looking at the loaded value of the SDNode.
2724   if (Op.getResNo() == 0) {
2725     // Handle LOADX separately here. EXTLOAD case will fallthrough.
2726     if (LoadSDNode *LD = dyn_cast<LoadSDNode>(Op)) {
2727       unsigned ExtType = LD->getExtensionType();
2728       switch (ExtType) {
2729         default: break;
2730         case ISD::SEXTLOAD:    // '17' bits known
2731           Tmp = LD->getMemoryVT().getScalarType().getSizeInBits();
2732           return VTBits-Tmp+1;
2733         case ISD::ZEXTLOAD:    // '16' bits known
2734           Tmp = LD->getMemoryVT().getScalarType().getSizeInBits();
2735           return VTBits-Tmp;
2736       }
2737     }
2738   }
2739
2740   // Allow the target to implement this method for its nodes.
2741   if (Op.getOpcode() >= ISD::BUILTIN_OP_END ||
2742       Op.getOpcode() == ISD::INTRINSIC_WO_CHAIN ||
2743       Op.getOpcode() == ISD::INTRINSIC_W_CHAIN ||
2744       Op.getOpcode() == ISD::INTRINSIC_VOID) {
2745     unsigned NumBits = TLI->ComputeNumSignBitsForTargetNode(Op, *this, Depth);
2746     if (NumBits > 1) FirstAnswer = std::max(FirstAnswer, NumBits);
2747   }
2748
2749   // Finally, if we can prove that the top bits of the result are 0's or 1's,
2750   // use this information.
2751   APInt KnownZero, KnownOne;
2752   computeKnownBits(Op, KnownZero, KnownOne, Depth);
2753
2754   APInt Mask;
2755   if (KnownZero.isNegative()) {        // sign bit is 0
2756     Mask = KnownZero;
2757   } else if (KnownOne.isNegative()) {  // sign bit is 1;
2758     Mask = KnownOne;
2759   } else {
2760     // Nothing known.
2761     return FirstAnswer;
2762   }
2763
2764   // Okay, we know that the sign bit in Mask is set.  Use CLZ to determine
2765   // the number of identical bits in the top of the input value.
2766   Mask = ~Mask;
2767   Mask <<= Mask.getBitWidth()-VTBits;
2768   // Return # leading zeros.  We use 'min' here in case Val was zero before
2769   // shifting.  We don't want to return '64' as for an i32 "0".
2770   return std::max(FirstAnswer, std::min(VTBits, Mask.countLeadingZeros()));
2771 }
2772
2773 /// isBaseWithConstantOffset - Return true if the specified operand is an
2774 /// ISD::ADD with a ConstantSDNode on the right-hand side, or if it is an
2775 /// ISD::OR with a ConstantSDNode that is guaranteed to have the same
2776 /// semantics as an ADD.  This handles the equivalence:
2777 ///     X|Cst == X+Cst iff X&Cst = 0.
2778 bool SelectionDAG::isBaseWithConstantOffset(SDValue Op) const {
2779   if ((Op.getOpcode() != ISD::ADD && Op.getOpcode() != ISD::OR) ||
2780       !isa<ConstantSDNode>(Op.getOperand(1)))
2781     return false;
2782
2783   if (Op.getOpcode() == ISD::OR &&
2784       !MaskedValueIsZero(Op.getOperand(0),
2785                      cast<ConstantSDNode>(Op.getOperand(1))->getAPIntValue()))
2786     return false;
2787
2788   return true;
2789 }
2790
2791
2792 bool SelectionDAG::isKnownNeverNaN(SDValue Op) const {
2793   // If we're told that NaNs won't happen, assume they won't.
2794   if (getTarget().Options.NoNaNsFPMath)
2795     return true;
2796
2797   // If the value is a constant, we can obviously see if it is a NaN or not.
2798   if (const ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Op))
2799     return !C->getValueAPF().isNaN();
2800
2801   // TODO: Recognize more cases here.
2802
2803   return false;
2804 }
2805
2806 bool SelectionDAG::isKnownNeverZero(SDValue Op) const {
2807   // If the value is a constant, we can obviously see if it is a zero or not.
2808   if (const ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Op))
2809     return !C->isZero();
2810
2811   // TODO: Recognize more cases here.
2812   switch (Op.getOpcode()) {
2813   default: break;
2814   case ISD::OR:
2815     if (const ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1)))
2816       return !C->isNullValue();
2817     break;
2818   }
2819
2820   return false;
2821 }
2822
2823 bool SelectionDAG::isEqualTo(SDValue A, SDValue B) const {
2824   // Check the obvious case.
2825   if (A == B) return true;
2826
2827   // For for negative and positive zero.
2828   if (const ConstantFPSDNode *CA = dyn_cast<ConstantFPSDNode>(A))
2829     if (const ConstantFPSDNode *CB = dyn_cast<ConstantFPSDNode>(B))
2830       if (CA->isZero() && CB->isZero()) return true;
2831
2832   // Otherwise they may not be equal.
2833   return false;
2834 }
2835
2836 bool SelectionDAG::haveNoCommonBitsSet(SDValue A, SDValue B) const {
2837   assert(A.getValueType() == B.getValueType() &&
2838          "Values must have the same type");
2839   APInt AZero, AOne;
2840   APInt BZero, BOne;
2841   computeKnownBits(A, AZero, AOne);
2842   computeKnownBits(B, BZero, BOne);
2843   return (AZero | BZero).isAllOnesValue();
2844 }
2845
2846 /// getNode - Gets or creates the specified node.
2847 ///
2848 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT) {
2849   FoldingSetNodeID ID;
2850   AddNodeIDNode(ID, Opcode, getVTList(VT), None);
2851   void *IP = nullptr;
2852   if (SDNode *E = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP))
2853     return SDValue(E, 0);
2854
2855   SDNode *N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(),
2856                                          DL.getDebugLoc(), getVTList(VT));
2857   CSEMap.InsertNode(N, IP);
2858
2859   InsertNode(N);
2860   return SDValue(N, 0);
2861 }
2862
2863 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL,
2864                               EVT VT, SDValue Operand) {
2865   // Constant fold unary operations with an integer constant operand. Even
2866   // opaque constant will be folded, because the folding of unary operations
2867   // doesn't create new constants with different values. Nevertheless, the
2868   // opaque flag is preserved during folding to prevent future folding with
2869   // other constants.
2870   if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Operand)) {
2871     const APInt &Val = C->getAPIntValue();
2872     switch (Opcode) {
2873     default: break;
2874     case ISD::SIGN_EXTEND:
2875       return getConstant(Val.sextOrTrunc(VT.getSizeInBits()), DL, VT,
2876                          C->isTargetOpcode(), C->isOpaque());
2877     case ISD::ANY_EXTEND:
2878     case ISD::ZERO_EXTEND:
2879     case ISD::TRUNCATE:
2880       return getConstant(Val.zextOrTrunc(VT.getSizeInBits()), DL, VT,
2881                          C->isTargetOpcode(), C->isOpaque());
2882     case ISD::UINT_TO_FP:
2883     case ISD::SINT_TO_FP: {
2884       APFloat apf(EVTToAPFloatSemantics(VT),
2885                   APInt::getNullValue(VT.getSizeInBits()));
2886       (void)apf.convertFromAPInt(Val,
2887                                  Opcode==ISD::SINT_TO_FP,
2888                                  APFloat::rmNearestTiesToEven);
2889       return getConstantFP(apf, DL, VT);
2890     }
2891     case ISD::BITCAST:
2892       if (VT == MVT::f16 && C->getValueType(0) == MVT::i16)
2893         return getConstantFP(APFloat(APFloat::IEEEhalf, Val), DL, VT);
2894       if (VT == MVT::f32 && C->getValueType(0) == MVT::i32)
2895         return getConstantFP(APFloat(APFloat::IEEEsingle, Val), DL, VT);
2896       if (VT == MVT::f64 && C->getValueType(0) == MVT::i64)
2897         return getConstantFP(APFloat(APFloat::IEEEdouble, Val), DL, VT);
2898       if (VT == MVT::f128 && C->getValueType(0) == MVT::i128)
2899         return getConstantFP(APFloat(APFloat::IEEEquad, Val), DL, VT);
2900       break;
2901     case ISD::BSWAP:
2902       return getConstant(Val.byteSwap(), DL, VT, C->isTargetOpcode(),
2903                          C->isOpaque());
2904     case ISD::CTPOP:
2905       return getConstant(Val.countPopulation(), DL, VT, C->isTargetOpcode(),
2906                          C->isOpaque());
2907     case ISD::CTLZ:
2908     case ISD::CTLZ_ZERO_UNDEF:
2909       return getConstant(Val.countLeadingZeros(), DL, VT, C->isTargetOpcode(),
2910                          C->isOpaque());
2911     case ISD::CTTZ:
2912     case ISD::CTTZ_ZERO_UNDEF:
2913       return getConstant(Val.countTrailingZeros(), DL, VT, C->isTargetOpcode(),
2914                          C->isOpaque());
2915     }
2916   }
2917
2918   // Constant fold unary operations with a floating point constant operand.
2919   if (ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Operand)) {
2920     APFloat V = C->getValueAPF();    // make copy
2921     switch (Opcode) {
2922     case ISD::FNEG:
2923       V.changeSign();
2924       return getConstantFP(V, DL, VT);
2925     case ISD::FABS:
2926       V.clearSign();
2927       return getConstantFP(V, DL, VT);
2928     case ISD::FCEIL: {
2929       APFloat::opStatus fs = V.roundToIntegral(APFloat::rmTowardPositive);
2930       if (fs == APFloat::opOK || fs == APFloat::opInexact)
2931         return getConstantFP(V, DL, VT);
2932       break;
2933     }
2934     case ISD::FTRUNC: {
2935       APFloat::opStatus fs = V.roundToIntegral(APFloat::rmTowardZero);
2936       if (fs == APFloat::opOK || fs == APFloat::opInexact)
2937         return getConstantFP(V, DL, VT);
2938       break;
2939     }
2940     case ISD::FFLOOR: {
2941       APFloat::opStatus fs = V.roundToIntegral(APFloat::rmTowardNegative);
2942       if (fs == APFloat::opOK || fs == APFloat::opInexact)
2943         return getConstantFP(V, DL, VT);
2944       break;
2945     }
2946     case ISD::FP_EXTEND: {
2947       bool ignored;
2948       // This can return overflow, underflow, or inexact; we don't care.
2949       // FIXME need to be more flexible about rounding mode.
2950       (void)V.convert(EVTToAPFloatSemantics(VT),
2951                       APFloat::rmNearestTiesToEven, &ignored);
2952       return getConstantFP(V, DL, VT);
2953     }
2954     case ISD::FP_TO_SINT:
2955     case ISD::FP_TO_UINT: {
2956       integerPart x[2];
2957       bool ignored;
2958       static_assert(integerPartWidth >= 64, "APFloat parts too small!");
2959       // FIXME need to be more flexible about rounding mode.
2960       APFloat::opStatus s = V.convertToInteger(x, VT.getSizeInBits(),
2961                             Opcode==ISD::FP_TO_SINT,
2962                             APFloat::rmTowardZero, &ignored);
2963       if (s==APFloat::opInvalidOp)     // inexact is OK, in fact usual
2964         break;
2965       APInt api(VT.getSizeInBits(), x);
2966       return getConstant(api, DL, VT);
2967     }
2968     case ISD::BITCAST:
2969       if (VT == MVT::i16 && C->getValueType(0) == MVT::f16)
2970         return getConstant((uint16_t)V.bitcastToAPInt().getZExtValue(), DL, VT);
2971       else if (VT == MVT::i32 && C->getValueType(0) == MVT::f32)
2972         return getConstant((uint32_t)V.bitcastToAPInt().getZExtValue(), DL, VT);
2973       else if (VT == MVT::i64 && C->getValueType(0) == MVT::f64)
2974         return getConstant(V.bitcastToAPInt().getZExtValue(), DL, VT);
2975       break;
2976     }
2977   }
2978
2979   // Constant fold unary operations with a vector integer or float operand.
2980   if (BuildVectorSDNode *BV = dyn_cast<BuildVectorSDNode>(Operand)) {
2981     if (BV->isConstant()) {
2982       switch (Opcode) {
2983       default:
2984         // FIXME: Entirely reasonable to perform folding of other unary
2985         // operations here as the need arises.
2986         break;
2987       case ISD::FNEG:
2988       case ISD::FABS:
2989       case ISD::FCEIL:
2990       case ISD::FTRUNC:
2991       case ISD::FFLOOR:
2992       case ISD::FP_EXTEND:
2993       case ISD::FP_TO_SINT:
2994       case ISD::FP_TO_UINT:
2995       case ISD::TRUNCATE:
2996       case ISD::UINT_TO_FP:
2997       case ISD::SINT_TO_FP:
2998       case ISD::BSWAP:
2999       case ISD::CTLZ:
3000       case ISD::CTLZ_ZERO_UNDEF:
3001       case ISD::CTTZ:
3002       case ISD::CTTZ_ZERO_UNDEF:
3003       case ISD::CTPOP: {
3004         SDValue Ops = { Operand };
3005         if (SDValue Fold = FoldConstantVectorArithmetic(Opcode, DL, VT, Ops))
3006           return Fold;
3007       }
3008       }
3009     }
3010   }
3011
3012   unsigned OpOpcode = Operand.getNode()->getOpcode();
3013   switch (Opcode) {
3014   case ISD::TokenFactor:
3015   case ISD::MERGE_VALUES:
3016   case ISD::CONCAT_VECTORS:
3017     return Operand;         // Factor, merge or concat of one node?  No need.
3018   case ISD::FP_ROUND: llvm_unreachable("Invalid method to make FP_ROUND node");
3019   case ISD::FP_EXTEND:
3020     assert(VT.isFloatingPoint() &&
3021            Operand.getValueType().isFloatingPoint() && "Invalid FP cast!");
3022     if (Operand.getValueType() == VT) return Operand;  // noop conversion.
3023     assert((!VT.isVector() ||
3024             VT.getVectorNumElements() ==
3025             Operand.getValueType().getVectorNumElements()) &&
3026            "Vector element count mismatch!");
3027     assert(Operand.getValueType().bitsLT(VT) &&
3028            "Invalid fpext node, dst < src!");
3029     if (Operand.getOpcode() == ISD::UNDEF)
3030       return getUNDEF(VT);
3031     break;
3032   case ISD::SIGN_EXTEND:
3033     assert(VT.isInteger() && Operand.getValueType().isInteger() &&
3034            "Invalid SIGN_EXTEND!");
3035     if (Operand.getValueType() == VT) return Operand;   // noop extension
3036     assert((!VT.isVector() ||
3037             VT.getVectorNumElements() ==
3038             Operand.getValueType().getVectorNumElements()) &&
3039            "Vector element count mismatch!");
3040     assert(Operand.getValueType().bitsLT(VT) &&
3041            "Invalid sext node, dst < src!");
3042     if (OpOpcode == ISD::SIGN_EXTEND || OpOpcode == ISD::ZERO_EXTEND)
3043       return getNode(OpOpcode, DL, VT, Operand.getNode()->getOperand(0));
3044     else if (OpOpcode == ISD::UNDEF)
3045       // sext(undef) = 0, because the top bits will all be the same.
3046       return getConstant(0, DL, VT);
3047     break;
3048   case ISD::ZERO_EXTEND:
3049     assert(VT.isInteger() && Operand.getValueType().isInteger() &&
3050            "Invalid ZERO_EXTEND!");
3051     if (Operand.getValueType() == VT) return Operand;   // noop extension
3052     assert((!VT.isVector() ||
3053             VT.getVectorNumElements() ==
3054             Operand.getValueType().getVectorNumElements()) &&
3055            "Vector element count mismatch!");
3056     assert(Operand.getValueType().bitsLT(VT) &&
3057            "Invalid zext node, dst < src!");
3058     if (OpOpcode == ISD::ZERO_EXTEND)   // (zext (zext x)) -> (zext x)
3059       return getNode(ISD::ZERO_EXTEND, DL, VT,
3060                      Operand.getNode()->getOperand(0));
3061     else if (OpOpcode == ISD::UNDEF)
3062       // zext(undef) = 0, because the top bits will be zero.
3063       return getConstant(0, DL, VT);
3064     break;
3065   case ISD::ANY_EXTEND:
3066     assert(VT.isInteger() && Operand.getValueType().isInteger() &&
3067            "Invalid ANY_EXTEND!");
3068     if (Operand.getValueType() == VT) return Operand;   // noop extension
3069     assert((!VT.isVector() ||
3070             VT.getVectorNumElements() ==
3071             Operand.getValueType().getVectorNumElements()) &&
3072            "Vector element count mismatch!");
3073     assert(Operand.getValueType().bitsLT(VT) &&
3074            "Invalid anyext node, dst < src!");
3075
3076     if (OpOpcode == ISD::ZERO_EXTEND || OpOpcode == ISD::SIGN_EXTEND ||
3077         OpOpcode == ISD::ANY_EXTEND)
3078       // (ext (zext x)) -> (zext x)  and  (ext (sext x)) -> (sext x)
3079       return getNode(OpOpcode, DL, VT, Operand.getNode()->getOperand(0));
3080     else if (OpOpcode == ISD::UNDEF)
3081       return getUNDEF(VT);
3082
3083     // (ext (trunx x)) -> x
3084     if (OpOpcode == ISD::TRUNCATE) {
3085       SDValue OpOp = Operand.getNode()->getOperand(0);
3086       if (OpOp.getValueType() == VT)
3087         return OpOp;
3088     }
3089     break;
3090   case ISD::TRUNCATE:
3091     assert(VT.isInteger() && Operand.getValueType().isInteger() &&
3092            "Invalid TRUNCATE!");
3093     if (Operand.getValueType() == VT) return Operand;   // noop truncate
3094     assert((!VT.isVector() ||
3095             VT.getVectorNumElements() ==
3096             Operand.getValueType().getVectorNumElements()) &&
3097            "Vector element count mismatch!");
3098     assert(Operand.getValueType().bitsGT(VT) &&
3099            "Invalid truncate node, src < dst!");
3100     if (OpOpcode == ISD::TRUNCATE)
3101       return getNode(ISD::TRUNCATE, DL, VT, Operand.getNode()->getOperand(0));
3102     if (OpOpcode == ISD::ZERO_EXTEND || OpOpcode == ISD::SIGN_EXTEND ||
3103         OpOpcode == ISD::ANY_EXTEND) {
3104       // If the source is smaller than the dest, we still need an extend.
3105       if (Operand.getNode()->getOperand(0).getValueType().getScalarType()
3106             .bitsLT(VT.getScalarType()))
3107         return getNode(OpOpcode, DL, VT, Operand.getNode()->getOperand(0));
3108       if (Operand.getNode()->getOperand(0).getValueType().bitsGT(VT))
3109         return getNode(ISD::TRUNCATE, DL, VT, Operand.getNode()->getOperand(0));
3110       return Operand.getNode()->getOperand(0);
3111     }
3112     if (OpOpcode == ISD::UNDEF)
3113       return getUNDEF(VT);
3114     break;
3115   case ISD::BSWAP:
3116     assert(VT.isInteger() && VT == Operand.getValueType() &&
3117            "Invalid BSWAP!");
3118     assert((VT.getScalarSizeInBits() % 16 == 0) &&
3119            "BSWAP types must be a multiple of 16 bits!");
3120     if (OpOpcode == ISD::UNDEF)
3121       return getUNDEF(VT);
3122     break;
3123   case ISD::BITCAST:
3124     // Basic sanity checking.
3125     assert(VT.getSizeInBits() == Operand.getValueType().getSizeInBits()
3126            && "Cannot BITCAST between types of different sizes!");
3127     if (VT == Operand.getValueType()) return Operand;  // noop conversion.
3128     if (OpOpcode == ISD::BITCAST)  // bitconv(bitconv(x)) -> bitconv(x)
3129       return getNode(ISD::BITCAST, DL, VT, Operand.getOperand(0));
3130     if (OpOpcode == ISD::UNDEF)
3131       return getUNDEF(VT);
3132     break;
3133   case ISD::SCALAR_TO_VECTOR:
3134     assert(VT.isVector() && !Operand.getValueType().isVector() &&
3135            (VT.getVectorElementType() == Operand.getValueType() ||
3136             (VT.getVectorElementType().isInteger() &&
3137              Operand.getValueType().isInteger() &&
3138              VT.getVectorElementType().bitsLE(Operand.getValueType()))) &&
3139            "Illegal SCALAR_TO_VECTOR node!");
3140     if (OpOpcode == ISD::UNDEF)
3141       return getUNDEF(VT);
3142     // scalar_to_vector(extract_vector_elt V, 0) -> V, top bits are undefined.
3143     if (OpOpcode == ISD::EXTRACT_VECTOR_ELT &&
3144         isa<ConstantSDNode>(Operand.getOperand(1)) &&
3145         Operand.getConstantOperandVal(1) == 0 &&
3146         Operand.getOperand(0).getValueType() == VT)
3147       return Operand.getOperand(0);
3148     break;
3149   case ISD::FNEG:
3150     // -(X-Y) -> (Y-X) is unsafe because when X==Y, -0.0 != +0.0
3151     if (getTarget().Options.UnsafeFPMath && OpOpcode == ISD::FSUB)
3152       // FIXME: FNEG has no fast-math-flags to propagate; use the FSUB's flags?
3153       return getNode(ISD::FSUB, DL, VT, Operand.getNode()->getOperand(1),
3154                        Operand.getNode()->getOperand(0),
3155                        &cast<BinaryWithFlagsSDNode>(Operand.getNode())->Flags);
3156     if (OpOpcode == ISD::FNEG)  // --X -> X
3157       return Operand.getNode()->getOperand(0);
3158     break;
3159   case ISD::FABS:
3160     if (OpOpcode == ISD::FNEG)  // abs(-X) -> abs(X)
3161       return getNode(ISD::FABS, DL, VT, Operand.getNode()->getOperand(0));
3162     break;
3163   }
3164
3165   SDNode *N;
3166   SDVTList VTs = getVTList(VT);
3167   if (VT != MVT::Glue) { // Don't CSE flag producing nodes
3168     FoldingSetNodeID ID;
3169     SDValue Ops[1] = { Operand };
3170     AddNodeIDNode(ID, Opcode, VTs, Ops);
3171     void *IP = nullptr;
3172     if (SDNode *E = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP))
3173       return SDValue(E, 0);
3174
3175     N = new (NodeAllocator) UnarySDNode(Opcode, DL.getIROrder(),
3176                                         DL.getDebugLoc(), VTs, Operand);
3177     CSEMap.InsertNode(N, IP);
3178   } else {
3179     N = new (NodeAllocator) UnarySDNode(Opcode, DL.getIROrder(),
3180                                         DL.getDebugLoc(), VTs, Operand);
3181   }
3182
3183   InsertNode(N);
3184   return SDValue(N, 0);
3185 }
3186
3187 static std::pair<APInt, bool> FoldValue(unsigned Opcode, const APInt &C1,
3188                                         const APInt &C2) {
3189   switch (Opcode) {
3190   case ISD::ADD:  return std::make_pair(C1 + C2, true);
3191   case ISD::SUB:  return std::make_pair(C1 - C2, true);
3192   case ISD::MUL:  return std::make_pair(C1 * C2, true);
3193   case ISD::AND:  return std::make_pair(C1 & C2, true);
3194   case ISD::OR:   return std::make_pair(C1 | C2, true);
3195   case ISD::XOR:  return std::make_pair(C1 ^ C2, true);
3196   case ISD::SHL:  return std::make_pair(C1 << C2, true);
3197   case ISD::SRL:  return std::make_pair(C1.lshr(C2), true);
3198   case ISD::SRA:  return std::make_pair(C1.ashr(C2), true);
3199   case ISD::ROTL: return std::make_pair(C1.rotl(C2), true);
3200   case ISD::ROTR: return std::make_pair(C1.rotr(C2), true);
3201   case ISD::SMIN: return std::make_pair(C1.sle(C2) ? C1 : C2, true);
3202   case ISD::SMAX: return std::make_pair(C1.sge(C2) ? C1 : C2, true);
3203   case ISD::UMIN: return std::make_pair(C1.ule(C2) ? C1 : C2, true);
3204   case ISD::UMAX: return std::make_pair(C1.uge(C2) ? C1 : C2, true);
3205   case ISD::UDIV:
3206     if (!C2.getBoolValue())
3207       break;
3208     return std::make_pair(C1.udiv(C2), true);
3209   case ISD::UREM:
3210     if (!C2.getBoolValue())
3211       break;
3212     return std::make_pair(C1.urem(C2), true);
3213   case ISD::SDIV:
3214     if (!C2.getBoolValue())
3215       break;
3216     return std::make_pair(C1.sdiv(C2), true);
3217   case ISD::SREM:
3218     if (!C2.getBoolValue())
3219       break;
3220     return std::make_pair(C1.srem(C2), true);
3221   }
3222   return std::make_pair(APInt(1, 0), false);
3223 }
3224
3225 SDValue SelectionDAG::FoldConstantArithmetic(unsigned Opcode, SDLoc DL, EVT VT,
3226                                              const ConstantSDNode *Cst1,
3227                                              const ConstantSDNode *Cst2) {
3228   if (Cst1->isOpaque() || Cst2->isOpaque())
3229     return SDValue();
3230
3231   std::pair<APInt, bool> Folded = FoldValue(Opcode, Cst1->getAPIntValue(),
3232                                             Cst2->getAPIntValue());
3233   if (!Folded.second)
3234     return SDValue();
3235   return getConstant(Folded.first, DL, VT);
3236 }
3237
3238 SDValue SelectionDAG::FoldConstantArithmetic(unsigned Opcode, SDLoc DL, EVT VT,
3239                                              SDNode *Cst1, SDNode *Cst2) {
3240   // If the opcode is a target-specific ISD node, there's nothing we can
3241   // do here and the operand rules may not line up with the below, so
3242   // bail early.
3243   if (Opcode >= ISD::BUILTIN_OP_END)
3244     return SDValue();
3245
3246   // Handle the case of two scalars.
3247   if (const ConstantSDNode *Scalar1 = dyn_cast<ConstantSDNode>(Cst1)) {
3248     if (const ConstantSDNode *Scalar2 = dyn_cast<ConstantSDNode>(Cst2)) {
3249       if (SDValue Folded =
3250           FoldConstantArithmetic(Opcode, DL, VT, Scalar1, Scalar2)) {
3251         if (!VT.isVector())
3252           return Folded;
3253         SmallVector<SDValue, 4> Outputs;
3254         // We may have a vector type but a scalar result. Create a splat.
3255         Outputs.resize(VT.getVectorNumElements(), Outputs.back());
3256         // Build a big vector out of the scalar elements we generated.
3257         return getNode(ISD::BUILD_VECTOR, SDLoc(), VT, Outputs);
3258       } else {
3259         return SDValue();
3260       }
3261     }
3262   }
3263
3264   // For vectors extract each constant element into Inputs so we can constant
3265   // fold them individually.
3266   BuildVectorSDNode *BV1 = dyn_cast<BuildVectorSDNode>(Cst1);
3267   BuildVectorSDNode *BV2 = dyn_cast<BuildVectorSDNode>(Cst2);
3268   if (!BV1 || !BV2)
3269     return SDValue();
3270
3271   assert(BV1->getNumOperands() == BV2->getNumOperands() && "Out of sync!");
3272
3273   EVT SVT = VT.getScalarType();
3274   SmallVector<SDValue, 4> Outputs;
3275   for (unsigned I = 0, E = BV1->getNumOperands(); I != E; ++I) {
3276     ConstantSDNode *V1 = dyn_cast<ConstantSDNode>(BV1->getOperand(I));
3277     ConstantSDNode *V2 = dyn_cast<ConstantSDNode>(BV2->getOperand(I));
3278     if (!V1 || !V2) // Not a constant, bail.
3279       return SDValue();
3280
3281     if (V1->isOpaque() || V2->isOpaque())
3282       return SDValue();
3283
3284     // Avoid BUILD_VECTOR nodes that perform implicit truncation.
3285     // FIXME: This is valid and could be handled by truncating the APInts.
3286     if (V1->getValueType(0) != SVT || V2->getValueType(0) != SVT)
3287       return SDValue();
3288
3289     // Fold one vector element.
3290     std::pair<APInt, bool> Folded = FoldValue(Opcode, V1->getAPIntValue(),
3291                                               V2->getAPIntValue());
3292     if (!Folded.second)
3293       return SDValue();
3294     Outputs.push_back(getConstant(Folded.first, DL, SVT));
3295   }
3296
3297   assert(VT.getVectorNumElements() == Outputs.size() &&
3298          "Vector size mismatch!");
3299
3300   // We may have a vector type but a scalar result. Create a splat.
3301   Outputs.resize(VT.getVectorNumElements(), Outputs.back());
3302
3303   // Build a big vector out of the scalar elements we generated.
3304   return getNode(ISD::BUILD_VECTOR, SDLoc(), VT, Outputs);
3305 }
3306
3307 SDValue SelectionDAG::FoldConstantVectorArithmetic(unsigned Opcode, SDLoc DL,
3308                                                    EVT VT,
3309                                                    ArrayRef<SDValue> Ops,
3310                                                    const SDNodeFlags *Flags) {
3311   // If the opcode is a target-specific ISD node, there's nothing we can
3312   // do here and the operand rules may not line up with the below, so
3313   // bail early.
3314   if (Opcode >= ISD::BUILTIN_OP_END)
3315     return SDValue();
3316
3317   // We can only fold vectors - maybe merge with FoldConstantArithmetic someday?
3318   if (!VT.isVector())
3319     return SDValue();
3320
3321   unsigned NumElts = VT.getVectorNumElements();
3322
3323   auto IsScalarOrSameVectorSize = [&](const SDValue &Op) {
3324     return !Op.getValueType().isVector() ||
3325            Op.getValueType().getVectorNumElements() == NumElts;
3326   };
3327
3328   auto IsConstantBuildVectorOrUndef = [&](const SDValue &Op) {
3329     BuildVectorSDNode *BV = dyn_cast<BuildVectorSDNode>(Op);
3330     return (Op.getOpcode() == ISD::UNDEF) ||
3331            (Op.getOpcode() == ISD::CONDCODE) || (BV && BV->isConstant());
3332   };
3333
3334   // All operands must be vector types with the same number of elements as
3335   // the result type and must be either UNDEF or a build vector of constant
3336   // or UNDEF scalars.
3337   if (!std::all_of(Ops.begin(), Ops.end(), IsConstantBuildVectorOrUndef) ||
3338       !std::all_of(Ops.begin(), Ops.end(), IsScalarOrSameVectorSize))
3339     return SDValue();
3340
3341   // If we are comparing vectors, then the result needs to be a i1 boolean
3342   // that is then sign-extended back to the legal result type.
3343   EVT SVT = (Opcode == ISD::SETCC ? MVT::i1 : VT.getScalarType());
3344
3345   // Find legal integer scalar type for constant promotion and
3346   // ensure that its scalar size is at least as large as source.
3347   EVT LegalSVT = VT.getScalarType();
3348   if (LegalSVT.isInteger()) {
3349     LegalSVT = TLI->getTypeToTransformTo(*getContext(), LegalSVT);
3350     if (LegalSVT.bitsLT(SVT))
3351       return SDValue();
3352   }
3353
3354   // Constant fold each scalar lane separately.
3355   SmallVector<SDValue, 4> ScalarResults;
3356   for (unsigned i = 0; i != NumElts; i++) {
3357     SmallVector<SDValue, 4> ScalarOps;
3358     for (SDValue Op : Ops) {
3359       EVT InSVT = Op.getValueType().getScalarType();
3360       BuildVectorSDNode *InBV = dyn_cast<BuildVectorSDNode>(Op);
3361       if (!InBV) {
3362         // We've checked that this is UNDEF or a constant of some kind.
3363         if (Op.isUndef())
3364           ScalarOps.push_back(getUNDEF(InSVT));
3365         else
3366           ScalarOps.push_back(Op);
3367         continue;
3368       }
3369
3370       SDValue ScalarOp = InBV->getOperand(i);
3371       EVT ScalarVT = ScalarOp.getValueType();
3372
3373       // Build vector (integer) scalar operands may need implicit
3374       // truncation - do this before constant folding.
3375       if (ScalarVT.isInteger() && ScalarVT.bitsGT(InSVT))
3376         ScalarOp = getNode(ISD::TRUNCATE, DL, InSVT, ScalarOp);
3377
3378       ScalarOps.push_back(ScalarOp);
3379     }
3380
3381     // Constant fold the scalar operands.
3382     SDValue ScalarResult = getNode(Opcode, DL, SVT, ScalarOps, Flags);
3383
3384     // Legalize the (integer) scalar constant if necessary.
3385     if (LegalSVT != SVT)
3386       ScalarResult = getNode(ISD::SIGN_EXTEND, DL, LegalSVT, ScalarResult);
3387
3388     // Scalar folding only succeeded if the result is a constant or UNDEF.
3389     if (ScalarResult.getOpcode() != ISD::UNDEF &&
3390         ScalarResult.getOpcode() != ISD::Constant &&
3391         ScalarResult.getOpcode() != ISD::ConstantFP)
3392       return SDValue();
3393     ScalarResults.push_back(ScalarResult);
3394   }
3395
3396   assert(ScalarResults.size() == NumElts &&
3397          "Unexpected number of scalar results for BUILD_VECTOR");
3398   return getNode(ISD::BUILD_VECTOR, DL, VT, ScalarResults);
3399 }
3400
3401 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT, SDValue N1,
3402                               SDValue N2, const SDNodeFlags *Flags) {
3403   ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N1);
3404   ConstantSDNode *N2C = dyn_cast<ConstantSDNode>(N2);
3405   ConstantFPSDNode *N1CFP = dyn_cast<ConstantFPSDNode>(N1);
3406   ConstantFPSDNode *N2CFP = dyn_cast<ConstantFPSDNode>(N2);
3407
3408   // Canonicalize constant to RHS if commutative.
3409   if (isCommutativeBinOp(Opcode)) {
3410     if (N1C && !N2C) {
3411       std::swap(N1C, N2C);
3412       std::swap(N1, N2);
3413     } else if (N1CFP && !N2CFP) {
3414       std::swap(N1CFP, N2CFP);
3415       std::swap(N1, N2);
3416     }
3417   }
3418
3419   switch (Opcode) {
3420   default: break;
3421   case ISD::TokenFactor:
3422     assert(VT == MVT::Other && N1.getValueType() == MVT::Other &&
3423            N2.getValueType() == MVT::Other && "Invalid token factor!");
3424     // Fold trivial token factors.
3425     if (N1.getOpcode() == ISD::EntryToken) return N2;
3426     if (N2.getOpcode() == ISD::EntryToken) return N1;
3427     if (N1 == N2) return N1;
3428     break;
3429   case ISD::CONCAT_VECTORS:
3430     // Concat of UNDEFs is UNDEF.
3431     if (N1.getOpcode() == ISD::UNDEF &&
3432         N2.getOpcode() == ISD::UNDEF)
3433       return getUNDEF(VT);
3434
3435     // A CONCAT_VECTOR with all operands BUILD_VECTOR can be simplified to
3436     // one big BUILD_VECTOR.
3437     if (N1.getOpcode() == ISD::BUILD_VECTOR &&
3438         N2.getOpcode() == ISD::BUILD_VECTOR) {
3439       SmallVector<SDValue, 16> Elts(N1.getNode()->op_begin(),
3440                                     N1.getNode()->op_end());
3441       Elts.append(N2.getNode()->op_begin(), N2.getNode()->op_end());
3442
3443       // BUILD_VECTOR requires all inputs to be of the same type, find the
3444       // maximum type and extend them all.
3445       EVT SVT = VT.getScalarType();
3446       for (SDValue Op : Elts)
3447         SVT = (SVT.bitsLT(Op.getValueType()) ? Op.getValueType() : SVT);
3448       if (SVT.bitsGT(VT.getScalarType()))
3449         for (SDValue &Op : Elts)
3450           Op = TLI->isZExtFree(Op.getValueType(), SVT)
3451              ? getZExtOrTrunc(Op, DL, SVT)
3452              : getSExtOrTrunc(Op, DL, SVT);
3453
3454       return getNode(ISD::BUILD_VECTOR, DL, VT, Elts);
3455     }
3456     break;
3457   case ISD::AND:
3458     assert(VT.isInteger() && "This operator does not apply to FP types!");
3459     assert(N1.getValueType() == N2.getValueType() &&
3460            N1.getValueType() == VT && "Binary operator types must match!");
3461     // (X & 0) -> 0.  This commonly occurs when legalizing i64 values, so it's
3462     // worth handling here.
3463     if (N2C && N2C->isNullValue())
3464       return N2;
3465     if (N2C && N2C->isAllOnesValue())  // X & -1 -> X
3466       return N1;
3467     break;
3468   case ISD::OR:
3469   case ISD::XOR:
3470   case ISD::ADD:
3471   case ISD::SUB:
3472     assert(VT.isInteger() && "This operator does not apply to FP types!");
3473     assert(N1.getValueType() == N2.getValueType() &&
3474            N1.getValueType() == VT && "Binary operator types must match!");
3475     // (X ^|+- 0) -> X.  This commonly occurs when legalizing i64 values, so
3476     // it's worth handling here.
3477     if (N2C && N2C->isNullValue())
3478       return N1;
3479     break;
3480   case ISD::UDIV:
3481   case ISD::UREM:
3482   case ISD::MULHU:
3483   case ISD::MULHS:
3484   case ISD::MUL:
3485   case ISD::SDIV:
3486   case ISD::SREM:
3487   case ISD::SMIN:
3488   case ISD::SMAX:
3489   case ISD::UMIN:
3490   case ISD::UMAX:
3491     assert(VT.isInteger() && "This operator does not apply to FP types!");
3492     assert(N1.getValueType() == N2.getValueType() &&
3493            N1.getValueType() == VT && "Binary operator types must match!");
3494     break;
3495   case ISD::FADD:
3496   case ISD::FSUB:
3497   case ISD::FMUL:
3498   case ISD::FDIV:
3499   case ISD::FREM:
3500     if (getTarget().Options.UnsafeFPMath) {
3501       if (Opcode == ISD::FADD) {
3502         // x+0 --> x
3503         if (N2CFP && N2CFP->getValueAPF().isZero())
3504           return N1;
3505       } else if (Opcode == ISD::FSUB) {
3506         // x-0 --> x
3507         if (N2CFP && N2CFP->getValueAPF().isZero())
3508           return N1;
3509       } else if (Opcode == ISD::FMUL) {
3510         // x*0 --> 0
3511         if (N2CFP && N2CFP->isZero())
3512           return N2;
3513         // x*1 --> x
3514         if (N2CFP && N2CFP->isExactlyValue(1.0))
3515           return N1;
3516       }
3517     }
3518     assert(VT.isFloatingPoint() && "This operator only applies to FP types!");
3519     assert(N1.getValueType() == N2.getValueType() &&
3520            N1.getValueType() == VT && "Binary operator types must match!");
3521     break;
3522   case ISD::FCOPYSIGN:   // N1 and result must match.  N1/N2 need not match.
3523     assert(N1.getValueType() == VT &&
3524            N1.getValueType().isFloatingPoint() &&
3525            N2.getValueType().isFloatingPoint() &&
3526            "Invalid FCOPYSIGN!");
3527     break;
3528   case ISD::SHL:
3529   case ISD::SRA:
3530   case ISD::SRL:
3531   case ISD::ROTL:
3532   case ISD::ROTR:
3533     assert(VT == N1.getValueType() &&
3534            "Shift operators return type must be the same as their first arg");
3535     assert(VT.isInteger() && N2.getValueType().isInteger() &&
3536            "Shifts only work on integers");
3537     assert((!VT.isVector() || VT == N2.getValueType()) &&
3538            "Vector shift amounts must be in the same as their first arg");
3539     // Verify that the shift amount VT is bit enough to hold valid shift
3540     // amounts.  This catches things like trying to shift an i1024 value by an
3541     // i8, which is easy to fall into in generic code that uses
3542     // TLI.getShiftAmount().
3543     assert(N2.getValueType().getSizeInBits() >=
3544                    Log2_32_Ceil(N1.getValueType().getSizeInBits()) &&
3545            "Invalid use of small shift amount with oversized value!");
3546
3547     // Always fold shifts of i1 values so the code generator doesn't need to
3548     // handle them.  Since we know the size of the shift has to be less than the
3549     // size of the value, the shift/rotate count is guaranteed to be zero.
3550     if (VT == MVT::i1)
3551       return N1;
3552     if (N2C && N2C->isNullValue())
3553       return N1;
3554     break;
3555   case ISD::FP_ROUND_INREG: {
3556     EVT EVT = cast<VTSDNode>(N2)->getVT();
3557     assert(VT == N1.getValueType() && "Not an inreg round!");
3558     assert(VT.isFloatingPoint() && EVT.isFloatingPoint() &&
3559            "Cannot FP_ROUND_INREG integer types");
3560     assert(EVT.isVector() == VT.isVector() &&
3561            "FP_ROUND_INREG type should be vector iff the operand "
3562            "type is vector!");
3563     assert((!EVT.isVector() ||
3564             EVT.getVectorNumElements() == VT.getVectorNumElements()) &&
3565            "Vector element counts must match in FP_ROUND_INREG");
3566     assert(EVT.bitsLE(VT) && "Not rounding down!");
3567     (void)EVT;
3568     if (cast<VTSDNode>(N2)->getVT() == VT) return N1;  // Not actually rounding.
3569     break;
3570   }
3571   case ISD::FP_ROUND:
3572     assert(VT.isFloatingPoint() &&
3573            N1.getValueType().isFloatingPoint() &&
3574            VT.bitsLE(N1.getValueType()) &&
3575            N2C && "Invalid FP_ROUND!");
3576     if (N1.getValueType() == VT) return N1;  // noop conversion.
3577     break;
3578   case ISD::AssertSext:
3579   case ISD::AssertZext: {
3580     EVT EVT = cast<VTSDNode>(N2)->getVT();
3581     assert(VT == N1.getValueType() && "Not an inreg extend!");
3582     assert(VT.isInteger() && EVT.isInteger() &&
3583            "Cannot *_EXTEND_INREG FP types");
3584     assert(!EVT.isVector() &&
3585            "AssertSExt/AssertZExt type should be the vector element type "
3586            "rather than the vector type!");
3587     assert(EVT.bitsLE(VT) && "Not extending!");
3588     if (VT == EVT) return N1; // noop assertion.
3589     break;
3590   }
3591   case ISD::SIGN_EXTEND_INREG: {
3592     EVT EVT = cast<VTSDNode>(N2)->getVT();
3593     assert(VT == N1.getValueType() && "Not an inreg extend!");
3594     assert(VT.isInteger() && EVT.isInteger() &&
3595            "Cannot *_EXTEND_INREG FP types");
3596     assert(EVT.isVector() == VT.isVector() &&
3597            "SIGN_EXTEND_INREG type should be vector iff the operand "
3598            "type is vector!");
3599     assert((!EVT.isVector() ||
3600             EVT.getVectorNumElements() == VT.getVectorNumElements()) &&
3601            "Vector element counts must match in SIGN_EXTEND_INREG");
3602     assert(EVT.bitsLE(VT) && "Not extending!");
3603     if (EVT == VT) return N1;  // Not actually extending
3604
3605     auto SignExtendInReg = [&](APInt Val) {
3606       unsigned FromBits = EVT.getScalarType().getSizeInBits();
3607       Val <<= Val.getBitWidth() - FromBits;
3608       Val = Val.ashr(Val.getBitWidth() - FromBits);
3609       return getConstant(Val, DL, VT.getScalarType());
3610     };
3611
3612     if (N1C) {
3613       APInt Val = N1C->getAPIntValue();
3614       return SignExtendInReg(Val);
3615     }
3616     if (ISD::isBuildVectorOfConstantSDNodes(N1.getNode())) {
3617       SmallVector<SDValue, 8> Ops;
3618       for (int i = 0, e = VT.getVectorNumElements(); i != e; ++i) {
3619         SDValue Op = N1.getOperand(i);
3620         if (Op.getOpcode() == ISD::UNDEF) {
3621           Ops.push_back(getUNDEF(VT.getScalarType()));
3622           continue;
3623         }
3624         if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
3625           APInt Val = C->getAPIntValue();
3626           Val = Val.zextOrTrunc(VT.getScalarSizeInBits());
3627           Ops.push_back(SignExtendInReg(Val));
3628           continue;
3629         }
3630         break;
3631       }
3632       if (Ops.size() == VT.getVectorNumElements())
3633         return getNode(ISD::BUILD_VECTOR, DL, VT, Ops);
3634     }
3635     break;
3636   }
3637   case ISD::EXTRACT_VECTOR_ELT:
3638     // EXTRACT_VECTOR_ELT of an UNDEF is an UNDEF.
3639     if (N1.getOpcode() == ISD::UNDEF)
3640       return getUNDEF(VT);
3641
3642     // EXTRACT_VECTOR_ELT of out-of-bounds element is an UNDEF
3643     if (N2C && N2C->getZExtValue() >= N1.getValueType().getVectorNumElements())
3644       return getUNDEF(VT);
3645
3646     // EXTRACT_VECTOR_ELT of CONCAT_VECTORS is often formed while lowering is
3647     // expanding copies of large vectors from registers.
3648     if (N2C &&
3649         N1.getOpcode() == ISD::CONCAT_VECTORS &&
3650         N1.getNumOperands() > 0) {
3651       unsigned Factor =
3652         N1.getOperand(0).getValueType().getVectorNumElements();
3653       return getNode(ISD::EXTRACT_VECTOR_ELT, DL, VT,
3654                      N1.getOperand(N2C->getZExtValue() / Factor),
3655                      getConstant(N2C->getZExtValue() % Factor, DL,
3656                                  N2.getValueType()));
3657     }
3658
3659     // EXTRACT_VECTOR_ELT of BUILD_VECTOR is often formed while lowering is
3660     // expanding large vector constants.
3661     if (N2C && N1.getOpcode() == ISD::BUILD_VECTOR) {
3662       SDValue Elt = N1.getOperand(N2C->getZExtValue());
3663
3664       if (VT != Elt.getValueType())
3665         // If the vector element type is not legal, the BUILD_VECTOR operands
3666         // are promoted and implicitly truncated, and the result implicitly
3667         // extended. Make that explicit here.
3668         Elt = getAnyExtOrTrunc(Elt, DL, VT);
3669
3670       return Elt;
3671     }
3672
3673     // EXTRACT_VECTOR_ELT of INSERT_VECTOR_ELT is often formed when vector
3674     // operations are lowered to scalars.
3675     if (N1.getOpcode() == ISD::INSERT_VECTOR_ELT) {
3676       // If the indices are the same, return the inserted element else
3677       // if the indices are known different, extract the element from
3678       // the original vector.
3679       SDValue N1Op2 = N1.getOperand(2);
3680       ConstantSDNode *N1Op2C = dyn_cast<ConstantSDNode>(N1Op2);
3681
3682       if (N1Op2C && N2C) {
3683         if (N1Op2C->getZExtValue() == N2C->getZExtValue()) {
3684           if (VT == N1.getOperand(1).getValueType())
3685             return N1.getOperand(1);
3686           else
3687             return getSExtOrTrunc(N1.getOperand(1), DL, VT);
3688         }
3689
3690         return getNode(ISD::EXTRACT_VECTOR_ELT, DL, VT, N1.getOperand(0), N2);
3691       }
3692     }
3693     break;
3694   case ISD::EXTRACT_ELEMENT:
3695     assert(N2C && (unsigned)N2C->getZExtValue() < 2 && "Bad EXTRACT_ELEMENT!");
3696     assert(!N1.getValueType().isVector() && !VT.isVector() &&
3697            (N1.getValueType().isInteger() == VT.isInteger()) &&
3698            N1.getValueType() != VT &&
3699            "Wrong types for EXTRACT_ELEMENT!");
3700
3701     // EXTRACT_ELEMENT of BUILD_PAIR is often formed while legalize is expanding
3702     // 64-bit integers into 32-bit parts.  Instead of building the extract of
3703     // the BUILD_PAIR, only to have legalize rip it apart, just do it now.
3704     if (N1.getOpcode() == ISD::BUILD_PAIR)
3705       return N1.getOperand(N2C->getZExtValue());
3706
3707     // EXTRACT_ELEMENT of a constant int is also very common.
3708     if (N1C) {
3709       unsigned ElementSize = VT.getSizeInBits();
3710       unsigned Shift = ElementSize * N2C->getZExtValue();
3711       APInt ShiftedVal = N1C->getAPIntValue().lshr(Shift);
3712       return getConstant(ShiftedVal.trunc(ElementSize), DL, VT);
3713     }
3714     break;
3715   case ISD::EXTRACT_SUBVECTOR:
3716     if (VT.isSimple() && N1.getValueType().isSimple()) {
3717       assert(VT.isVector() && N1.getValueType().isVector() &&
3718              "Extract subvector VTs must be a vectors!");
3719       assert(VT.getVectorElementType() ==
3720              N1.getValueType().getVectorElementType() &&
3721              "Extract subvector VTs must have the same element type!");
3722       assert(VT.getSimpleVT() <= N1.getSimpleValueType() &&
3723              "Extract subvector must be from larger vector to smaller vector!");
3724
3725       if (N2C) {
3726         assert((VT.getVectorNumElements() + N2C->getZExtValue()
3727                 <= N1.getValueType().getVectorNumElements())
3728                && "Extract subvector overflow!");
3729       }
3730
3731       // Trivial extraction.
3732       if (VT.getSimpleVT() == N1.getSimpleValueType())
3733         return N1;
3734     }
3735     break;
3736   }
3737
3738   // Perform trivial constant folding.
3739   if (SDValue SV =
3740           FoldConstantArithmetic(Opcode, DL, VT, N1.getNode(), N2.getNode()))
3741     return SV;
3742
3743   // Constant fold FP operations.
3744   bool HasFPExceptions = TLI->hasFloatingPointExceptions();
3745   if (N1CFP) {
3746     if (N2CFP) {
3747       APFloat V1 = N1CFP->getValueAPF(), V2 = N2CFP->getValueAPF();
3748       APFloat::opStatus s;
3749       switch (Opcode) {
3750       case ISD::FADD:
3751         s = V1.add(V2, APFloat::rmNearestTiesToEven);
3752         if (!HasFPExceptions || s != APFloat::opInvalidOp)
3753           return getConstantFP(V1, DL, VT);
3754         break;
3755       case ISD::FSUB:
3756         s = V1.subtract(V2, APFloat::rmNearestTiesToEven);
3757         if (!HasFPExceptions || s!=APFloat::opInvalidOp)
3758           return getConstantFP(V1, DL, VT);
3759         break;
3760       case ISD::FMUL:
3761         s = V1.multiply(V2, APFloat::rmNearestTiesToEven);
3762         if (!HasFPExceptions || s!=APFloat::opInvalidOp)
3763           return getConstantFP(V1, DL, VT);
3764         break;
3765       case ISD::FDIV:
3766         s = V1.divide(V2, APFloat::rmNearestTiesToEven);
3767         if (!HasFPExceptions || (s!=APFloat::opInvalidOp &&
3768                                  s!=APFloat::opDivByZero)) {
3769           return getConstantFP(V1, DL, VT);
3770         }
3771         break;
3772       case ISD::FREM :
3773         s = V1.mod(V2);
3774         if (!HasFPExceptions || (s!=APFloat::opInvalidOp &&
3775                                  s!=APFloat::opDivByZero)) {
3776           return getConstantFP(V1, DL, VT);
3777         }
3778         break;
3779       case ISD::FCOPYSIGN:
3780         V1.copySign(V2);
3781         return getConstantFP(V1, DL, VT);
3782       default: break;
3783       }
3784     }
3785
3786     if (Opcode == ISD::FP_ROUND) {
3787       APFloat V = N1CFP->getValueAPF();    // make copy
3788       bool ignored;
3789       // This can return overflow, underflow, or inexact; we don't care.
3790       // FIXME need to be more flexible about rounding mode.
3791       (void)V.convert(EVTToAPFloatSemantics(VT),
3792                       APFloat::rmNearestTiesToEven, &ignored);
3793       return getConstantFP(V, DL, VT);
3794     }
3795   }
3796
3797   // Canonicalize an UNDEF to the RHS, even over a constant.
3798   if (N1.getOpcode() == ISD::UNDEF) {
3799     if (isCommutativeBinOp(Opcode)) {
3800       std::swap(N1, N2);
3801     } else {
3802       switch (Opcode) {
3803       case ISD::FP_ROUND_INREG:
3804       case ISD::SIGN_EXTEND_INREG:
3805       case ISD::SUB:
3806       case ISD::FSUB:
3807       case ISD::FDIV:
3808       case ISD::FREM:
3809       case ISD::SRA:
3810         return N1;     // fold op(undef, arg2) -> undef
3811       case ISD::UDIV:
3812       case ISD::SDIV:
3813       case ISD::UREM:
3814       case ISD::SREM:
3815       case ISD::SRL:
3816       case ISD::SHL:
3817         if (!VT.isVector())
3818           return getConstant(0, DL, VT);    // fold op(undef, arg2) -> 0
3819         // For vectors, we can't easily build an all zero vector, just return
3820         // the LHS.
3821         return N2;
3822       }
3823     }
3824   }
3825
3826   // Fold a bunch of operators when the RHS is undef.
3827   if (N2.getOpcode() == ISD::UNDEF) {
3828     switch (Opcode) {
3829     case ISD::XOR:
3830       if (N1.getOpcode() == ISD::UNDEF)
3831         // Handle undef ^ undef -> 0 special case. This is a common
3832         // idiom (misuse).
3833         return getConstant(0, DL, VT);
3834       // fallthrough
3835     case ISD::ADD:
3836     case ISD::ADDC:
3837     case ISD::ADDE:
3838     case ISD::SUB:
3839     case ISD::UDIV:
3840     case ISD::SDIV:
3841     case ISD::UREM:
3842     case ISD::SREM:
3843       return N2;       // fold op(arg1, undef) -> undef
3844     case ISD::FADD:
3845     case ISD::FSUB:
3846     case ISD::FMUL:
3847     case ISD::FDIV:
3848     case ISD::FREM:
3849       if (getTarget().Options.UnsafeFPMath)
3850         return N2;
3851       break;
3852     case ISD::MUL:
3853     case ISD::AND:
3854     case ISD::SRL:
3855     case ISD::SHL:
3856       if (!VT.isVector())
3857         return getConstant(0, DL, VT);  // fold op(arg1, undef) -> 0
3858       // For vectors, we can't easily build an all zero vector, just return
3859       // the LHS.
3860       return N1;
3861     case ISD::OR:
3862       if (!VT.isVector())
3863         return getConstant(APInt::getAllOnesValue(VT.getSizeInBits()), DL, VT);
3864       // For vectors, we can't easily build an all one vector, just return
3865       // the LHS.
3866       return N1;
3867     case ISD::SRA:
3868       return N1;
3869     }
3870   }
3871
3872   // Memoize this node if possible.
3873   BinarySDNode *N;
3874   SDVTList VTs = getVTList(VT);
3875   if (VT != MVT::Glue) {
3876     SDValue Ops[] = {N1, N2};
3877     FoldingSetNodeID ID;
3878     AddNodeIDNode(ID, Opcode, VTs, Ops);
3879     AddNodeIDFlags(ID, Opcode, Flags);
3880     void *IP = nullptr;
3881     if (SDNode *E = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP))
3882       return SDValue(E, 0);
3883
3884     N = GetBinarySDNode(Opcode, DL, VTs, N1, N2, Flags);
3885
3886     CSEMap.InsertNode(N, IP);
3887   } else {
3888     N = GetBinarySDNode(Opcode, DL, VTs, N1, N2, Flags);
3889   }
3890
3891   InsertNode(N);
3892   return SDValue(N, 0);
3893 }
3894
3895 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
3896                               SDValue N1, SDValue N2, SDValue N3) {
3897   // Perform various simplifications.
3898   switch (Opcode) {
3899   case ISD::FMA: {
3900     ConstantFPSDNode *N1CFP = dyn_cast<ConstantFPSDNode>(N1);
3901     ConstantFPSDNode *N2CFP = dyn_cast<ConstantFPSDNode>(N2);
3902     ConstantFPSDNode *N3CFP = dyn_cast<ConstantFPSDNode>(N3);
3903     if (N1CFP && N2CFP && N3CFP) {
3904       APFloat  V1 = N1CFP->getValueAPF();
3905       const APFloat &V2 = N2CFP->getValueAPF();
3906       const APFloat &V3 = N3CFP->getValueAPF();
3907       APFloat::opStatus s =
3908         V1.fusedMultiplyAdd(V2, V3, APFloat::rmNearestTiesToEven);
3909       if (!TLI->hasFloatingPointExceptions() || s != APFloat::opInvalidOp)
3910         return getConstantFP(V1, DL, VT);
3911     }
3912     break;
3913   }
3914   case ISD::CONCAT_VECTORS:
3915     // A CONCAT_VECTOR with all operands BUILD_VECTOR can be simplified to
3916     // one big BUILD_VECTOR.
3917     if (N1.getOpcode() == ISD::BUILD_VECTOR &&
3918         N2.getOpcode() == ISD::BUILD_VECTOR &&
3919         N3.getOpcode() == ISD::BUILD_VECTOR) {
3920       SmallVector<SDValue, 16> Elts(N1.getNode()->op_begin(),
3921                                     N1.getNode()->op_end());
3922       Elts.append(N2.getNode()->op_begin(), N2.getNode()->op_end());
3923       Elts.append(N3.getNode()->op_begin(), N3.getNode()->op_end());
3924       return getNode(ISD::BUILD_VECTOR, DL, VT, Elts);
3925     }
3926     break;
3927   case ISD::SETCC: {
3928     // Use FoldSetCC to simplify SETCC's.
3929     if (SDValue V = FoldSetCC(VT, N1, N2, cast<CondCodeSDNode>(N3)->get(), DL))
3930       return V;
3931     // Vector constant folding.
3932     SDValue Ops[] = {N1, N2, N3};
3933     if (SDValue V = FoldConstantVectorArithmetic(Opcode, DL, VT, Ops))
3934       return V;
3935     break;
3936   }
3937   case ISD::SELECT:
3938     if (ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N1)) {
3939      if (N1C->getZExtValue())
3940        return N2;             // select true, X, Y -> X
3941      return N3;             // select false, X, Y -> Y
3942     }
3943
3944     if (N2 == N3) return N2;   // select C, X, X -> X
3945     break;
3946   case ISD::VECTOR_SHUFFLE:
3947     llvm_unreachable("should use getVectorShuffle constructor!");
3948   case ISD::INSERT_SUBVECTOR: {
3949     SDValue Index = N3;
3950     if (VT.isSimple() && N1.getValueType().isSimple()
3951         && N2.getValueType().isSimple()) {
3952       assert(VT.isVector() && N1.getValueType().isVector() &&
3953              N2.getValueType().isVector() &&
3954              "Insert subvector VTs must be a vectors");
3955       assert(VT == N1.getValueType() &&
3956              "Dest and insert subvector source types must match!");
3957       assert(N2.getSimpleValueType() <= N1.getSimpleValueType() &&
3958              "Insert subvector must be from smaller vector to larger vector!");
3959       if (isa<ConstantSDNode>(Index)) {
3960         assert((N2.getValueType().getVectorNumElements() +
3961                 cast<ConstantSDNode>(Index)->getZExtValue()
3962                 <= VT.getVectorNumElements())
3963                && "Insert subvector overflow!");
3964       }
3965
3966       // Trivial insertion.
3967       if (VT.getSimpleVT() == N2.getSimpleValueType())
3968         return N2;
3969     }
3970     break;
3971   }
3972   case ISD::BITCAST:
3973     // Fold bit_convert nodes from a type to themselves.
3974     if (N1.getValueType() == VT)
3975       return N1;
3976     break;
3977   }
3978
3979   // Memoize node if it doesn't produce a flag.
3980   SDNode *N;
3981   SDVTList VTs = getVTList(VT);
3982   if (VT != MVT::Glue) {
3983     SDValue Ops[] = { N1, N2, N3 };
3984     FoldingSetNodeID ID;
3985     AddNodeIDNode(ID, Opcode, VTs, Ops);
3986     void *IP = nullptr;
3987     if (SDNode *E = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP))
3988       return SDValue(E, 0);
3989
3990     N = new (NodeAllocator) TernarySDNode(Opcode, DL.getIROrder(),
3991                                           DL.getDebugLoc(), VTs, N1, N2, N3);
3992     CSEMap.InsertNode(N, IP);
3993   } else {
3994     N = new (NodeAllocator) TernarySDNode(Opcode, DL.getIROrder(),
3995                                           DL.getDebugLoc(), VTs, N1, N2, N3);
3996   }
3997
3998   InsertNode(N);
3999   return SDValue(N, 0);
4000 }
4001
4002 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
4003                               SDValue N1, SDValue N2, SDValue N3,
4004                               SDValue N4) {
4005   SDValue Ops[] = { N1, N2, N3, N4 };
4006   return getNode(Opcode, DL, VT, Ops);
4007 }
4008
4009 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
4010                               SDValue N1, SDValue N2, SDValue N3,
4011                               SDValue N4, SDValue N5) {
4012   SDValue Ops[] = { N1, N2, N3, N4, N5 };
4013   return getNode(Opcode, DL, VT, Ops);
4014 }
4015
4016 /// getStackArgumentTokenFactor - Compute a TokenFactor to force all
4017 /// the incoming stack arguments to be loaded from the stack.
4018 SDValue SelectionDAG::getStackArgumentTokenFactor(SDValue Chain) {
4019   SmallVector<SDValue, 8> ArgChains;
4020
4021   // Include the original chain at the beginning of the list. When this is
4022   // used by target LowerCall hooks, this helps legalize find the
4023   // CALLSEQ_BEGIN node.
4024   ArgChains.push_back(Chain);
4025
4026   // Add a chain value for each stack argument.
4027   for (SDNode::use_iterator U = getEntryNode().getNode()->use_begin(),
4028        UE = getEntryNode().getNode()->use_end(); U != UE; ++U)
4029     if (LoadSDNode *L = dyn_cast<LoadSDNode>(*U))
4030       if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(L->getBasePtr()))
4031         if (FI->getIndex() < 0)
4032           ArgChains.push_back(SDValue(L, 1));
4033
4034   // Build a tokenfactor for all the chains.
4035   return getNode(ISD::TokenFactor, SDLoc(Chain), MVT::Other, ArgChains);
4036 }
4037
4038 /// getMemsetValue - Vectorized representation of the memset value
4039 /// operand.
4040 static SDValue getMemsetValue(SDValue Value, EVT VT, SelectionDAG &DAG,
4041                               SDLoc dl) {
4042   assert(Value.getOpcode() != ISD::UNDEF);
4043
4044   unsigned NumBits = VT.getScalarType().getSizeInBits();
4045   if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Value)) {
4046     assert(C->getAPIntValue().getBitWidth() == 8);
4047     APInt Val = APInt::getSplat(NumBits, C->getAPIntValue());
4048     if (VT.isInteger())
4049       return DAG.getConstant(Val, dl, VT);
4050     return DAG.getConstantFP(APFloat(DAG.EVTToAPFloatSemantics(VT), Val), dl,
4051                              VT);
4052   }
4053
4054   assert(Value.getValueType() == MVT::i8 && "memset with non-byte fill value?");
4055   EVT IntVT = VT.getScalarType();
4056   if (!IntVT.isInteger())
4057     IntVT = EVT::getIntegerVT(*DAG.getContext(), IntVT.getSizeInBits());
4058
4059   Value = DAG.getNode(ISD::ZERO_EXTEND, dl, IntVT, Value);
4060   if (NumBits > 8) {
4061     // Use a multiplication with 0x010101... to extend the input to the
4062     // required length.
4063     APInt Magic = APInt::getSplat(NumBits, APInt(8, 0x01));
4064     Value = DAG.getNode(ISD::MUL, dl, IntVT, Value,
4065                         DAG.getConstant(Magic, dl, IntVT));
4066   }
4067
4068   if (VT != Value.getValueType() && !VT.isInteger())
4069     Value = DAG.getNode(ISD::BITCAST, dl, VT.getScalarType(), Value);
4070   if (VT != Value.getValueType()) {
4071     assert(VT.getVectorElementType() == Value.getValueType() &&
4072            "value type should be one vector element here");
4073     SmallVector<SDValue, 8> BVOps(VT.getVectorNumElements(), Value);
4074     Value = DAG.getNode(ISD::BUILD_VECTOR, dl, VT, BVOps);
4075   }
4076
4077   return Value;
4078 }
4079
4080 /// getMemsetStringVal - Similar to getMemsetValue. Except this is only
4081 /// used when a memcpy is turned into a memset when the source is a constant
4082 /// string ptr.
4083 static SDValue getMemsetStringVal(EVT VT, SDLoc dl, SelectionDAG &DAG,
4084                                   const TargetLowering &TLI, StringRef Str) {
4085   // Handle vector with all elements zero.
4086   if (Str.empty()) {
4087     if (VT.isInteger())
4088       return DAG.getConstant(0, dl, VT);
4089     else if (VT == MVT::f32 || VT == MVT::f64 || VT == MVT::f128)
4090       return DAG.getConstantFP(0.0, dl, VT);
4091     else if (VT.isVector()) {
4092       unsigned NumElts = VT.getVectorNumElements();
4093       MVT EltVT = (VT.getVectorElementType() == MVT::f32) ? MVT::i32 : MVT::i64;
4094       return DAG.getNode(ISD::BITCAST, dl, VT,
4095                          DAG.getConstant(0, dl,
4096                                          EVT::getVectorVT(*DAG.getContext(),
4097                                                           EltVT, NumElts)));
4098     } else
4099       llvm_unreachable("Expected type!");
4100   }
4101
4102   assert(!VT.isVector() && "Can't handle vector type here!");
4103   unsigned NumVTBits = VT.getSizeInBits();
4104   unsigned NumVTBytes = NumVTBits / 8;
4105   unsigned NumBytes = std::min(NumVTBytes, unsigned(Str.size()));
4106
4107   APInt Val(NumVTBits, 0);
4108   if (DAG.getDataLayout().isLittleEndian()) {
4109     for (unsigned i = 0; i != NumBytes; ++i)
4110       Val |= (uint64_t)(unsigned char)Str[i] << i*8;
4111   } else {
4112     for (unsigned i = 0; i != NumBytes; ++i)
4113       Val |= (uint64_t)(unsigned char)Str[i] << (NumVTBytes-i-1)*8;
4114   }
4115
4116   // If the "cost" of materializing the integer immediate is less than the cost
4117   // of a load, then it is cost effective to turn the load into the immediate.
4118   Type *Ty = VT.getTypeForEVT(*DAG.getContext());
4119   if (TLI.shouldConvertConstantLoadToIntImm(Val, Ty))
4120     return DAG.getConstant(Val, dl, VT);
4121   return SDValue(nullptr, 0);
4122 }
4123
4124 /// getMemBasePlusOffset - Returns base and offset node for the
4125 ///
4126 static SDValue getMemBasePlusOffset(SDValue Base, unsigned Offset, SDLoc dl,
4127                                       SelectionDAG &DAG) {
4128   EVT VT = Base.getValueType();
4129   return DAG.getNode(ISD::ADD, dl,
4130                      VT, Base, DAG.getConstant(Offset, dl, VT));
4131 }
4132
4133 /// isMemSrcFromString - Returns true if memcpy source is a string constant.
4134 ///
4135 static bool isMemSrcFromString(SDValue Src, StringRef &Str) {
4136   unsigned SrcDelta = 0;
4137   GlobalAddressSDNode *G = nullptr;
4138   if (Src.getOpcode() == ISD::GlobalAddress)
4139     G = cast<GlobalAddressSDNode>(Src);
4140   else if (Src.getOpcode() == ISD::ADD &&
4141            Src.getOperand(0).getOpcode() == ISD::GlobalAddress &&
4142            Src.getOperand(1).getOpcode() == ISD::Constant) {
4143     G = cast<GlobalAddressSDNode>(Src.getOperand(0));
4144     SrcDelta = cast<ConstantSDNode>(Src.getOperand(1))->getZExtValue();
4145   }
4146   if (!G)
4147     return false;
4148
4149   return getConstantStringInfo(G->getGlobal(), Str, SrcDelta, false);
4150 }
4151
4152 /// Determines the optimal series of memory ops to replace the memset / memcpy.
4153 /// Return true if the number of memory ops is below the threshold (Limit).
4154 /// It returns the types of the sequence of memory ops to perform
4155 /// memset / memcpy by reference.
4156 static bool FindOptimalMemOpLowering(std::vector<EVT> &MemOps,
4157                                      unsigned Limit, uint64_t Size,
4158                                      unsigned DstAlign, unsigned SrcAlign,
4159                                      bool IsMemset,
4160                                      bool ZeroMemset,
4161                                      bool MemcpyStrSrc,
4162                                      bool AllowOverlap,
4163                                      SelectionDAG &DAG,
4164                                      const TargetLowering &TLI) {
4165   assert((SrcAlign == 0 || SrcAlign >= DstAlign) &&
4166          "Expecting memcpy / memset source to meet alignment requirement!");
4167   // If 'SrcAlign' is zero, that means the memory operation does not need to
4168   // load the value, i.e. memset or memcpy from constant string. Otherwise,
4169   // it's the inferred alignment of the source. 'DstAlign', on the other hand,
4170   // is the specified alignment of the memory operation. If it is zero, that
4171   // means it's possible to change the alignment of the destination.
4172   // 'MemcpyStrSrc' indicates whether the memcpy source is constant so it does
4173   // not need to be loaded.
4174   EVT VT = TLI.getOptimalMemOpType(Size, DstAlign, SrcAlign,
4175                                    IsMemset, ZeroMemset, MemcpyStrSrc,
4176                                    DAG.getMachineFunction());
4177
4178   if (VT == MVT::Other) {
4179     unsigned AS = 0;
4180     if (DstAlign >= DAG.getDataLayout().getPointerPrefAlignment(AS) ||
4181         TLI.allowsMisalignedMemoryAccesses(VT, AS, DstAlign)) {
4182       VT = TLI.getPointerTy(DAG.getDataLayout());
4183     } else {
4184       switch (DstAlign & 7) {
4185       case 0:  VT = MVT::i64; break;
4186       case 4:  VT = MVT::i32; break;
4187       case 2:  VT = MVT::i16; break;
4188       default: VT = MVT::i8;  break;
4189       }
4190     }
4191
4192     MVT LVT = MVT::i64;
4193     while (!TLI.isTypeLegal(LVT))
4194       LVT = (MVT::SimpleValueType)(LVT.SimpleTy - 1);
4195     assert(LVT.isInteger());
4196
4197     if (VT.bitsGT(LVT))
4198       VT = LVT;
4199   }
4200
4201   unsigned NumMemOps = 0;
4202   while (Size != 0) {
4203     unsigned VTSize = VT.getSizeInBits() / 8;
4204     while (VTSize > Size) {
4205       // For now, only use non-vector load / store's for the left-over pieces.
4206       EVT NewVT = VT;
4207       unsigned NewVTSize;
4208
4209       bool Found = false;
4210       if (VT.isVector() || VT.isFloatingPoint()) {
4211         NewVT = (VT.getSizeInBits() > 64) ? MVT::i64 : MVT::i32;
4212         if (TLI.isOperationLegalOrCustom(ISD::STORE, NewVT) &&
4213             TLI.isSafeMemOpType(NewVT.getSimpleVT()))
4214           Found = true;
4215         else if (NewVT == MVT::i64 &&
4216                  TLI.isOperationLegalOrCustom(ISD::STORE, MVT::f64) &&
4217                  TLI.isSafeMemOpType(MVT::f64)) {
4218           // i64 is usually not legal on 32-bit targets, but f64 may be.
4219           NewVT = MVT::f64;
4220           Found = true;
4221         }
4222       }
4223
4224       if (!Found) {
4225         do {
4226           NewVT = (MVT::SimpleValueType)(NewVT.getSimpleVT().SimpleTy - 1);
4227           if (NewVT == MVT::i8)
4228             break;
4229         } while (!TLI.isSafeMemOpType(NewVT.getSimpleVT()));
4230       }
4231       NewVTSize = NewVT.getSizeInBits() / 8;
4232
4233       // If the new VT cannot cover all of the remaining bits, then consider
4234       // issuing a (or a pair of) unaligned and overlapping load / store.
4235       // FIXME: Only does this for 64-bit or more since we don't have proper
4236       // cost model for unaligned load / store.
4237       bool Fast;
4238       unsigned AS = 0;
4239       if (NumMemOps && AllowOverlap &&
4240           VTSize >= 8 && NewVTSize < Size &&
4241           TLI.allowsMisalignedMemoryAccesses(VT, AS, DstAlign, &Fast) && Fast)
4242         VTSize = Size;
4243       else {
4244         VT = NewVT;
4245         VTSize = NewVTSize;
4246       }
4247     }
4248
4249     if (++NumMemOps > Limit)
4250       return false;
4251
4252     MemOps.push_back(VT);
4253     Size -= VTSize;
4254   }
4255
4256   return true;
4257 }
4258
4259 static bool shouldLowerMemFuncForSize(const MachineFunction &MF) {
4260   // On Darwin, -Os means optimize for size without hurting performance, so
4261   // only really optimize for size when -Oz (MinSize) is used.
4262   if (MF.getTarget().getTargetTriple().isOSDarwin())
4263     return MF.getFunction()->optForMinSize();
4264   return MF.getFunction()->optForSize();
4265 }
4266
4267 static SDValue getMemcpyLoadsAndStores(SelectionDAG &DAG, SDLoc dl,
4268                                        SDValue Chain, SDValue Dst,
4269                                        SDValue Src, uint64_t Size,
4270                                        unsigned Align, bool isVol,
4271                                        bool AlwaysInline,
4272                                        MachinePointerInfo DstPtrInfo,
4273                                        MachinePointerInfo SrcPtrInfo) {
4274   // Turn a memcpy of undef to nop.
4275   if (Src.getOpcode() == ISD::UNDEF)
4276     return Chain;
4277
4278   // Expand memcpy to a series of load and store ops if the size operand falls
4279   // below a certain threshold.
4280   // TODO: In the AlwaysInline case, if the size is big then generate a loop
4281   // rather than maybe a humongous number of loads and stores.
4282   const TargetLowering &TLI = DAG.getTargetLoweringInfo();
4283   std::vector<EVT> MemOps;
4284   bool DstAlignCanChange = false;
4285   MachineFunction &MF = DAG.getMachineFunction();
4286   MachineFrameInfo *MFI = MF.getFrameInfo();
4287   bool OptSize = shouldLowerMemFuncForSize(MF);
4288   FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
4289   if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
4290     DstAlignCanChange = true;
4291   unsigned SrcAlign = DAG.InferPtrAlignment(Src);
4292   if (Align > SrcAlign)
4293     SrcAlign = Align;
4294   StringRef Str;
4295   bool CopyFromStr = isMemSrcFromString(Src, Str);
4296   bool isZeroStr = CopyFromStr && Str.empty();
4297   unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemcpy(OptSize);
4298
4299   if (!FindOptimalMemOpLowering(MemOps, Limit, Size,
4300                                 (DstAlignCanChange ? 0 : Align),
4301                                 (isZeroStr ? 0 : SrcAlign),
4302                                 false, false, CopyFromStr, true, DAG, TLI))
4303     return SDValue();
4304
4305   if (DstAlignCanChange) {
4306     Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
4307     unsigned NewAlign = (unsigned)DAG.getDataLayout().getABITypeAlignment(Ty);
4308
4309     // Don't promote to an alignment that would require dynamic stack
4310     // realignment.
4311     const TargetRegisterInfo *TRI = MF.getSubtarget().getRegisterInfo();
4312     if (!TRI->needsStackRealignment(MF))
4313       while (NewAlign > Align &&
4314              DAG.getDataLayout().exceedsNaturalStackAlignment(NewAlign))
4315           NewAlign /= 2;
4316
4317     if (NewAlign > Align) {
4318       // Give the stack frame object a larger alignment if needed.
4319       if (MFI->getObjectAlignment(FI->getIndex()) < NewAlign)
4320         MFI->setObjectAlignment(FI->getIndex(), NewAlign);
4321       Align = NewAlign;
4322     }
4323   }
4324
4325   SmallVector<SDValue, 8> OutChains;
4326   unsigned NumMemOps = MemOps.size();
4327   uint64_t SrcOff = 0, DstOff = 0;
4328   for (unsigned i = 0; i != NumMemOps; ++i) {
4329     EVT VT = MemOps[i];
4330     unsigned VTSize = VT.getSizeInBits() / 8;
4331     SDValue Value, Store;
4332
4333     if (VTSize > Size) {
4334       // Issuing an unaligned load / store pair  that overlaps with the previous
4335       // pair. Adjust the offset accordingly.
4336       assert(i == NumMemOps-1 && i != 0);
4337       SrcOff -= VTSize - Size;
4338       DstOff -= VTSize - Size;
4339     }
4340
4341     if (CopyFromStr &&
4342         (isZeroStr || (VT.isInteger() && !VT.isVector()))) {
4343       // It's unlikely a store of a vector immediate can be done in a single
4344       // instruction. It would require a load from a constantpool first.
4345       // We only handle zero vectors here.
4346       // FIXME: Handle other cases where store of vector immediate is done in
4347       // a single instruction.
4348       Value = getMemsetStringVal(VT, dl, DAG, TLI, Str.substr(SrcOff));
4349       if (Value.getNode())
4350         Store = DAG.getStore(Chain, dl, Value,
4351                              getMemBasePlusOffset(Dst, DstOff, dl, DAG),
4352                              DstPtrInfo.getWithOffset(DstOff), isVol,
4353                              false, Align);
4354     }
4355
4356     if (!Store.getNode()) {
4357       // The type might not be legal for the target.  This should only happen
4358       // if the type is smaller than a legal type, as on PPC, so the right
4359       // thing to do is generate a LoadExt/StoreTrunc pair.  These simplify
4360       // to Load/Store if NVT==VT.
4361       // FIXME does the case above also need this?
4362       EVT NVT = TLI.getTypeToTransformTo(*DAG.getContext(), VT);
4363       assert(NVT.bitsGE(VT));
4364       Value = DAG.getExtLoad(ISD::EXTLOAD, dl, NVT, Chain,
4365                              getMemBasePlusOffset(Src, SrcOff, dl, DAG),
4366                              SrcPtrInfo.getWithOffset(SrcOff), VT, isVol, false,
4367                              false, MinAlign(SrcAlign, SrcOff));
4368       Store = DAG.getTruncStore(Chain, dl, Value,
4369                                 getMemBasePlusOffset(Dst, DstOff, dl, DAG),
4370                                 DstPtrInfo.getWithOffset(DstOff), VT, isVol,
4371                                 false, Align);
4372     }
4373     OutChains.push_back(Store);
4374     SrcOff += VTSize;
4375     DstOff += VTSize;
4376     Size -= VTSize;
4377   }
4378
4379   return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, OutChains);
4380 }
4381
4382 static SDValue getMemmoveLoadsAndStores(SelectionDAG &DAG, SDLoc dl,
4383                                         SDValue Chain, SDValue Dst,
4384                                         SDValue Src, uint64_t Size,
4385                                         unsigned Align,  bool isVol,
4386                                         bool AlwaysInline,
4387                                         MachinePointerInfo DstPtrInfo,
4388                                         MachinePointerInfo SrcPtrInfo) {
4389   // Turn a memmove of undef to nop.
4390   if (Src.getOpcode() == ISD::UNDEF)
4391     return Chain;
4392
4393   // Expand memmove to a series of load and store ops if the size operand falls
4394   // below a certain threshold.
4395   const TargetLowering &TLI = DAG.getTargetLoweringInfo();
4396   std::vector<EVT> MemOps;
4397   bool DstAlignCanChange = false;
4398   MachineFunction &MF = DAG.getMachineFunction();
4399   MachineFrameInfo *MFI = MF.getFrameInfo();
4400   bool OptSize = shouldLowerMemFuncForSize(MF);
4401   FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
4402   if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
4403     DstAlignCanChange = true;
4404   unsigned SrcAlign = DAG.InferPtrAlignment(Src);
4405   if (Align > SrcAlign)
4406     SrcAlign = Align;
4407   unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemmove(OptSize);
4408
4409   if (!FindOptimalMemOpLowering(MemOps, Limit, Size,
4410                                 (DstAlignCanChange ? 0 : Align), SrcAlign,
4411                                 false, false, false, false, DAG, TLI))
4412     return SDValue();
4413
4414   if (DstAlignCanChange) {
4415     Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
4416     unsigned NewAlign = (unsigned)DAG.getDataLayout().getABITypeAlignment(Ty);
4417     if (NewAlign > Align) {
4418       // Give the stack frame object a larger alignment if needed.
4419       if (MFI->getObjectAlignment(FI->getIndex()) < NewAlign)
4420         MFI->setObjectAlignment(FI->getIndex(), NewAlign);
4421       Align = NewAlign;
4422     }
4423   }
4424
4425   uint64_t SrcOff = 0, DstOff = 0;
4426   SmallVector<SDValue, 8> LoadValues;
4427   SmallVector<SDValue, 8> LoadChains;
4428   SmallVector<SDValue, 8> OutChains;
4429   unsigned NumMemOps = MemOps.size();
4430   for (unsigned i = 0; i < NumMemOps; i++) {
4431     EVT VT = MemOps[i];
4432     unsigned VTSize = VT.getSizeInBits() / 8;
4433     SDValue Value;
4434
4435     Value = DAG.getLoad(VT, dl, Chain,
4436                         getMemBasePlusOffset(Src, SrcOff, dl, DAG),
4437                         SrcPtrInfo.getWithOffset(SrcOff), isVol,
4438                         false, false, SrcAlign);
4439     LoadValues.push_back(Value);
4440     LoadChains.push_back(Value.getValue(1));
4441     SrcOff += VTSize;
4442   }
4443   Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, LoadChains);
4444   OutChains.clear();
4445   for (unsigned i = 0; i < NumMemOps; i++) {
4446     EVT VT = MemOps[i];
4447     unsigned VTSize = VT.getSizeInBits() / 8;
4448     SDValue Store;
4449
4450     Store = DAG.getStore(Chain, dl, LoadValues[i],
4451                          getMemBasePlusOffset(Dst, DstOff, dl, DAG),
4452                          DstPtrInfo.getWithOffset(DstOff), isVol, false, Align);
4453     OutChains.push_back(Store);
4454     DstOff += VTSize;
4455   }
4456
4457   return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, OutChains);
4458 }
4459
4460 /// \brief Lower the call to 'memset' intrinsic function into a series of store
4461 /// operations.
4462 ///
4463 /// \param DAG Selection DAG where lowered code is placed.
4464 /// \param dl Link to corresponding IR location.
4465 /// \param Chain Control flow dependency.
4466 /// \param Dst Pointer to destination memory location.
4467 /// \param Src Value of byte to write into the memory.
4468 /// \param Size Number of bytes to write.
4469 /// \param Align Alignment of the destination in bytes.
4470 /// \param isVol True if destination is volatile.
4471 /// \param DstPtrInfo IR information on the memory pointer.
4472 /// \returns New head in the control flow, if lowering was successful, empty
4473 /// SDValue otherwise.
4474 ///
4475 /// The function tries to replace 'llvm.memset' intrinsic with several store
4476 /// operations and value calculation code. This is usually profitable for small
4477 /// memory size.
4478 static SDValue getMemsetStores(SelectionDAG &DAG, SDLoc dl,
4479                                SDValue Chain, SDValue Dst,
4480                                SDValue Src, uint64_t Size,
4481                                unsigned Align, bool isVol,
4482                                MachinePointerInfo DstPtrInfo) {
4483   // Turn a memset of undef to nop.
4484   if (Src.getOpcode() == ISD::UNDEF)
4485     return Chain;
4486
4487   // Expand memset to a series of load/store ops if the size operand
4488   // falls below a certain threshold.
4489   const TargetLowering &TLI = DAG.getTargetLoweringInfo();
4490   std::vector<EVT> MemOps;
4491   bool DstAlignCanChange = false;
4492   MachineFunction &MF = DAG.getMachineFunction();
4493   MachineFrameInfo *MFI = MF.getFrameInfo();
4494   bool OptSize = shouldLowerMemFuncForSize(MF);
4495   FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
4496   if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
4497     DstAlignCanChange = true;
4498   bool IsZeroVal =
4499     isa<ConstantSDNode>(Src) && cast<ConstantSDNode>(Src)->isNullValue();
4500   if (!FindOptimalMemOpLowering(MemOps, TLI.getMaxStoresPerMemset(OptSize),
4501                                 Size, (DstAlignCanChange ? 0 : Align), 0,
4502                                 true, IsZeroVal, false, true, DAG, TLI))
4503     return SDValue();
4504
4505   if (DstAlignCanChange) {
4506     Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
4507     unsigned NewAlign = (unsigned)DAG.getDataLayout().getABITypeAlignment(Ty);
4508     if (NewAlign > Align) {
4509       // Give the stack frame object a larger alignment if needed.
4510       if (MFI->getObjectAlignment(FI->getIndex()) < NewAlign)
4511         MFI->setObjectAlignment(FI->getIndex(), NewAlign);
4512       Align = NewAlign;
4513     }
4514   }
4515
4516   SmallVector<SDValue, 8> OutChains;
4517   uint64_t DstOff = 0;
4518   unsigned NumMemOps = MemOps.size();
4519
4520   // Find the largest store and generate the bit pattern for it.
4521   EVT LargestVT = MemOps[0];
4522   for (unsigned i = 1; i < NumMemOps; i++)
4523     if (MemOps[i].bitsGT(LargestVT))
4524       LargestVT = MemOps[i];
4525   SDValue MemSetValue = getMemsetValue(Src, LargestVT, DAG, dl);
4526
4527   for (unsigned i = 0; i < NumMemOps; i++) {
4528     EVT VT = MemOps[i];
4529     unsigned VTSize = VT.getSizeInBits() / 8;
4530     if (VTSize > Size) {
4531       // Issuing an unaligned load / store pair  that overlaps with the previous
4532       // pair. Adjust the offset accordingly.
4533       assert(i == NumMemOps-1 && i != 0);
4534       DstOff -= VTSize - Size;
4535     }
4536
4537     // If this store is smaller than the largest store see whether we can get
4538     // the smaller value for free with a truncate.
4539     SDValue Value = MemSetValue;
4540     if (VT.bitsLT(LargestVT)) {
4541       if (!LargestVT.isVector() && !VT.isVector() &&
4542           TLI.isTruncateFree(LargestVT, VT))
4543         Value = DAG.getNode(ISD::TRUNCATE, dl, VT, MemSetValue);
4544       else
4545         Value = getMemsetValue(Src, VT, DAG, dl);
4546     }
4547     assert(Value.getValueType() == VT && "Value with wrong type.");
4548     SDValue Store = DAG.getStore(Chain, dl, Value,
4549                                  getMemBasePlusOffset(Dst, DstOff, dl, DAG),
4550                                  DstPtrInfo.getWithOffset(DstOff),
4551                                  isVol, false, Align);
4552     OutChains.push_back(Store);
4553     DstOff += VT.getSizeInBits() / 8;
4554     Size -= VTSize;
4555   }
4556
4557   return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, OutChains);
4558 }
4559
4560 SDValue SelectionDAG::getMemcpy(SDValue Chain, SDLoc dl, SDValue Dst,
4561                                 SDValue Src, SDValue Size,
4562                                 unsigned Align, bool isVol, bool AlwaysInline,
4563                                 bool isTailCall, MachinePointerInfo DstPtrInfo,
4564                                 MachinePointerInfo SrcPtrInfo) {
4565   assert(Align && "The SDAG layer expects explicit alignment and reserves 0");
4566
4567   // Check to see if we should lower the memcpy to loads and stores first.
4568   // For cases within the target-specified limits, this is the best choice.
4569   ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);
4570   if (ConstantSize) {
4571     // Memcpy with size zero? Just return the original chain.
4572     if (ConstantSize->isNullValue())
4573       return Chain;
4574
4575     SDValue Result = getMemcpyLoadsAndStores(*this, dl, Chain, Dst, Src,
4576                                              ConstantSize->getZExtValue(),Align,
4577                                 isVol, false, DstPtrInfo, SrcPtrInfo);
4578     if (Result.getNode())
4579       return Result;
4580   }
4581
4582   // Then check to see if we should lower the memcpy with target-specific
4583   // code. If the target chooses to do this, this is the next best.
4584   if (TSI) {
4585     SDValue Result = TSI->EmitTargetCodeForMemcpy(
4586         *this, dl, Chain, Dst, Src, Size, Align, isVol, AlwaysInline,
4587         DstPtrInfo, SrcPtrInfo);
4588     if (Result.getNode())
4589       return Result;
4590   }
4591
4592   // If we really need inline code and the target declined to provide it,
4593   // use a (potentially long) sequence of loads and stores.
4594   if (AlwaysInline) {
4595     assert(ConstantSize && "AlwaysInline requires a constant size!");
4596     return getMemcpyLoadsAndStores(*this, dl, Chain, Dst, Src,
4597                                    ConstantSize->getZExtValue(), Align, isVol,
4598                                    true, DstPtrInfo, SrcPtrInfo);
4599   }
4600
4601   // FIXME: If the memcpy is volatile (isVol), lowering it to a plain libc
4602   // memcpy is not guaranteed to be safe. libc memcpys aren't required to
4603   // respect volatile, so they may do things like read or write memory
4604   // beyond the given memory regions. But fixing this isn't easy, and most
4605   // people don't care.
4606
4607   // Emit a library call.
4608   TargetLowering::ArgListTy Args;
4609   TargetLowering::ArgListEntry Entry;
4610   Entry.Ty = getDataLayout().getIntPtrType(*getContext());
4611   Entry.Node = Dst; Args.push_back(Entry);
4612   Entry.Node = Src; Args.push_back(Entry);
4613   Entry.Node = Size; Args.push_back(Entry);
4614   // FIXME: pass in SDLoc
4615   TargetLowering::CallLoweringInfo CLI(*this);
4616   CLI.setDebugLoc(dl)
4617       .setChain(Chain)
4618       .setCallee(TLI->getLibcallCallingConv(RTLIB::MEMCPY),
4619                  Type::getVoidTy(*getContext()),
4620                  getExternalSymbol(TLI->getLibcallName(RTLIB::MEMCPY),
4621                                    TLI->getPointerTy(getDataLayout())),
4622                  std::move(Args), 0)
4623       .setDiscardResult()
4624       .setTailCall(isTailCall);
4625
4626   std::pair<SDValue,SDValue> CallResult = TLI->LowerCallTo(CLI);
4627   return CallResult.second;
4628 }
4629
4630 SDValue SelectionDAG::getMemmove(SDValue Chain, SDLoc dl, SDValue Dst,
4631                                  SDValue Src, SDValue Size,
4632                                  unsigned Align, bool isVol, bool isTailCall,
4633                                  MachinePointerInfo DstPtrInfo,
4634                                  MachinePointerInfo SrcPtrInfo) {
4635   assert(Align && "The SDAG layer expects explicit alignment and reserves 0");
4636
4637   // Check to see if we should lower the memmove to loads and stores first.
4638   // For cases within the target-specified limits, this is the best choice.
4639   ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);
4640   if (ConstantSize) {
4641     // Memmove with size zero? Just return the original chain.
4642     if (ConstantSize->isNullValue())
4643       return Chain;
4644
4645     SDValue Result =
4646       getMemmoveLoadsAndStores(*this, dl, Chain, Dst, Src,
4647                                ConstantSize->getZExtValue(), Align, isVol,
4648                                false, DstPtrInfo, SrcPtrInfo);
4649     if (Result.getNode())
4650       return Result;
4651   }
4652
4653   // Then check to see if we should lower the memmove with target-specific
4654   // code. If the target chooses to do this, this is the next best.
4655   if (TSI) {
4656     SDValue Result = TSI->EmitTargetCodeForMemmove(
4657         *this, dl, Chain, Dst, Src, Size, Align, isVol, DstPtrInfo, SrcPtrInfo);
4658     if (Result.getNode())
4659       return Result;
4660   }
4661
4662   // FIXME: If the memmove is volatile, lowering it to plain libc memmove may
4663   // not be safe.  See memcpy above for more details.
4664
4665   // Emit a library call.
4666   TargetLowering::ArgListTy Args;
4667   TargetLowering::ArgListEntry Entry;
4668   Entry.Ty = getDataLayout().getIntPtrType(*getContext());
4669   Entry.Node = Dst; Args.push_back(Entry);
4670   Entry.Node = Src; Args.push_back(Entry);
4671   Entry.Node = Size; Args.push_back(Entry);
4672   // FIXME:  pass in SDLoc
4673   TargetLowering::CallLoweringInfo CLI(*this);
4674   CLI.setDebugLoc(dl)
4675       .setChain(Chain)
4676       .setCallee(TLI->getLibcallCallingConv(RTLIB::MEMMOVE),
4677                  Type::getVoidTy(*getContext()),
4678                  getExternalSymbol(TLI->getLibcallName(RTLIB::MEMMOVE),
4679                                    TLI->getPointerTy(getDataLayout())),
4680                  std::move(Args), 0)
4681       .setDiscardResult()
4682       .setTailCall(isTailCall);
4683
4684   std::pair<SDValue,SDValue> CallResult = TLI->LowerCallTo(CLI);
4685   return CallResult.second;
4686 }
4687
4688 SDValue SelectionDAG::getMemset(SDValue Chain, SDLoc dl, SDValue Dst,
4689                                 SDValue Src, SDValue Size,
4690                                 unsigned Align, bool isVol, bool isTailCall,
4691                                 MachinePointerInfo DstPtrInfo) {
4692   assert(Align && "The SDAG layer expects explicit alignment and reserves 0");
4693
4694   // Check to see if we should lower the memset to stores first.
4695   // For cases within the target-specified limits, this is the best choice.
4696   ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);
4697   if (ConstantSize) {
4698     // Memset with size zero? Just return the original chain.
4699     if (ConstantSize->isNullValue())
4700       return Chain;
4701
4702     SDValue Result =
4703       getMemsetStores(*this, dl, Chain, Dst, Src, ConstantSize->getZExtValue(),
4704                       Align, isVol, DstPtrInfo);
4705
4706     if (Result.getNode())
4707       return Result;
4708   }
4709
4710   // Then check to see if we should lower the memset with target-specific
4711   // code. If the target chooses to do this, this is the next best.
4712   if (TSI) {
4713     SDValue Result = TSI->EmitTargetCodeForMemset(
4714         *this, dl, Chain, Dst, Src, Size, Align, isVol, DstPtrInfo);
4715     if (Result.getNode())
4716       return Result;
4717   }
4718
4719   // Emit a library call.
4720   Type *IntPtrTy = getDataLayout().getIntPtrType(*getContext());
4721   TargetLowering::ArgListTy Args;
4722   TargetLowering::ArgListEntry Entry;
4723   Entry.Node = Dst; Entry.Ty = IntPtrTy;
4724   Args.push_back(Entry);
4725   Entry.Node = Src;
4726   Entry.Ty = Src.getValueType().getTypeForEVT(*getContext());
4727   Args.push_back(Entry);
4728   Entry.Node = Size;
4729   Entry.Ty = IntPtrTy;
4730   Args.push_back(Entry);
4731
4732   // FIXME: pass in SDLoc
4733   TargetLowering::CallLoweringInfo CLI(*this);
4734   CLI.setDebugLoc(dl)
4735       .setChain(Chain)
4736       .setCallee(TLI->getLibcallCallingConv(RTLIB::MEMSET),
4737                  Type::getVoidTy(*getContext()),
4738                  getExternalSymbol(TLI->getLibcallName(RTLIB::MEMSET),
4739                                    TLI->getPointerTy(getDataLayout())),
4740                  std::move(Args), 0)
4741       .setDiscardResult()
4742       .setTailCall(isTailCall);
4743
4744   std::pair<SDValue,SDValue> CallResult = TLI->LowerCallTo(CLI);
4745   return CallResult.second;
4746 }
4747
4748 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4749                                 SDVTList VTList, ArrayRef<SDValue> Ops,
4750                                 MachineMemOperand *MMO,
4751                                 AtomicOrdering SuccessOrdering,
4752                                 AtomicOrdering FailureOrdering,
4753                                 SynchronizationScope SynchScope) {
4754   FoldingSetNodeID ID;
4755   ID.AddInteger(MemVT.getRawBits());
4756   AddNodeIDNode(ID, Opcode, VTList, Ops);
4757   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
4758   void* IP = nullptr;
4759   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP)) {
4760     cast<AtomicSDNode>(E)->refineAlignment(MMO);
4761     return SDValue(E, 0);
4762   }
4763
4764   // Allocate the operands array for the node out of the BumpPtrAllocator, since
4765   // SDNode doesn't have access to it.  This memory will be "leaked" when
4766   // the node is deallocated, but recovered when the allocator is released.
4767   // If the number of operands is less than 5 we use AtomicSDNode's internal
4768   // storage.
4769   unsigned NumOps = Ops.size();
4770   SDUse *DynOps = NumOps > 4 ? OperandAllocator.Allocate<SDUse>(NumOps)
4771                              : nullptr;
4772
4773   SDNode *N = new (NodeAllocator) AtomicSDNode(Opcode, dl.getIROrder(),
4774                                                dl.getDebugLoc(), VTList, MemVT,
4775                                                Ops.data(), DynOps, NumOps, MMO,
4776                                                SuccessOrdering, FailureOrdering,
4777                                                SynchScope);
4778   CSEMap.InsertNode(N, IP);
4779   InsertNode(N);
4780   return SDValue(N, 0);
4781 }
4782
4783 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4784                                 SDVTList VTList, ArrayRef<SDValue> Ops,
4785                                 MachineMemOperand *MMO,
4786                                 AtomicOrdering Ordering,
4787                                 SynchronizationScope SynchScope) {
4788   return getAtomic(Opcode, dl, MemVT, VTList, Ops, MMO, Ordering,
4789                    Ordering, SynchScope);
4790 }
4791
4792 SDValue SelectionDAG::getAtomicCmpSwap(
4793     unsigned Opcode, SDLoc dl, EVT MemVT, SDVTList VTs, SDValue Chain,
4794     SDValue Ptr, SDValue Cmp, SDValue Swp, MachinePointerInfo PtrInfo,
4795     unsigned Alignment, AtomicOrdering SuccessOrdering,
4796     AtomicOrdering FailureOrdering, SynchronizationScope SynchScope) {
4797   assert(Opcode == ISD::ATOMIC_CMP_SWAP ||
4798          Opcode == ISD::ATOMIC_CMP_SWAP_WITH_SUCCESS);
4799   assert(Cmp.getValueType() == Swp.getValueType() && "Invalid Atomic Op Types");
4800
4801   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
4802     Alignment = getEVTAlignment(MemVT);
4803
4804   MachineFunction &MF = getMachineFunction();
4805
4806   // FIXME: Volatile isn't really correct; we should keep track of atomic
4807   // orderings in the memoperand.
4808   unsigned Flags = MachineMemOperand::MOVolatile;
4809   Flags |= MachineMemOperand::MOLoad;
4810   Flags |= MachineMemOperand::MOStore;
4811
4812   MachineMemOperand *MMO =
4813     MF.getMachineMemOperand(PtrInfo, Flags, MemVT.getStoreSize(), Alignment);
4814
4815   return getAtomicCmpSwap(Opcode, dl, MemVT, VTs, Chain, Ptr, Cmp, Swp, MMO,
4816                           SuccessOrdering, FailureOrdering, SynchScope);
4817 }
4818
4819 SDValue SelectionDAG::getAtomicCmpSwap(unsigned Opcode, SDLoc dl, EVT MemVT,
4820                                        SDVTList VTs, SDValue Chain, SDValue Ptr,
4821                                        SDValue Cmp, SDValue Swp,
4822                                        MachineMemOperand *MMO,
4823                                        AtomicOrdering SuccessOrdering,
4824                                        AtomicOrdering FailureOrdering,
4825                                        SynchronizationScope SynchScope) {
4826   assert(Opcode == ISD::ATOMIC_CMP_SWAP ||
4827          Opcode == ISD::ATOMIC_CMP_SWAP_WITH_SUCCESS);
4828   assert(Cmp.getValueType() == Swp.getValueType() && "Invalid Atomic Op Types");
4829
4830   SDValue Ops[] = {Chain, Ptr, Cmp, Swp};
4831   return getAtomic(Opcode, dl, MemVT, VTs, Ops, MMO,
4832                    SuccessOrdering, FailureOrdering, SynchScope);
4833 }
4834
4835 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4836                                 SDValue Chain,
4837                                 SDValue Ptr, SDValue Val,
4838                                 const Value* PtrVal,
4839                                 unsigned Alignment,
4840                                 AtomicOrdering Ordering,
4841                                 SynchronizationScope SynchScope) {
4842   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
4843     Alignment = getEVTAlignment(MemVT);
4844
4845   MachineFunction &MF = getMachineFunction();
4846   // An atomic store does not load. An atomic load does not store.
4847   // (An atomicrmw obviously both loads and stores.)
4848   // For now, atomics are considered to be volatile always, and they are
4849   // chained as such.
4850   // FIXME: Volatile isn't really correct; we should keep track of atomic
4851   // orderings in the memoperand.
4852   unsigned Flags = MachineMemOperand::MOVolatile;
4853   if (Opcode != ISD::ATOMIC_STORE)
4854     Flags |= MachineMemOperand::MOLoad;
4855   if (Opcode != ISD::ATOMIC_LOAD)
4856     Flags |= MachineMemOperand::MOStore;
4857
4858   MachineMemOperand *MMO =
4859     MF.getMachineMemOperand(MachinePointerInfo(PtrVal), Flags,
4860                             MemVT.getStoreSize(), Alignment);
4861
4862   return getAtomic(Opcode, dl, MemVT, Chain, Ptr, Val, MMO,
4863                    Ordering, SynchScope);
4864 }
4865
4866 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4867                                 SDValue Chain,
4868                                 SDValue Ptr, SDValue Val,
4869                                 MachineMemOperand *MMO,
4870                                 AtomicOrdering Ordering,
4871                                 SynchronizationScope SynchScope) {
4872   assert((Opcode == ISD::ATOMIC_LOAD_ADD ||
4873           Opcode == ISD::ATOMIC_LOAD_SUB ||
4874           Opcode == ISD::ATOMIC_LOAD_AND ||
4875           Opcode == ISD::ATOMIC_LOAD_OR ||
4876           Opcode == ISD::ATOMIC_LOAD_XOR ||
4877           Opcode == ISD::ATOMIC_LOAD_NAND ||
4878           Opcode == ISD::ATOMIC_LOAD_MIN ||
4879           Opcode == ISD::ATOMIC_LOAD_MAX ||
4880           Opcode == ISD::ATOMIC_LOAD_UMIN ||
4881           Opcode == ISD::ATOMIC_LOAD_UMAX ||
4882           Opcode == ISD::ATOMIC_SWAP ||
4883           Opcode == ISD::ATOMIC_STORE) &&
4884          "Invalid Atomic Op");
4885
4886   EVT VT = Val.getValueType();
4887
4888   SDVTList VTs = Opcode == ISD::ATOMIC_STORE ? getVTList(MVT::Other) :
4889                                                getVTList(VT, MVT::Other);
4890   SDValue Ops[] = {Chain, Ptr, Val};
4891   return getAtomic(Opcode, dl, MemVT, VTs, Ops, MMO, Ordering, SynchScope);
4892 }
4893
4894 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4895                                 EVT VT, SDValue Chain,
4896                                 SDValue Ptr,
4897                                 MachineMemOperand *MMO,
4898                                 AtomicOrdering Ordering,
4899                                 SynchronizationScope SynchScope) {
4900   assert(Opcode == ISD::ATOMIC_LOAD && "Invalid Atomic Op");
4901
4902   SDVTList VTs = getVTList(VT, MVT::Other);
4903   SDValue Ops[] = {Chain, Ptr};
4904   return getAtomic(Opcode, dl, MemVT, VTs, Ops, MMO, Ordering, SynchScope);
4905 }
4906
4907 /// getMergeValues - Create a MERGE_VALUES node from the given operands.
4908 SDValue SelectionDAG::getMergeValues(ArrayRef<SDValue> Ops, SDLoc dl) {
4909   if (Ops.size() == 1)
4910     return Ops[0];
4911
4912   SmallVector<EVT, 4> VTs;
4913   VTs.reserve(Ops.size());
4914   for (unsigned i = 0; i < Ops.size(); ++i)
4915     VTs.push_back(Ops[i].getValueType());
4916   return getNode(ISD::MERGE_VALUES, dl, getVTList(VTs), Ops);
4917 }
4918
4919 SDValue
4920 SelectionDAG::getMemIntrinsicNode(unsigned Opcode, SDLoc dl, SDVTList VTList,
4921                                   ArrayRef<SDValue> Ops,
4922                                   EVT MemVT, MachinePointerInfo PtrInfo,
4923                                   unsigned Align, bool Vol,
4924                                   bool ReadMem, bool WriteMem, unsigned Size) {
4925   if (Align == 0)  // Ensure that codegen never sees alignment 0
4926     Align = getEVTAlignment(MemVT);
4927
4928   MachineFunction &MF = getMachineFunction();
4929   unsigned Flags = 0;
4930   if (WriteMem)
4931     Flags |= MachineMemOperand::MOStore;
4932   if (ReadMem)
4933     Flags |= MachineMemOperand::MOLoad;
4934   if (Vol)
4935     Flags |= MachineMemOperand::MOVolatile;
4936   if (!Size)
4937     Size = MemVT.getStoreSize();
4938   MachineMemOperand *MMO =
4939     MF.getMachineMemOperand(PtrInfo, Flags, Size, Align);
4940
4941   return getMemIntrinsicNode(Opcode, dl, VTList, Ops, MemVT, MMO);
4942 }
4943
4944 SDValue
4945 SelectionDAG::getMemIntrinsicNode(unsigned Opcode, SDLoc dl, SDVTList VTList,
4946                                   ArrayRef<SDValue> Ops, EVT MemVT,
4947                                   MachineMemOperand *MMO) {
4948   assert((Opcode == ISD::INTRINSIC_VOID ||
4949           Opcode == ISD::INTRINSIC_W_CHAIN ||
4950           Opcode == ISD::PREFETCH ||
4951           Opcode == ISD::LIFETIME_START ||
4952           Opcode == ISD::LIFETIME_END ||
4953           (Opcode <= INT_MAX &&
4954            (int)Opcode >= ISD::FIRST_TARGET_MEMORY_OPCODE)) &&
4955          "Opcode is not a memory-accessing opcode!");
4956
4957   // Memoize the node unless it returns a flag.
4958   MemIntrinsicSDNode *N;
4959   if (VTList.VTs[VTList.NumVTs-1] != MVT::Glue) {
4960     FoldingSetNodeID ID;
4961     AddNodeIDNode(ID, Opcode, VTList, Ops);
4962     ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
4963     void *IP = nullptr;
4964     if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP)) {
4965       cast<MemIntrinsicSDNode>(E)->refineAlignment(MMO);
4966       return SDValue(E, 0);
4967     }
4968
4969     N = new (NodeAllocator) MemIntrinsicSDNode(Opcode, dl.getIROrder(),
4970                                                dl.getDebugLoc(), VTList, Ops,
4971                                                MemVT, MMO);
4972     CSEMap.InsertNode(N, IP);
4973   } else {
4974     N = new (NodeAllocator) MemIntrinsicSDNode(Opcode, dl.getIROrder(),
4975                                                dl.getDebugLoc(), VTList, Ops,
4976                                                MemVT, MMO);
4977   }
4978   InsertNode(N);
4979   return SDValue(N, 0);
4980 }
4981
4982 /// InferPointerInfo - If the specified ptr/offset is a frame index, infer a
4983 /// MachinePointerInfo record from it.  This is particularly useful because the
4984 /// code generator has many cases where it doesn't bother passing in a
4985 /// MachinePointerInfo to getLoad or getStore when it has "FI+Cst".
4986 static MachinePointerInfo InferPointerInfo(SelectionDAG &DAG, SDValue Ptr,
4987                                            int64_t Offset = 0) {
4988   // If this is FI+Offset, we can model it.
4989   if (const FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Ptr))
4990     return MachinePointerInfo::getFixedStack(DAG.getMachineFunction(),
4991                                              FI->getIndex(), Offset);
4992
4993   // If this is (FI+Offset1)+Offset2, we can model it.
4994   if (Ptr.getOpcode() != ISD::ADD ||
4995       !isa<ConstantSDNode>(Ptr.getOperand(1)) ||
4996       !isa<FrameIndexSDNode>(Ptr.getOperand(0)))
4997     return MachinePointerInfo();
4998
4999   int FI = cast<FrameIndexSDNode>(Ptr.getOperand(0))->getIndex();
5000   return MachinePointerInfo::getFixedStack(
5001       DAG.getMachineFunction(), FI,
5002       Offset + cast<ConstantSDNode>(Ptr.getOperand(1))->getSExtValue());
5003 }
5004
5005 /// InferPointerInfo - If the specified ptr/offset is a frame index, infer a
5006 /// MachinePointerInfo record from it.  This is particularly useful because the
5007 /// code generator has many cases where it doesn't bother passing in a
5008 /// MachinePointerInfo to getLoad or getStore when it has "FI+Cst".
5009 static MachinePointerInfo InferPointerInfo(SelectionDAG &DAG, SDValue Ptr,
5010                                            SDValue OffsetOp) {
5011   // If the 'Offset' value isn't a constant, we can't handle this.
5012   if (ConstantSDNode *OffsetNode = dyn_cast<ConstantSDNode>(OffsetOp))
5013     return InferPointerInfo(DAG, Ptr, OffsetNode->getSExtValue());
5014   if (OffsetOp.getOpcode() == ISD::UNDEF)
5015     return InferPointerInfo(DAG, Ptr);
5016   return MachinePointerInfo();
5017 }
5018
5019
5020 SDValue
5021 SelectionDAG::getLoad(ISD::MemIndexedMode AM, ISD::LoadExtType ExtType,
5022                       EVT VT, SDLoc dl, SDValue Chain,
5023                       SDValue Ptr, SDValue Offset,
5024                       MachinePointerInfo PtrInfo, EVT MemVT,
5025                       bool isVolatile, bool isNonTemporal, bool isInvariant,
5026                       unsigned Alignment, const AAMDNodes &AAInfo,
5027                       const MDNode *Ranges) {
5028   assert(Chain.getValueType() == MVT::Other &&
5029         "Invalid chain type");
5030   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
5031     Alignment = getEVTAlignment(VT);
5032
5033   unsigned Flags = MachineMemOperand::MOLoad;
5034   if (isVolatile)
5035     Flags |= MachineMemOperand::MOVolatile;
5036   if (isNonTemporal)
5037     Flags |= MachineMemOperand::MONonTemporal;
5038   if (isInvariant)
5039     Flags |= MachineMemOperand::MOInvariant;
5040
5041   // If we don't have a PtrInfo, infer the trivial frame index case to simplify
5042   // clients.
5043   if (PtrInfo.V.isNull())
5044     PtrInfo = InferPointerInfo(*this, Ptr, Offset);
5045
5046   MachineFunction &MF = getMachineFunction();
5047   MachineMemOperand *MMO =
5048     MF.getMachineMemOperand(PtrInfo, Flags, MemVT.getStoreSize(), Alignment,
5049                             AAInfo, Ranges);
5050   return getLoad(AM, ExtType, VT, dl, Chain, Ptr, Offset, MemVT, MMO);
5051 }
5052
5053 SDValue
5054 SelectionDAG::getLoad(ISD::MemIndexedMode AM, ISD::LoadExtType ExtType,
5055                       EVT VT, SDLoc dl, SDValue Chain,
5056                       SDValue Ptr, SDValue Offset, EVT MemVT,
5057                       MachineMemOperand *MMO) {
5058   if (VT == MemVT) {
5059     ExtType = ISD::NON_EXTLOAD;
5060   } else if (ExtType == ISD::NON_EXTLOAD) {
5061     assert(VT == MemVT && "Non-extending load from different memory type!");
5062   } else {
5063     // Extending load.
5064     assert(MemVT.getScalarType().bitsLT(VT.getScalarType()) &&
5065            "Should only be an extending load, not truncating!");
5066     assert(VT.isInteger() == MemVT.isInteger() &&
5067            "Cannot convert from FP to Int or Int -> FP!");
5068     assert(VT.isVector() == MemVT.isVector() &&
5069            "Cannot use an ext load to convert to or from a vector!");
5070     assert((!VT.isVector() ||
5071             VT.getVectorNumElements() == MemVT.getVectorNumElements()) &&
5072            "Cannot use an ext load to change the number of vector elements!");
5073   }
5074
5075   bool Indexed = AM != ISD::UNINDEXED;
5076   assert((Indexed || Offset.getOpcode() == ISD::UNDEF) &&
5077          "Unindexed load with an offset!");
5078
5079   SDVTList VTs = Indexed ?
5080     getVTList(VT, Ptr.getValueType(), MVT::Other) : getVTList(VT, MVT::Other);
5081   SDValue Ops[] = { Chain, Ptr, Offset };
5082   FoldingSetNodeID ID;
5083   AddNodeIDNode(ID, ISD::LOAD, VTs, Ops);
5084   ID.AddInteger(MemVT.getRawBits());
5085   ID.AddInteger(encodeMemSDNodeFlags(ExtType, AM, MMO->isVolatile(),
5086                                      MMO->isNonTemporal(),
5087                                      MMO->isInvariant()));
5088   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
5089   void *IP = nullptr;
5090   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP)) {
5091     cast<LoadSDNode>(E)->refineAlignment(MMO);
5092     return SDValue(E, 0);
5093   }
5094   SDNode *N = new (NodeAllocator) LoadSDNode(Ops, dl.getIROrder(),
5095                                              dl.getDebugLoc(), VTs, AM, ExtType,
5096                                              MemVT, MMO);
5097   CSEMap.InsertNode(N, IP);
5098   InsertNode(N);
5099   return SDValue(N, 0);
5100 }
5101
5102 SDValue SelectionDAG::getLoad(EVT VT, SDLoc dl,
5103                               SDValue Chain, SDValue Ptr,
5104                               MachinePointerInfo PtrInfo,
5105                               bool isVolatile, bool isNonTemporal,
5106                               bool isInvariant, unsigned Alignment,
5107                               const AAMDNodes &AAInfo,
5108                               const MDNode *Ranges) {
5109   SDValue Undef = getUNDEF(Ptr.getValueType());
5110   return getLoad(ISD::UNINDEXED, ISD::NON_EXTLOAD, VT, dl, Chain, Ptr, Undef,
5111                  PtrInfo, VT, isVolatile, isNonTemporal, isInvariant, Alignment,
5112                  AAInfo, Ranges);
5113 }
5114
5115 SDValue SelectionDAG::getLoad(EVT VT, SDLoc dl,
5116                               SDValue Chain, SDValue Ptr,
5117                               MachineMemOperand *MMO) {
5118   SDValue Undef = getUNDEF(Ptr.getValueType());
5119   return getLoad(ISD::UNINDEXED, ISD::NON_EXTLOAD, VT, dl, Chain, Ptr, Undef,
5120                  VT, MMO);
5121 }
5122
5123 SDValue SelectionDAG::getExtLoad(ISD::LoadExtType ExtType, SDLoc dl, EVT VT,
5124                                  SDValue Chain, SDValue Ptr,
5125                                  MachinePointerInfo PtrInfo, EVT MemVT,
5126                                  bool isVolatile, bool isNonTemporal,
5127                                  bool isInvariant, unsigned Alignment,
5128                                  const AAMDNodes &AAInfo) {
5129   SDValue Undef = getUNDEF(Ptr.getValueType());
5130   return getLoad(ISD::UNINDEXED, ExtType, VT, dl, Chain, Ptr, Undef,
5131                  PtrInfo, MemVT, isVolatile, isNonTemporal, isInvariant,
5132                  Alignment, AAInfo);
5133 }
5134
5135
5136 SDValue SelectionDAG::getExtLoad(ISD::LoadExtType ExtType, SDLoc dl, EVT VT,
5137                                  SDValue Chain, SDValue Ptr, EVT MemVT,
5138                                  MachineMemOperand *MMO) {
5139   SDValue Undef = getUNDEF(Ptr.getValueType());
5140   return getLoad(ISD::UNINDEXED, ExtType, VT, dl, Chain, Ptr, Undef,
5141                  MemVT, MMO);
5142 }
5143
5144 SDValue
5145 SelectionDAG::getIndexedLoad(SDValue OrigLoad, SDLoc dl, SDValue Base,
5146                              SDValue Offset, ISD::MemIndexedMode AM) {
5147   LoadSDNode *LD = cast<LoadSDNode>(OrigLoad);
5148   assert(LD->getOffset().getOpcode() == ISD::UNDEF &&
5149          "Load is already a indexed load!");
5150   return getLoad(AM, LD->getExtensionType(), OrigLoad.getValueType(), dl,
5151                  LD->getChain(), Base, Offset, LD->getPointerInfo(),
5152                  LD->getMemoryVT(), LD->isVolatile(), LD->isNonTemporal(),
5153                  false, LD->getAlignment());
5154 }
5155
5156 SDValue SelectionDAG::getStore(SDValue Chain, SDLoc dl, SDValue Val,
5157                                SDValue Ptr, MachinePointerInfo PtrInfo,
5158                                bool isVolatile, bool isNonTemporal,
5159                                unsigned Alignment, const AAMDNodes &AAInfo) {
5160   assert(Chain.getValueType() == MVT::Other &&
5161         "Invalid chain type");
5162   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
5163     Alignment = getEVTAlignment(Val.getValueType());
5164
5165   unsigned Flags = MachineMemOperand::MOStore;
5166   if (isVolatile)
5167     Flags |= MachineMemOperand::MOVolatile;
5168   if (isNonTemporal)
5169     Flags |= MachineMemOperand::MONonTemporal;
5170
5171   if (PtrInfo.V.isNull())
5172     PtrInfo = InferPointerInfo(*this, Ptr);
5173
5174   MachineFunction &MF = getMachineFunction();
5175   MachineMemOperand *MMO =
5176     MF.getMachineMemOperand(PtrInfo, Flags,
5177                             Val.getValueType().getStoreSize(), Alignment,
5178                             AAInfo);
5179
5180   return getStore(Chain, dl, Val, Ptr, MMO);
5181 }
5182
5183 SDValue SelectionDAG::getStore(SDValue Chain, SDLoc dl, SDValue Val,
5184                                SDValue Ptr, MachineMemOperand *MMO) {
5185   assert(Chain.getValueType() == MVT::Other &&
5186         "Invalid chain type");
5187   EVT VT = Val.getValueType();
5188   SDVTList VTs = getVTList(MVT::Other);
5189   SDValue Undef = getUNDEF(Ptr.getValueType());
5190   SDValue Ops[] = { Chain, Val, Ptr, Undef };
5191   FoldingSetNodeID ID;
5192   AddNodeIDNode(ID, ISD::STORE, VTs, Ops);
5193   ID.AddInteger(VT.getRawBits());
5194   ID.AddInteger(encodeMemSDNodeFlags(false, ISD::UNINDEXED, MMO->isVolatile(),
5195                                      MMO->isNonTemporal(), MMO->isInvariant()));
5196   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
5197   void *IP = nullptr;
5198   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP)) {
5199     cast<StoreSDNode>(E)->refineAlignment(MMO);
5200     return SDValue(E, 0);
5201   }
5202   SDNode *N = new (NodeAllocator) StoreSDNode(Ops, dl.getIROrder(),
5203                                               dl.getDebugLoc(), VTs,
5204                                               ISD::UNINDEXED, false, VT, MMO);
5205   CSEMap.InsertNode(N, IP);
5206   InsertNode(N);
5207   return SDValue(N, 0);
5208 }
5209
5210 SDValue SelectionDAG::getTruncStore(SDValue Chain, SDLoc dl, SDValue Val,
5211                                     SDValue Ptr, MachinePointerInfo PtrInfo,
5212                                     EVT SVT,bool isVolatile, bool isNonTemporal,
5213                                     unsigned Alignment,
5214                                     const AAMDNodes &AAInfo) {
5215   assert(Chain.getValueType() == MVT::Other &&
5216         "Invalid chain type");
5217   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
5218     Alignment = getEVTAlignment(SVT);
5219
5220   unsigned Flags = MachineMemOperand::MOStore;
5221   if (isVolatile)
5222     Flags |= MachineMemOperand::MOVolatile;
5223   if (isNonTemporal)
5224     Flags |= MachineMemOperand::MONonTemporal;
5225
5226   if (PtrInfo.V.isNull())
5227     PtrInfo = InferPointerInfo(*this, Ptr);
5228
5229   MachineFunction &MF = getMachineFunction();
5230   MachineMemOperand *MMO =
5231     MF.getMachineMemOperand(PtrInfo, Flags, SVT.getStoreSize(), Alignment,
5232                             AAInfo);
5233
5234   return getTruncStore(Chain, dl, Val, Ptr, SVT, MMO);
5235 }
5236
5237 SDValue SelectionDAG::getTruncStore(SDValue Chain, SDLoc dl, SDValue Val,
5238                                     SDValue Ptr, EVT SVT,
5239                                     MachineMemOperand *MMO) {
5240   EVT VT = Val.getValueType();
5241
5242   assert(Chain.getValueType() == MVT::Other &&
5243         "Invalid chain type");
5244   if (VT == SVT)
5245     return getStore(Chain, dl, Val, Ptr, MMO);
5246
5247   assert(SVT.getScalarType().bitsLT(VT.getScalarType()) &&
5248          "Should only be a truncating store, not extending!");
5249   assert(VT.isInteger() == SVT.isInteger() &&
5250          "Can't do FP-INT conversion!");
5251   assert(VT.isVector() == SVT.isVector() &&
5252          "Cannot use trunc store to convert to or from a vector!");
5253   assert((!VT.isVector() ||
5254           VT.getVectorNumElements() == SVT.getVectorNumElements()) &&
5255          "Cannot use trunc store to change the number of vector elements!");
5256
5257   SDVTList VTs = getVTList(MVT::Other);
5258   SDValue Undef = getUNDEF(Ptr.getValueType());
5259   SDValue Ops[] = { Chain, Val, Ptr, Undef };
5260   FoldingSetNodeID ID;
5261   AddNodeIDNode(ID, ISD::STORE, VTs, Ops);
5262   ID.AddInteger(SVT.getRawBits());
5263   ID.AddInteger(encodeMemSDNodeFlags(true, ISD::UNINDEXED, MMO->isVolatile(),
5264                                      MMO->isNonTemporal(), MMO->isInvariant()));
5265   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
5266   void *IP = nullptr;
5267   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP)) {
5268     cast<StoreSDNode>(E)->refineAlignment(MMO);
5269     return SDValue(E, 0);
5270   }
5271   SDNode *N = new (NodeAllocator) StoreSDNode(Ops, dl.getIROrder(),
5272                                               dl.getDebugLoc(), VTs,
5273                                               ISD::UNINDEXED, true, SVT, MMO);
5274   CSEMap.InsertNode(N, IP);
5275   InsertNode(N);
5276   return SDValue(N, 0);
5277 }
5278
5279 SDValue
5280 SelectionDAG::getIndexedStore(SDValue OrigStore, SDLoc dl, SDValue Base,
5281                               SDValue Offset, ISD::MemIndexedMode AM) {
5282   StoreSDNode *ST = cast<StoreSDNode>(OrigStore);
5283   assert(ST->getOffset().getOpcode() == ISD::UNDEF &&
5284          "Store is already a indexed store!");
5285   SDVTList VTs = getVTList(Base.getValueType(), MVT::Other);
5286   SDValue Ops[] = { ST->getChain(), ST->getValue(), Base, Offset };
5287   FoldingSetNodeID ID;
5288   AddNodeIDNode(ID, ISD::STORE, VTs, Ops);
5289   ID.AddInteger(ST->getMemoryVT().getRawBits());
5290   ID.AddInteger(ST->getRawSubclassData());
5291   ID.AddInteger(ST->getPointerInfo().getAddrSpace());
5292   void *IP = nullptr;
5293   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP))
5294     return SDValue(E, 0);
5295
5296   SDNode *N = new (NodeAllocator) StoreSDNode(Ops, dl.getIROrder(),
5297                                               dl.getDebugLoc(), VTs, AM,
5298                                               ST->isTruncatingStore(),
5299                                               ST->getMemoryVT(),
5300                                               ST->getMemOperand());
5301   CSEMap.InsertNode(N, IP);
5302   InsertNode(N);
5303   return SDValue(N, 0);
5304 }
5305
5306 SDValue
5307 SelectionDAG::getMaskedLoad(EVT VT, SDLoc dl, SDValue Chain,
5308                             SDValue Ptr, SDValue Mask, SDValue Src0, EVT MemVT,
5309                             MachineMemOperand *MMO, ISD::LoadExtType ExtTy) {
5310
5311   SDVTList VTs = getVTList(VT, MVT::Other);
5312   SDValue Ops[] = { Chain, Ptr, Mask, Src0 };
5313   FoldingSetNodeID ID;
5314   AddNodeIDNode(ID, ISD::MLOAD, VTs, Ops);
5315   ID.AddInteger(VT.getRawBits());
5316   ID.AddInteger(encodeMemSDNodeFlags(ExtTy, ISD::UNINDEXED,
5317                                      MMO->isVolatile(),
5318                                      MMO->isNonTemporal(),
5319                                      MMO->isInvariant()));
5320   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
5321   void *IP = nullptr;
5322   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP)) {
5323     cast<MaskedLoadSDNode>(E)->refineAlignment(MMO);
5324     return SDValue(E, 0);
5325   }
5326   SDNode *N = new (NodeAllocator) MaskedLoadSDNode(dl.getIROrder(),
5327                                              dl.getDebugLoc(), Ops, 4, VTs,
5328                                              ExtTy, MemVT, MMO);
5329   CSEMap.InsertNode(N, IP);
5330   InsertNode(N);
5331   return SDValue(N, 0);
5332 }
5333
5334 SDValue SelectionDAG::getMaskedStore(SDValue Chain, SDLoc dl, SDValue Val,
5335                                      SDValue Ptr, SDValue Mask, EVT MemVT,
5336                                      MachineMemOperand *MMO, bool isTrunc) {
5337   assert(Chain.getValueType() == MVT::Other &&
5338         "Invalid chain type");
5339   EVT VT = Val.getValueType();
5340   SDVTList VTs = getVTList(MVT::Other);
5341   SDValue Ops[] = { Chain, Ptr, Mask, Val };
5342   FoldingSetNodeID ID;
5343   AddNodeIDNode(ID, ISD::MSTORE, VTs, Ops);
5344   ID.AddInteger(VT.getRawBits());
5345   ID.AddInteger(encodeMemSDNodeFlags(false, ISD::UNINDEXED, MMO->isVolatile(),
5346                                      MMO->isNonTemporal(), MMO->isInvariant()));
5347   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
5348   void *IP = nullptr;
5349   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP)) {
5350     cast<MaskedStoreSDNode>(E)->refineAlignment(MMO);
5351     return SDValue(E, 0);
5352   }
5353   SDNode *N = new (NodeAllocator) MaskedStoreSDNode(dl.getIROrder(),
5354                                                     dl.getDebugLoc(), Ops, 4,
5355                                                     VTs, isTrunc, MemVT, MMO);
5356   CSEMap.InsertNode(N, IP);
5357   InsertNode(N);
5358   return SDValue(N, 0);
5359 }
5360
5361 SDValue
5362 SelectionDAG::getMaskedGather(SDVTList VTs, EVT VT, SDLoc dl,
5363                               ArrayRef<SDValue> Ops,
5364                               MachineMemOperand *MMO) {
5365
5366   FoldingSetNodeID ID;
5367   AddNodeIDNode(ID, ISD::MGATHER, VTs, Ops);
5368   ID.AddInteger(VT.getRawBits());
5369   ID.AddInteger(encodeMemSDNodeFlags(ISD::NON_EXTLOAD, ISD::UNINDEXED,
5370                                      MMO->isVolatile(),
5371                                      MMO->isNonTemporal(),
5372                                      MMO->isInvariant()));
5373   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
5374   void *IP = nullptr;
5375   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP)) {
5376     cast<MaskedGatherSDNode>(E)->refineAlignment(MMO);
5377     return SDValue(E, 0);
5378   }
5379   MaskedGatherSDNode *N =
5380     new (NodeAllocator) MaskedGatherSDNode(dl.getIROrder(), dl.getDebugLoc(),
5381                                            Ops, VTs, VT, MMO);
5382   CSEMap.InsertNode(N, IP);
5383   InsertNode(N);
5384   return SDValue(N, 0);
5385 }
5386
5387 SDValue SelectionDAG::getMaskedScatter(SDVTList VTs, EVT VT, SDLoc dl,
5388                                        ArrayRef<SDValue> Ops,
5389                                        MachineMemOperand *MMO) {
5390   FoldingSetNodeID ID;
5391   AddNodeIDNode(ID, ISD::MSCATTER, VTs, Ops);
5392   ID.AddInteger(VT.getRawBits());
5393   ID.AddInteger(encodeMemSDNodeFlags(false, ISD::UNINDEXED, MMO->isVolatile(),
5394                                      MMO->isNonTemporal(),
5395                                      MMO->isInvariant()));
5396   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
5397   void *IP = nullptr;
5398   if (SDNode *E = FindNodeOrInsertPos(ID, dl.getDebugLoc(), IP)) {
5399     cast<MaskedScatterSDNode>(E)->refineAlignment(MMO);
5400     return SDValue(E, 0);
5401   }
5402   SDNode *N =
5403     new (NodeAllocator) MaskedScatterSDNode(dl.getIROrder(), dl.getDebugLoc(),
5404                                             Ops, VTs, VT, MMO);
5405   CSEMap.InsertNode(N, IP);
5406   InsertNode(N);
5407   return SDValue(N, 0);
5408 }
5409
5410 SDValue SelectionDAG::getVAArg(EVT VT, SDLoc dl,
5411                                SDValue Chain, SDValue Ptr,
5412                                SDValue SV,
5413                                unsigned Align) {
5414   SDValue Ops[] = { Chain, Ptr, SV, getTargetConstant(Align, dl, MVT::i32) };
5415   return getNode(ISD::VAARG, dl, getVTList(VT, MVT::Other), Ops);
5416 }
5417
5418 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
5419                               ArrayRef<SDUse> Ops) {
5420   switch (Ops.size()) {
5421   case 0: return getNode(Opcode, DL, VT);
5422   case 1: return getNode(Opcode, DL, VT, static_cast<const SDValue>(Ops[0]));
5423   case 2: return getNode(Opcode, DL, VT, Ops[0], Ops[1]);
5424   case 3: return getNode(Opcode, DL, VT, Ops[0], Ops[1], Ops[2]);
5425   default: break;
5426   }
5427
5428   // Copy from an SDUse array into an SDValue array for use with
5429   // the regular getNode logic.
5430   SmallVector<SDValue, 8> NewOps(Ops.begin(), Ops.end());
5431   return getNode(Opcode, DL, VT, NewOps);
5432 }
5433
5434 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
5435                               ArrayRef<SDValue> Ops, const SDNodeFlags *Flags) {
5436   unsigned NumOps = Ops.size();
5437   switch (NumOps) {
5438   case 0: return getNode(Opcode, DL, VT);
5439   case 1: return getNode(Opcode, DL, VT, Ops[0]);
5440   case 2: return getNode(Opcode, DL, VT, Ops[0], Ops[1], Flags);
5441   case 3: return getNode(Opcode, DL, VT, Ops[0], Ops[1], Ops[2]);
5442   default: break;
5443   }
5444
5445   switch (Opcode) {
5446   default: break;
5447   case ISD::SELECT_CC: {
5448     assert(NumOps == 5 && "SELECT_CC takes 5 operands!");
5449     assert(Ops[0].getValueType() == Ops[1].getValueType() &&
5450            "LHS and RHS of condition must have same type!");
5451     assert(Ops[2].getValueType() == Ops[3].getValueType() &&
5452            "True and False arms of SelectCC must have same type!");
5453     assert(Ops[2].getValueType() == VT &&
5454            "select_cc node must be of same type as true and false value!");
5455     break;
5456   }
5457   case ISD::BR_CC: {
5458     assert(NumOps == 5 && "BR_CC takes 5 operands!");
5459     assert(Ops[2].getValueType() == Ops[3].getValueType() &&
5460            "LHS/RHS of comparison should match types!");
5461     break;
5462   }
5463   }
5464
5465   // Memoize nodes.
5466   SDNode *N;
5467   SDVTList VTs = getVTList(VT);
5468
5469   if (VT != MVT::Glue) {
5470     FoldingSetNodeID ID;
5471     AddNodeIDNode(ID, Opcode, VTs, Ops);
5472     void *IP = nullptr;
5473
5474     if (SDNode *E = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP))
5475       return SDValue(E, 0);
5476
5477     N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(),
5478                                    VTs, Ops);
5479     CSEMap.InsertNode(N, IP);
5480   } else {
5481     N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(),
5482                                    VTs, Ops);
5483   }
5484
5485   InsertNode(N);
5486   return SDValue(N, 0);
5487 }
5488
5489 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL,
5490                               ArrayRef<EVT> ResultTys, ArrayRef<SDValue> Ops) {
5491   return getNode(Opcode, DL, getVTList(ResultTys), Ops);
5492 }
5493
5494 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5495                               ArrayRef<SDValue> Ops) {
5496   if (VTList.NumVTs == 1)
5497     return getNode(Opcode, DL, VTList.VTs[0], Ops);
5498
5499 #if 0
5500   switch (Opcode) {
5501   // FIXME: figure out how to safely handle things like
5502   // int foo(int x) { return 1 << (x & 255); }
5503   // int bar() { return foo(256); }
5504   case ISD::SRA_PARTS:
5505   case ISD::SRL_PARTS:
5506   case ISD::SHL_PARTS:
5507     if (N3.getOpcode() == ISD::SIGN_EXTEND_INREG &&
5508         cast<VTSDNode>(N3.getOperand(1))->getVT() != MVT::i1)
5509       return getNode(Opcode, DL, VT, N1, N2, N3.getOperand(0));
5510     else if (N3.getOpcode() == ISD::AND)
5511       if (ConstantSDNode *AndRHS = dyn_cast<ConstantSDNode>(N3.getOperand(1))) {
5512         // If the and is only masking out bits that cannot effect the shift,
5513         // eliminate the and.
5514         unsigned NumBits = VT.getScalarType().getSizeInBits()*2;
5515         if ((AndRHS->getValue() & (NumBits-1)) == NumBits-1)
5516           return getNode(Opcode, DL, VT, N1, N2, N3.getOperand(0));
5517       }
5518     break;
5519   }
5520 #endif
5521
5522   // Memoize the node unless it returns a flag.
5523   SDNode *N;
5524   unsigned NumOps = Ops.size();
5525   if (VTList.VTs[VTList.NumVTs-1] != MVT::Glue) {
5526     FoldingSetNodeID ID;
5527     AddNodeIDNode(ID, Opcode, VTList, Ops);
5528     void *IP = nullptr;
5529     if (SDNode *E = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP))
5530       return SDValue(E, 0);
5531
5532     if (NumOps == 1) {
5533       N = new (NodeAllocator) UnarySDNode(Opcode, DL.getIROrder(),
5534                                           DL.getDebugLoc(), VTList, Ops[0]);
5535     } else if (NumOps == 2) {
5536       N = new (NodeAllocator) BinarySDNode(Opcode, DL.getIROrder(),
5537                                            DL.getDebugLoc(), VTList, Ops[0],
5538                                            Ops[1]);
5539     } else if (NumOps == 3) {
5540       N = new (NodeAllocator) TernarySDNode(Opcode, DL.getIROrder(),
5541                                             DL.getDebugLoc(), VTList, Ops[0],
5542                                             Ops[1], Ops[2]);
5543     } else {
5544       N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(),
5545                                      VTList, Ops);
5546     }
5547     CSEMap.InsertNode(N, IP);
5548   } else {
5549     if (NumOps == 1) {
5550       N = new (NodeAllocator) UnarySDNode(Opcode, DL.getIROrder(),
5551                                           DL.getDebugLoc(), VTList, Ops[0]);
5552     } else if (NumOps == 2) {
5553       N = new (NodeAllocator) BinarySDNode(Opcode, DL.getIROrder(),
5554                                            DL.getDebugLoc(), VTList, Ops[0],
5555                                            Ops[1]);
5556     } else if (NumOps == 3) {
5557       N = new (NodeAllocator) TernarySDNode(Opcode, DL.getIROrder(),
5558                                             DL.getDebugLoc(), VTList, Ops[0],
5559                                             Ops[1], Ops[2]);
5560     } else {
5561       N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(),
5562                                      VTList, Ops);
5563     }
5564   }
5565   InsertNode(N);
5566   return SDValue(N, 0);
5567 }
5568
5569 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList) {
5570   return getNode(Opcode, DL, VTList, None);
5571 }
5572
5573 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5574                               SDValue N1) {
5575   SDValue Ops[] = { N1 };
5576   return getNode(Opcode, DL, VTList, Ops);
5577 }
5578
5579 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5580                               SDValue N1, SDValue N2) {
5581   SDValue Ops[] = { N1, N2 };
5582   return getNode(Opcode, DL, VTList, Ops);
5583 }
5584
5585 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5586                               SDValue N1, SDValue N2, SDValue N3) {
5587   SDValue Ops[] = { N1, N2, N3 };
5588   return getNode(Opcode, DL, VTList, Ops);
5589 }
5590
5591 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5592                               SDValue N1, SDValue N2, SDValue N3,
5593                               SDValue N4) {
5594   SDValue Ops[] = { N1, N2, N3, N4 };
5595   return getNode(Opcode, DL, VTList, Ops);
5596 }
5597
5598 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5599                               SDValue N1, SDValue N2, SDValue N3,
5600                               SDValue N4, SDValue N5) {
5601   SDValue Ops[] = { N1, N2, N3, N4, N5 };
5602   return getNode(Opcode, DL, VTList, Ops);
5603 }
5604
5605 SDVTList SelectionDAG::getVTList(EVT VT) {
5606   return makeVTList(SDNode::getValueTypeList(VT), 1);
5607 }
5608
5609 SDVTList SelectionDAG::getVTList(EVT VT1, EVT VT2) {
5610   FoldingSetNodeID ID;
5611   ID.AddInteger(2U);
5612   ID.AddInteger(VT1.getRawBits());
5613   ID.AddInteger(VT2.getRawBits());
5614
5615   void *IP = nullptr;
5616   SDVTListNode *Result = VTListMap.FindNodeOrInsertPos(ID, IP);
5617   if (!Result) {
5618     EVT *Array = Allocator.Allocate<EVT>(2);
5619     Array[0] = VT1;
5620     Array[1] = VT2;
5621     Result = new (Allocator) SDVTListNode(ID.Intern(Allocator), Array, 2);
5622     VTListMap.InsertNode(Result, IP);
5623   }
5624   return Result->getSDVTList();
5625 }
5626
5627 SDVTList SelectionDAG::getVTList(EVT VT1, EVT VT2, EVT VT3) {
5628   FoldingSetNodeID ID;
5629   ID.AddInteger(3U);
5630   ID.AddInteger(VT1.getRawBits());
5631   ID.AddInteger(VT2.getRawBits());
5632   ID.AddInteger(VT3.getRawBits());
5633
5634   void *IP = nullptr;
5635   SDVTListNode *Result = VTListMap.FindNodeOrInsertPos(ID, IP);
5636   if (!Result) {
5637     EVT *Array = Allocator.Allocate<EVT>(3);
5638     Array[0] = VT1;
5639     Array[1] = VT2;
5640     Array[2] = VT3;
5641     Result = new (Allocator) SDVTListNode(ID.Intern(Allocator), Array, 3);
5642     VTListMap.InsertNode(Result, IP);
5643   }
5644   return Result->getSDVTList();
5645 }
5646
5647 SDVTList SelectionDAG::getVTList(EVT VT1, EVT VT2, EVT VT3, EVT VT4) {
5648   FoldingSetNodeID ID;
5649   ID.AddInteger(4U);
5650   ID.AddInteger(VT1.getRawBits());
5651   ID.AddInteger(VT2.getRawBits());
5652   ID.AddInteger(VT3.getRawBits());
5653   ID.AddInteger(VT4.getRawBits());
5654
5655   void *IP = nullptr;
5656   SDVTListNode *Result = VTListMap.FindNodeOrInsertPos(ID, IP);
5657   if (!Result) {
5658     EVT *Array = Allocator.Allocate<EVT>(4);
5659     Array[0] = VT1;
5660     Array[1] = VT2;
5661     Array[2] = VT3;
5662     Array[3] = VT4;
5663     Result = new (Allocator) SDVTListNode(ID.Intern(Allocator), Array, 4);
5664     VTListMap.InsertNode(Result, IP);
5665   }
5666   return Result->getSDVTList();
5667 }
5668
5669 SDVTList SelectionDAG::getVTList(ArrayRef<EVT> VTs) {
5670   unsigned NumVTs = VTs.size();
5671   FoldingSetNodeID ID;
5672   ID.AddInteger(NumVTs);
5673   for (unsigned index = 0; index < NumVTs; index++) {
5674     ID.AddInteger(VTs[index].getRawBits());
5675   }
5676
5677   void *IP = nullptr;
5678   SDVTListNode *Result = VTListMap.FindNodeOrInsertPos(ID, IP);
5679   if (!Result) {
5680     EVT *Array = Allocator.Allocate<EVT>(NumVTs);
5681     std::copy(VTs.begin(), VTs.end(), Array);
5682     Result = new (Allocator) SDVTListNode(ID.Intern(Allocator), Array, NumVTs);
5683     VTListMap.InsertNode(Result, IP);
5684   }
5685   return Result->getSDVTList();
5686 }
5687
5688
5689 /// UpdateNodeOperands - *Mutate* the specified node in-place to have the
5690 /// specified operands.  If the resultant node already exists in the DAG,
5691 /// this does not modify the specified node, instead it returns the node that
5692 /// already exists.  If the resultant node does not exist in the DAG, the
5693 /// input node is returned.  As a degenerate case, if you specify the same
5694 /// input operands as the node already has, the input node is returned.
5695 SDNode *SelectionDAG::UpdateNodeOperands(SDNode *N, SDValue Op) {
5696   assert(N->getNumOperands() == 1 && "Update with wrong number of operands");
5697
5698   // Check to see if there is no change.
5699   if (Op == N->getOperand(0)) return N;
5700
5701   // See if the modified node already exists.
5702   void *InsertPos = nullptr;
5703   if (SDNode *Existing = FindModifiedNodeSlot(N, Op, InsertPos))
5704     return Existing;
5705
5706   // Nope it doesn't.  Remove the node from its current place in the maps.
5707   if (InsertPos)
5708     if (!RemoveNodeFromCSEMaps(N))
5709       InsertPos = nullptr;
5710
5711   // Now we update the operands.
5712   N->OperandList[0].set(Op);
5713
5714   // If this gets put into a CSE map, add it.
5715   if (InsertPos) CSEMap.InsertNode(N, InsertPos);
5716   return N;
5717 }
5718
5719 SDNode *SelectionDAG::UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2) {
5720   assert(N->getNumOperands() == 2 && "Update with wrong number of operands");
5721
5722   // Check to see if there is no change.
5723   if (Op1 == N->getOperand(0) && Op2 == N->getOperand(1))
5724     return N;   // No operands changed, just return the input node.
5725
5726   // See if the modified node already exists.
5727   void *InsertPos = nullptr;
5728   if (SDNode *Existing = FindModifiedNodeSlot(N, Op1, Op2, InsertPos))
5729     return Existing;
5730
5731   // Nope it doesn't.  Remove the node from its current place in the maps.
5732   if (InsertPos)
5733     if (!RemoveNodeFromCSEMaps(N))
5734       InsertPos = nullptr;
5735
5736   // Now we update the operands.
5737   if (N->OperandList[0] != Op1)
5738     N->OperandList[0].set(Op1);
5739   if (N->OperandList[1] != Op2)
5740     N->OperandList[1].set(Op2);
5741
5742   // If this gets put into a CSE map, add it.
5743   if (InsertPos) CSEMap.InsertNode(N, InsertPos);
5744   return N;
5745 }
5746
5747 SDNode *SelectionDAG::
5748 UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2, SDValue Op3) {
5749   SDValue Ops[] = { Op1, Op2, Op3 };
5750   return UpdateNodeOperands(N, Ops);
5751 }
5752
5753 SDNode *SelectionDAG::
5754 UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2,
5755                    SDValue Op3, SDValue Op4) {
5756   SDValue Ops[] = { Op1, Op2, Op3, Op4 };
5757   return UpdateNodeOperands(N, Ops);
5758 }
5759
5760 SDNode *SelectionDAG::
5761 UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2,
5762                    SDValue Op3, SDValue Op4, SDValue Op5) {
5763   SDValue Ops[] = { Op1, Op2, Op3, Op4, Op5 };
5764   return UpdateNodeOperands(N, Ops);
5765 }
5766
5767 SDNode *SelectionDAG::
5768 UpdateNodeOperands(SDNode *N, ArrayRef<SDValue> Ops) {
5769   unsigned NumOps = Ops.size();
5770   assert(N->getNumOperands() == NumOps &&
5771          "Update with wrong number of operands");
5772
5773   // If no operands changed just return the input node.
5774   if (std::equal(Ops.begin(), Ops.end(), N->op_begin()))
5775     return N;
5776
5777   // See if the modified node already exists.
5778   void *InsertPos = nullptr;
5779   if (SDNode *Existing = FindModifiedNodeSlot(N, Ops, InsertPos))
5780     return Existing;
5781
5782   // Nope it doesn't.  Remove the node from its current place in the maps.
5783   if (InsertPos)
5784     if (!RemoveNodeFromCSEMaps(N))
5785       InsertPos = nullptr;
5786
5787   // Now we update the operands.
5788   for (unsigned i = 0; i != NumOps; ++i)
5789     if (N->OperandList[i] != Ops[i])
5790       N->OperandList[i].set(Ops[i]);
5791
5792   // If this gets put into a CSE map, add it.
5793   if (InsertPos) CSEMap.InsertNode(N, InsertPos);
5794   return N;
5795 }
5796
5797 /// DropOperands - Release the operands and set this node to have
5798 /// zero operands.
5799 void SDNode::DropOperands() {
5800   // Unlike the code in MorphNodeTo that does this, we don't need to
5801   // watch for dead nodes here.
5802   for (op_iterator I = op_begin(), E = op_end(); I != E; ) {
5803     SDUse &Use = *I++;
5804     Use.set(SDValue());
5805   }
5806 }
5807
5808 /// SelectNodeTo - These are wrappers around MorphNodeTo that accept a
5809 /// machine opcode.
5810 ///
5811 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5812                                    EVT VT) {
5813   SDVTList VTs = getVTList(VT);
5814   return SelectNodeTo(N, MachineOpc, VTs, None);
5815 }
5816
5817 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5818                                    EVT VT, SDValue Op1) {
5819   SDVTList VTs = getVTList(VT);
5820   SDValue Ops[] = { Op1 };
5821   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5822 }
5823
5824 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5825                                    EVT VT, SDValue Op1,
5826                                    SDValue Op2) {
5827   SDVTList VTs = getVTList(VT);
5828   SDValue Ops[] = { Op1, Op2 };
5829   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5830 }
5831
5832 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5833                                    EVT VT, SDValue Op1,
5834                                    SDValue Op2, SDValue Op3) {
5835   SDVTList VTs = getVTList(VT);
5836   SDValue Ops[] = { Op1, Op2, Op3 };
5837   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5838 }
5839
5840 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5841                                    EVT VT, ArrayRef<SDValue> Ops) {
5842   SDVTList VTs = getVTList(VT);
5843   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5844 }
5845
5846 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5847                                    EVT VT1, EVT VT2, ArrayRef<SDValue> Ops) {
5848   SDVTList VTs = getVTList(VT1, VT2);
5849   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5850 }
5851
5852 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5853                                    EVT VT1, EVT VT2) {
5854   SDVTList VTs = getVTList(VT1, VT2);
5855   return SelectNodeTo(N, MachineOpc, VTs, None);
5856 }
5857
5858 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5859                                    EVT VT1, EVT VT2, EVT VT3,
5860                                    ArrayRef<SDValue> Ops) {
5861   SDVTList VTs = getVTList(VT1, VT2, VT3);
5862   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5863 }
5864
5865 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5866                                    EVT VT1, EVT VT2, EVT VT3, EVT VT4,
5867                                    ArrayRef<SDValue> Ops) {
5868   SDVTList VTs = getVTList(VT1, VT2, VT3, VT4);
5869   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5870 }
5871
5872 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5873                                    EVT VT1, EVT VT2,
5874                                    SDValue Op1) {
5875   SDVTList VTs = getVTList(VT1, VT2);
5876   SDValue Ops[] = { Op1 };
5877   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5878 }
5879
5880 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5881                                    EVT VT1, EVT VT2,
5882                                    SDValue Op1, SDValue Op2) {
5883   SDVTList VTs = getVTList(VT1, VT2);
5884   SDValue Ops[] = { Op1, Op2 };
5885   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5886 }
5887
5888 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5889                                    EVT VT1, EVT VT2,
5890                                    SDValue Op1, SDValue Op2,
5891                                    SDValue Op3) {
5892   SDVTList VTs = getVTList(VT1, VT2);
5893   SDValue Ops[] = { Op1, Op2, Op3 };
5894   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5895 }
5896
5897 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5898                                    EVT VT1, EVT VT2, EVT VT3,
5899                                    SDValue Op1, SDValue Op2,
5900                                    SDValue Op3) {
5901   SDVTList VTs = getVTList(VT1, VT2, VT3);
5902   SDValue Ops[] = { Op1, Op2, Op3 };
5903   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5904 }
5905
5906 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5907                                    SDVTList VTs,ArrayRef<SDValue> Ops) {
5908   N = MorphNodeTo(N, ~MachineOpc, VTs, Ops);
5909   // Reset the NodeID to -1.
5910   N->setNodeId(-1);
5911   return N;
5912 }
5913
5914 /// UpdadeSDLocOnMergedSDNode - If the opt level is -O0 then it throws away
5915 /// the line number information on the merged node since it is not possible to
5916 /// preserve the information that operation is associated with multiple lines.
5917 /// This will make the debugger working better at -O0, were there is a higher
5918 /// probability having other instructions associated with that line.
5919 ///
5920 /// For IROrder, we keep the smaller of the two
5921 SDNode *SelectionDAG::UpdadeSDLocOnMergedSDNode(SDNode *N, SDLoc OLoc) {
5922   DebugLoc NLoc = N->getDebugLoc();
5923   if (NLoc && OptLevel == CodeGenOpt::None && OLoc.getDebugLoc() != NLoc) {
5924     N->setDebugLoc(DebugLoc());
5925   }
5926   unsigned Order = std::min(N->getIROrder(), OLoc.getIROrder());
5927   N->setIROrder(Order);
5928   return N;
5929 }
5930
5931 /// MorphNodeTo - This *mutates* the specified node to have the specified
5932 /// return type, opcode, and operands.
5933 ///
5934 /// Note that MorphNodeTo returns the resultant node.  If there is already a
5935 /// node of the specified opcode and operands, it returns that node instead of
5936 /// the current one.  Note that the SDLoc need not be the same.
5937 ///
5938 /// Using MorphNodeTo is faster than creating a new node and swapping it in
5939 /// with ReplaceAllUsesWith both because it often avoids allocating a new
5940 /// node, and because it doesn't require CSE recalculation for any of
5941 /// the node's users.
5942 ///
5943 /// However, note that MorphNodeTo recursively deletes dead nodes from the DAG.
5944 /// As a consequence it isn't appropriate to use from within the DAG combiner or
5945 /// the legalizer which maintain worklists that would need to be updated when
5946 /// deleting things.
5947 SDNode *SelectionDAG::MorphNodeTo(SDNode *N, unsigned Opc,
5948                                   SDVTList VTs, ArrayRef<SDValue> Ops) {
5949   unsigned NumOps = Ops.size();
5950   // If an identical node already exists, use it.
5951   void *IP = nullptr;
5952   if (VTs.VTs[VTs.NumVTs-1] != MVT::Glue) {
5953     FoldingSetNodeID ID;
5954     AddNodeIDNode(ID, Opc, VTs, Ops);
5955     if (SDNode *ON = FindNodeOrInsertPos(ID, N->getDebugLoc(), IP))
5956       return UpdadeSDLocOnMergedSDNode(ON, SDLoc(N));
5957   }
5958
5959   if (!RemoveNodeFromCSEMaps(N))
5960     IP = nullptr;
5961
5962   // Start the morphing.
5963   N->NodeType = Opc;
5964   N->ValueList = VTs.VTs;
5965   N->NumValues = VTs.NumVTs;
5966
5967   // Clear the operands list, updating used nodes to remove this from their
5968   // use list.  Keep track of any operands that become dead as a result.
5969   SmallPtrSet<SDNode*, 16> DeadNodeSet;
5970   for (SDNode::op_iterator I = N->op_begin(), E = N->op_end(); I != E; ) {
5971     SDUse &Use = *I++;
5972     SDNode *Used = Use.getNode();
5973     Use.set(SDValue());
5974     if (Used->use_empty())
5975       DeadNodeSet.insert(Used);
5976   }
5977
5978   if (MachineSDNode *MN = dyn_cast<MachineSDNode>(N)) {
5979     // Initialize the memory references information.
5980     MN->setMemRefs(nullptr, nullptr);
5981     // If NumOps is larger than the # of operands we can have in a
5982     // MachineSDNode, reallocate the operand list.
5983     if (NumOps > MN->NumOperands || !MN->OperandsNeedDelete) {
5984       if (MN->OperandsNeedDelete)
5985         delete[] MN->OperandList;
5986       if (NumOps > array_lengthof(MN->LocalOperands))
5987         // We're creating a final node that will live unmorphed for the
5988         // remainder of the current SelectionDAG iteration, so we can allocate
5989         // the operands directly out of a pool with no recycling metadata.
5990         MN->InitOperands(OperandAllocator.Allocate<SDUse>(NumOps),
5991                          Ops.data(), NumOps);
5992       else
5993         MN->InitOperands(MN->LocalOperands, Ops.data(), NumOps);
5994       MN->OperandsNeedDelete = false;
5995     } else
5996       MN->InitOperands(MN->OperandList, Ops.data(), NumOps);
5997   } else {
5998     // If NumOps is larger than the # of operands we currently have, reallocate
5999     // the operand list.
6000     if (NumOps > N->NumOperands) {
6001       if (N->OperandsNeedDelete)
6002         delete[] N->OperandList;
6003       N->InitOperands(new SDUse[NumOps], Ops.data(), NumOps);
6004       N->OperandsNeedDelete = true;
6005     } else
6006       N->InitOperands(N->OperandList, Ops.data(), NumOps);
6007   }
6008
6009   // Delete any nodes that are still dead after adding the uses for the
6010   // new operands.
6011   if (!DeadNodeSet.empty()) {
6012     SmallVector<SDNode *, 16> DeadNodes;
6013     for (SDNode *N : DeadNodeSet)
6014       if (N->use_empty())
6015         DeadNodes.push_back(N);
6016     RemoveDeadNodes(DeadNodes);
6017   }
6018
6019   if (IP)
6020     CSEMap.InsertNode(N, IP);   // Memoize the new node.
6021   return N;
6022 }
6023
6024
6025 /// getMachineNode - These are used for target selectors to create a new node
6026 /// with specified return type(s), MachineInstr opcode, and operands.
6027 ///
6028 /// Note that getMachineNode returns the resultant node.  If there is already a
6029 /// node of the specified opcode and operands, it returns that node instead of
6030 /// the current one.
6031 MachineSDNode *
6032 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT) {
6033   SDVTList VTs = getVTList(VT);
6034   return getMachineNode(Opcode, dl, VTs, None);
6035 }
6036
6037 MachineSDNode *
6038 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT, SDValue Op1) {
6039   SDVTList VTs = getVTList(VT);
6040   SDValue Ops[] = { Op1 };
6041   return getMachineNode(Opcode, dl, VTs, Ops);
6042 }
6043
6044 MachineSDNode *
6045 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT,
6046                              SDValue Op1, SDValue Op2) {
6047   SDVTList VTs = getVTList(VT);
6048   SDValue Ops[] = { Op1, Op2 };
6049   return getMachineNode(Opcode, dl, VTs, Ops);
6050 }
6051
6052 MachineSDNode *
6053 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT,
6054                              SDValue Op1, SDValue Op2, SDValue Op3) {
6055   SDVTList VTs = getVTList(VT);
6056   SDValue Ops[] = { Op1, Op2, Op3 };
6057   return getMachineNode(Opcode, dl, VTs, Ops);
6058 }
6059
6060 MachineSDNode *
6061 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT,
6062                              ArrayRef<SDValue> Ops) {
6063   SDVTList VTs = getVTList(VT);
6064   return getMachineNode(Opcode, dl, VTs, Ops);
6065 }
6066
6067 MachineSDNode *
6068 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT1, EVT VT2) {
6069   SDVTList VTs = getVTList(VT1, VT2);
6070   return getMachineNode(Opcode, dl, VTs, None);
6071 }
6072
6073 MachineSDNode *
6074 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
6075                              EVT VT1, EVT VT2, SDValue Op1) {
6076   SDVTList VTs = getVTList(VT1, VT2);
6077   SDValue Ops[] = { Op1 };
6078   return getMachineNode(Opcode, dl, VTs, Ops);
6079 }
6080
6081 MachineSDNode *
6082 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
6083                              EVT VT1, EVT VT2, SDValue Op1, SDValue Op2) {
6084   SDVTList VTs = getVTList(VT1, VT2);
6085   SDValue Ops[] = { Op1, Op2 };
6086   return getMachineNode(Opcode, dl, VTs, Ops);
6087 }
6088
6089 MachineSDNode *
6090 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
6091                              EVT VT1, EVT VT2, SDValue Op1,
6092                              SDValue Op2, SDValue Op3) {
6093   SDVTList VTs = getVTList(VT1, VT2);
6094   SDValue Ops[] = { Op1, Op2, Op3 };
6095   return getMachineNode(Opcode, dl, VTs, Ops);
6096 }
6097
6098 MachineSDNode *
6099 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
6100                              EVT VT1, EVT VT2,
6101                              ArrayRef<SDValue> Ops) {
6102   SDVTList VTs = getVTList(VT1, VT2);
6103   return getMachineNode(Opcode, dl, VTs, Ops);
6104 }
6105
6106 MachineSDNode *
6107 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
6108                              EVT VT1, EVT VT2, EVT VT3,
6109                              SDValue Op1, SDValue Op2) {
6110   SDVTList VTs = getVTList(VT1, VT2, VT3);
6111   SDValue Ops[] = { Op1, Op2 };
6112   return getMachineNode(Opcode, dl, VTs, Ops);
6113 }
6114
6115 MachineSDNode *
6116 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
6117                              EVT VT1, EVT VT2, EVT VT3,
6118                              SDValue Op1, SDValue Op2, SDValue Op3) {
6119   SDVTList VTs = getVTList(VT1, VT2, VT3);
6120   SDValue Ops[] = { Op1, Op2, Op3 };
6121   return getMachineNode(Opcode, dl, VTs, Ops);
6122 }
6123
6124 MachineSDNode *
6125 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
6126                              EVT VT1, EVT VT2, EVT VT3,
6127                              ArrayRef<SDValue> Ops) {
6128   SDVTList VTs = getVTList(VT1, VT2, VT3);
6129   return getMachineNode(Opcode, dl, VTs, Ops);
6130 }
6131
6132 MachineSDNode *
6133 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT1,
6134                              EVT VT2, EVT VT3, EVT VT4,
6135                              ArrayRef<SDValue> Ops) {
6136   SDVTList VTs = getVTList(VT1, VT2, VT3, VT4);
6137   return getMachineNode(Opcode, dl, VTs, Ops);
6138 }
6139
6140 MachineSDNode *
6141 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
6142                              ArrayRef<EVT> ResultTys,
6143                              ArrayRef<SDValue> Ops) {
6144   SDVTList VTs = getVTList(ResultTys);
6145   return getMachineNode(Opcode, dl, VTs, Ops);
6146 }
6147
6148 MachineSDNode *
6149 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc DL, SDVTList VTs,
6150                              ArrayRef<SDValue> OpsArray) {
6151   bool DoCSE = VTs.VTs[VTs.NumVTs-1] != MVT::Glue;
6152   MachineSDNode *N;
6153   void *IP = nullptr;
6154   const SDValue *Ops = OpsArray.data();
6155   unsigned NumOps = OpsArray.size();
6156
6157   if (DoCSE) {
6158     FoldingSetNodeID ID;
6159     AddNodeIDNode(ID, ~Opcode, VTs, OpsArray);
6160     IP = nullptr;
6161     if (SDNode *E = FindNodeOrInsertPos(ID, DL.getDebugLoc(), IP)) {
6162       return cast<MachineSDNode>(UpdadeSDLocOnMergedSDNode(E, DL));
6163     }
6164   }
6165
6166   // Allocate a new MachineSDNode.
6167   N = new (NodeAllocator) MachineSDNode(~Opcode, DL.getIROrder(),
6168                                         DL.getDebugLoc(), VTs);
6169
6170   // Initialize the operands list.
6171   if (NumOps > array_lengthof(N->LocalOperands))
6172     // We're creating a final node that will live unmorphed for the
6173     // remainder of the current SelectionDAG iteration, so we can allocate
6174     // the operands directly out of a pool with no recycling metadata.
6175     N->InitOperands(OperandAllocator.Allocate<SDUse>(NumOps),
6176                     Ops, NumOps);
6177   else
6178     N->InitOperands(N->LocalOperands, Ops, NumOps);
6179   N->OperandsNeedDelete = false;
6180
6181   if (DoCSE)
6182     CSEMap.InsertNode(N, IP);
6183
6184   InsertNode(N);
6185   return N;
6186 }
6187
6188 /// getTargetExtractSubreg - A convenience function for creating
6189 /// TargetOpcode::EXTRACT_SUBREG nodes.
6190 SDValue
6191 SelectionDAG::getTargetExtractSubreg(int SRIdx, SDLoc DL, EVT VT,
6192                                      SDValue Operand) {
6193   SDValue SRIdxVal = getTargetConstant(SRIdx, DL, MVT::i32);
6194   SDNode *Subreg = getMachineNode(TargetOpcode::EXTRACT_SUBREG, DL,
6195                                   VT, Operand, SRIdxVal);
6196   return SDValue(Subreg, 0);
6197 }
6198
6199 /// getTargetInsertSubreg - A convenience function for creating
6200 /// TargetOpcode::INSERT_SUBREG nodes.
6201 SDValue
6202 SelectionDAG::getTargetInsertSubreg(int SRIdx, SDLoc DL, EVT VT,
6203                                     SDValue Operand, SDValue Subreg) {
6204   SDValue SRIdxVal = getTargetConstant(SRIdx, DL, MVT::i32);
6205   SDNode *Result = getMachineNode(TargetOpcode::INSERT_SUBREG, DL,
6206                                   VT, Operand, Subreg, SRIdxVal);
6207   return SDValue(Result, 0);
6208 }
6209
6210 /// getNodeIfExists - Get the specified node if it's already available, or
6211 /// else return NULL.
6212 SDNode *SelectionDAG::getNodeIfExists(unsigned Opcode, SDVTList VTList,
6213                                       ArrayRef<SDValue> Ops,
6214                                       const SDNodeFlags *Flags) {
6215   if (VTList.VTs[VTList.NumVTs - 1] != MVT::Glue) {
6216     FoldingSetNodeID ID;
6217     AddNodeIDNode(ID, Opcode, VTList, Ops);
6218     AddNodeIDFlags(ID, Opcode, Flags);
6219     void *IP = nullptr;
6220     if (SDNode *E = FindNodeOrInsertPos(ID, DebugLoc(), IP))
6221       return E;
6222   }
6223   return nullptr;
6224 }
6225
6226 /// getDbgValue - Creates a SDDbgValue node.
6227 ///
6228 /// SDNode
6229 SDDbgValue *SelectionDAG::getDbgValue(MDNode *Var, MDNode *Expr, SDNode *N,
6230                                       unsigned R, bool IsIndirect, uint64_t Off,
6231                                       DebugLoc DL, unsigned O) {
6232   assert(cast<DILocalVariable>(Var)->isValidLocationForIntrinsic(DL) &&
6233          "Expected inlined-at fields to agree");
6234   return new (DbgInfo->getAlloc())
6235       SDDbgValue(Var, Expr, N, R, IsIndirect, Off, DL, O);
6236 }
6237
6238 /// Constant
6239 SDDbgValue *SelectionDAG::getConstantDbgValue(MDNode *Var, MDNode *Expr,
6240                                               const Value *C, uint64_t Off,
6241                                               DebugLoc DL, unsigned O) {
6242   assert(cast<DILocalVariable>(Var)->isValidLocationForIntrinsic(DL) &&
6243          "Expected inlined-at fields to agree");
6244   return new (DbgInfo->getAlloc()) SDDbgValue(Var, Expr, C, Off, DL, O);
6245 }
6246
6247 /// FrameIndex
6248 SDDbgValue *SelectionDAG::getFrameIndexDbgValue(MDNode *Var, MDNode *Expr,
6249                                                 unsigned FI, uint64_t Off,
6250                                                 DebugLoc DL, unsigned O) {
6251   assert(cast<DILocalVariable>(Var)->isValidLocationForIntrinsic(DL) &&
6252          "Expected inlined-at fields to agree");
6253   return new (DbgInfo->getAlloc()) SDDbgValue(Var, Expr, FI, Off, DL, O);
6254 }
6255
6256 namespace {
6257
6258 /// RAUWUpdateListener - Helper for ReplaceAllUsesWith - When the node
6259 /// pointed to by a use iterator is deleted, increment the use iterator
6260 /// so that it doesn't dangle.
6261 ///
6262 class RAUWUpdateListener : public SelectionDAG::DAGUpdateListener {
6263   SDNode::use_iterator &UI;
6264   SDNode::use_iterator &UE;
6265
6266   void NodeDeleted(SDNode *N, SDNode *E) override {
6267     // Increment the iterator as needed.
6268     while (UI != UE && N == *UI)
6269       ++UI;
6270   }
6271
6272 public:
6273   RAUWUpdateListener(SelectionDAG &d,
6274                      SDNode::use_iterator &ui,
6275                      SDNode::use_iterator &ue)
6276     : SelectionDAG::DAGUpdateListener(d), UI(ui), UE(ue) {}
6277 };
6278
6279 }
6280
6281 /// ReplaceAllUsesWith - Modify anything using 'From' to use 'To' instead.
6282 /// This can cause recursive merging of nodes in the DAG.
6283 ///
6284 /// This version assumes From has a single result value.
6285 ///
6286 void SelectionDAG::ReplaceAllUsesWith(SDValue FromN, SDValue To) {
6287   SDNode *From = FromN.getNode();
6288   assert(From->getNumValues() == 1 && FromN.getResNo() == 0 &&
6289          "Cannot replace with this method!");
6290   assert(From != To.getNode() && "Cannot replace uses of with self");
6291
6292   // Iterate over all the existing uses of From. New uses will be added
6293   // to the beginning of the use list, which we avoid visiting.
6294   // This specifically avoids visiting uses of From that arise while the
6295   // replacement is happening, because any such uses would be the result
6296   // of CSE: If an existing node looks like From after one of its operands
6297   // is replaced by To, we don't want to replace of all its users with To
6298   // too. See PR3018 for more info.
6299   SDNode::use_iterator UI = From->use_begin(), UE = From->use_end();
6300   RAUWUpdateListener Listener(*this, UI, UE);
6301   while (UI != UE) {
6302     SDNode *User = *UI;
6303
6304     // This node is about to morph, remove its old self from the CSE maps.
6305     RemoveNodeFromCSEMaps(User);
6306
6307     // A user can appear in a use list multiple times, and when this
6308     // happens the uses are usually next to each other in the list.
6309     // To help reduce the number of CSE recomputations, process all
6310     // the uses of this user that we can find this way.
6311     do {
6312       SDUse &Use = UI.getUse();
6313       ++UI;
6314       Use.set(To);
6315     } while (UI != UE && *UI == User);
6316
6317     // Now that we have modified User, add it back to the CSE maps.  If it
6318     // already exists there, recursively merge the results together.
6319     AddModifiedNodeToCSEMaps(User);
6320   }
6321
6322   // If we just RAUW'd the root, take note.
6323   if (FromN == getRoot())
6324     setRoot(To);
6325 }
6326
6327 /// ReplaceAllUsesWith - Modify anything using 'From' to use 'To' instead.
6328 /// This can cause recursive merging of nodes in the DAG.
6329 ///
6330 /// This version assumes that for each value of From, there is a
6331 /// corresponding value in To in the same position with the same type.
6332 ///
6333 void SelectionDAG::ReplaceAllUsesWith(SDNode *From, SDNode *To) {
6334 #ifndef NDEBUG
6335   for (unsigned i = 0, e = From->getNumValues(); i != e; ++i)
6336     assert((!From->hasAnyUseOfValue(i) ||
6337             From->getValueType(i) == To->getValueType(i)) &&
6338            "Cannot use this version of ReplaceAllUsesWith!");
6339 #endif
6340
6341   // Handle the trivial case.
6342   if (From == To)
6343     return;
6344
6345   // Iterate over just the existing users of From. See the comments in
6346   // the ReplaceAllUsesWith above.
6347   SDNode::use_iterator UI = From->use_begin(), UE = From->use_end();
6348   RAUWUpdateListener Listener(*this, UI, UE);
6349   while (UI != UE) {
6350     SDNode *User = *UI;
6351
6352     // This node is about to morph, remove its old self from the CSE maps.
6353     RemoveNodeFromCSEMaps(User);
6354
6355     // A user can appear in a use list multiple times, and when this
6356     // happens the uses are usually next to each other in the list.
6357     // To help reduce the number of CSE recomputations, process all
6358     // the uses of this user that we can find this way.
6359     do {
6360       SDUse &Use = UI.getUse();
6361       ++UI;
6362       Use.setNode(To);
6363     } while (UI != UE && *UI == User);
6364
6365     // Now that we have modified User, add it back to the CSE maps.  If it
6366     // already exists there, recursively merge the results together.
6367     AddModifiedNodeToCSEMaps(User);
6368   }
6369
6370   // If we just RAUW'd the root, take note.
6371   if (From == getRoot().getNode())
6372     setRoot(SDValue(To, getRoot().getResNo()));
6373 }
6374
6375 /// ReplaceAllUsesWith - Modify anything using 'From' to use 'To' instead.
6376 /// This can cause recursive merging of nodes in the DAG.
6377 ///
6378 /// This version can replace From with any result values.  To must match the
6379 /// number and types of values returned by From.
6380 void SelectionDAG::ReplaceAllUsesWith(SDNode *From, const SDValue *To) {
6381   if (From->getNumValues() == 1)  // Handle the simple case efficiently.
6382     return ReplaceAllUsesWith(SDValue(From, 0), To[0]);
6383
6384   // Iterate over just the existing users of From. See the comments in
6385   // the ReplaceAllUsesWith above.
6386   SDNode::use_iterator UI = From->use_begin(), UE = From->use_end();
6387   RAUWUpdateListener Listener(*this, UI, UE);
6388   while (UI != UE) {
6389     SDNode *User = *UI;
6390
6391     // This node is about to morph, remove its old self from the CSE maps.
6392     RemoveNodeFromCSEMaps(User);
6393
6394     // A user can appear in a use list multiple times, and when this
6395     // happens the uses are usually next to each other in the list.
6396     // To help reduce the number of CSE recomputations, process all
6397     // the uses of this user that we can find this way.
6398     do {
6399       SDUse &Use = UI.getUse();
6400       const SDValue &ToOp = To[Use.getResNo()];
6401       ++UI;
6402       Use.set(ToOp);
6403     } while (UI != UE && *UI == User);
6404
6405     // Now that we have modified User, add it back to the CSE maps.  If it
6406     // already exists there, recursively merge the results together.
6407     AddModifiedNodeToCSEMaps(User);
6408   }
6409
6410   // If we just RAUW'd the root, take note.
6411   if (From == getRoot().getNode())
6412     setRoot(SDValue(To[getRoot().getResNo()]));
6413 }
6414
6415 /// ReplaceAllUsesOfValueWith - Replace any uses of From with To, leaving
6416 /// uses of other values produced by From.getNode() alone.  The Deleted
6417 /// vector is handled the same way as for ReplaceAllUsesWith.
6418 void SelectionDAG::ReplaceAllUsesOfValueWith(SDValue From, SDValue To){
6419   // Handle the really simple, really trivial case efficiently.
6420   if (From == To) return;
6421
6422   // Handle the simple, trivial, case efficiently.
6423   if (From.getNode()->getNumValues() == 1) {
6424     ReplaceAllUsesWith(From, To);
6425     return;
6426   }
6427
6428   // Iterate over just the existing users of From. See the comments in
6429   // the ReplaceAllUsesWith above.
6430   SDNode::use_iterator UI = From.getNode()->use_begin(),
6431                        UE = From.getNode()->use_end();
6432   RAUWUpdateListener Listener(*this, UI, UE);
6433   while (UI != UE) {
6434     SDNode *User = *UI;
6435     bool UserRemovedFromCSEMaps = false;
6436
6437     // A user can appear in a use list multiple times, and when this
6438     // happens the uses are usually next to each other in the list.
6439     // To help reduce the number of CSE recomputations, process all
6440     // the uses of this user that we can find this way.
6441     do {
6442       SDUse &Use = UI.getUse();
6443
6444       // Skip uses of different values from the same node.
6445       if (Use.getResNo() != From.getResNo()) {
6446         ++UI;
6447         continue;
6448       }
6449
6450       // If this node hasn't been modified yet, it's still in the CSE maps,
6451       // so remove its old self from the CSE maps.
6452       if (!UserRemovedFromCSEMaps) {
6453         RemoveNodeFromCSEMaps(User);
6454         UserRemovedFromCSEMaps = true;
6455       }
6456
6457       ++UI;
6458       Use.set(To);
6459     } while (UI != UE && *UI == User);
6460
6461     // We are iterating over all uses of the From node, so if a use
6462     // doesn't use the specific value, no changes are made.
6463     if (!UserRemovedFromCSEMaps)
6464       continue;
6465
6466     // Now that we have modified User, add it back to the CSE maps.  If it
6467     // already exists there, recursively merge the results together.
6468     AddModifiedNodeToCSEMaps(User);
6469   }
6470
6471   // If we just RAUW'd the root, take note.
6472   if (From == getRoot())
6473     setRoot(To);
6474 }
6475
6476 namespace {
6477   /// UseMemo - This class is used by SelectionDAG::ReplaceAllUsesOfValuesWith
6478   /// to record information about a use.
6479   struct UseMemo {
6480     SDNode *User;
6481     unsigned Index;
6482     SDUse *Use;
6483   };
6484
6485   /// operator< - Sort Memos by User.
6486   bool operator<(const UseMemo &L, const UseMemo &R) {
6487     return (intptr_t)L.User < (intptr_t)R.User;
6488   }
6489 }
6490
6491 /// ReplaceAllUsesOfValuesWith - Replace any uses of From with To, leaving
6492 /// uses of other values produced by From.getNode() alone.  The same value
6493 /// may appear in both the From and To list.  The Deleted vector is
6494 /// handled the same way as for ReplaceAllUsesWith.
6495 void SelectionDAG::ReplaceAllUsesOfValuesWith(const SDValue *From,
6496                                               const SDValue *To,
6497                                               unsigned Num){
6498   // Handle the simple, trivial case efficiently.
6499   if (Num == 1)
6500     return ReplaceAllUsesOfValueWith(*From, *To);
6501
6502   // Read up all the uses and make records of them. This helps
6503   // processing new uses that are introduced during the
6504   // replacement process.
6505   SmallVector<UseMemo, 4> Uses;
6506   for (unsigned i = 0; i != Num; ++i) {
6507     unsigned FromResNo = From[i].getResNo();
6508     SDNode *FromNode = From[i].getNode();
6509     for (SDNode::use_iterator UI = FromNode->use_begin(),
6510          E = FromNode->use_end(); UI != E; ++UI) {
6511       SDUse &Use = UI.getUse();
6512       if (Use.getResNo() == FromResNo) {
6513         UseMemo Memo = { *UI, i, &Use };
6514         Uses.push_back(Memo);
6515       }
6516     }
6517   }
6518
6519   // Sort the uses, so that all the uses from a given User are together.
6520   std::sort(Uses.begin(), Uses.end());
6521
6522   for (unsigned UseIndex = 0, UseIndexEnd = Uses.size();
6523        UseIndex != UseIndexEnd; ) {
6524     // We know that this user uses some value of From.  If it is the right
6525     // value, update it.
6526     SDNode *User = Uses[UseIndex].User;
6527
6528     // This node is about to morph, remove its old self from the CSE maps.
6529     RemoveNodeFromCSEMaps(User);
6530
6531     // The Uses array is sorted, so all the uses for a given User
6532     // are next to each other in the list.
6533     // To help reduce the number of CSE recomputations, process all
6534     // the uses of this user that we can find this way.
6535     do {
6536       unsigned i = Uses[UseIndex].Index;
6537       SDUse &Use = *Uses[UseIndex].Use;
6538       ++UseIndex;
6539
6540       Use.set(To[i]);
6541     } while (UseIndex != UseIndexEnd && Uses[UseIndex].User == User);
6542
6543     // Now that we have modified User, add it back to the CSE maps.  If it
6544     // already exists there, recursively merge the results together.
6545     AddModifiedNodeToCSEMaps(User);
6546   }
6547 }
6548
6549 /// AssignTopologicalOrder - Assign a unique node id for each node in the DAG
6550 /// based on their topological order. It returns the maximum id and a vector
6551 /// of the SDNodes* in assigned order by reference.
6552 unsigned SelectionDAG::AssignTopologicalOrder() {
6553
6554   unsigned DAGSize = 0;
6555
6556   // SortedPos tracks the progress of the algorithm. Nodes before it are
6557   // sorted, nodes after it are unsorted. When the algorithm completes
6558   // it is at the end of the list.
6559   allnodes_iterator SortedPos = allnodes_begin();
6560
6561   // Visit all the nodes. Move nodes with no operands to the front of
6562   // the list immediately. Annotate nodes that do have operands with their
6563   // operand count. Before we do this, the Node Id fields of the nodes
6564   // may contain arbitrary values. After, the Node Id fields for nodes
6565   // before SortedPos will contain the topological sort index, and the
6566   // Node Id fields for nodes At SortedPos and after will contain the
6567   // count of outstanding operands.
6568   for (allnodes_iterator I = allnodes_begin(),E = allnodes_end(); I != E; ) {
6569     SDNode *N = &*I++;
6570     checkForCycles(N, this);
6571     unsigned Degree = N->getNumOperands();
6572     if (Degree == 0) {
6573       // A node with no uses, add it to the result array immediately.
6574       N->setNodeId(DAGSize++);
6575       allnodes_iterator Q(N);
6576       if (Q != SortedPos)
6577         SortedPos = AllNodes.insert(SortedPos, AllNodes.remove(Q));
6578       assert(SortedPos != AllNodes.end() && "Overran node list");
6579       ++SortedPos;
6580     } else {
6581       // Temporarily use the Node Id as scratch space for the degree count.
6582       N->setNodeId(Degree);
6583     }
6584   }
6585
6586   // Visit all the nodes. As we iterate, move nodes into sorted order,
6587   // such that by the time the end is reached all nodes will be sorted.
6588   for (SDNode &Node : allnodes()) {
6589     SDNode *N = &Node;
6590     checkForCycles(N, this);
6591     // N is in sorted position, so all its uses have one less operand
6592     // that needs to be sorted.
6593     for (SDNode::use_iterator UI = N->use_begin(), UE = N->use_end();
6594          UI != UE; ++UI) {
6595       SDNode *P = *UI;
6596       unsigned Degree = P->getNodeId();
6597       assert(Degree != 0 && "Invalid node degree");
6598       --Degree;
6599       if (Degree == 0) {
6600         // All of P's operands are sorted, so P may sorted now.
6601         P->setNodeId(DAGSize++);
6602         if (P != SortedPos)
6603           SortedPos = AllNodes.insert(SortedPos, AllNodes.remove(P));
6604         assert(SortedPos != AllNodes.end() && "Overran node list");
6605         ++SortedPos;
6606       } else {
6607         // Update P's outstanding operand count.
6608         P->setNodeId(Degree);
6609       }
6610     }
6611     if (&Node == SortedPos) {
6612 #ifndef NDEBUG
6613       allnodes_iterator I(N);
6614       SDNode *S = &*++I;
6615       dbgs() << "Overran sorted position:\n";
6616       S->dumprFull(this); dbgs() << "\n";
6617       dbgs() << "Checking if this is due to cycles\n";
6618       checkForCycles(this, true);
6619 #endif
6620       llvm_unreachable(nullptr);
6621     }
6622   }
6623
6624   assert(SortedPos == AllNodes.end() &&
6625          "Topological sort incomplete!");
6626   assert(AllNodes.front().getOpcode() == ISD::EntryToken &&
6627          "First node in topological sort is not the entry token!");
6628   assert(AllNodes.front().getNodeId() == 0 &&
6629          "First node in topological sort has non-zero id!");
6630   assert(AllNodes.front().getNumOperands() == 0 &&
6631          "First node in topological sort has operands!");
6632   assert(AllNodes.back().getNodeId() == (int)DAGSize-1 &&
6633          "Last node in topologic sort has unexpected id!");
6634   assert(AllNodes.back().use_empty() &&
6635          "Last node in topologic sort has users!");
6636   assert(DAGSize == allnodes_size() && "Node count mismatch!");
6637   return DAGSize;
6638 }
6639
6640 /// AddDbgValue - Add a dbg_value SDNode. If SD is non-null that means the
6641 /// value is produced by SD.
6642 void SelectionDAG::AddDbgValue(SDDbgValue *DB, SDNode *SD, bool isParameter) {
6643   if (SD) {
6644     assert(DbgInfo->getSDDbgValues(SD).empty() || SD->getHasDebugValue());
6645     SD->setHasDebugValue(true);
6646   }
6647   DbgInfo->add(DB, SD, isParameter);
6648 }
6649
6650 /// TransferDbgValues - Transfer SDDbgValues.
6651 void SelectionDAG::TransferDbgValues(SDValue From, SDValue To) {
6652   if (From == To || !From.getNode()->getHasDebugValue())
6653     return;
6654   SDNode *FromNode = From.getNode();
6655   SDNode *ToNode = To.getNode();
6656   ArrayRef<SDDbgValue *> DVs = GetDbgValues(FromNode);
6657   SmallVector<SDDbgValue *, 2> ClonedDVs;
6658   for (ArrayRef<SDDbgValue *>::iterator I = DVs.begin(), E = DVs.end();
6659        I != E; ++I) {
6660     SDDbgValue *Dbg = *I;
6661     if (Dbg->getKind() == SDDbgValue::SDNODE) {
6662       SDDbgValue *Clone =
6663           getDbgValue(Dbg->getVariable(), Dbg->getExpression(), ToNode,
6664                       To.getResNo(), Dbg->isIndirect(), Dbg->getOffset(),
6665                       Dbg->getDebugLoc(), Dbg->getOrder());
6666       ClonedDVs.push_back(Clone);
6667     }
6668   }
6669   for (SmallVectorImpl<SDDbgValue *>::iterator I = ClonedDVs.begin(),
6670          E = ClonedDVs.end(); I != E; ++I)
6671     AddDbgValue(*I, ToNode, false);
6672 }
6673
6674 //===----------------------------------------------------------------------===//
6675 //                              SDNode Class
6676 //===----------------------------------------------------------------------===//
6677
6678 bool llvm::isNullConstant(SDValue V) {
6679   ConstantSDNode *Const = dyn_cast<ConstantSDNode>(V);
6680   return Const != nullptr && Const->isNullValue();
6681 }
6682
6683 bool llvm::isNullFPConstant(SDValue V) {
6684   ConstantFPSDNode *Const = dyn_cast<ConstantFPSDNode>(V);
6685   return Const != nullptr && Const->isZero() && !Const->isNegative();
6686 }
6687
6688 bool llvm::isAllOnesConstant(SDValue V) {
6689   ConstantSDNode *Const = dyn_cast<ConstantSDNode>(V);
6690   return Const != nullptr && Const->isAllOnesValue();
6691 }
6692
6693 bool llvm::isOneConstant(SDValue V) {
6694   ConstantSDNode *Const = dyn_cast<ConstantSDNode>(V);
6695   return Const != nullptr && Const->isOne();
6696 }
6697
6698 HandleSDNode::~HandleSDNode() {
6699   DropOperands();
6700 }
6701
6702 GlobalAddressSDNode::GlobalAddressSDNode(unsigned Opc, unsigned Order,
6703                                          DebugLoc DL, const GlobalValue *GA,
6704                                          EVT VT, int64_t o, unsigned char TF)
6705   : SDNode(Opc, Order, DL, getSDVTList(VT)), Offset(o), TargetFlags(TF) {
6706   TheGlobal = GA;
6707 }
6708
6709 AddrSpaceCastSDNode::AddrSpaceCastSDNode(unsigned Order, DebugLoc dl, EVT VT,
6710                                          SDValue X, unsigned SrcAS,
6711                                          unsigned DestAS)
6712  : UnarySDNode(ISD::ADDRSPACECAST, Order, dl, getSDVTList(VT), X),
6713    SrcAddrSpace(SrcAS), DestAddrSpace(DestAS) {}
6714
6715 MemSDNode::MemSDNode(unsigned Opc, unsigned Order, DebugLoc dl, SDVTList VTs,
6716                      EVT memvt, MachineMemOperand *mmo)
6717  : SDNode(Opc, Order, dl, VTs), MemoryVT(memvt), MMO(mmo) {
6718   SubclassData = encodeMemSDNodeFlags(0, ISD::UNINDEXED, MMO->isVolatile(),
6719                                       MMO->isNonTemporal(), MMO->isInvariant());
6720   assert(isVolatile() == MMO->isVolatile() && "Volatile encoding error!");
6721   assert(isNonTemporal() == MMO->isNonTemporal() &&
6722          "Non-temporal encoding error!");
6723   // We check here that the size of the memory operand fits within the size of
6724   // the MMO. This is because the MMO might indicate only a possible address
6725   // range instead of specifying the affected memory addresses precisely.
6726   assert(memvt.getStoreSize() <= MMO->getSize() && "Size mismatch!");
6727 }
6728
6729 MemSDNode::MemSDNode(unsigned Opc, unsigned Order, DebugLoc dl, SDVTList VTs,
6730                      ArrayRef<SDValue> Ops, EVT memvt, MachineMemOperand *mmo)
6731    : SDNode(Opc, Order, dl, VTs, Ops),
6732      MemoryVT(memvt), MMO(mmo) {
6733   SubclassData = encodeMemSDNodeFlags(0, ISD::UNINDEXED, MMO->isVolatile(),
6734                                       MMO->isNonTemporal(), MMO->isInvariant());
6735   assert(isVolatile() == MMO->isVolatile() && "Volatile encoding error!");
6736   assert(memvt.getStoreSize() <= MMO->getSize() && "Size mismatch!");
6737 }
6738
6739 /// Profile - Gather unique data for the node.
6740 ///
6741 void SDNode::Profile(FoldingSetNodeID &ID) const {
6742   AddNodeIDNode(ID, this);
6743 }
6744
6745 namespace {
6746   struct EVTArray {
6747     std::vector<EVT> VTs;
6748
6749     EVTArray() {
6750       VTs.reserve(MVT::LAST_VALUETYPE);
6751       for (unsigned i = 0; i < MVT::LAST_VALUETYPE; ++i)
6752         VTs.push_back(MVT((MVT::SimpleValueType)i));
6753     }
6754   };
6755 }
6756
6757 static ManagedStatic<std::set<EVT, EVT::compareRawBits> > EVTs;
6758 static ManagedStatic<EVTArray> SimpleVTArray;
6759 static ManagedStatic<sys::SmartMutex<true> > VTMutex;
6760
6761 /// getValueTypeList - Return a pointer to the specified value type.
6762 ///
6763 const EVT *SDNode::getValueTypeList(EVT VT) {
6764   if (VT.isExtended()) {
6765     sys::SmartScopedLock<true> Lock(*VTMutex);
6766     return &(*EVTs->insert(VT).first);
6767   } else {
6768     assert(VT.getSimpleVT() < MVT::LAST_VALUETYPE &&
6769            "Value type out of range!");
6770     return &SimpleVTArray->VTs[VT.getSimpleVT().SimpleTy];
6771   }
6772 }
6773
6774 /// hasNUsesOfValue - Return true if there are exactly NUSES uses of the
6775 /// indicated value.  This method ignores uses of other values defined by this
6776 /// operation.
6777 bool SDNode::hasNUsesOfValue(unsigned NUses, unsigned Value) const {
6778   assert(Value < getNumValues() && "Bad value!");
6779
6780   // TODO: Only iterate over uses of a given value of the node
6781   for (SDNode::use_iterator UI = use_begin(), E = use_end(); UI != E; ++UI) {
6782     if (UI.getUse().getResNo() == Value) {
6783       if (NUses == 0)
6784         return false;
6785       --NUses;
6786     }
6787   }
6788
6789   // Found exactly the right number of uses?
6790   return NUses == 0;
6791 }
6792
6793
6794 /// hasAnyUseOfValue - Return true if there are any use of the indicated
6795 /// value. This method ignores uses of other values defined by this operation.
6796 bool SDNode::hasAnyUseOfValue(unsigned Value) const {
6797   assert(Value < getNumValues() && "Bad value!");
6798
6799   for (SDNode::use_iterator UI = use_begin(), E = use_end(); UI != E; ++UI)
6800     if (UI.getUse().getResNo() == Value)
6801       return true;
6802
6803   return false;
6804 }
6805
6806
6807 /// isOnlyUserOf - Return true if this node is the only use of N.
6808 ///
6809 bool SDNode::isOnlyUserOf(const SDNode *N) const {
6810   bool Seen = false;
6811   for (SDNode::use_iterator I = N->use_begin(), E = N->use_end(); I != E; ++I) {
6812     SDNode *User = *I;
6813     if (User == this)
6814       Seen = true;
6815     else
6816       return false;
6817   }
6818
6819   return Seen;
6820 }
6821
6822 /// isOperand - Return true if this node is an operand of N.
6823 ///
6824 bool SDValue::isOperandOf(const SDNode *N) const {
6825   for (const SDValue &Op : N->op_values())
6826     if (*this == Op)
6827       return true;
6828   return false;
6829 }
6830
6831 bool SDNode::isOperandOf(const SDNode *N) const {
6832   for (const SDValue &Op : N->op_values())
6833     if (this == Op.getNode())
6834       return true;
6835   return false;
6836 }
6837
6838 /// reachesChainWithoutSideEffects - Return true if this operand (which must
6839 /// be a chain) reaches the specified operand without crossing any
6840 /// side-effecting instructions on any chain path.  In practice, this looks
6841 /// through token factors and non-volatile loads.  In order to remain efficient,
6842 /// this only looks a couple of nodes in, it does not do an exhaustive search.
6843 bool SDValue::reachesChainWithoutSideEffects(SDValue Dest,
6844                                                unsigned Depth) const {
6845   if (*this == Dest) return true;
6846
6847   // Don't search too deeply, we just want to be able to see through
6848   // TokenFactor's etc.
6849   if (Depth == 0) return false;
6850
6851   // If this is a token factor, all inputs to the TF happen in parallel.  If any
6852   // of the operands of the TF does not reach dest, then we cannot do the xform.
6853   if (getOpcode() == ISD::TokenFactor) {
6854     for (unsigned i = 0, e = getNumOperands(); i != e; ++i)
6855       if (!getOperand(i).reachesChainWithoutSideEffects(Dest, Depth-1))
6856         return false;
6857     return true;
6858   }
6859
6860   // Loads don't have side effects, look through them.
6861   if (LoadSDNode *Ld = dyn_cast<LoadSDNode>(*this)) {
6862     if (!Ld->isVolatile())
6863       return Ld->getChain().reachesChainWithoutSideEffects(Dest, Depth-1);
6864   }
6865   return false;
6866 }
6867
6868 /// hasPredecessor - Return true if N is a predecessor of this node.
6869 /// N is either an operand of this node, or can be reached by recursively
6870 /// traversing up the operands.
6871 /// NOTE: This is an expensive method. Use it carefully.
6872 bool SDNode::hasPredecessor(const SDNode *N) const {
6873   SmallPtrSet<const SDNode *, 32> Visited;
6874   SmallVector<const SDNode *, 16> Worklist;
6875   return hasPredecessorHelper(N, Visited, Worklist);
6876 }
6877
6878 bool
6879 SDNode::hasPredecessorHelper(const SDNode *N,
6880                              SmallPtrSetImpl<const SDNode *> &Visited,
6881                              SmallVectorImpl<const SDNode *> &Worklist) const {
6882   if (Visited.empty()) {
6883     Worklist.push_back(this);
6884   } else {
6885     // Take a look in the visited set. If we've already encountered this node
6886     // we needn't search further.
6887     if (Visited.count(N))
6888       return true;
6889   }
6890
6891   // Haven't visited N yet. Continue the search.
6892   while (!Worklist.empty()) {
6893     const SDNode *M = Worklist.pop_back_val();
6894     for (const SDValue &OpV : M->op_values()) {
6895       SDNode *Op = OpV.getNode();
6896       if (Visited.insert(Op).second)
6897         Worklist.push_back(Op);
6898       if (Op == N)
6899         return true;
6900     }
6901   }
6902
6903   return false;
6904 }
6905
6906 uint64_t SDNode::getConstantOperandVal(unsigned Num) const {
6907   assert(Num < NumOperands && "Invalid child # of SDNode!");
6908   return cast<ConstantSDNode>(OperandList[Num])->getZExtValue();
6909 }
6910
6911 const SDNodeFlags *SDNode::getFlags() const {
6912   if (auto *FlagsNode = dyn_cast<BinaryWithFlagsSDNode>(this))
6913     return &FlagsNode->Flags;
6914   return nullptr;
6915 }
6916
6917 SDValue SelectionDAG::UnrollVectorOp(SDNode *N, unsigned ResNE) {
6918   assert(N->getNumValues() == 1 &&
6919          "Can't unroll a vector with multiple results!");
6920
6921   EVT VT = N->getValueType(0);
6922   unsigned NE = VT.getVectorNumElements();
6923   EVT EltVT = VT.getVectorElementType();
6924   SDLoc dl(N);
6925
6926   SmallVector<SDValue, 8> Scalars;
6927   SmallVector<SDValue, 4> Operands(N->getNumOperands());
6928
6929   // If ResNE is 0, fully unroll the vector op.
6930   if (ResNE == 0)
6931     ResNE = NE;
6932   else if (NE > ResNE)
6933     NE = ResNE;
6934
6935   unsigned i;
6936   for (i= 0; i != NE; ++i) {
6937     for (unsigned j = 0, e = N->getNumOperands(); j != e; ++j) {
6938       SDValue Operand = N->getOperand(j);
6939       EVT OperandVT = Operand.getValueType();
6940       if (OperandVT.isVector()) {
6941         // A vector operand; extract a single element.
6942         EVT OperandEltVT = OperandVT.getVectorElementType();
6943         Operands[j] =
6944             getNode(ISD::EXTRACT_VECTOR_ELT, dl, OperandEltVT, Operand,
6945                     getConstant(i, dl, TLI->getVectorIdxTy(getDataLayout())));
6946       } else {
6947         // A scalar operand; just use it as is.
6948         Operands[j] = Operand;
6949       }
6950     }
6951
6952     switch (N->getOpcode()) {
6953     default: {
6954       Scalars.push_back(getNode(N->getOpcode(), dl, EltVT, Operands,
6955                                 N->getFlags()));
6956       break;
6957     }
6958     case ISD::VSELECT:
6959       Scalars.push_back(getNode(ISD::SELECT, dl, EltVT, Operands));
6960       break;
6961     case ISD::SHL:
6962     case ISD::SRA:
6963     case ISD::SRL:
6964     case ISD::ROTL:
6965     case ISD::ROTR:
6966       Scalars.push_back(getNode(N->getOpcode(), dl, EltVT, Operands[0],
6967                                getShiftAmountOperand(Operands[0].getValueType(),
6968                                                      Operands[1])));
6969       break;
6970     case ISD::SIGN_EXTEND_INREG:
6971     case ISD::FP_ROUND_INREG: {
6972       EVT ExtVT = cast<VTSDNode>(Operands[1])->getVT().getVectorElementType();
6973       Scalars.push_back(getNode(N->getOpcode(), dl, EltVT,
6974                                 Operands[0],
6975                                 getValueType(ExtVT)));
6976     }
6977     }
6978   }
6979
6980   for (; i < ResNE; ++i)
6981     Scalars.push_back(getUNDEF(EltVT));
6982
6983   return getNode(ISD::BUILD_VECTOR, dl,
6984                  EVT::getVectorVT(*getContext(), EltVT, ResNE), Scalars);
6985 }
6986
6987
6988 /// isConsecutiveLoad - Return true if LD is loading 'Bytes' bytes from a
6989 /// location that is 'Dist' units away from the location that the 'Base' load
6990 /// is loading from.
6991 bool SelectionDAG::isConsecutiveLoad(LoadSDNode *LD, LoadSDNode *Base,
6992                                      unsigned Bytes, int Dist) const {
6993   if (LD->getChain() != Base->getChain())
6994     return false;
6995   EVT VT = LD->getValueType(0);
6996   if (VT.getSizeInBits() / 8 != Bytes)
6997     return false;
6998
6999   SDValue Loc = LD->getOperand(1);
7000   SDValue BaseLoc = Base->getOperand(1);
7001   if (Loc.getOpcode() == ISD::FrameIndex) {
7002     if (BaseLoc.getOpcode() != ISD::FrameIndex)
7003       return false;
7004     const MachineFrameInfo *MFI = getMachineFunction().getFrameInfo();
7005     int FI  = cast<FrameIndexSDNode>(Loc)->getIndex();
7006     int BFI = cast<FrameIndexSDNode>(BaseLoc)->getIndex();
7007     int FS  = MFI->getObjectSize(FI);
7008     int BFS = MFI->getObjectSize(BFI);
7009     if (FS != BFS || FS != (int)Bytes) return false;
7010     return MFI->getObjectOffset(FI) == (MFI->getObjectOffset(BFI) + Dist*Bytes);
7011   }
7012
7013   // Handle X + C.
7014   if (isBaseWithConstantOffset(Loc)) {
7015     int64_t LocOffset = cast<ConstantSDNode>(Loc.getOperand(1))->getSExtValue();
7016     if (Loc.getOperand(0) == BaseLoc) {
7017       // If the base location is a simple address with no offset itself, then
7018       // the second load's first add operand should be the base address.
7019       if (LocOffset == Dist * (int)Bytes)
7020         return true;
7021     } else if (isBaseWithConstantOffset(BaseLoc)) {
7022       // The base location itself has an offset, so subtract that value from the
7023       // second load's offset before comparing to distance * size.
7024       int64_t BOffset =
7025         cast<ConstantSDNode>(BaseLoc.getOperand(1))->getSExtValue();
7026       if (Loc.getOperand(0) == BaseLoc.getOperand(0)) {
7027         if ((LocOffset - BOffset) == Dist * (int)Bytes)
7028           return true;
7029       }
7030     }
7031   }
7032   const GlobalValue *GV1 = nullptr;
7033   const GlobalValue *GV2 = nullptr;
7034   int64_t Offset1 = 0;
7035   int64_t Offset2 = 0;
7036   bool isGA1 = TLI->isGAPlusOffset(Loc.getNode(), GV1, Offset1);
7037   bool isGA2 = TLI->isGAPlusOffset(BaseLoc.getNode(), GV2, Offset2);
7038   if (isGA1 && isGA2 && GV1 == GV2)
7039     return Offset1 == (Offset2 + Dist*Bytes);
7040   return false;
7041 }
7042
7043
7044 /// InferPtrAlignment - Infer alignment of a load / store address. Return 0 if
7045 /// it cannot be inferred.
7046 unsigned SelectionDAG::InferPtrAlignment(SDValue Ptr) const {
7047   // If this is a GlobalAddress + cst, return the alignment.
7048   const GlobalValue *GV;
7049   int64_t GVOffset = 0;
7050   if (TLI->isGAPlusOffset(Ptr.getNode(), GV, GVOffset)) {
7051     unsigned PtrWidth = getDataLayout().getPointerTypeSizeInBits(GV->getType());
7052     APInt KnownZero(PtrWidth, 0), KnownOne(PtrWidth, 0);
7053     llvm::computeKnownBits(const_cast<GlobalValue *>(GV), KnownZero, KnownOne,
7054                            getDataLayout());
7055     unsigned AlignBits = KnownZero.countTrailingOnes();
7056     unsigned Align = AlignBits ? 1 << std::min(31U, AlignBits) : 0;
7057     if (Align)
7058       return MinAlign(Align, GVOffset);
7059   }
7060
7061   // If this is a direct reference to a stack slot, use information about the
7062   // stack slot's alignment.
7063   int FrameIdx = 1 << 31;
7064   int64_t FrameOffset = 0;
7065   if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Ptr)) {
7066     FrameIdx = FI->getIndex();
7067   } else if (isBaseWithConstantOffset(Ptr) &&
7068              isa<FrameIndexSDNode>(Ptr.getOperand(0))) {
7069     // Handle FI+Cst
7070     FrameIdx = cast<FrameIndexSDNode>(Ptr.getOperand(0))->getIndex();
7071     FrameOffset = Ptr.getConstantOperandVal(1);
7072   }
7073
7074   if (FrameIdx != (1 << 31)) {
7075     const MachineFrameInfo &MFI = *getMachineFunction().getFrameInfo();
7076     unsigned FIInfoAlign = MinAlign(MFI.getObjectAlignment(FrameIdx),
7077                                     FrameOffset);
7078     return FIInfoAlign;
7079   }
7080
7081   return 0;
7082 }
7083
7084 /// GetSplitDestVTs - Compute the VTs needed for the low/hi parts of a type
7085 /// which is split (or expanded) into two not necessarily identical pieces.
7086 std::pair<EVT, EVT> SelectionDAG::GetSplitDestVTs(const EVT &VT) const {
7087   // Currently all types are split in half.
7088   EVT LoVT, HiVT;
7089   if (!VT.isVector()) {
7090     LoVT = HiVT = TLI->getTypeToTransformTo(*getContext(), VT);
7091   } else {
7092     unsigned NumElements = VT.getVectorNumElements();
7093     assert(!(NumElements & 1) && "Splitting vector, but not in half!");
7094     LoVT = HiVT = EVT::getVectorVT(*getContext(), VT.getVectorElementType(),
7095                                    NumElements/2);
7096   }
7097   return std::make_pair(LoVT, HiVT);
7098 }
7099
7100 /// SplitVector - Split the vector with EXTRACT_SUBVECTOR and return the
7101 /// low/high part.
7102 std::pair<SDValue, SDValue>
7103 SelectionDAG::SplitVector(const SDValue &N, const SDLoc &DL, const EVT &LoVT,
7104                           const EVT &HiVT) {
7105   assert(LoVT.getVectorNumElements() + HiVT.getVectorNumElements() <=
7106          N.getValueType().getVectorNumElements() &&
7107          "More vector elements requested than available!");
7108   SDValue Lo, Hi;
7109   Lo = getNode(ISD::EXTRACT_SUBVECTOR, DL, LoVT, N,
7110                getConstant(0, DL, TLI->getVectorIdxTy(getDataLayout())));
7111   Hi = getNode(ISD::EXTRACT_SUBVECTOR, DL, HiVT, N,
7112                getConstant(LoVT.getVectorNumElements(), DL,
7113                            TLI->getVectorIdxTy(getDataLayout())));
7114   return std::make_pair(Lo, Hi);
7115 }
7116
7117 void SelectionDAG::ExtractVectorElements(SDValue Op,
7118                                          SmallVectorImpl<SDValue> &Args,
7119                                          unsigned Start, unsigned Count) {
7120   EVT VT = Op.getValueType();
7121   if (Count == 0)
7122     Count = VT.getVectorNumElements();
7123
7124   EVT EltVT = VT.getVectorElementType();
7125   EVT IdxTy = TLI->getVectorIdxTy(getDataLayout());
7126   SDLoc SL(Op);
7127   for (unsigned i = Start, e = Start + Count; i != e; ++i) {
7128     Args.push_back(getNode(ISD::EXTRACT_VECTOR_ELT, SL, EltVT,
7129                            Op, getConstant(i, SL, IdxTy)));
7130   }
7131 }
7132
7133 // getAddressSpace - Return the address space this GlobalAddress belongs to.
7134 unsigned GlobalAddressSDNode::getAddressSpace() const {
7135   return getGlobal()->getType()->getAddressSpace();
7136 }
7137
7138
7139 Type *ConstantPoolSDNode::getType() const {
7140   if (isMachineConstantPoolEntry())
7141     return Val.MachineCPVal->getType();
7142   return Val.ConstVal->getType();
7143 }
7144
7145 bool BuildVectorSDNode::isConstantSplat(APInt &SplatValue,
7146                                         APInt &SplatUndef,
7147                                         unsigned &SplatBitSize,
7148                                         bool &HasAnyUndefs,
7149                                         unsigned MinSplatBits,
7150                                         bool isBigEndian) const {
7151   EVT VT = getValueType(0);
7152   assert(VT.isVector() && "Expected a vector type");
7153   unsigned sz = VT.getSizeInBits();
7154   if (MinSplatBits > sz)
7155     return false;
7156
7157   SplatValue = APInt(sz, 0);
7158   SplatUndef = APInt(sz, 0);
7159
7160   // Get the bits.  Bits with undefined values (when the corresponding element
7161   // of the vector is an ISD::UNDEF value) are set in SplatUndef and cleared
7162   // in SplatValue.  If any of the values are not constant, give up and return
7163   // false.
7164   unsigned int nOps = getNumOperands();
7165   assert(nOps > 0 && "isConstantSplat has 0-size build vector");
7166   unsigned EltBitSize = VT.getVectorElementType().getSizeInBits();
7167
7168   for (unsigned j = 0; j < nOps; ++j) {
7169     unsigned i = isBigEndian ? nOps-1-j : j;
7170     SDValue OpVal = getOperand(i);
7171     unsigned BitPos = j * EltBitSize;
7172
7173     if (OpVal.getOpcode() == ISD::UNDEF)
7174       SplatUndef |= APInt::getBitsSet(sz, BitPos, BitPos + EltBitSize);
7175     else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal))
7176       SplatValue |= CN->getAPIntValue().zextOrTrunc(EltBitSize).
7177                     zextOrTrunc(sz) << BitPos;
7178     else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal))
7179       SplatValue |= CN->getValueAPF().bitcastToAPInt().zextOrTrunc(sz) <<BitPos;
7180      else
7181       return false;
7182   }
7183
7184   // The build_vector is all constants or undefs.  Find the smallest element
7185   // size that splats the vector.
7186
7187   HasAnyUndefs = (SplatUndef != 0);
7188   while (sz > 8) {
7189
7190     unsigned HalfSize = sz / 2;
7191     APInt HighValue = SplatValue.lshr(HalfSize).trunc(HalfSize);
7192     APInt LowValue = SplatValue.trunc(HalfSize);
7193     APInt HighUndef = SplatUndef.lshr(HalfSize).trunc(HalfSize);
7194     APInt LowUndef = SplatUndef.trunc(HalfSize);
7195
7196     // If the two halves do not match (ignoring undef bits), stop here.
7197     if ((HighValue & ~LowUndef) != (LowValue & ~HighUndef) ||
7198         MinSplatBits > HalfSize)
7199       break;
7200
7201     SplatValue = HighValue | LowValue;
7202     SplatUndef = HighUndef & LowUndef;
7203
7204     sz = HalfSize;
7205   }
7206
7207   SplatBitSize = sz;
7208   return true;
7209 }
7210
7211 SDValue BuildVectorSDNode::getSplatValue(BitVector *UndefElements) const {
7212   if (UndefElements) {
7213     UndefElements->clear();
7214     UndefElements->resize(getNumOperands());
7215   }
7216   SDValue Splatted;
7217   for (unsigned i = 0, e = getNumOperands(); i != e; ++i) {
7218     SDValue Op = getOperand(i);
7219     if (Op.getOpcode() == ISD::UNDEF) {
7220       if (UndefElements)
7221         (*UndefElements)[i] = true;
7222     } else if (!Splatted) {
7223       Splatted = Op;
7224     } else if (Splatted != Op) {
7225       return SDValue();
7226     }
7227   }
7228
7229   if (!Splatted) {
7230     assert(getOperand(0).getOpcode() == ISD::UNDEF &&
7231            "Can only have a splat without a constant for all undefs.");
7232     return getOperand(0);
7233   }
7234
7235   return Splatted;
7236 }
7237
7238 ConstantSDNode *
7239 BuildVectorSDNode::getConstantSplatNode(BitVector *UndefElements) const {
7240   return dyn_cast_or_null<ConstantSDNode>(getSplatValue(UndefElements));
7241 }
7242
7243 ConstantFPSDNode *
7244 BuildVectorSDNode::getConstantFPSplatNode(BitVector *UndefElements) const {
7245   return dyn_cast_or_null<ConstantFPSDNode>(getSplatValue(UndefElements));
7246 }
7247
7248 int32_t
7249 BuildVectorSDNode::getConstantFPSplatPow2ToLog2Int(BitVector *UndefElements,
7250                                                    uint32_t BitWidth) const {
7251   if (ConstantFPSDNode *CN =
7252           dyn_cast_or_null<ConstantFPSDNode>(getSplatValue(UndefElements))) {
7253     bool IsExact;
7254     APSInt IntVal(BitWidth);
7255     APFloat APF = CN->getValueAPF();
7256     if (APF.convertToInteger(IntVal, APFloat::rmTowardZero, &IsExact) !=
7257             APFloat::opOK ||
7258         !IsExact)
7259       return -1;
7260
7261     return IntVal.exactLogBase2();
7262   }
7263   return -1;
7264 }
7265
7266 bool BuildVectorSDNode::isConstant() const {
7267   for (const SDValue &Op : op_values()) {
7268     unsigned Opc = Op.getOpcode();
7269     if (Opc != ISD::UNDEF && Opc != ISD::Constant && Opc != ISD::ConstantFP)
7270       return false;
7271   }
7272   return true;
7273 }
7274
7275 bool ShuffleVectorSDNode::isSplatMask(const int *Mask, EVT VT) {
7276   // Find the first non-undef value in the shuffle mask.
7277   unsigned i, e;
7278   for (i = 0, e = VT.getVectorNumElements(); i != e && Mask[i] < 0; ++i)
7279     /* search */;
7280
7281   assert(i != e && "VECTOR_SHUFFLE node with all undef indices!");
7282
7283   // Make sure all remaining elements are either undef or the same as the first
7284   // non-undef value.
7285   for (int Idx = Mask[i]; i != e; ++i)
7286     if (Mask[i] >= 0 && Mask[i] != Idx)
7287       return false;
7288   return true;
7289 }
7290
7291 #ifndef NDEBUG
7292 static void checkForCyclesHelper(const SDNode *N,
7293                                  SmallPtrSetImpl<const SDNode*> &Visited,
7294                                  SmallPtrSetImpl<const SDNode*> &Checked,
7295                                  const llvm::SelectionDAG *DAG) {
7296   // If this node has already been checked, don't check it again.
7297   if (Checked.count(N))
7298     return;
7299
7300   // If a node has already been visited on this depth-first walk, reject it as
7301   // a cycle.
7302   if (!Visited.insert(N).second) {
7303     errs() << "Detected cycle in SelectionDAG\n";
7304     dbgs() << "Offending node:\n";
7305     N->dumprFull(DAG); dbgs() << "\n";
7306     abort();
7307   }
7308
7309   for (const SDValue &Op : N->op_values())
7310     checkForCyclesHelper(Op.getNode(), Visited, Checked, DAG);
7311
7312   Checked.insert(N);
7313   Visited.erase(N);
7314 }
7315 #endif
7316
7317 void llvm::checkForCycles(const llvm::SDNode *N,
7318                           const llvm::SelectionDAG *DAG,
7319                           bool force) {
7320 #ifndef NDEBUG
7321   bool check = force;
7322 #ifdef XDEBUG
7323   check = true;
7324 #endif  // XDEBUG
7325   if (check) {
7326     assert(N && "Checking nonexistent SDNode");
7327     SmallPtrSet<const SDNode*, 32> visited;
7328     SmallPtrSet<const SDNode*, 32> checked;
7329     checkForCyclesHelper(N, visited, checked, DAG);
7330   }
7331 #endif  // !NDEBUG
7332 }
7333
7334 void llvm::checkForCycles(const llvm::SelectionDAG *DAG, bool force) {
7335   checkForCycles(DAG->getRoot().getNode(), DAG, force);
7336 }