Reapply r143206, with fixes. Disallow physical register lifetimes

[oota-llvm.git] / lib / CodeGen / SelectionDAG / SelectionDAG.cpp
diff --git a/lib/CodeGen/SelectionDAG/SelectionDAG.cpp b/lib/CodeGen/SelectionDAG/SelectionDAG.cpp

index 888d8b4ea397cd25d9faeb5bb665e79fcae5e8be..010a740dc7c4284b4848c47696f4907a4691956a 100644 (file)
--- a/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
@@ -403,7 +403,7 @@ static void AddNodeIDCustom(FoldingSetNodeID &ID, const SDNode *N) {
      ID.AddInteger(CP->getAlignment());
      ID.AddInteger(CP->getOffset());
      if (CP->isMachineConstantPoolEntry())
-      CP->getMachineCPVal()->AddSelectionDAGCSEId(ID);
+      CP->getMachineCPVal()->addSelectionDAGCSEId(ID);
      else
        ID.AddPointer(CP->getConstVal());
      ID.AddInteger(CP->getTargetFlags());
@@ -432,7 +432,9 @@ static void AddNodeIDCustom(FoldingSetNodeID &ID, const SDNode *N) {
    case ISD::ATOMIC_LOAD_MIN:
    case ISD::ATOMIC_LOAD_MAX:
    case ISD::ATOMIC_LOAD_UMIN:
-  case ISD::ATOMIC_LOAD_UMAX: {
+  case ISD::ATOMIC_LOAD_UMAX:
+  case ISD::ATOMIC_LOAD:
+  case ISD::ATOMIC_STORE: {
      const AtomicSDNode *AT = cast<AtomicSDNode>(N);
      ID.AddInteger(AT->getMemoryVT().getRawBits());
      ID.AddInteger(AT->getRawSubclassData());
@@ -769,11 +771,14 @@ static void VerifyNodeCommon(SDNode *N) {
      assert(N->getNumOperands() == N->getValueType(0).getVectorNumElements() &&
             "Wrong number of operands!");
      EVT EltVT = N->getValueType(0).getVectorElementType();
-    for (SDNode::op_iterator I = N->op_begin(), E = N->op_end(); I != E; ++I)
+    for (SDNode::op_iterator I = N->op_begin(), E = N->op_end(); I != E; ++I) {
        assert((I->getValueType() == EltVT ||
               (EltVT.isInteger() && I->getValueType().isInteger() &&
                EltVT.bitsLE(I->getValueType()))) &&
              "Wrong operand type!");
+      assert(I->getValueType() == N->getOperand(0).getValueType() &&
+             "Operands must all have the same type");
+    }
      break;
    }
    }
@@ -876,6 +881,12 @@ void SelectionDAG::clear() {
    DbgInfo->clear();
  }
  
+SDValue SelectionDAG::getAnyExtOrTrunc(SDValue Op, DebugLoc DL, EVT VT) {
+  return VT.bitsGT(Op.getValueType()) ?
+    getNode(ISD::ANY_EXTEND, DL, VT, Op) :
+    getNode(ISD::TRUNCATE, DL, VT, Op);
+}
+
  SDValue SelectionDAG::getSExtOrTrunc(SDValue Op, DebugLoc DL, EVT VT) {
    return VT.bitsGT(Op.getValueType()) ?
      getNode(ISD::SIGN_EXTEND, DL, VT, Op) :
@@ -925,13 +936,25 @@ SDValue SelectionDAG::getConstant(const ConstantInt &Val, EVT VT, bool isT) {
    assert(VT.isInteger() && "Cannot create FP integer constant!");
  
    EVT EltVT = VT.getScalarType();
-  assert(Val.getBitWidth() == EltVT.getSizeInBits() &&
-         "APInt size does not match type size!");
+  const ConstantInt *Elt = &Val;
+
+  // In some cases the vector type is legal but the element type is illegal and
+  // needs to be promoted, for example v8i8 on ARM.  In this case, promote the
+  // inserted value (the type does not need to match the vector element type).
+  // Any extra bits introduced will be truncated away.
+  if (VT.isVector() && TLI.getTypeAction(*getContext(), EltVT) ==
+      TargetLowering::TypePromoteInteger) {
+   EltVT = TLI.getTypeToTransformTo(*getContext(), EltVT);
+   APInt NewVal = Elt->getValue().zext(EltVT.getSizeInBits());
+   Elt = ConstantInt::get(*getContext(), NewVal);
+  }
  
+  assert(Elt->getBitWidth() == EltVT.getSizeInBits() &&
+         "APInt size does not match type size!");
    unsigned Opc = isT ? ISD::TargetConstant : ISD::Constant;
    FoldingSetNodeID ID;
    AddNodeIDNode(ID, Opc, getVTList(EltVT), 0, 0);
-  ID.AddPointer(&Val);
+  ID.AddPointer(Elt);
    void *IP = 0;
    SDNode *N = NULL;
    if ((N = CSEMap.FindNodeOrInsertPos(ID, IP)))
@@ -939,7 +962,7 @@ SDValue SelectionDAG::getConstant(const ConstantInt &Val, EVT VT, bool isT) {
        return SDValue(N, 0);
  
    if (!N) {
-    N = new (NodeAllocator) ConstantSDNode(isT, &Val, EltVT);
+    N = new (NodeAllocator) ConstantSDNode(isT, Elt, EltVT);
      CSEMap.InsertNode(N, IP);
      AllNodes.push_back(N);
    }
@@ -1131,7 +1154,7 @@ SDValue SelectionDAG::getConstantPool(MachineConstantPoolValue *C, EVT VT,
    AddNodeIDNode(ID, Opc, getVTList(VT), 0, 0);
    ID.AddInteger(Alignment);
    ID.AddInteger(Offset);
-  C->AddSelectionDAGCSEId(ID);
+  C->addSelectionDAGCSEId(ID);
    ID.AddInteger(TargetFlags);
    void *IP = 0;
    if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
@@ -1718,8 +1741,8 @@ void SelectionDAG::ComputeMaskedBits(SDValue Op, const APInt &Mask,
      // The boolean result conforms to getBooleanContents.  Fall through.
    case ISD::SETCC:
      // If we know the result of a setcc has the top bits zero, use this info.
-    if (TLI.getBooleanContents() == TargetLowering::ZeroOrOneBooleanContent &&
-        BitWidth > 1)
+    if (TLI.getBooleanContents(Op.getValueType().isVector()) ==
+        TargetLowering::ZeroOrOneBooleanContent && BitWidth > 1)
        KnownZero |= APInt::getHighBitsSet(BitWidth, BitWidth - 1);
      return;
    case ISD::SHL:
@@ -2153,7 +2176,7 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, unsigned Depth) const{
      // The boolean result conforms to getBooleanContents.  Fall through.
    case ISD::SETCC:
      // If setcc returns 0/-1, all bits are sign bits.
-    if (TLI.getBooleanContents() ==
+    if (TLI.getBooleanContents(Op.getValueType().isVector()) ==
          TargetLowering::ZeroOrNegativeOneBooleanContent)
        return VTBits;
      break;
@@ -2777,6 +2800,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
              EVT.getVectorNumElements() == VT.getVectorNumElements()) &&
             "Vector element counts must match in FP_ROUND_INREG");
      assert(EVT.bitsLE(VT) && "Not rounding down!");
+    (void)EVT;
      if (cast<VTSDNode>(N2)->getVT() == VT) return N1;  // Not actually rounding.
      break;
    }
@@ -2884,6 +2908,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
      assert(N2C && (unsigned)N2C->getZExtValue() < 2 && "Bad EXTRACT_ELEMENT!");
      assert(!N1.getValueType().isVector() && !VT.isVector() &&
             (N1.getValueType().isInteger() == VT.isInteger()) &&
+           N1.getValueType() != VT &&
             "Wrong types for EXTRACT_ELEMENT!");
  
      // EXTRACT_ELEMENT of BUILD_PAIR is often formed while legalize is expanding
@@ -3320,7 +3345,7 @@ static bool isMemSrcFromString(SDValue Src, std::string &Str) {
  static bool FindOptimalMemOpLowering(std::vector<EVT> &MemOps,
                                       unsigned Limit, uint64_t Size,
                                       unsigned DstAlign, unsigned SrcAlign,
-                                     bool NonScalarIntSafe,
+                                     bool IsZeroVal,
                                       bool MemcpyStrSrc,
                                       SelectionDAG &DAG,
                                       const TargetLowering &TLI) {
@@ -3334,7 +3359,7 @@ static bool FindOptimalMemOpLowering(std::vector<EVT> &MemOps,
    // 'MemcpyStrSrc' indicates whether the memcpy source is constant so it does
    // not need to be loaded.
    EVT VT = TLI.getOptimalMemOpType(Size, DstAlign, SrcAlign,
-                                   NonScalarIntSafe, MemcpyStrSrc,
+                                   IsZeroVal, MemcpyStrSrc,
                                     DAG.getMachineFunction());
  
    if (VT == MVT::Other) {
@@ -3581,11 +3606,11 @@ static SDValue getMemsetStores(SelectionDAG &DAG, DebugLoc dl,
    FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
    if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
      DstAlignCanChange = true;
-  bool NonScalarIntSafe =
+  bool IsZeroVal =
      isa<ConstantSDNode>(Src) && cast<ConstantSDNode>(Src)->isNullValue();
    if (!FindOptimalMemOpLowering(MemOps, TLI.getMaxStoresPerMemset(OptSize),
                                  Size, (DstAlignCanChange ? 0 : Align), 0,
-                                NonScalarIntSafe, false, DAG, TLI))
+                                IsZeroVal, false, DAG, TLI))
      return SDValue();
  
    if (DstAlignCanChange) {
@@ -3825,6 +3850,8 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
    unsigned Flags = MachineMemOperand::MOLoad | MachineMemOperand::MOStore;
  
    // For now, atomics are considered to be volatile always.
+  // FIXME: Volatile isn't really correct; we should keep track of atomic
+  // orderings in the memoperand.
    Flags |= MachineMemOperand::MOVolatile;
  
    MachineMemOperand *MMO =
@@ -3874,9 +3901,16 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
      Alignment = getEVTAlignment(MemVT);
  
    MachineFunction &MF = getMachineFunction();
-  unsigned Flags = MachineMemOperand::MOLoad | MachineMemOperand::MOStore;
+  // A monotonic store does not load; a release store "loads" in the sense
+  // that other stores cannot be sunk past it.
+  // (An atomicrmw obviously both loads and stores.)
+  unsigned Flags = MachineMemOperand::MOStore;
+  if (Opcode != ISD::ATOMIC_STORE || Ordering > Monotonic)
+    Flags |= MachineMemOperand::MOLoad;
  
    // For now, atomics are considered to be volatile always.
+  // FIXME: Volatile isn't really correct; we should keep track of atomic
+  // orderings in the memoperand.
    Flags |= MachineMemOperand::MOVolatile;
  
    MachineMemOperand *MMO =
@@ -3903,12 +3937,14 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
            Opcode == ISD::ATOMIC_LOAD_MAX ||
            Opcode == ISD::ATOMIC_LOAD_UMIN ||
            Opcode == ISD::ATOMIC_LOAD_UMAX ||
-          Opcode == ISD::ATOMIC_SWAP) &&
+          Opcode == ISD::ATOMIC_SWAP ||
+          Opcode == ISD::ATOMIC_STORE) &&
           "Invalid Atomic Op");
  
    EVT VT = Val.getValueType();
  
-  SDVTList VTs = getVTList(VT, MVT::Other);
+  SDVTList VTs = Opcode == ISD::ATOMIC_STORE ? getVTList(MVT::Other) :
+                                               getVTList(VT, MVT::Other);
    FoldingSetNodeID ID;
    ID.AddInteger(MemVT.getRawBits());
    SDValue Ops[] = {Chain, Ptr, Val};
@@ -3926,6 +3962,61 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
    return SDValue(N, 0);
  }
  
+SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
+                                EVT VT, SDValue Chain,
+                                SDValue Ptr,
+                                const Value* PtrVal,
+                                unsigned Alignment,
+                                AtomicOrdering Ordering,
+                                SynchronizationScope SynchScope) {
+  if (Alignment == 0)  // Ensure that codegen never sees alignment 0
+    Alignment = getEVTAlignment(MemVT);
+
+  MachineFunction &MF = getMachineFunction();
+  // A monotonic load does not store; an acquire load "stores" in the sense
+  // that other loads cannot be hoisted past it.
+  unsigned Flags = MachineMemOperand::MOLoad;
+  if (Ordering > Monotonic)
+    Flags |= MachineMemOperand::MOStore;
+
+  // For now, atomics are considered to be volatile always.
+  // FIXME: Volatile isn't really correct; we should keep track of atomic
+  // orderings in the memoperand.
+  Flags |= MachineMemOperand::MOVolatile;
+
+  MachineMemOperand *MMO =
+    MF.getMachineMemOperand(MachinePointerInfo(PtrVal), Flags,
+                            MemVT.getStoreSize(), Alignment);
+
+  return getAtomic(Opcode, dl, MemVT, VT, Chain, Ptr, MMO,
+                   Ordering, SynchScope);
+}
+
+SDValue SelectionDAG::getAtomic(unsigned Opcode, DebugLoc dl, EVT MemVT,
+                                EVT VT, SDValue Chain,
+                                SDValue Ptr,
+                                MachineMemOperand *MMO,
+                                AtomicOrdering Ordering,
+                                SynchronizationScope SynchScope) {
+  assert(Opcode == ISD::ATOMIC_LOAD && "Invalid Atomic Op");
+
+  SDVTList VTs = getVTList(VT, MVT::Other);
+  FoldingSetNodeID ID;
+  ID.AddInteger(MemVT.getRawBits());
+  SDValue Ops[] = {Chain, Ptr};
+  AddNodeIDNode(ID, Opcode, VTs, Ops, 2);
+  void* IP = 0;
+  if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP)) {
+    cast<AtomicSDNode>(E)->refineAlignment(MMO);
+    return SDValue(E, 0);
+  }
+  SDNode *N = new (NodeAllocator) AtomicSDNode(Opcode, dl, VTs, MemVT, Chain,
+                                               Ptr, MMO, Ordering, SynchScope);
+  CSEMap.InsertNode(N, IP);
+  AllNodes.push_back(N);
+  return SDValue(N, 0);
+}
+
  /// getMergeValues - Create a MERGE_VALUES node from the given operands.
  SDValue SelectionDAG::getMergeValues(const SDValue *Ops, unsigned NumOps,
                                       DebugLoc dl) {
@@ -5199,6 +5290,10 @@ void SelectionDAG::ReplaceAllUsesWith(SDValue FromN, SDValue To,
      // already exists there, recursively merge the results together.
      AddModifiedNodeToCSEMaps(User, &Listener);
    }
+
+  // If we just RAUW'd the root, take note.
+  if (FromN == getRoot())
+    setRoot(To);
  }
  
  /// ReplaceAllUsesWith - Modify anything using 'From' to use 'To' instead.
@@ -5244,6 +5339,10 @@ void SelectionDAG::ReplaceAllUsesWith(SDNode *From, SDNode *To,
      // already exists there, recursively merge the results together.
      AddModifiedNodeToCSEMaps(User, &Listener);
    }
+
+  // If we just RAUW'd the root, take note.
+  if (From == getRoot().getNode())
+    setRoot(SDValue(To, getRoot().getResNo()));
  }
  
  /// ReplaceAllUsesWith - Modify anything using 'From' to use 'To' instead.
@@ -5282,6 +5381,10 @@ void SelectionDAG::ReplaceAllUsesWith(SDNode *From,
      // already exists there, recursively merge the results together.
      AddModifiedNodeToCSEMaps(User, &Listener);
    }
+
+  // If we just RAUW'd the root, take note.
+  if (From == getRoot().getNode())
+    setRoot(SDValue(To[getRoot().getResNo()]));
  }
  
  /// ReplaceAllUsesOfValueWith - Replace any uses of From with To, leaving
@@ -5340,6 +5443,10 @@ void SelectionDAG::ReplaceAllUsesOfValueWith(SDValue From, SDValue To,
      // already exists there, recursively merge the results together.
      AddModifiedNodeToCSEMaps(User, &Listener);
    }
+
+  // If we just RAUW'd the root, take note.
+  if (From == getRoot())
+    setRoot(To);
  }
  
  namespace {
@@ -5794,6 +5901,8 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::ATOMIC_LOAD_MAX:    return "AtomicLoadMax";
    case ISD::ATOMIC_LOAD_UMIN:   return "AtomicLoadUMin";
    case ISD::ATOMIC_LOAD_UMAX:   return "AtomicLoadUMax";
+  case ISD::ATOMIC_LOAD:        return "AtomicLoad";
+  case ISD::ATOMIC_STORE:       return "AtomicStore";
    case ISD::PCMARKER:      return "PCMarker";
    case ISD::READCYCLECOUNTER: return "ReadCycleCounter";
    case ISD::SRCVALUE:      return "SrcValue";
@@ -5909,8 +6018,8 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
  
    case ISD::FPOWI:  return "fpowi";
    case ISD::SETCC:       return "setcc";
-  case ISD::VSETCC:      return "vsetcc";
    case ISD::SELECT:      return "select";
+  case ISD::VSELECT:     return "vselect";
    case ISD::SELECT_CC:   return "select_cc";
    case ISD::INSERT_VECTOR_ELT:   return "insert_vector_elt";
    case ISD::EXTRACT_VECTOR_ELT:  return "extract_vector_elt";
@@ -5998,7 +6107,8 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::CTLZ:    return "ctlz";
  
    // Trampolines
-  case ISD::TRAMPOLINE: return "trampoline";
+  case ISD::INIT_TRAMPOLINE: return "init_trampoline";
+  case ISD::ADJUST_TRAMPOLINE: return "adjust_trampoline";
  
    case ISD::CONDCODE:
      switch (cast<CondCodeSDNode>(this)->get()) {
@@ -6258,8 +6368,7 @@ void SDNode::print(raw_ostream &OS, const SelectionDAG *G) const {
  
  static void printrWithDepthHelper(raw_ostream &OS, const SDNode *N,
                                    const SelectionDAG *G, unsigned depth,
-                                  unsigned indent)
-{
+                                  unsigned indent) {
    if (depth == 0)
      return;
  
@@ -6353,6 +6462,10 @@ SDValue SelectionDAG::UnrollVectorOp(SDNode *N, unsigned ResNE) {
        Scalars.push_back(getNode(N->getOpcode(), dl, EltVT,
                                  &Operands[0], Operands.size()));
        break;
+    case ISD::VSELECT:
+      Scalars.push_back(getNode(ISD::SELECT, dl, EltVT,
+                                &Operands[0], Operands.size()));
+      break;
      case ISD::SHL:
      case ISD::SRA:
      case ISD::SRL:
@@ -6440,6 +6553,8 @@ unsigned SelectionDAG::InferPtrAlignment(SDValue Ptr) const {
            Align = TD->getPreferredAlignment(GVar);
          }
        }
+      if (!Align)
+        Align = TLI.getTargetData()->getABITypeAlignment(GV->getType());
      }
      return MinAlign(Align, GVOffset);
    }
@@ -6494,7 +6609,7 @@ static void DumpNodesr(raw_ostream &OS, const SDNode *N, unsigned indent,
      return;
  
    // Dump the current SDNode, but don't end the line yet.
-  OS << std::string(indent, ' ');
+  OS.indent(indent);
    N->printr(OS, G);
  
    // Having printed this SDNode, walk the children: