DebugInfo: partially revert cleanup committed in r209680

[oota-llvm.git] / lib / CodeGen / Analysis.cpp
diff --git a/lib/CodeGen/Analysis.cpp b/lib/CodeGen/Analysis.cpp

index ca08b5b6e0d52e16aef2caa1f33e6ac10eed0f78..6fc83a26a0d2441b0c31203214fdeaf29ae74e56 100644 (file)
--- a/lib/CodeGen/Analysis.cpp
+++ b/lib/CodeGen/Analysis.cpp
@@ -46,7 +46,7 @@ unsigned llvm::ComputeLinearIndex(Type *Ty,
          EI != EE; ++EI) {
        if (Indices && *Indices == unsigned(EI - EB))
          return ComputeLinearIndex(*EI, Indices+1, IndicesEnd, CurIndex);
-      CurIndex = ComputeLinearIndex(*EI, 0, 0, CurIndex);
+      CurIndex = ComputeLinearIndex(*EI, nullptr, nullptr, CurIndex);
      }
      return CurIndex;
    }
@@ -56,7 +56,7 @@ unsigned llvm::ComputeLinearIndex(Type *Ty,
      for (unsigned i = 0, e = ATy->getNumElements(); i != e; ++i) {
        if (Indices && *Indices == i)
          return ComputeLinearIndex(EltTy, Indices+1, IndicesEnd, CurIndex);
-      CurIndex = ComputeLinearIndex(EltTy, 0, 0, CurIndex);
+      CurIndex = ComputeLinearIndex(EltTy, nullptr, nullptr, CurIndex);
      }
      return CurIndex;
    }
@@ -228,7 +228,7 @@ static const Value *getNoopInput(const Value *V,
      // through.
      const Instruction *I = dyn_cast<Instruction>(V);
      if (!I || I->getNumOperands() == 0) return V;
-    const Value *NoopInput = 0;
+    const Value *NoopInput = nullptr;
  
      Value *Op = I->getOperand(0);
      if (isa<BitCastInst>(I)) {
@@ -320,6 +320,7 @@ static const Value *getNoopInput(const Value *V,
  static bool slotOnlyDiscardsData(const Value *RetVal, const Value *CallVal,
                                   SmallVectorImpl<unsigned> &RetIndices,
                                   SmallVectorImpl<unsigned> &CallIndices,
+                                 bool AllowDifferingSizes,
                                   const TargetLoweringBase &TLI) {
  
    // Trace the sub-value needed by the return value as far back up the graph as
@@ -350,7 +351,8 @@ static bool slotOnlyDiscardsData(const Value *RetVal, const Value *CallVal,
    // all the bits that are needed by the "ret" have been provided by the "tail
    // call". FIXME: with sufficiently cunning bit-tracking, we could look through
    // extensions too.
-  if (BitsProvided < BitsRequired)
+  if (BitsProvided < BitsRequired ||
+      (!AllowDifferingSizes && BitsProvided != BitsRequired))
      return false;
  
    return true;
@@ -382,9 +384,8 @@ static bool indexReallyValid(CompositeType *T, unsigned Idx) {
  /// function again on a finished iterator will repeatedly return
  /// false. SubTypes.back()->getTypeAtIndex(Path.back()) is either an empty
  /// aggregate or a non-aggregate
-static bool
-advanceToNextLeafType(SmallVectorImpl<CompositeType *> &SubTypes,
-                     SmallVectorImpl<unsigned> &Path) {
+static bool advanceToNextLeafType(SmallVectorImpl<CompositeType *> &SubTypes,
+                                  SmallVectorImpl<unsigned> &Path) {
    // First march back up the tree until we can successfully increment one of the
    // coordinates in Path.
    while (!Path.empty() && !indexReallyValid(SubTypes.back(), Path.back() + 1)) {
@@ -454,8 +455,8 @@ static bool firstRealType(Type *Next,
  
  /// Set the iterator data-structures to the next non-empty, non-aggregate
  /// subtype.
-bool nextRealType(SmallVectorImpl<CompositeType *> &SubTypes,
-                  SmallVectorImpl<unsigned> &Path) {
+static bool nextRealType(SmallVectorImpl<CompositeType *> &SubTypes,
+                         SmallVectorImpl<unsigned> &Path) {
    do {
      if (!advanceToNextLeafType(SubTypes, Path))
        return false;
@@ -497,8 +498,7 @@ bool llvm::isInTailCallPosition(ImmutableCallSite CS,
    // chain interposes between I and the return.
    if (I->mayHaveSideEffects() || I->mayReadFromMemory() ||
        !isSafeToSpeculativelyExecute(I))
-    for (BasicBlock::const_iterator BBI = prior(prior(ExitBB->end())); ;
-         --BBI) {
+    for (BasicBlock::const_iterator BBI = std::prev(ExitBB->end(), 2);; --BBI) {
        if (&*BBI == I)
          break;
        // Debug info intrinsics do not get in the way of tail call optimization.
@@ -509,6 +509,13 @@ bool llvm::isInTailCallPosition(ImmutableCallSite CS,
          return false;
      }
  
+  return returnTypeIsEligibleForTailCall(ExitBB->getParent(), I, Ret, TLI);
+}
+
+bool llvm::returnTypeIsEligibleForTailCall(const Function *F,
+                                           const Instruction *I,
+                                           const ReturnInst *Ret,
+                                           const TargetLoweringBase &TLI) {
    // If the block ends with a void return or unreachable, it doesn't matter
    // what the call's return type is.
    if (!Ret || Ret->getNumOperands() == 0) return true;
@@ -517,19 +524,38 @@ bool llvm::isInTailCallPosition(ImmutableCallSite CS,
    // return type is.
    if (isa<UndefValue>(Ret->getOperand(0))) return true;
  
-  // Conservatively require the attributes of the call to match those of
-  // the return. Ignore noalias because it doesn't affect the call sequence.
-  const Function *F = ExitBB->getParent();
-  AttributeSet CallerAttrs = F->getAttributes();
-  if (AttrBuilder(CallerAttrs, AttributeSet::ReturnIndex).
-        removeAttribute(Attribute::NoAlias) !=
-      AttrBuilder(CallerAttrs, AttributeSet::ReturnIndex).
-        removeAttribute(Attribute::NoAlias))
-    return false;
+  // Make sure the attributes attached to each return are compatible.
+  AttrBuilder CallerAttrs(F->getAttributes(),
+                          AttributeSet::ReturnIndex);
+  AttrBuilder CalleeAttrs(cast<CallInst>(I)->getAttributes(),
+                          AttributeSet::ReturnIndex);
+
+  // Noalias is completely benign as far as calling convention goes, it
+  // shouldn't affect whether the call is a tail call.
+  CallerAttrs = CallerAttrs.removeAttribute(Attribute::NoAlias);
+  CalleeAttrs = CalleeAttrs.removeAttribute(Attribute::NoAlias);
+
+  bool AllowDifferingSizes = true;
+  if (CallerAttrs.contains(Attribute::ZExt)) {
+    if (!CalleeAttrs.contains(Attribute::ZExt))
+      return false;
+
+    AllowDifferingSizes = false;
+    CallerAttrs.removeAttribute(Attribute::ZExt);
+    CalleeAttrs.removeAttribute(Attribute::ZExt);
+  } else if (CallerAttrs.contains(Attribute::SExt)) {
+    if (!CalleeAttrs.contains(Attribute::SExt))
+      return false;
+
+    AllowDifferingSizes = false;
+    CallerAttrs.removeAttribute(Attribute::SExt);
+    CalleeAttrs.removeAttribute(Attribute::SExt);
+  }
  
-  // It's not safe to eliminate the sign / zero extension of the return value.
-  if (CallerAttrs.hasAttribute(AttributeSet::ReturnIndex, Attribute::ZExt) ||
-      CallerAttrs.hasAttribute(AttributeSet::ReturnIndex, Attribute::SExt))
+  // If they're still different, there's some facet we don't understand
+  // (currently only "inreg", but in future who knows). It may be OK but the
+  // only safe option is to reject the tail call.
+  if (CallerAttrs != CalleeAttrs)
      return false;
  
    const Value *RetVal = Ret->getOperand(0), *CallVal = I;
@@ -571,7 +597,8 @@ bool llvm::isInTailCallPosition(ImmutableCallSite CS,
  
      // Finally, we can check whether the value produced by the tail call at this
      // index is compatible with the value we return.
-    if (!slotOnlyDiscardsData(RetVal, CallVal, TmpRetPath, TmpCallPath, TLI))
+    if (!slotOnlyDiscardsData(RetVal, CallVal, TmpRetPath, TmpCallPath,
+                              AllowDifferingSizes, TLI))
        return false;
  
      CallEmpty  = !nextRealType(CallSubTypes, CallPath);