[RS4GC] Unify two asserts. NFC.

[oota-llvm.git] / lib / Transforms / Scalar / RewriteStatepointsForGC.cpp
diff --git a/lib/Transforms/Scalar/RewriteStatepointsForGC.cpp b/lib/Transforms/Scalar/RewriteStatepointsForGC.cpp

index a9dc8d8eec079f9606af494a15dc565ffbcc2652..277ac8bea5c128c230a5a87ed64926dda2cc8aa9 100644 (file)
--- a/lib/Transforms/Scalar/RewriteStatepointsForGC.cpp
+++ b/lib/Transforms/Scalar/RewriteStatepointsForGC.cpp
@@ -78,6 +78,13 @@ static cl::opt<bool>
      AllowStatepointWithNoDeoptInfo("rs4gc-allow-statepoint-with-no-deopt-info",
                                     cl::Hidden, cl::init(true));
  
+/// Should we split vectors of pointers into their individual elements?  This
+/// is known to be buggy, but the alternate implementation isn't yet ready.
+/// This is purely to provide a debugging and dianostic hook until the vector
+/// split is replaced with vector relocations.
+static cl::opt<bool> UseVectorSplit("rs4gc-split-vector-values", cl::Hidden,
+                                    cl::init(true));
+
  namespace {
  struct RewriteStatepointsForGC : public ModulePass {
    static char ID; // Pass identification, replacement for typeid
@@ -357,10 +364,6 @@ static BaseDefiningValueResult findBaseDefiningValue(Value *I);
  /// particular element in 'I'.  
  static BaseDefiningValueResult
  findBaseDefiningValueOfVector(Value *I) {
-  assert(I->getType()->isVectorTy() &&
-         cast<VectorType>(I->getType())->getElementType()->isPointerTy() &&
-         "Illegal to ask for the base pointer of a non-pointer type");
-
    // Each case parallels findBaseDefiningValue below, see that code for
    // detailed motivation.
  
@@ -417,41 +420,26 @@ findBaseDefiningValueOfVector(Value *I) {
  /// (i.e. a PHI or Select of two derived pointers), or c) involves a change
  /// from pointer to vector type or back.
  static BaseDefiningValueResult findBaseDefiningValue(Value *I) {
+  assert(I->getType()->isPtrOrPtrVectorTy() &&
+         "Illegal to ask for the base pointer of a non-pointer type");
+
    if (I->getType()->isVectorTy())
      return findBaseDefiningValueOfVector(I);
-  
-  assert(I->getType()->isPointerTy() &&
-         "Illegal to ask for the base pointer of a non-pointer type");
  
    if (isa<Argument>(I))
      // An incoming argument to the function is a base pointer
      // We should have never reached here if this argument isn't an gc value
      return BaseDefiningValueResult(I, true);
  
-  if (isa<GlobalVariable>(I))
-    // base case
+  if (isa<Constant>(I))
+    // We assume that objects with a constant base (e.g. a global) can't move
+    // and don't need to be reported to the collector because they are always
+    // live.  All constants have constant bases.  Besides global references, all
+    // kinds of constants (e.g. undef, constant expressions, null pointers) can
+    // be introduced by the inliner or the optimizer, especially on dynamically
+    // dead paths.  See e.g. test4 in constants.ll.
      return BaseDefiningValueResult(I, true);
  
-  // inlining could possibly introduce phi node that contains
-  // undef if callee has multiple returns
-  if (isa<UndefValue>(I))
-    // utterly meaningless, but useful for dealing with
-    // partially optimized code.
-    return BaseDefiningValueResult(I, true);
-
-  // Due to inheritance, this must be _after_ the global variable and undef
-  // checks
-  if (isa<Constant>(I)) {
-    assert(!isa<GlobalVariable>(I) && !isa<UndefValue>(I) &&
-           "order of checks wrong!");
-    // Note: Even for frontends which don't have constant references, we can
-    // see constants appearing after optimizations.  A simple example is
-    // specialization of an address computation on null feeding into a merge
-    // point where the actual use of the now-constant input is protected by
-    // another null check.  (e.g. test4 in constants.ll)
-    return BaseDefiningValueResult(I, true);
-  }
-
    if (CastInst *CI = dyn_cast<CastInst>(I)) {
      Value *Def = CI->stripPointerCasts();
      // If stripping pointer casts changes the address space there is an
@@ -1140,7 +1128,7 @@ static Value *findBasePointer(Value *I, DefiningValueMapTy &cache) {
      }
      cache[BDV] = base;
    }
-  assert(cache.find(def) != cache.end());
+  assert(cache.count(def));
    return cache[def];
  }
  
@@ -1325,18 +1313,29 @@ static void CreateGCRelocates(ArrayRef<Value *> LiveVariables,
      assert(Index < LiveVec.size() && "Bug in std::find?");
      return Index;
    };
-
-  // All gc_relocate are set to i8 addrspace(1)* type. We originally generated
-  // unique declarations for each pointer type, but this proved problematic
-  // because the intrinsic mangling code is incomplete and fragile.  Since
-  // we're moving towards a single unified pointer type anyways, we can just
-  // cast everything to an i8* of the right address space.  A bitcast is added
-  // later to convert gc_relocate to the actual value's type. 
    Module *M = StatepointToken->getModule();
-  auto AS = cast<PointerType>(LiveVariables[0]->getType())->getAddressSpace();
-  Type *Types[] = {Type::getInt8PtrTy(M->getContext(), AS)};
-  Value *GCRelocateDecl =
-    Intrinsic::getDeclaration(M, Intrinsic::experimental_gc_relocate, Types);
+  
+  // All gc_relocate are generated as i8 addrspace(1)* (or a vector type whose
+  // element type is i8 addrspace(1)*). We originally generated unique
+  // declarations for each pointer type, but this proved problematic because
+  // the intrinsic mangling code is incomplete and fragile.  Since we're moving
+  // towards a single unified pointer type anyways, we can just cast everything
+  // to an i8* of the right address space.  A bitcast is added later to convert
+  // gc_relocate to the actual value's type.  
+  auto getGCRelocateDecl = [&] (Type *Ty) {
+    assert(isHandledGCPointerType(Ty));
+    auto AS = Ty->getScalarType()->getPointerAddressSpace();
+    Type *NewTy = Type::getInt8PtrTy(M->getContext(), AS);
+    if (auto *VT = dyn_cast<VectorType>(Ty))
+      NewTy = VectorType::get(NewTy, VT->getNumElements());
+    return Intrinsic::getDeclaration(M, Intrinsic::experimental_gc_relocate,
+                                     {NewTy});
+  };
+
+  // Lazily populated map from input types to the canonicalized form mentioned
+  // in the comment above.  This should probably be cached somewhere more
+  // broadly.
+  DenseMap<Type*, Value*> TypeToDeclMap;
  
    for (unsigned i = 0; i < LiveVariables.size(); i++) {
      // Generate the gc.relocate call and save the result
@@ -1344,6 +1343,11 @@ static void CreateGCRelocates(ArrayRef<Value *> LiveVariables,
        Builder.getInt32(LiveStart + FindIndex(LiveVariables, BasePtrs[i]));
      Value *LiveIdx = Builder.getInt32(LiveStart + i);
  
+    Type *Ty = LiveVariables[i]->getType();
+    if (!TypeToDeclMap.count(Ty))
+      TypeToDeclMap[Ty] = getGCRelocateDecl(Ty);
+    Value *GCRelocateDecl = TypeToDeclMap[Ty];
+
      // only specify a debug name if we can give a useful one
      CallInst *Reloc = Builder.CreateCall(
          GCRelocateDecl, {StatepointToken, BaseIdx, LiveIdx},
@@ -1642,33 +1646,24 @@ insertRelocationStores(iterator_range<Value::user_iterator> GCRelocs,
                         DenseSet<Value *> &VisitedLiveValues) {
  
    for (User *U : GCRelocs) {
-    if (!isa<IntrinsicInst>(U))
-      continue;
-
-    IntrinsicInst *RelocatedValue = cast<IntrinsicInst>(U);
-
-    // We only care about relocates
-    if (RelocatedValue->getIntrinsicID() !=
-        Intrinsic::experimental_gc_relocate) {
+    GCRelocateInst *Relocate = dyn_cast<GCRelocateInst>(U);
+    if (!Relocate)
        continue;
-    }
  
-    GCRelocateOperands RelocateOperands(RelocatedValue);
-    Value *OriginalValue =
-        const_cast<Value *>(RelocateOperands.getDerivedPtr());
+    Value *OriginalValue = const_cast<Value *>(Relocate->getDerivedPtr());
      assert(AllocaMap.count(OriginalValue));
      Value *Alloca = AllocaMap[OriginalValue];
  
      // Emit store into the related alloca
      // All gc_relocates are i8 addrspace(1)* typed, and it must be bitcasted to
      // the correct type according to alloca.
-    assert(RelocatedValue->getNextNode() &&
+    assert(Relocate->getNextNode() &&
             "Should always have one since it's not a terminator");
-    IRBuilder<> Builder(RelocatedValue->getNextNode());
+    IRBuilder<> Builder(Relocate->getNextNode());
      Value *CastedRelocatedValue =
-      Builder.CreateBitCast(RelocatedValue,
+      Builder.CreateBitCast(Relocate,
                              cast<AllocaInst>(Alloca)->getAllocatedType(),
-                            suffixed_name_or(RelocatedValue, ".casted", ""));
+                            suffixed_name_or(Relocate, ".casted", ""));
  
      StoreInst *Store = new StoreInst(CastedRelocatedValue, Alloca);
      Store->insertAfter(cast<Instruction>(CastedRelocatedValue));
@@ -2404,15 +2399,19 @@ static bool insertParsePoints(Function &F, DominatorTree &DT,
  
    // Do a limited scalarization of any live at safepoint vector values which
    // contain pointers.  This enables this pass to run after vectorization at
-  // the cost of some possible performance loss.  TODO: it would be nice to
-  // natively support vectors all the way through the backend so we don't need
-  // to scalarize here.
-  for (size_t i = 0; i < Records.size(); i++) {
-    PartiallyConstructedSafepointRecord &Info = Records[i];
-    Instruction *Statepoint = ToUpdate[i].getInstruction();
-    splitVectorValues(cast<Instruction>(Statepoint), Info.LiveSet,
-                      Info.PointerToBase, DT);
-  }
+  // the cost of some possible performance loss.  Note: This is known to not
+  // handle updating of the side tables correctly which can lead to relocation
+  // bugs when the same vector is live at multiple statepoints.  We're in the
+  // process of implementing the alternate lowering - relocating the
+  // vector-of-pointers as first class item and updating the backend to
+  // understand that - but that's not yet complete.  
+  if (UseVectorSplit)
+    for (size_t i = 0; i < Records.size(); i++) {
+      PartiallyConstructedSafepointRecord &Info = Records[i];
+      Instruction *Statepoint = ToUpdate[i].getInstruction();
+      splitVectorValues(cast<Instruction>(Statepoint), Info.LiveSet,
+                        Info.PointerToBase, DT);
+    }
  
    // In order to reduce live set of statepoint we might choose to rematerialize
    // some values instead of relocating them. This is purely an optimization and
@@ -2491,7 +2490,8 @@ static bool insertParsePoints(Function &F, DominatorTree &DT,
  #ifndef NDEBUG
    // sanity check
    for (auto *Ptr : Live)
-    assert(isGCPointerType(Ptr->getType()) && "must be a gc pointer type");
+    assert(isHandledGCPointerType(Ptr->getType()) &&
+           "must be a gc pointer type");
  #endif
  
    relocationViaAlloca(F, DT, Live, Records);
@@ -2571,7 +2571,7 @@ void RewriteStatepointsForGC::stripNonValidAttributesFromBody(Function &F) {
  static bool shouldRewriteStatepointsIn(Function &F) {
    // TODO: This should check the GCStrategy
    if (F.hasGC()) {
-    const char *FunctionGCName = F.getGC();
+    const auto &FunctionGCName = F.getGC();
      const StringRef StatepointExampleName("statepoint-example");
      const StringRef CoreCLRName("coreclr");
      return (StatepointExampleName == FunctionGCName) ||