[RS4GC] Use an value handle to help isolate errors quickly

[oota-llvm.git] / lib / Transforms / Scalar / GVN.cpp
diff --git a/lib/Transforms/Scalar/GVN.cpp b/lib/Transforms/Scalar/GVN.cpp

index 9315362afe1ed9018d97b84af2fd5ae0275aadc5..a028b8c444baed70aeabec6978c908663e65c98b 100644 (file)
--- a/lib/Transforms/Scalar/GVN.cpp
+++ b/lib/Transforms/Scalar/GVN.cpp
@@ -129,6 +129,7 @@ namespace {
      uint32_t lookup(Value *V) const;
      uint32_t lookup_or_add_cmp(unsigned Opcode, CmpInst::Predicate Pred,
                                 Value *LHS, Value *RHS);
+    bool exists(Value *V) const;
      void add(Value *V, uint32_t num);
      void clear();
      void erase(Value *v);
@@ -389,6 +390,9 @@ uint32_t ValueTable::lookup_or_add_call(CallInst *C) {
    }
  }
  
+/// Returns true if a value number exists for the specified value.
+bool ValueTable::exists(Value *V) const { return valueNumbering.count(V) != 0; }
+
  /// lookup_or_add - Returns the value number for the specified value, assigning
  /// it a new number if it did not have one before.
  uint32_t ValueTable::lookup_or_add(Value *V) {
@@ -638,15 +642,6 @@ namespace {
      DominatorTree &getDominatorTree() const { return *DT; }
      AliasAnalysis *getAliasAnalysis() const { return VN.getAliasAnalysis(); }
      MemoryDependenceAnalysis &getMemDep() const { return *MD; }
-
-    // Assign VNs for instructions newly created during GVN optimization.
-    void addNewInstruction(Value *Val) {
-      if (Instruction *I = dyn_cast<Instruction>(Val)) {
-        unsigned Num = VN.lookup_or_add(I);
-        addToLeaderTable(Num, I, I->getParent());
-      }
-    }
-
    private:
      /// Push a new Value to the LeaderTable onto the list for its value number.
      void addToLeaderTable(uint32_t N, Value *V, const BasicBlock *BB) {
@@ -1135,8 +1130,7 @@ static int AnalyzeLoadFromClobberingMemInst(Type *LoadTy, Value *LoadPtr,
  /// before we give up.
  static Value *GetStoreValueForLoad(Value *SrcVal, unsigned Offset,
                                     Type *LoadTy,
-                                   Instruction *InsertPt, const DataLayout &DL,
-                                   GVN &gvn){
+                                   Instruction *InsertPt, const DataLayout &DL){
    LLVMContext &Ctx = SrcVal->getType()->getContext();
  
    uint64_t StoreSize = (DL.getTypeSizeInBits(SrcVal->getType()) + 7) / 8;
@@ -1146,15 +1140,11 @@ static Value *GetStoreValueForLoad(Value *SrcVal, unsigned Offset,
  
    // Compute which bits of the stored value are being used by the load.  Convert
    // to an integer type to start with.
-  if (SrcVal->getType()->getScalarType()->isPointerTy()) {
+  if (SrcVal->getType()->getScalarType()->isPointerTy())
      SrcVal = Builder.CreatePtrToInt(SrcVal,
          DL.getIntPtrType(SrcVal->getType()));
-    gvn.addNewInstruction(SrcVal);
-  }
-  if (!SrcVal->getType()->isIntegerTy()) {
+  if (!SrcVal->getType()->isIntegerTy())
      SrcVal = Builder.CreateBitCast(SrcVal, IntegerType::get(Ctx, StoreSize*8));
-    gvn.addNewInstruction(SrcVal);
-  }
  
    // Shift the bits to the least significant depending on endianness.
    unsigned ShiftAmt;
@@ -1163,15 +1153,11 @@ static Value *GetStoreValueForLoad(Value *SrcVal, unsigned Offset,
    else
      ShiftAmt = (StoreSize-LoadSize-Offset)*8;
  
-  if (ShiftAmt) {
+  if (ShiftAmt)
      SrcVal = Builder.CreateLShr(SrcVal, ShiftAmt);
-    gvn.addNewInstruction(SrcVal);
-  }
  
-  if (LoadSize != StoreSize) {
+  if (LoadSize != StoreSize)
      SrcVal = Builder.CreateTrunc(SrcVal, IntegerType::get(Ctx, LoadSize*8));
-    gvn.addNewInstruction(SrcVal);
-  }
  
    return CoerceAvailableValueToLoadType(SrcVal, LoadTy, Builder, DL);
  }
@@ -1210,7 +1196,6 @@ static Value *GetLoadValueForLoad(LoadInst *SrcVal, unsigned Offset,
                                 PtrVal->getType()->getPointerAddressSpace());
      Builder.SetCurrentDebugLocation(SrcVal->getDebugLoc());
      PtrVal = Builder.CreateBitCast(PtrVal, DestPTy);
-    gvn.addNewInstruction(PtrVal);
      LoadInst *NewLoad = Builder.CreateLoad(PtrVal);
      NewLoad->takeName(SrcVal);
      NewLoad->setAlignment(SrcVal->getAlignment());
@@ -1221,13 +1206,10 @@ static Value *GetLoadValueForLoad(LoadInst *SrcVal, unsigned Offset,
      // Replace uses of the original load with the wider load.  On a big endian
      // system, we need to shift down to get the relevant bits.
      Value *RV = NewLoad;
-    if (DL.isBigEndian()) {
+    if (DL.isBigEndian())
        RV = Builder.CreateLShr(RV,
                      NewLoadSize*8-SrcVal->getType()->getPrimitiveSizeInBits());
-      gvn.addNewInstruction(RV);
-    }
      RV = Builder.CreateTrunc(RV, SrcVal->getType());
-    gvn.addNewInstruction(RV);
      SrcVal->replaceAllUsesWith(RV);
  
      // We would like to use gvn.markInstructionForDeletion here, but we can't
@@ -1239,7 +1221,7 @@ static Value *GetLoadValueForLoad(LoadInst *SrcVal, unsigned Offset,
      SrcVal = NewLoad;
    }
  
-  return GetStoreValueForLoad(SrcVal, Offset, LoadTy, InsertPt, DL, gvn);
+  return GetStoreValueForLoad(SrcVal, Offset, LoadTy, InsertPt, DL);
  }
  
  
@@ -1247,7 +1229,7 @@ static Value *GetLoadValueForLoad(LoadInst *SrcVal, unsigned Offset,
  /// memdep query of a load that ends up being a clobbering mem intrinsic.
  static Value *GetMemInstValueForLoad(MemIntrinsic *SrcInst, unsigned Offset,
                                       Type *LoadTy, Instruction *InsertPt,
-                                     const DataLayout &DL, GVN &gvn){
+                                     const DataLayout &DL){
    LLVMContext &Ctx = LoadTy->getContext();
    uint64_t LoadSize = DL.getTypeSizeInBits(LoadTy)/8;
  
@@ -1259,10 +1241,8 @@ static Value *GetMemInstValueForLoad(MemIntrinsic *SrcInst, unsigned Offset,
      // memset(P, 'x', 1234) -> splat('x'), even if x is a variable, and
      // independently of what the offset is.
      Value *Val = MSI->getValue();
-    if (LoadSize != 1) {
+    if (LoadSize != 1)
        Val = Builder.CreateZExt(Val, IntegerType::get(Ctx, LoadSize*8));
-      gvn.addNewInstruction(Val);
-    }
  
      Value *OneElt = Val;
  
@@ -1271,18 +1251,14 @@ static Value *GetMemInstValueForLoad(MemIntrinsic *SrcInst, unsigned Offset,
        // If we can double the number of bytes set, do it.
        if (NumBytesSet*2 <= LoadSize) {
          Value *ShVal = Builder.CreateShl(Val, NumBytesSet*8);
-        gvn.addNewInstruction(ShVal);
          Val = Builder.CreateOr(Val, ShVal);
-        gvn.addNewInstruction(Val);
          NumBytesSet <<= 1;
          continue;
        }
  
        // Otherwise insert one byte at a time.
        Value *ShVal = Builder.CreateShl(Val, 1*8);
-      gvn.addNewInstruction(ShVal);
        Val = Builder.CreateOr(OneElt, ShVal);
-      gvn.addNewInstruction(Val);
        ++NumBytesSet;
      }
  
@@ -1327,8 +1303,7 @@ static Value *ConstructSSAForLoadSet(LoadInst *LI,
    SSAUpdater SSAUpdate(&NewPHIs);
    SSAUpdate.Initialize(LI->getType(), LI->getName());
  
-  for (unsigned i = 0, e = ValuesPerBlock.size(); i != e; ++i) {
-    const AvailableValueInBlock &AV = ValuesPerBlock[i];
+  for (const AvailableValueInBlock &AV : ValuesPerBlock) {
      BasicBlock *BB = AV.BB;
  
      if (SSAUpdate.HasValueForBlock(BB))
@@ -1349,7 +1324,7 @@ Value *AvailableValueInBlock::MaterializeAdjustedValue(LoadInst *LI,
    if (isSimpleValue()) {
      Res = getSimpleValue();
      if (Res->getType() != LoadTy) {
-      Res = GetStoreValueForLoad(Res, Offset, LoadTy, BB->getTerminator(), DL, gvn);
+      Res = GetStoreValueForLoad(Res, Offset, LoadTy, BB->getTerminator(), DL);
  
        DEBUG(dbgs() << "GVN COERCED NONLOCAL VAL:\nOffset: " << Offset << "  "
                     << *getSimpleValue() << '\n'
@@ -1369,7 +1344,7 @@ Value *AvailableValueInBlock::MaterializeAdjustedValue(LoadInst *LI,
      }
    } else if (isMemIntrinValue()) {
      Res = GetMemInstValueForLoad(getMemIntrinValue(), Offset, LoadTy,
-                                 BB->getTerminator(), DL, gvn);
+                                 BB->getTerminator(), DL);
      DEBUG(dbgs() << "GVN COERCED NONLOCAL MEM INTRIN:\nOffset: " << Offset
                   << "  " << *getMemIntrinValue() << '\n'
                   << *Res << '\n' << "\n\n\n");
@@ -1538,9 +1513,8 @@ bool GVN::PerformLoadPRE(LoadInst *LI, AvailValInBlkVect &ValuesPerBlock,
    // that we only have to insert *one* load (which means we're basically moving
    // the load, not inserting a new one).
  
-  SmallPtrSet<BasicBlock *, 4> Blockers;
-  for (unsigned i = 0, e = UnavailableBlocks.size(); i != e; ++i)
-    Blockers.insert(UnavailableBlocks[i]);
+  SmallPtrSet<BasicBlock *, 4> Blockers(UnavailableBlocks.begin(),
+                                        UnavailableBlocks.end());
  
    // Let's find the first basic block with more than one predecessor.  Walk
    // backwards through predecessors if needed.
@@ -1570,15 +1544,22 @@ bool GVN::PerformLoadPRE(LoadInst *LI, AvailValInBlkVect &ValuesPerBlock,
    // available.
    MapVector<BasicBlock *, Value *> PredLoads;
    DenseMap<BasicBlock*, char> FullyAvailableBlocks;
-  for (unsigned i = 0, e = ValuesPerBlock.size(); i != e; ++i)
-    FullyAvailableBlocks[ValuesPerBlock[i].BB] = true;
-  for (unsigned i = 0, e = UnavailableBlocks.size(); i != e; ++i)
-    FullyAvailableBlocks[UnavailableBlocks[i]] = false;
+  for (const AvailableValueInBlock &AV : ValuesPerBlock)
+    FullyAvailableBlocks[AV.BB] = true;
+  for (BasicBlock *UnavailableBB : UnavailableBlocks)
+    FullyAvailableBlocks[UnavailableBB] = false;
  
    SmallVector<BasicBlock *, 4> CriticalEdgePred;
-  for (pred_iterator PI = pred_begin(LoadBB), E = pred_end(LoadBB);
-       PI != E; ++PI) {
-    BasicBlock *Pred = *PI;
+  for (BasicBlock *Pred : predecessors(LoadBB)) {
+    // If any predecessor block is an EH pad that does not allow non-PHI
+    // instructions before the terminator, we can't PRE the load.
+    if (Pred->getTerminator()->isEHPad()) {
+      DEBUG(dbgs()
+            << "COULD NOT PRE LOAD BECAUSE OF AN EH PAD PREDECESSOR '"
+            << Pred->getName() << "': " << *LI << '\n');
+      return false;
+    }
+
      if (IsValueFullyAvailableInBlock(Pred, FullyAvailableBlocks, 0)) {
        continue;
      }
@@ -1675,12 +1656,12 @@ bool GVN::PerformLoadPRE(LoadInst *LI, AvailValInBlkVect &ValuesPerBlock,
                   << *NewInsts.back() << '\n');
  
    // Assign value numbers to the new instructions.
-  for (unsigned i = 0, e = NewInsts.size(); i != e; ++i) {
+  for (Instruction *I : NewInsts) {
      // FIXME: We really _ought_ to insert these value numbers into their
      // parent's availability map.  However, in doing so, we risk getting into
      // ordering issues.  If a block hasn't been processed yet, we would be
      // marking a value as AVAIL-IN, which isn't what we intend.
-    VN.lookup_or_add(NewInsts[i]);
+    VN.lookup_or_add(I);
    }
  
    for (const auto &PredLoad : PredLoads) {
@@ -1697,6 +1678,8 @@ bool GVN::PerformLoadPRE(LoadInst *LI, AvailValInBlkVect &ValuesPerBlock,
      if (Tags)
        NewLoad->setAAMetadata(Tags);
  
+    if (auto *MD = LI->getMetadata(LLVMContext::MD_invariant_load))
+      NewLoad->setMetadata(LLVMContext::MD_invariant_load, MD);
      if (auto *InvGroupMD = LI->getMetadata(LLVMContext::MD_invariant_group))
        NewLoad->setMetadata(LLVMContext::MD_invariant_group, InvGroupMD);
  
@@ -1727,6 +1710,10 @@ bool GVN::PerformLoadPRE(LoadInst *LI, AvailValInBlkVect &ValuesPerBlock,
  /// Attempt to eliminate a load whose dependencies are
  /// non-local by performing PHI construction.
  bool GVN::processNonLocalLoad(LoadInst *LI) {
+  // non-local speculations are not allowed under asan.
+  if (LI->getParent()->getParent()->hasFnAttribute(Attribute::SanitizeAddress))
+    return false;
+
    // Step 1: Find the non-local dependencies of the load.
    LoadDepVect Deps;
    MD->getNonLocalPointerDependency(LI, Deps);
@@ -1927,7 +1914,7 @@ bool GVN::processLoad(LoadInst *L) {
            L->getType(), L->getPointerOperand(), DepSI);
        if (Offset != -1)
          AvailVal = GetStoreValueForLoad(DepSI->getValueOperand(), Offset,
-                                        L->getType(), L, DL, *this);
+                                        L->getType(), L, DL);
      }
  
      // Check to see if we have something like this:
@@ -1952,7 +1939,7 @@ bool GVN::processLoad(LoadInst *L) {
        int Offset = AnalyzeLoadFromClobberingMemInst(
            L->getType(), L->getPointerOperand(), DepMI, DL);
        if (Offset != -1)
-        AvailVal = GetMemInstValueForLoad(DepMI, Offset, L->getType(), L, DL, *this);
+        AvailVal = GetMemInstValueForLoad(DepMI, Offset, L->getType(), L, DL);
      }
  
      if (AvailVal) {
@@ -2556,7 +2543,14 @@ bool GVN::performScalarPREInsertion(Instruction *Instr, BasicBlock *Pred,
      Value *Op = Instr->getOperand(i);
      if (isa<Argument>(Op) || isa<Constant>(Op) || isa<GlobalValue>(Op))
        continue;
-
+    // This could be a newly inserted instruction, in which case, we won't
+    // find a value number, and should give up before we hurt ourselves.
+    // FIXME: Rewrite the infrastructure to let it easier to value number
+    // and process newly inserted instructions.
+    if (!VN.exists(Op)) {
+      success = false;
+      break;
+    }
      if (Value *V = findLeader(Pred, VN.lookup(Op))) {
        Instr->setOperand(i, V);
      } else {
@@ -2616,9 +2610,7 @@ bool GVN::performScalarPRE(Instruction *CurInst) {
    BasicBlock *CurrentBlock = CurInst->getParent();
    predMap.clear();
  
-  for (pred_iterator PI = pred_begin(CurrentBlock), PE = pred_end(CurrentBlock);
-       PI != PE; ++PI) {
-    BasicBlock *P = *PI;
+  for (BasicBlock *P : predecessors(CurrentBlock)) {
      // We're not interested in PRE where the block is its
      // own predecessor, or in blocks with predecessors
      // that are not reachable.
@@ -2731,7 +2723,7 @@ bool GVN::performPRE(Function &F) {
                                BE = CurrentBlock->end();
           BI != BE;) {
        Instruction *CurInst = &*BI++;
-      Changed = performScalarPRE(CurInst);
+      Changed |= performScalarPRE(CurInst);
      }
    }
  
@@ -2835,17 +2827,14 @@ void GVN::addDeadBlock(BasicBlock *BB) {
      DeadBlocks.insert(Dom.begin(), Dom.end());
      
      // Figure out the dominance-frontier(D).
-    for (SmallVectorImpl<BasicBlock *>::iterator I = Dom.begin(),
-           E = Dom.end(); I != E; I++) {
-      BasicBlock *B = *I;
-      for (succ_iterator SI = succ_begin(B), SE = succ_end(B); SI != SE; SI++) {
-        BasicBlock *S = *SI;
+    for (BasicBlock *B : Dom) {
+      for (BasicBlock *S : successors(B)) {
          if (DeadBlocks.count(S))
            continue;
  
          bool AllPredDead = true;
-        for (pred_iterator PI = pred_begin(S), PE = pred_end(S); PI != PE; PI++)
-          if (!DeadBlocks.count(*PI)) {
+        for (BasicBlock *P : predecessors(S))
+          if (!DeadBlocks.count(P)) {
              AllPredDead = false;
              break;
            }
@@ -2873,10 +2862,7 @@ void GVN::addDeadBlock(BasicBlock *BB) {
        continue;
  
      SmallVector<BasicBlock *, 4> Preds(pred_begin(B), pred_end(B));
-    for (SmallVectorImpl<BasicBlock *>::iterator PI = Preds.begin(),
-           PE = Preds.end(); PI != PE; PI++) {
-      BasicBlock *P = *PI;
-
+    for (BasicBlock *P : Preds) {
        if (!DeadBlocks.count(P))
          continue;
  
@@ -2936,14 +2922,10 @@ bool GVN::processFoldableCondBr(BranchInst *BI) {
  // instructions, it makes more sense just to "fabricate" a val-number for the
  // dead code than checking if instruction involved is dead or not.
  void GVN::assignValNumForDeadCode() {
-  for (SetVector<BasicBlock *>::iterator I = DeadBlocks.begin(),
-        E = DeadBlocks.end(); I != E; I++) {
-    BasicBlock *BB = *I;
-    for (BasicBlock::iterator II = BB->begin(), EE = BB->end();
-          II != EE; II++) {
-      Instruction *Inst = &*II;
-      unsigned ValNum = VN.lookup_or_add(Inst);
-      addToLeaderTable(ValNum, Inst, BB);
+  for (BasicBlock *BB : DeadBlocks) {
+    for (Instruction &Inst : *BB) {
+      unsigned ValNum = VN.lookup_or_add(&Inst);
+      addToLeaderTable(ValNum, &Inst, BB);
      }
    }
  }