Speculatively revert r97010, "Add an argument to PHITranslateValue to specify

[oota-llvm.git] / lib / Transforms / Scalar / GVN.cpp
diff --git a/lib/Transforms/Scalar/GVN.cpp b/lib/Transforms/Scalar/GVN.cpp

index 6e709523af38cbc92ed55d507e3e62193696b42f..164730c3ca06d0f61bef011cc8ea6ade7e28d92c 100644 (file)
--- a/lib/Transforms/Scalar/GVN.cpp
+++ b/lib/Transforms/Scalar/GVN.cpp
@@ -60,6 +60,7 @@ STATISTIC(NumPRELoad,   "Number of loads PRE'd");
  static cl::opt<bool> EnablePRE("enable-pre",
                                 cl::init(true), cl::Hidden);
  static cl::opt<bool> EnableLoadPRE("enable-load-pre", cl::init(true));
+static cl::opt<bool> EnableFullLoadPRE("enable-full-load-pre", cl::init(false));
  
  //===----------------------------------------------------------------------===//
  //                         ValueTable Class
@@ -673,6 +674,9 @@ namespace {
      ValueTable VN;
      DenseMap<BasicBlock*, ValueNumberScope*> localAvail;
  
+    // List of critical edges to be split between iterations.
+    SmallVector<std::pair<TerminatorInst*, unsigned>, 4> toSplit;
+
      // This transformation requires dominator postdominator info
      virtual void getAnalysisUsage(AnalysisUsage &AU) const {
        AU.addRequired<DominatorTree>();
@@ -700,6 +704,7 @@ namespace {
      Value *lookupNumber(BasicBlock *BB, uint32_t num);
      void cleanupGlobalSets();
      void verifyRemoved(const Instruction *I) const;
+    bool splitCriticalEdges();
    };
  
    char GVN::ID = 0;
@@ -835,9 +840,9 @@ static bool CanCoerceMustAliasedValueToLoad(Value *StoredVal,
                                              const TargetData &TD) {
    // If the loaded or stored value is an first class array or struct, don't try
    // to transform them.  We need to be able to bitcast to integer.
-  if (isa<StructType>(LoadTy) || isa<ArrayType>(LoadTy) ||
-      isa<StructType>(StoredVal->getType()) ||
-      isa<ArrayType>(StoredVal->getType()))
+  if (LoadTy->isStructTy() || LoadTy->isArrayTy() ||
+      StoredVal->getType()->isStructTy() ||
+      StoredVal->getType()->isArrayTy())
      return false;
    
    // The store has to be at least as big as the load.
@@ -869,26 +874,26 @@ static Value *CoerceAvailableValueToLoadType(Value *StoredVal,
    
    // If the store and reload are the same size, we can always reuse it.
    if (StoreSize == LoadSize) {
-    if (isa<PointerType>(StoredValTy) && isa<PointerType>(LoadedTy)) {
+    if (StoredValTy->isPointerTy() && LoadedTy->isPointerTy()) {
        // Pointer to Pointer -> use bitcast.
        return new BitCastInst(StoredVal, LoadedTy, "", InsertPt);
      }
      
      // Convert source pointers to integers, which can be bitcast.
-    if (isa<PointerType>(StoredValTy)) {
+    if (StoredValTy->isPointerTy()) {
        StoredValTy = TD.getIntPtrType(StoredValTy->getContext());
        StoredVal = new PtrToIntInst(StoredVal, StoredValTy, "", InsertPt);
      }
      
      const Type *TypeToCastTo = LoadedTy;
-    if (isa<PointerType>(TypeToCastTo))
+    if (TypeToCastTo->isPointerTy())
        TypeToCastTo = TD.getIntPtrType(StoredValTy->getContext());
      
      if (StoredValTy != TypeToCastTo)
        StoredVal = new BitCastInst(StoredVal, TypeToCastTo, "", InsertPt);
      
      // Cast to pointer if the load needs a pointer type.
-    if (isa<PointerType>(LoadedTy))
+    if (LoadedTy->isPointerTy())
        StoredVal = new IntToPtrInst(StoredVal, LoadedTy, "", InsertPt);
      
      return StoredVal;
@@ -900,13 +905,13 @@ static Value *CoerceAvailableValueToLoadType(Value *StoredVal,
    assert(StoreSize >= LoadSize && "CanCoerceMustAliasedValueToLoad fail");
    
    // Convert source pointers to integers, which can be manipulated.
-  if (isa<PointerType>(StoredValTy)) {
+  if (StoredValTy->isPointerTy()) {
      StoredValTy = TD.getIntPtrType(StoredValTy->getContext());
      StoredVal = new PtrToIntInst(StoredVal, StoredValTy, "", InsertPt);
    }
    
    // Convert vectors and fp to integer, which can be manipulated.
-  if (!isa<IntegerType>(StoredValTy)) {
+  if (!StoredValTy->isIntegerTy()) {
      StoredValTy = IntegerType::get(StoredValTy->getContext(), StoreSize);
      StoredVal = new BitCastInst(StoredVal, StoredValTy, "", InsertPt);
    }
@@ -926,7 +931,7 @@ static Value *CoerceAvailableValueToLoadType(Value *StoredVal,
      return StoredVal;
    
    // If the result is a pointer, inttoptr.
-  if (isa<PointerType>(LoadedTy))
+  if (LoadedTy->isPointerTy())
      return new IntToPtrInst(StoredVal, LoadedTy, "inttoptr", InsertPt);
    
    // Otherwise, bitcast.
@@ -988,7 +993,7 @@ static int AnalyzeLoadFromClobberingWrite(const Type *LoadTy, Value *LoadPtr,
                                            const TargetData &TD) {
    // If the loaded or stored value is an first class array or struct, don't try
    // to transform them.  We need to be able to bitcast to integer.
-  if (isa<StructType>(LoadTy) || isa<ArrayType>(LoadTy))
+  if (LoadTy->isStructTy() || LoadTy->isArrayTy())
      return -1;
    
    int64_t StoreOffset = 0, LoadOffset = 0;
@@ -1063,8 +1068,8 @@ static int AnalyzeLoadFromClobberingStore(const Type *LoadTy, Value *LoadPtr,
                                            StoreInst *DepSI,
                                            const TargetData &TD) {
    // Cannot handle reading from store of first-class aggregate yet.
-  if (isa<StructType>(DepSI->getOperand(0)->getType()) ||
-      isa<ArrayType>(DepSI->getOperand(0)->getType()))
+  if (DepSI->getOperand(0)->getType()->isStructTy() ||
+      DepSI->getOperand(0)->getType()->isArrayTy())
      return -1;
  
    Value *StorePtr = DepSI->getPointerOperand();
@@ -1135,9 +1140,9 @@ static Value *GetStoreValueForLoad(Value *SrcVal, unsigned Offset,
    
    // Compute which bits of the stored value are being used by the load.  Convert
    // to an integer type to start with.
-  if (isa<PointerType>(SrcVal->getType()))
+  if (SrcVal->getType()->isPointerTy())
      SrcVal = Builder.CreatePtrToInt(SrcVal, TD.getIntPtrType(Ctx), "tmp");
-  if (!isa<IntegerType>(SrcVal->getType()))
+  if (!SrcVal->getType()->isIntegerTy())
      SrcVal = Builder.CreateBitCast(SrcVal, IntegerType::get(Ctx, StoreSize*8),
                                     "tmp");
    
@@ -1322,7 +1327,7 @@ static Value *ConstructSSAForLoadSet(LoadInst *LI,
    Value *V = SSAUpdate.GetValueInMiddleOfBlock(LI->getParent());
    
    // If new PHI nodes were created, notify alias analysis.
-  if (isa<PointerType>(V->getType()))
+  if (V->getType()->isPointerTy())
      for (unsigned i = 0, e = NewPHIs.size(); i != e; ++i)
        AA->copyValue(LI, NewPHIs[i]);
  
@@ -1490,8 +1495,9 @@ bool GVN::processNonLocalLoad(LoadInst *LI,
  
      if (isa<PHINode>(V))
        V->takeName(LI);
-    if (isa<PointerType>(V->getType()))
+    if (V->getType()->isPointerTy())
        MD->invalidateCachedPointerInfo(V);
+    VN.erase(LI);
      toErase.push_back(LI);
      NumGVNLoad++;
      return true;
@@ -1537,10 +1543,12 @@ bool GVN::processNonLocalLoad(LoadInst *LI,
    // at least one of the values is LI.  Since this means that we won't be able
    // to eliminate LI even if we insert uses in the other predecessors, we will
    // end up increasing code size.  Reject this by scanning for LI.
-  for (unsigned i = 0, e = ValuesPerBlock.size(); i != e; ++i)
-    if (ValuesPerBlock[i].isSimpleValue() &&
-        ValuesPerBlock[i].getSimpleValue() == LI)
-      return false;
+  if (!EnableFullLoadPRE) {
+    for (unsigned i = 0, e = ValuesPerBlock.size(); i != e; ++i)
+      if (ValuesPerBlock[i].isSimpleValue() &&
+          ValuesPerBlock[i].getSimpleValue() == LI)
+        return false;
+  }
  
    // FIXME: It is extremely unclear what this loop is doing, other than
    // artificially restricting loadpre.
@@ -1564,13 +1572,9 @@ bool GVN::processNonLocalLoad(LoadInst *LI,
        return false;
    }
  
-  // Okay, we have some hope :).  Check to see if the loaded value is fully
-  // available in all but one predecessor.
-  // FIXME: If we could restructure the CFG, we could make a common pred with
-  // all the preds that don't have an available LI and insert a new load into
-  // that one block.
-  BasicBlock *UnavailablePred = 0;
-
+  // Check to see how many predecessors have the loaded value fully
+  // available.
+  DenseMap<BasicBlock*, Value*> PredLoads;
    DenseMap<BasicBlock*, char> FullyAvailableBlocks;
    for (unsigned i = 0, e = ValuesPerBlock.size(); i != e; ++i)
      FullyAvailableBlocks[ValuesPerBlock[i].BB] = true;
@@ -1579,81 +1583,98 @@ bool GVN::processNonLocalLoad(LoadInst *LI,
  
    for (pred_iterator PI = pred_begin(LoadBB), E = pred_end(LoadBB);
         PI != E; ++PI) {
-    if (IsValueFullyAvailableInBlock(*PI, FullyAvailableBlocks))
+    BasicBlock *Pred = *PI;
+    if (IsValueFullyAvailableInBlock(Pred, FullyAvailableBlocks)) {
        continue;
+    }
+    PredLoads[Pred] = 0;
  
-    // If this load is not available in multiple predecessors, reject it.
-    if (UnavailablePred && UnavailablePred != *PI)
+    if (Pred->getTerminator()->getNumSuccessors() != 1) {
+      if (isa<IndirectBrInst>(Pred->getTerminator())) {
+        DEBUG(dbgs() << "COULD NOT PRE LOAD BECAUSE OF INDBR CRITICAL EDGE '"
+              << Pred->getName() << "': " << *LI << '\n');
+        return false;
+      }
+      unsigned SuccNum = GetSuccessorNumber(Pred, LoadBB);
+      toSplit.push_back(std::make_pair(Pred->getTerminator(), SuccNum));
        return false;
-    UnavailablePred = *PI;
+    }
    }
  
-  assert(UnavailablePred != 0 &&
+  // Decide whether PRE is profitable for this load.
+  unsigned NumUnavailablePreds = PredLoads.size();
+  assert(NumUnavailablePreds != 0 &&
           "Fully available value should be eliminated above!");
-
-  // We don't currently handle critical edges :(
-  if (UnavailablePred->getTerminator()->getNumSuccessors() != 1) {
-    DEBUG(dbgs() << "COULD NOT PRE LOAD BECAUSE OF CRITICAL EDGE '"
-                 << UnavailablePred->getName() << "': " << *LI << '\n');
-    return false;
+  if (!EnableFullLoadPRE) {
+    // If this load is unavailable in multiple predecessors, reject it.
+    // FIXME: If we could restructure the CFG, we could make a common pred with
+    // all the preds that don't have an available LI and insert a new load into
+    // that one block.
+    if (NumUnavailablePreds != 1)
+      return false;
    }
-  
-  // Do PHI translation to get its value in the predecessor if necessary.  The
-  // returned pointer (if non-null) is guaranteed to dominate UnavailablePred.
-  //
+
+  // Check if the load can safely be moved to all the unavailable predecessors.
+  bool CanDoPRE = true;
    SmallVector<Instruction*, 8> NewInsts;
-  
-  // If all preds have a single successor, then we know it is safe to insert the
-  // load on the pred (?!?), so we can insert code to materialize the pointer if
-  // it is not available.
-  PHITransAddr Address(LI->getOperand(0), TD);
-  Value *LoadPtr = 0;
-  if (allSingleSucc) {
-    LoadPtr = Address.PHITranslateWithInsertion(LoadBB, UnavailablePred,
-                                                *DT, NewInsts);
-  } else {
-    Address.PHITranslateValue(LoadBB, UnavailablePred);
-    LoadPtr = Address.getAddr();
+  for (DenseMap<BasicBlock*, Value*>::iterator I = PredLoads.begin(),
+         E = PredLoads.end(); I != E; ++I) {
+    BasicBlock *UnavailablePred = I->first;
+
+    // Do PHI translation to get its value in the predecessor if necessary.  The
+    // returned pointer (if non-null) is guaranteed to dominate UnavailablePred.
+
+    // If all preds have a single successor, then we know it is safe to insert
+    // the load on the pred (?!?), so we can insert code to materialize the
+    // pointer if it is not available.
+    PHITransAddr Address(LI->getOperand(0), TD);
+    Value *LoadPtr = 0;
+    if (allSingleSucc) {
+      LoadPtr = Address.PHITranslateWithInsertion(LoadBB, UnavailablePred,
+                                                  *DT, NewInsts);
+    } else {
+      Address.PHITranslateValue(LoadBB, UnavailablePred);
+      LoadPtr = Address.getAddr();
      
-    // Make sure the value is live in the predecessor.
-    if (Instruction *Inst = dyn_cast_or_null<Instruction>(LoadPtr))
-      if (!DT->dominates(Inst->getParent(), UnavailablePred))
-        LoadPtr = 0;
-  }
+      // Make sure the value is live in the predecessor.
+      if (Instruction *Inst = dyn_cast_or_null<Instruction>(LoadPtr))
+        if (!DT->dominates(Inst->getParent(), UnavailablePred))
+          LoadPtr = 0;
+    }
  
-  // If we couldn't find or insert a computation of this phi translated value,
-  // we fail PRE.
-  if (LoadPtr == 0) {
-    assert(NewInsts.empty() && "Shouldn't insert insts on failure");
-    DEBUG(dbgs() << "COULDN'T INSERT PHI TRANSLATED VALUE OF: "
-                 << *LI->getOperand(0) << "\n");
-    return false;
-  }
+    // If we couldn't find or insert a computation of this phi translated value,
+    // we fail PRE.
+    if (LoadPtr == 0) {
+      DEBUG(dbgs() << "COULDN'T INSERT PHI TRANSLATED VALUE OF: "
+            << *LI->getOperand(0) << "\n");
+      CanDoPRE = false;
+      break;
+    }
  
-  // Assign value numbers to these new instructions.
-  for (unsigned i = 0, e = NewInsts.size(); i != e; ++i) {
-    // FIXME: We really _ought_ to insert these value numbers into their 
-    // parent's availability map.  However, in doing so, we risk getting into
-    // ordering issues.  If a block hasn't been processed yet, we would be
-    // marking a value as AVAIL-IN, which isn't what we intend.
-    VN.lookup_or_add(NewInsts[i]);
+    // Make sure it is valid to move this load here.  We have to watch out for:
+    //  @1 = getelementptr (i8* p, ...
+    //  test p and branch if == 0
+    //  load @1
+    // It is valid to have the getelementptr before the test, even if p can be 0,
+    // as getelementptr only does address arithmetic.
+    // If we are not pushing the value through any multiple-successor blocks
+    // we do not have this case.  Otherwise, check that the load is safe to
+    // put anywhere; this can be improved, but should be conservatively safe.
+    if (!allSingleSucc &&
+        // FIXME: REEVALUTE THIS.
+        !isSafeToLoadUnconditionally(LoadPtr,
+                                     UnavailablePred->getTerminator(),
+                                     LI->getAlignment(), TD)) {
+      CanDoPRE = false;
+      break;
+    }
+
+    I->second = LoadPtr;
    }
-  
-  // Make sure it is valid to move this load here.  We have to watch out for:
-  //  @1 = getelementptr (i8* p, ...
-  //  test p and branch if == 0
-  //  load @1
-  // It is valid to have the getelementptr before the test, even if p can be 0,
-  // as getelementptr only does address arithmetic.
-  // If we are not pushing the value through any multiple-successor blocks
-  // we do not have this case.  Otherwise, check that the load is safe to
-  // put anywhere; this can be improved, but should be conservatively safe.
-  if (!allSingleSucc &&
-      // FIXME: REEVALUTE THIS.
-      !isSafeToLoadUnconditionally(LoadPtr,
-                                   UnavailablePred->getTerminator(),
-                                   LI->getAlignment(), TD)) {
-    assert(NewInsts.empty() && "Should not have inserted instructions");
+
+  if (!CanDoPRE) {
+    while (!NewInsts.empty())
+      NewInsts.pop_back_val()->eraseFromParent();
      return false;
    }
  
@@ -1665,12 +1686,30 @@ bool GVN::processNonLocalLoad(LoadInst *LI,
            dbgs() << "INSERTED " << NewInsts.size() << " INSTS: "
                   << *NewInsts.back() << '\n');
    
-  Value *NewLoad = new LoadInst(LoadPtr, LI->getName()+".pre", false,
-                                LI->getAlignment(),
-                                UnavailablePred->getTerminator());
+  // Assign value numbers to the new instructions.
+  for (unsigned i = 0, e = NewInsts.size(); i != e; ++i) {
+    // FIXME: We really _ought_ to insert these value numbers into their 
+    // parent's availability map.  However, in doing so, we risk getting into
+    // ordering issues.  If a block hasn't been processed yet, we would be
+    // marking a value as AVAIL-IN, which isn't what we intend.
+    VN.lookup_or_add(NewInsts[i]);
+  }
  
-  // Add the newly created load.
-  ValuesPerBlock.push_back(AvailableValueInBlock::get(UnavailablePred,NewLoad));
+  for (DenseMap<BasicBlock*, Value*>::iterator I = PredLoads.begin(),
+         E = PredLoads.end(); I != E; ++I) {
+    BasicBlock *UnavailablePred = I->first;
+    Value *LoadPtr = I->second;
+
+    Value *NewLoad = new LoadInst(LoadPtr, LI->getName()+".pre", false,
+                                  LI->getAlignment(),
+                                  UnavailablePred->getTerminator());
+
+    // Add the newly created load.
+    ValuesPerBlock.push_back(AvailableValueInBlock::get(UnavailablePred,
+                                                        NewLoad));
+    MD->invalidateCachedPointerInfo(LoadPtr);
+    DEBUG(dbgs() << "GVN INSERTED " << *NewLoad << '\n');
+  }
  
    // Perform PHI construction.
    Value *V = ConstructSSAForLoadSet(LI, ValuesPerBlock, TD, *DT,
@@ -1678,8 +1717,9 @@ bool GVN::processNonLocalLoad(LoadInst *LI,
    LI->replaceAllUsesWith(V);
    if (isa<PHINode>(V))
      V->takeName(LI);
-  if (isa<PointerType>(V->getType()))
+  if (V->getType()->isPointerTy())
      MD->invalidateCachedPointerInfo(V);
+  VN.erase(LI);
    toErase.push_back(LI);
    NumPRELoad++;
    return true;
@@ -1738,8 +1778,9 @@ bool GVN::processLoad(LoadInst *L, SmallVectorImpl<Instruction*> &toErase) {
        
        // Replace the load!
        L->replaceAllUsesWith(AvailVal);
-      if (isa<PointerType>(AvailVal->getType()))
+      if (AvailVal->getType()->isPointerTy())
          MD->invalidateCachedPointerInfo(AvailVal);
+      VN.erase(L);
        toErase.push_back(L);
        NumGVNLoad++;
        return true;
@@ -1783,8 +1824,9 @@ bool GVN::processLoad(LoadInst *L, SmallVectorImpl<Instruction*> &toErase) {
  
      // Remove it!
      L->replaceAllUsesWith(StoredVal);
-    if (isa<PointerType>(StoredVal->getType()))
+    if (StoredVal->getType()->isPointerTy())
        MD->invalidateCachedPointerInfo(StoredVal);
+    VN.erase(L);
      toErase.push_back(L);
      NumGVNLoad++;
      return true;
@@ -1812,8 +1854,9 @@ bool GVN::processLoad(LoadInst *L, SmallVectorImpl<Instruction*> &toErase) {
      
      // Remove it!
      L->replaceAllUsesWith(AvailableVal);
-    if (isa<PointerType>(DepLI->getType()))
+    if (DepLI->getType()->isPointerTy())
        MD->invalidateCachedPointerInfo(DepLI);
+    VN.erase(L);
      toErase.push_back(L);
      NumGVNLoad++;
      return true;
@@ -1824,6 +1867,7 @@ bool GVN::processLoad(LoadInst *L, SmallVectorImpl<Instruction*> &toErase) {
    // intervening stores, for example.
    if (isa<AllocaInst>(DepInst) || isMalloc(DepInst)) {
      L->replaceAllUsesWith(UndefValue::get(L->getType()));
+    VN.erase(L);
      toErase.push_back(L);
      NumGVNLoad++;
      return true;
@@ -1834,6 +1878,7 @@ bool GVN::processLoad(LoadInst *L, SmallVectorImpl<Instruction*> &toErase) {
    if (IntrinsicInst* II = dyn_cast<IntrinsicInst>(DepInst)) {
      if (II->getIntrinsicID() == Intrinsic::lifetime_start) {
        L->replaceAllUsesWith(UndefValue::get(L->getType()));
+      VN.erase(L);
        toErase.push_back(L);
        NumGVNLoad++;
        return true;
@@ -1864,6 +1909,10 @@ Value *GVN::lookupNumber(BasicBlock *BB, uint32_t num) {
  /// by inserting it into the appropriate sets
  bool GVN::processInstruction(Instruction *I,
                               SmallVectorImpl<Instruction*> &toErase) {
+  // Ignore dbg info intrinsics.
+  if (isa<DbgInfoIntrinsic>(I))
+    return false;
+
    if (LoadInst *LI = dyn_cast<LoadInst>(I)) {
      bool Changed = processLoad(LI, toErase);
  
@@ -1912,7 +1961,7 @@ bool GVN::processInstruction(Instruction *I,
  
      if (constVal) {
        p->replaceAllUsesWith(constVal);
-      if (MD && isa<PointerType>(constVal->getType()))
+      if (MD && constVal->getType()->isPointerTy())
          MD->invalidateCachedPointerInfo(constVal);
        VN.erase(p);
  
@@ -1933,7 +1982,7 @@ bool GVN::processInstruction(Instruction *I,
      // Remove it!
      VN.erase(I);
      I->replaceAllUsesWith(repl);
-    if (MD && isa<PointerType>(repl->getType()))
+    if (MD && repl->getType()->isPointerTy())
        MD->invalidateCachedPointerInfo(repl);
      toErase.push_back(I);
      return true;
@@ -1973,6 +2022,8 @@ bool GVN::runOnFunction(Function& F) {
    while (ShouldContinue) {
      DEBUG(dbgs() << "GVN iteration: " << Iteration << "\n");
      ShouldContinue = iterateOnFunction(F);
+    if (splitCriticalEdges())
+      ShouldContinue = true;
      Changed |= ShouldContinue;
      ++Iteration;
    }
@@ -2039,7 +2090,6 @@ bool GVN::processBlock(BasicBlock *BB) {
  /// control flow patterns and attempts to perform simple PRE at the join point.
  bool GVN::performPRE(Function &F) {
    bool Changed = false;
-  SmallVector<std::pair<TerminatorInst*, unsigned>, 4> toSplit;
    DenseMap<BasicBlock*, Value*> predMap;
    for (df_iterator<BasicBlock*> DI = df_begin(&F.getEntryBlock()),
         DE = df_end(&F.getEntryBlock()); DI != DE; ++DI) {
@@ -2075,7 +2125,7 @@ bool GVN::performPRE(Function &F) {
        for (pred_iterator PI = pred_begin(CurrentBlock),
             PE = pred_end(CurrentBlock); PI != PE; ++PI) {
          // We're not interested in PRE where the block is its
-        // own predecessor, on in blocks with predecessors
+        // own predecessor, or in blocks with predecessors
          // that are not reachable.
          if (*PI == CurrentBlock) {
            NumWithout = 2;
@@ -2110,23 +2160,16 @@ bool GVN::performPRE(Function &F) {
        // We can't do PRE safely on a critical edge, so instead we schedule
        // the edge to be split and perform the PRE the next time we iterate
        // on the function.
-      unsigned SuccNum = 0;
-      for (unsigned i = 0, e = PREPred->getTerminator()->getNumSuccessors();
-           i != e; ++i)
-        if (PREPred->getTerminator()->getSuccessor(i) == CurrentBlock) {
-          SuccNum = i;
-          break;
-        }
-
+      unsigned SuccNum = GetSuccessorNumber(PREPred, CurrentBlock);
        if (isCriticalEdge(PREPred->getTerminator(), SuccNum)) {
          toSplit.push_back(std::make_pair(PREPred->getTerminator(), SuccNum));
          continue;
        }
  
-      // Instantiate the expression the in predecessor that lacked it.
+      // Instantiate the expression in the predecessor that lacked it.
        // Because we are going top-down through the block, all value numbers
        // will be available in the predecessor by the time we need them.  Any
-      // that weren't original present will have been instantiated earlier
+      // that weren't originally present will have been instantiated earlier
        // in this loop.
        Instruction *PREInstr = CurInst->clone();
        bool success = true;
@@ -2173,7 +2216,7 @@ bool GVN::performPRE(Function &F) {
        localAvail[CurrentBlock]->table[ValNo] = Phi;
  
        CurInst->replaceAllUsesWith(Phi);
-      if (MD && isa<PointerType>(Phi->getType()))
+      if (MD && Phi->getType()->isPointerTy())
          MD->invalidateCachedPointerInfo(Phi);
        VN.erase(CurInst);
  
@@ -2185,11 +2228,23 @@ bool GVN::performPRE(Function &F) {
      }
    }
  
-  for (SmallVector<std::pair<TerminatorInst*, unsigned>, 4>::iterator
-       I = toSplit.begin(), E = toSplit.end(); I != E; ++I)
-    SplitCriticalEdge(I->first, I->second, this);
+  if (splitCriticalEdges())
+    Changed = true;
+
+  return Changed;
+}
  
-  return Changed || toSplit.size();
+/// splitCriticalEdges - Split critical edges found during the previous
+/// iteration that may enable further optimization.
+bool GVN::splitCriticalEdges() {
+  if (toSplit.empty())
+    return false;
+  do {
+    std::pair<TerminatorInst*, unsigned> Edge = toSplit.pop_back_val();
+    SplitCriticalEdge(Edge.first, Edge.second, this);
+  } while (!toSplit.empty());
+  MD->invalidateCachedPredecessors();
+  return true;
  }
  
  /// iterateOnFunction - Executes one iteration of GVN