Two small cleanups/speedups:

[oota-llvm.git] / lib / Transforms / Utils / PromoteMemoryToRegister.cpp
diff --git a/lib/Transforms/Utils/PromoteMemoryToRegister.cpp b/lib/Transforms/Utils/PromoteMemoryToRegister.cpp

index e0d2c2475fcc5b322f73376a4ab9b42db56abde3..a56420f5b14668da6f3483f9d62030962779a132 100644 (file)
--- a/lib/Transforms/Utils/PromoteMemoryToRegister.cpp
+++ b/lib/Transforms/Utils/PromoteMemoryToRegister.cpp
@@ -1,7 +1,7 @@
  //===- PromoteMemoryToRegister.cpp - Convert memory refs to regs ----------===//
  //
-// This pass is used to promote memory references to be register references.  A
-// simple example of the transformation performed by this pass is:
+// This file is used to promote memory references to be register references.  A
+// simple example of the transformation performed by this function is:
  //
  //        FROM CODE                           TO CODE
  //   %X = alloca int, uint 1                 ret int 42
@@ -9,152 +9,125 @@
  //   %Y = load int* %X
  //   ret int %Y
  //
-// To do this transformation, a simple analysis is done to ensure it is safe.
-// Currently this just loops over all alloca instructions, looking for
-// instructions that are only used in simple load and stores.
-//
-// After this, the code is transformed by...something magical :)
+// The code is transformed by looping over all of the alloca instruction,
+// calculating dominator frontiers, then inserting phi-nodes following the usual
+// SSA construction algorithm.  This code does not modify the CFG of the
+// function.
  //
  //===----------------------------------------------------------------------===//
  
-#include "llvm/Transforms/Scalar/PromoteMemoryToRegister.h"
+#include "llvm/Transforms/Utils/PromoteMemToReg.h"
  #include "llvm/Analysis/Dominators.h"
  #include "llvm/iMemory.h"
  #include "llvm/iPHINode.h"
  #include "llvm/iTerminators.h"
-#include "llvm/Pass.h"
  #include "llvm/Function.h"
-#include "llvm/BasicBlock.h"
  #include "llvm/Constant.h"
+#include "llvm/Type.h"
+#include "llvm/Support/CFG.h"
+#include "Support/StringExtras.h"
+
+/// isAllocaPromotable - Return true if this alloca is legal for promotion.
+/// This is true if there are only loads and stores to the alloca...
+///
+bool isAllocaPromotable(const AllocaInst *AI, const TargetData &TD) {
+  // FIXME: If the memory unit is of pointer or integer type, we can permit
+  // assignments to subsections of the memory unit.
+
+  // Only allow direct loads and stores...
+  for (Value::use_const_iterator UI = AI->use_begin(), UE = AI->use_end();
+       UI != UE; ++UI)     // Loop over all of the uses of the alloca
+    if (!isa<LoadInst>(*UI))
+      if (const StoreInst *SI = dyn_cast<StoreInst>(*UI)) {
+        if (SI->getOperand(0) == AI)
+          return false;   // Don't allow a store of the AI, only INTO the AI.
+      } else {
+        return false;   // Not a load or store?
+      }
+  
+  return true;
+}
  
-using std::vector;
-using std::map;
-using std::set;
  
  namespace {
-  struct PromotePass : public FunctionPass {
-    vector<AllocaInst*>          Allocas;      // the alloca instruction..
-    map<Instruction*, unsigned>  AllocaLookup; // reverse mapping of above
-    
-    vector<vector<BasicBlock*> > PhiNodes;     // index corresponds to Allocas
+  struct PromoteMem2Reg {
+    const std::vector<AllocaInst*> &Allocas;        // the alloca instructions..
+    std::vector<unsigned> VersionNumbers;           // Current version counters
+    DominanceFrontier &DF;
+    const TargetData &TD;
+
+    std::map<Instruction*, unsigned>  AllocaLookup; // reverse mapping of above
      
-    // List of instructions to remove at end of pass
-    vector<Instruction *>        KillList;
+    std::vector<std::vector<BasicBlock*> > PhiNodes;// Idx corresponds 2 Allocas
      
-    map<BasicBlock*,vector<PHINode*> > NewPhiNodes; // the PhiNodes we're adding
+    // NewPhiNodes - The PhiNodes we're adding.
+    std::map<BasicBlock*, std::vector<PHINode*> > NewPhiNodes;
+
+    // Visited - The set of basic blocks the renamer has already visited.
+    std::set<BasicBlock*> Visited;
  
    public:
-    // runOnFunction - To run this pass, first we calculate the alloca
-    // instructions that are safe for promotion, then we promote each one.
-    //
-    virtual bool runOnFunction(Function *F);
+    PromoteMem2Reg(const std::vector<AllocaInst*> &A, DominanceFrontier &df,
+                   const TargetData &td) : Allocas(A), DF(df), TD(td) {}
  
-    // getAnalysisUsage - We need dominance frontiers
-    //
-    virtual void getAnalysisUsage(AnalysisUsage &AU) const {
-      AU.addRequired(DominanceFrontier::ID);
-      AU.preservesCFG();
-    }
+    void run();
  
    private:
-    void Traverse(BasicBlock *BB, BasicBlock *Pred, vector<Value*> &IncVals,
-                  set<BasicBlock*> &Visited);
+    void RenamePass(BasicBlock *BB, BasicBlock *Pred,
+                    std::vector<Value*> &IncVals);
      bool QueuePhiNode(BasicBlock *BB, unsigned AllocaIdx);
-    void FindSafeAllocas(Function *F);
    };
-
  }  // end of anonymous namespace
  
  
-// isSafeAlloca - This predicate controls what types of alloca instructions are
-// allowed to be promoted...
-//
-static inline bool isSafeAlloca(const AllocaInst *AI) {
-  if (AI->isArrayAllocation()) return false;
-
-  for (Value::use_const_iterator UI = AI->use_begin(), UE = AI->use_end();
-       UI != UE; ++UI) {   // Loop over all of the uses of the alloca
-
-    // Only allow nonindexed memory access instructions...
-    if (MemAccessInst *MAI = dyn_cast<MemAccessInst>(*UI)) {
-      if (MAI->hasIndices()) {  // indexed?
-        // Allow the access if there is only one index and the index is
-        // zero.
-        if (*MAI->idx_begin() != Constant::getNullValue(Type::UIntTy) ||
-            MAI->idx_begin()+1 != MAI->idx_end())
-          return false;
-      }
-    } else {
-      return false;   // Not a load or store?
-    }
-  }
-  
-  return true;
-}
-
-// FindSafeAllocas - Find allocas that are safe to promote
-//
-void PromotePass::FindSafeAllocas(Function *F) {
-  BasicBlock *BB = F->getEntryNode();  // Get the entry node for the function
-
-  // Look at all instructions in the entry node
-  for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ++I)
-    if (AllocaInst *AI = dyn_cast<AllocaInst>(*I))       // Is it an alloca?
-      if (isSafeAlloca(AI)) {   // If safe alloca, add alloca to safe list
-        AllocaLookup[AI] = Allocas.size();  // Keep reverse mapping
-        Allocas.push_back(AI);
-      }
-}
-
-
-
-bool PromotePass::runOnFunction(Function *F) {
-  // Calculate the set of safe allocas
-  FindSafeAllocas(F);
+void PromoteMem2Reg::run() {
+  Function &F = *DF.getRoot()->getParent();
  
-  // If there is nothing to do, bail out...
-  if (Allocas.empty()) return false;
+  VersionNumbers.resize(Allocas.size());
  
-  // Add each alloca to the KillList.  Note: KillList is destroyed MOST recently
-  // added to least recently.
-  KillList.assign(Allocas.begin(), Allocas.end());
+  for (unsigned i = 0, e = Allocas.size(); i != e; ++i) {
+    assert(isAllocaPromotable(Allocas[i], TD) &&
+           "Cannot promote non-promotable alloca!");
+    assert(Allocas[i]->getParent()->getParent() == &F &&
+           "All allocas should be in the same function, which is same as DF!");
+    AllocaLookup[Allocas[i]] = i;
+  }
  
-  // Calculate the set of write-locations for each alloca.  This is analogous to
-  // counting the number of 'redefinitions' of each variable.
-  vector<vector<BasicBlock*> > WriteSets;    // index corresponds to Allocas
-  WriteSets.resize(Allocas.size());
+  PhiNodes.resize(Allocas.size());
    for (unsigned i = 0; i != Allocas.size(); ++i) {
      AllocaInst *AI = Allocas[i];
+
+    // Calculate the set of write-locations for each alloca.  This is analogous
+    // to counting the number of 'redefinitions' of each variable.
+    std::vector<BasicBlock*> WriteSets;
      for (Value::use_iterator U =AI->use_begin(), E = AI->use_end(); U != E; ++U)
        if (StoreInst *SI = dyn_cast<StoreInst>(*U))
          // jot down the basic-block it came from
-        WriteSets[i].push_back(SI->getParent());
-  }
-
-  // Get dominance frontier information...
-  DominanceFrontier &DF = getAnalysis<DominanceFrontier>();
-
-  // Compute the locations where PhiNodes need to be inserted.  Look at the
-  // dominance frontier of EACH basic-block we have a write in
-  //
-  PhiNodes.resize(Allocas.size());
-  for (unsigned i = 0; i != Allocas.size(); ++i) {
-    for (unsigned j = 0; j != WriteSets[i].size(); j++) {
+        WriteSets.push_back(SI->getParent());
+    
+    // Compute the locations where PhiNodes need to be inserted.  Look at the
+    // dominance frontier of EACH basic-block we have a write in.
+    //
+    for (unsigned j = 0; j != WriteSets.size(); j++) {
        // Look up the DF for this write, add it to PhiNodes
-      DominanceFrontier::const_iterator it = DF.find(WriteSets[i][j]);
-      DominanceFrontier::DomSetType     S = it->second;
-      for (DominanceFrontier::DomSetType::iterator P = S.begin(), PE = S.end();
-           P != PE; ++P)
-        QueuePhiNode(*P, i);
+      DominanceFrontier::const_iterator it = DF.find(WriteSets[j]);
+      if (it != DF.end()) {
+        const DominanceFrontier::DomSetType &S = it->second;
+        for (DominanceFrontier::DomSetType::iterator P = S.begin(),PE = S.end();
+             P != PE; ++P)
+          QueuePhiNode(*P, i);
+      }
      }
      
      // Perform iterative step
      for (unsigned k = 0; k != PhiNodes[i].size(); k++) {
        DominanceFrontier::const_iterator it = DF.find(PhiNodes[i][k]);
-      DominanceFrontier::DomSetType     S = it->second;
-      for (DominanceFrontier::DomSetType::iterator P = S.begin(), PE = S.end();
-           P != PE; ++P)
-        QueuePhiNode(*P, i);
+      if (it != DF.end()) {
+        const DominanceFrontier::DomSetType     &S = it->second;
+        for (DominanceFrontier::DomSetType::iterator P = S.begin(),PE = S.end();
+             P != PE; ++P)
+          QueuePhiNode(*P, i);
+      }
      }
    }
  
@@ -162,73 +135,89 @@ bool PromotePass::runOnFunction(Function *F) {
    // the alloca's.  We do this in case there is a load of a value that has not
    // been stored yet.  In this case, it will get this null value.
    //
-  vector<Value *> Values(Allocas.size());
+  std::vector<Value *> Values(Allocas.size());
    for (unsigned i = 0, e = Allocas.size(); i != e; ++i)
-    Values[i] = Constant::getNullValue(Allocas[i]->getType()->getElementType());
+    Values[i] = Constant::getNullValue(Allocas[i]->getAllocatedType());
  
    // Walks all basic blocks in the function performing the SSA rename algorithm
    // and inserting the phi nodes we marked as necessary
    //
-  set<BasicBlock*> Visited;         // The basic blocks we've already visited
-  Traverse(F->front(), 0, Values, Visited);
+  RenamePass(F.begin(), 0, Values);
+  Visited.clear();
  
-  // Remove all instructions marked by being placed in the KillList...
-  //
-  while (!KillList.empty()) {
-    Instruction *I = KillList.back();
-    KillList.pop_back();
+  // Remove the allocas themselves from the function...
+  for (unsigned i = 0, e = Allocas.size(); i != e; ++i) {
+    Instruction *A = Allocas[i];
  
-    I->getParent()->getInstList().remove(I);
-    delete I;
+    // If there are any uses of the alloca instructions left, they must be in
+    // sections of dead code that were not processed on the dominance frontier.
+    // Just delete the users now.
+    //
+    if (!A->use_empty())
+      A->replaceAllUsesWith(Constant::getNullValue(A->getType()));
+    A->getParent()->getInstList().erase(A);
    }
-
-  // Purge data structurse so they are available the next iteration...
-  Allocas.clear();
-  AllocaLookup.clear();
-  PhiNodes.clear();
-  NewPhiNodes.clear();
-  return true;
  }
  
  
  // QueuePhiNode - queues a phi-node to be added to a basic-block for a specific
  // Alloca returns true if there wasn't already a phi-node for that variable
  //
-bool PromotePass::QueuePhiNode(BasicBlock *BB, unsigned AllocaNo) {
+bool PromoteMem2Reg::QueuePhiNode(BasicBlock *BB, unsigned AllocaNo) {
    // Look up the basic-block in question
-  vector<PHINode*> &BBPNs = NewPhiNodes[BB];
+  std::vector<PHINode*> &BBPNs = NewPhiNodes[BB];
    if (BBPNs.empty()) BBPNs.resize(Allocas.size());
  
    // If the BB already has a phi node added for the i'th alloca then we're done!
    if (BBPNs[AllocaNo]) return false;
  
-  // Create a PhiNode using the dereferenced type...
-  PHINode *PN = new PHINode(Allocas[AllocaNo]->getType()->getElementType(),
-                            Allocas[AllocaNo]->getName()+".mem2reg");
-  BBPNs[AllocaNo] = PN;
-
-  // Add the phi-node to the basic-block
-  BB->getInstList().push_front(PN);
+  // Create a PhiNode using the dereferenced type... and add the phi-node to the
+  // BasicBlock.
+  PHINode *PN = new PHINode(Allocas[AllocaNo]->getAllocatedType(),
+                            Allocas[AllocaNo]->getName() + "." +
+                                      utostr(VersionNumbers[AllocaNo]++),
+                            BB->begin());
+
+  // Add null incoming values for all predecessors.  This ensures that if one of
+  // the predecessors is not found in the depth-first traversal of the CFG (ie,
+  // because it is an unreachable predecessor), that all PHI nodes will have the
+  // correct number of entries for their predecessors.
+  Value *NullVal = Constant::getNullValue(PN->getType());
+
+  // This is necessary because adding incoming values to the PHI node adds uses
+  // to the basic blocks being used, which can invalidate the predecessor
+  // iterator!
+  std::vector<BasicBlock*> Preds(pred_begin(BB), pred_end(BB));
+  for (unsigned i = 0, e = Preds.size(); i != e; ++i)
+    PN->addIncoming(NullVal, Preds[i]);
  
+  BBPNs[AllocaNo] = PN;
    PhiNodes[AllocaNo].push_back(BB);
    return true;
  }
  
-void PromotePass::Traverse(BasicBlock *BB, BasicBlock *Pred,
-                           vector<Value*> &IncomingVals,
-                           set<BasicBlock*> &Visited) {
-  // If this is a BB needing a phi node, lookup/create the phinode for each
-  // variable we need phinodes for.
-  vector<PHINode *> &BBPNs = NewPhiNodes[BB];
-  for (unsigned k = 0; k != BBPNs.size(); ++k)
-    if (PHINode *PN = BBPNs[k]) {
-      // at this point we can assume that the array has phi nodes.. let's add
-      // the incoming data
-      PN->addIncoming(IncomingVals[k], Pred);
-
-      // also note that the active variable IS designated by the phi node
-      IncomingVals[k] = PN;
-    }
+void PromoteMem2Reg::RenamePass(BasicBlock *BB, BasicBlock *Pred,
+                                std::vector<Value*> &IncomingVals) {
+  // If this BB needs a PHI node, update the PHI node for each variable we need
+  // PHI nodes for.
+  std::map<BasicBlock*, std::vector<PHINode *> >::iterator
+    BBPNI = NewPhiNodes.find(BB);
+  if (BBPNI != NewPhiNodes.end()) {
+    std::vector<PHINode *> &BBPNs = BBPNI->second;
+    for (unsigned k = 0; k != BBPNs.size(); ++k)
+      if (PHINode *PN = BBPNs[k]) {
+        // The PHI node may have multiple entries for this predecessor.  We must
+        // make sure we update all of them.
+        for (unsigned i = 0, e = PN->getNumOperands(); i != e; i += 2) {
+          if (PN->getOperand(i+1) == Pred)
+            // At this point we can assume that the array has phi nodes.. let's
+            // update the incoming data.
+            PN->setOperand(i, IncomingVals[k]);
+        }
+        // also note that the active variable IS designated by the phi node
+        IncomingVals[k] = PN;
+      }
+  }
  
    // don't revisit nodes
    if (Visited.count(BB)) return;
@@ -236,49 +225,52 @@ void PromotePass::Traverse(BasicBlock *BB, BasicBlock *Pred,
    // mark as visited
    Visited.insert(BB);
  
-  // keep track of the value of each variable we're watching.. how?
-  for (BasicBlock::iterator II = BB->begin(); II != BB->end(); ++II) {
-    Instruction *I = *II; //get the instruction
+  BasicBlock::iterator II = BB->begin();
+  while (1) {
+    Instruction *I = II++; // get the instruction, increment iterator
  
      if (LoadInst *LI = dyn_cast<LoadInst>(I)) {
-      Value *Ptr = LI->getPointerOperand();
-
-      if (AllocaInst *Src = dyn_cast<AllocaInst>(Ptr)) {
-        map<Instruction*, unsigned>::iterator AI = AllocaLookup.find(Src);
+      if (AllocaInst *Src = dyn_cast<AllocaInst>(LI->getPointerOperand())) {
+        std::map<Instruction*, unsigned>::iterator AI = AllocaLookup.find(Src);
          if (AI != AllocaLookup.end()) {
            Value *V = IncomingVals[AI->second];
  
            // walk the use list of this load and replace all uses with r
            LI->replaceAllUsesWith(V);
-          KillList.push_back(LI); // Mark the load to be deleted
+          BB->getInstList().erase(LI);
          }
        }
      } else if (StoreInst *SI = dyn_cast<StoreInst>(I)) {
-      // delete this instruction and mark the name as the current holder of the
+      // Delete this instruction and mark the name as the current holder of the
        // value
-      Value *Ptr = SI->getPointerOperand();
-      if (AllocaInst *Dest = dyn_cast<AllocaInst>(Ptr)) {
-        map<Instruction *, unsigned>::iterator ai = AllocaLookup.find(Dest);
+      if (AllocaInst *Dest = dyn_cast<AllocaInst>(SI->getPointerOperand())) {
+        std::map<Instruction *, unsigned>::iterator ai =AllocaLookup.find(Dest);
          if (ai != AllocaLookup.end()) {
            // what value were we writing?
            IncomingVals[ai->second] = SI->getOperand(0);
-          KillList.push_back(SI);  // Mark the store to be deleted
+          BB->getInstList().erase(SI);
          }
        }
        
      } else if (TerminatorInst *TI = dyn_cast<TerminatorInst>(I)) {
        // Recurse across our successors
        for (unsigned i = 0; i != TI->getNumSuccessors(); i++) {
-        vector<Value*> OutgoingVals(IncomingVals);
-        Traverse(TI->getSuccessor(i), BB, OutgoingVals, Visited);
+        std::vector<Value*> OutgoingVals(IncomingVals);
+        RenamePass(TI->getSuccessor(i), BB, OutgoingVals);
        }
+      break;
      }
    }
  }
  
-
-// createPromoteMemoryToRegister - Provide an entry point to create this pass.
-//
-Pass *createPromoteMemoryToRegister() {
-  return new PromotePass();
+/// PromoteMemToReg - Promote the specified list of alloca instructions into
+/// scalar registers, inserting PHI nodes as appropriate.  This function makes
+/// use of DominanceFrontier information.  This function does not modify the CFG
+/// of the function at all.  All allocas must be from the same function.
+///
+void PromoteMemToReg(const std::vector<AllocaInst*> &Allocas,
+                     DominanceFrontier &DF, const TargetData &TD) {
+  // If there is nothing to do, bail out...
+  if (Allocas.empty()) return;
+  PromoteMem2Reg(Allocas, DF, TD).run();
  }