Add codegen support for NEON vld4 intrinsics with 128-bit vectors.
[oota-llvm.git] / lib / CodeGen / LazyLiveness.cpp
index 85817da2e4f21db05567d92f1ce6864a7b2c0d2c..8352fb23e31c94e75a7c5fa471d9fcd99f0e94d7 100644 (file)
@@ -15,6 +15,7 @@
 #define DEBUG_TYPE "lazyliveness"
 #include "llvm/CodeGen/LazyLiveness.h"
 #include "llvm/CodeGen/MachineDominators.h"
+#include "llvm/CodeGen/MachineFunction.h"
 #include "llvm/CodeGen/MachineRegisterInfo.h"
 #include "llvm/CodeGen/Passes.h"
 #include "llvm/ADT/DepthFirstIterator.h"
@@ -32,10 +33,12 @@ void LazyLiveness::computeBackedgeChain(MachineFunction& mf,
   calculated.set(preorder[MBB]);
   
   for (SparseBitVector<128>::iterator I = tmp.begin(); I != tmp.end(); ++I) {
+    assert(rev_preorder.size() > *I && "Unknown block!");
+    
     MachineBasicBlock* SrcMBB = rev_preorder[*I];
     
-    for (MachineBasicBlock::succ_iterator SI = SrcMBB->succ_begin();
-         SI != SrcMBB->succ_end(); ++SI) {
+    for (MachineBasicBlock::succ_iterator SI = SrcMBB->succ_begin(),
+         SE = SrcMBB->succ_end(); SI != SE; ++SI) {
       MachineBasicBlock* TgtMBB = *SI;
       
       if (backedges.count(std::make_pair(SrcMBB, TgtMBB)) &&
@@ -44,7 +47,8 @@ void LazyLiveness::computeBackedgeChain(MachineFunction& mf,
           computeBackedgeChain(mf, TgtMBB);
         
         tv[MBB].set(preorder[TgtMBB]);
-        tv[MBB] |= tv[TgtMBB];
+        SparseBitVector<128> right = tv[TgtMBB];
+        tv[MBB] |= right;
       }
     }
     
@@ -60,26 +64,33 @@ bool LazyLiveness::runOnMachineFunction(MachineFunction &mf) {
   backedge_target.clear();
   calculated.clear();
   preorder.clear();
+  rev_preorder.clear();
+  
+  rv.resize(mf.size());
+  tv.resize(mf.size());
+  preorder.resize(mf.size());
+  rev_preorder.reserve(mf.size());
   
   MRI = &mf.getRegInfo();
+  MachineDominatorTree& MDT = getAnalysis<MachineDominatorTree>();
   
   // Step 0: Compute preorder numbering for all MBBs.
   unsigned num = 0;
-  for (df_iterator<MachineBasicBlock*> DI = df_begin(&*mf.begin());
-       DI != df_end(&*mf.begin()); ++DI) {
-    preorder[*DI] = num++;
-    rev_preorder.push_back(*DI);
+  for (df_iterator<MachineDomTreeNode*> DI = df_begin(MDT.getRootNode()),
+       DE = df_end(MDT.getRootNode()); DI != DE; ++DI) {
+    preorder[(*DI)->getBlock()] = num++;
+    rev_preorder.push_back((*DI)->getBlock());
   }
   
   // Step 1: Compute the transitive closure of the CFG, ignoring backedges.
-  for (po_iterator<MachineBasicBlock*> POI = po_begin(&*mf.begin());
-       POI != po_end(&*mf.begin()); ++POI) {
+  for (po_iterator<MachineBasicBlock*> POI = po_begin(&*mf.begin()),
+       POE = po_end(&*mf.begin()); POI != POE; ++POI) {
     MachineBasicBlock* MBB = *POI;
     SparseBitVector<128>& entry = rv[MBB];
     entry.set(preorder[MBB]);
     
-    for (MachineBasicBlock::succ_iterator SI = MBB->succ_begin();
-         SI != MBB->succ_end(); ++SI) {
+    for (MachineBasicBlock::succ_iterator SI = MBB->succ_begin(),
+         SE = MBB->succ_end(); SI != SE; ++SI) {
       DenseMap<MachineBasicBlock*, SparseBitVector<128> >::iterator SII = 
                                                          rv.find(*SI);
       
@@ -102,11 +113,11 @@ bool LazyLiveness::runOnMachineFunction(MachineFunction &mf) {
   for (po_iterator<MachineBasicBlock*> POI = po_begin(&*mf.begin()),
        POE = po_end(&*mf.begin()); POI != POE; ++POI)
     if (!backedge_target.test(preorder[*POI]))
-      for (MachineBasicBlock::succ_iterator SI = (*POI)->succ_begin();
-           SI != (*POI)->succ_end(); ++SI)
+      for (MachineBasicBlock::succ_iterator SI = (*POI)->succ_begin(),
+           SE = (*POI)->succ_end(); SI != SE; ++SI)
         if (!backedges.count(std::make_pair(*POI, *SI)) && tv.count(*SI)) {
-          SparseBitVector<128>& PBV = tv[*POI];
-          PBV = tv[*SI];
+          SparseBitVector<128> right = tv[*SI];
+          tv[*POI] |= right;
         }
   
   for (po_iterator<MachineBasicBlock*> POI = po_begin(&*mf.begin()),
@@ -122,11 +133,12 @@ bool LazyLiveness::vregLiveIntoMBB(unsigned vreg, MachineBasicBlock* MBB) {
   MachineBasicBlock* DefMBB = MRI->def_begin(vreg)->getParent();
   unsigned def = preorder[DefMBB];
   unsigned max_dom = 0;
-  for (df_iterator<MachineDomTreeNode*> DI = df_begin(MDT[DefMBB]);
-       DI != df_end(MDT[DefMBB]); ++DI)
+  for (df_iterator<MachineDomTreeNode*> DI = df_begin(MDT[DefMBB]),
+       DE = df_end(MDT[DefMBB]); DI != DE; ++DI) {
     if (preorder[DI->getBlock()] > max_dom) {
       max_dom = preorder[(*DI)->getBlock()];
     }
+  }
   
   if (preorder[MBB] <= def || max_dom < preorder[MBB])
     return false;
@@ -134,16 +146,16 @@ bool LazyLiveness::vregLiveIntoMBB(unsigned vreg, MachineBasicBlock* MBB) {
   SparseBitVector<128>::iterator I = tv[MBB].begin();
   while (I != tv[MBB].end() && *I <= def) ++I;
   while (I != tv[MBB].end() && *I < max_dom) {
-    for (MachineRegisterInfo::use_iterator UI = MRI->use_begin(vreg);
-         UI != MachineRegisterInfo::use_end(); ++UI) {
+    for (MachineRegisterInfo::use_iterator UI = MRI->use_begin(vreg),
+         UE = MachineRegisterInfo::use_end(); UI != UE; ++UI) {
       MachineBasicBlock* UseMBB = UI->getParent();
       if (rv[rev_preorder[*I]].test(preorder[UseMBB]))
         return true;
-        
+      
       unsigned t_dom = 0;
       for (df_iterator<MachineDomTreeNode*> DI =
-           df_begin(MDT[rev_preorder[*I]]);
-           DI != df_end(MDT[rev_preorder[*I]]); ++DI)
+           df_begin(MDT[rev_preorder[*I]]), DE = df_end(MDT[rev_preorder[*I]]); 
+           DI != DE; ++DI)
         if (preorder[DI->getBlock()] > t_dom) {
           max_dom = preorder[(*DI)->getBlock()];
         }
@@ -154,4 +166,3 @@ bool LazyLiveness::vregLiveIntoMBB(unsigned vreg, MachineBasicBlock* MBB) {
   
   return false;
 }
-