[PowerPC] Enable interleaved-access vectorization

[oota-llvm.git] / lib / CodeGen / MachineScheduler.cpp
diff --git a/lib/CodeGen/MachineScheduler.cpp b/lib/CodeGen/MachineScheduler.cpp

index a554254794aafcf8f9495c19a32d5f461a258483..9d7dc46ca9a088f891dfef02cdc38e22dbbf0a50 100644 (file)
--- a/lib/CodeGen/MachineScheduler.cpp
+++ b/lib/CodeGen/MachineScheduler.cpp
@@ -209,6 +209,11 @@ static MachineSchedRegistry
  DefaultSchedRegistry("default", "Use the target's default scheduler choice.",
                       useDefaultMachineSched);
  
+static cl::opt<bool> EnableMachineSched(
+    "enable-misched",
+    cl::desc("Enable the machine instruction scheduling pass."), cl::init(true),
+    cl::Hidden);
+
  /// Forward declare the standard machine scheduler. This will be used as the
  /// default scheduler if the target does not set a default.
  static ScheduleDAGInstrs *createGenericSchedLive(MachineSchedContext *C);
@@ -304,6 +309,12 @@ ScheduleDAGInstrs *PostMachineScheduler::createPostMachineScheduler() {
  /// design would be to split blocks at scheduling boundaries, but LLVM has a
  /// general bias against block splitting purely for implementation simplicity.
  bool MachineScheduler::runOnMachineFunction(MachineFunction &mf) {
+  if (EnableMachineSched.getNumOccurrences()) {
+    if (!EnableMachineSched)
+      return false;
+  } else if (!mf.getSubtarget().enableMachineScheduler())
+    return false;
+
    DEBUG(dbgs() << "Before MISsched:\n"; mf.print(dbgs()));
  
    // Initialize the context of the pass.
@@ -336,9 +347,7 @@ bool PostMachineScheduler::runOnMachineFunction(MachineFunction &mf) {
    if (skipOptnoneFunction(*mf.getFunction()))
      return false;
  
-  const TargetSubtargetInfo &ST =
-    mf.getTarget().getSubtarget<TargetSubtargetInfo>();
-  if (!ST.enablePostMachineScheduler()) {
+  if (!mf.getSubtarget().enablePostRAScheduler()) {
      DEBUG(dbgs() << "Subtarget disables post-MI-sched.\n");
      return false;
    }
@@ -934,8 +943,9 @@ updateScheduledPressure(const SUnit *SU,
      unsigned Limit = RegClassInfo->getRegPressureSetLimit(ID);
      if (NewMaxPressure[ID] >= Limit - 2) {
        DEBUG(dbgs() << "  " << TRI->getRegPressureSetName(ID) << ": "
-            << NewMaxPressure[ID] << " > " << Limit << "(+ "
-            << BotRPTracker.getLiveThru()[ID] << " livethru)\n");
+            << NewMaxPressure[ID]
+            << ((NewMaxPressure[ID] > Limit) ? " > " : " <= ") << Limit
+            << "(+ " << BotRPTracker.getLiveThru()[ID] << " livethru)\n");
      }
    }
  }
@@ -988,7 +998,7 @@ void ScheduleDAGMILive::updatePressureDiffs(ArrayRef<unsigned> LiveUses) {
  /// only includes instructions that have DAG nodes, not scheduling boundaries.
  ///
  /// This is a skeletal driver, with all the functionality pushed into helpers,
-/// so that it can be easilly extended by experimental schedulers. Generally,
+/// so that it can be easily extended by experimental schedulers. Generally,
  /// implementing MachineSchedStrategy should be sufficient to implement a new
  /// scheduling algorithm. However, if a scheduler further subclasses
  /// ScheduleDAGMILive then it will want to override this virtual method in order
@@ -1027,8 +1037,6 @@ void ScheduleDAGMILive::schedule() {
  
      scheduleMI(SU, IsTopNode);
  
-    updateQueues(SU, IsTopNode);
-
      if (DFSResult) {
        unsigned SubtreeID = DFSResult->getSubtreeID(SU);
        if (!ScheduledTrees.test(SubtreeID)) {
@@ -1040,6 +1048,8 @@ void ScheduleDAGMILive::schedule() {
  
      // Notify the scheduling strategy after updating the DAG.
      SchedImpl->schedNode(SU, IsTopNode);
+
+    updateQueues(SU, IsTopNode);
    }
    assert(CurrentTop == CurrentBottom && "Nonempty unscheduled zone.");
  
@@ -1261,7 +1271,7 @@ void LoadClusterMutation::clusterNeighboringLoads(ArrayRef<SUnit*> Loads,
      SUnit *SU = Loads[Idx];
      unsigned BaseReg;
      unsigned Offset;
-    if (TII->getLdStBaseRegImmOfs(SU->getInstr(), BaseReg, Offset, TRI))
+    if (TII->getMemOpBaseRegImmOfs(SU->getInstr(), BaseReg, Offset, TRI))
        LoadRecords.push_back(LoadInfo(SU, BaseReg, Offset));
    }
    if (LoadRecords.size() < 2)
@@ -1339,25 +1349,49 @@ namespace {
  /// \brief Post-process the DAG to create cluster edges between instructions
  /// that may be fused by the processor into a single operation.
  class MacroFusion : public ScheduleDAGMutation {
-  const TargetInstrInfo *TII;
+  const TargetInstrInfo &TII;
+  const TargetRegisterInfo &TRI;
  public:
-  MacroFusion(const TargetInstrInfo *tii): TII(tii) {}
+  MacroFusion(const TargetInstrInfo &TII, const TargetRegisterInfo &TRI)
+    : TII(TII), TRI(TRI) {}
  
    void apply(ScheduleDAGMI *DAG) override;
  };
  } // anonymous
  
+/// Returns true if \p MI reads a register written by \p Other.
+static bool HasDataDep(const TargetRegisterInfo &TRI, const MachineInstr &MI,
+                       const MachineInstr &Other) {
+  for (const MachineOperand &MO : MI.uses()) {
+    if (!MO.isReg() || !MO.readsReg())
+      continue;
+
+    unsigned Reg = MO.getReg();
+    if (Other.modifiesRegister(Reg, &TRI))
+      return true;
+  }
+  return false;
+}
+
  /// \brief Callback from DAG postProcessing to create cluster edges to encourage
  /// fused operations.
  void MacroFusion::apply(ScheduleDAGMI *DAG) {
    // For now, assume targets can only fuse with the branch.
-  MachineInstr *Branch = DAG->ExitSU.getInstr();
+  SUnit &ExitSU = DAG->ExitSU;
+  MachineInstr *Branch = ExitSU.getInstr();
    if (!Branch)
      return;
  
-  for (unsigned Idx = DAG->SUnits.size(); Idx > 0;) {
-    SUnit *SU = &DAG->SUnits[--Idx];
-    if (!TII->shouldScheduleAdjacent(SU->getInstr(), Branch))
+  for (SUnit &SU : DAG->SUnits) {
+    // SUnits with successors can't be schedule in front of the ExitSU.
+    if (!SU.Succs.empty())
+      continue;
+    // We only care if the node writes to a register that the branch reads.
+    MachineInstr *Pred = SU.getInstr();
+    if (!HasDataDep(TRI, *Branch, *Pred))
+      continue;
+
+    if (!TII.shouldScheduleAdjacent(Pred, Branch))
        continue;
  
      // Create a single weak edge from SU to ExitSU. The only effect is to cause
@@ -1366,11 +1400,11 @@ void MacroFusion::apply(ScheduleDAGMI *DAG) {
      // scheduling cannot prioritize ExitSU anyway. To defer top-down scheduling
      // of SU, we could create an artificial edge from the deepest root, but it
      // hasn't been needed yet.
-    bool Success = DAG->addEdge(&DAG->ExitSU, SDep(SU, SDep::Cluster));
+    bool Success = DAG->addEdge(&ExitSU, SDep(&SU, SDep::Cluster));
      (void)Success;
      assert(Success && "No DAG nodes should be reachable from ExitSU");
  
-    DEBUG(dbgs() << "Macro Fuse SU(" << SU->NodeNum << ")\n");
+    DEBUG(dbgs() << "Macro Fuse SU(" << SU.NodeNum << ")\n");
      break;
    }
  }
@@ -2140,7 +2174,7 @@ void GenericSchedulerBase::setPolicy(CandPolicy &Policy,
                                       bool IsPostRA,
                                       SchedBoundary &CurrZone,
                                       SchedBoundary *OtherZone) {
-  // Apply preemptive heuristics based on the the total latency and resources
+  // Apply preemptive heuristics based on the total latency and resources
    // inside and outside this zone. Potential stalls should be considered before
    // following this policy.
  
@@ -2602,8 +2636,7 @@ void GenericScheduler::tryCandidate(SchedCandidate &Cand,
                   TryCand, Cand, PhysRegCopy))
      return;
  
-  // Avoid exceeding the target's limit. If signed PSetID is negative, it is
-  // invalid; convert it to INT_MAX to give it lowest priority.
+  // Avoid exceeding the target's limit.
    if (DAG->isTrackingPressure() && tryPressure(TryCand.RPDelta.Excess,
                                                 Cand.RPDelta.Excess,
                                                 TryCand, Cand, RegExcess))
@@ -2878,7 +2911,7 @@ static ScheduleDAGInstrs *createGenericSchedLive(MachineSchedContext *C) {
    if (EnableLoadCluster && DAG->TII->enableClusterLoads())
      DAG->addMutation(make_unique<LoadClusterMutation>(DAG->TII, DAG->TRI));
    if (EnableMacroFusion)
-    DAG->addMutation(make_unique<MacroFusion>(DAG->TII));
+    DAG->addMutation(make_unique<MacroFusion>(*DAG->TII, *DAG->TRI));
    return DAG;
  }