R600/SI: Simplify debug printing

[oota-llvm.git] / lib / Target / R600 / SIFixSGPRCopies.cpp
diff --git a/lib/Target/R600/SIFixSGPRCopies.cpp b/lib/Target/R600/SIFixSGPRCopies.cpp

index 446a9f7b7914d55f2d3a8d5ae5347800b75b8ec0..086b44433c2ebf04096e3d4a50a8fe4d0d48cbb8 100644 (file)
--- a/lib/Target/R600/SIFixSGPRCopies.cpp
+++ b/lib/Target/R600/SIFixSGPRCopies.cpp
@@ -65,17 +65,20 @@
  /// ultimately led to the creation of an illegal COPY.
  //===----------------------------------------------------------------------===//
  
-#define DEBUG_TYPE "sgpr-copies"
  #include "AMDGPU.h"
+#include "AMDGPUSubtarget.h"
  #include "SIInstrInfo.h"
  #include "llvm/CodeGen/MachineFunctionPass.h"
  #include "llvm/CodeGen/MachineInstrBuilder.h"
  #include "llvm/CodeGen/MachineRegisterInfo.h"
  #include "llvm/Support/Debug.h"
+#include "llvm/Support/raw_ostream.h"
  #include "llvm/Target/TargetMachine.h"
  
  using namespace llvm;
  
+#define DEBUG_TYPE "sgpr-copies"
+
  namespace {
  
  class SIFixSGPRCopies : public MachineFunctionPass {
@@ -96,9 +99,9 @@ private:
  public:
    SIFixSGPRCopies(TargetMachine &tm) : MachineFunctionPass(ID) { }
  
-  virtual bool runOnMachineFunction(MachineFunction &MF);
+  bool runOnMachineFunction(MachineFunction &MF) override;
  
-  const char *getPassName() const {
+  const char *getPassName() const override {
      return "SI Fix SGPR copies";
    }
  
@@ -127,7 +130,7 @@ static bool hasVGPROperands(const MachineInstr &MI, const SIRegisterInfo *TRI) {
  
  /// This functions walks the use list of Reg until it finds an Instruction
  /// that isn't a COPY returns the register class of that instruction.
-/// \param[out] The register defined by the first non-COPY instruction.
+/// \return The register defined by the first non-COPY instruction.
  const TargetRegisterClass *SIFixSGPRCopies::inferRegClassFromUses(
                                                   const SIRegisterInfo *TRI,
                                                   const MachineRegisterInfo &MRI,
@@ -140,8 +143,8 @@ const TargetRegisterClass *SIFixSGPRCopies::inferRegClassFromUses(
  
    const TargetRegisterClass *RC = MRI.getRegClass(Reg);
    RC = TRI->getSubRegClass(RC, SubReg);
-  for (MachineRegisterInfo::use_iterator I = MRI.use_begin(Reg),
-                                         E = MRI.use_end(); I != E; ++I) {
+  for (MachineRegisterInfo::use_instr_iterator
+       I = MRI.use_instr_begin(Reg), E = MRI.use_instr_end(); I != E; ++I) {
      switch (I->getOpcode()) {
      case AMDGPU::COPY:
        RC = TRI->getCommonSubClass(RC, inferRegClassFromUses(TRI, MRI,
@@ -180,24 +183,23 @@ bool SIFixSGPRCopies::isVGPRToSGPRCopy(const MachineInstr &Copy,
    unsigned SrcReg = Copy.getOperand(1).getReg();
    unsigned SrcSubReg = Copy.getOperand(1).getSubReg();
    const TargetRegisterClass *DstRC = MRI.getRegClass(DstReg);
+  const TargetRegisterClass *SrcRC;
  
    if (!TargetRegisterInfo::isVirtualRegister(SrcReg) ||
-      DstRC == &AMDGPU::M0RegRegClass)
+      DstRC == &AMDGPU::M0RegRegClass ||
+      MRI.getRegClass(SrcReg) == &AMDGPU::VReg_1RegClass)
      return false;
  
-  const TargetRegisterClass *SrcRC = TRI->getSubRegClass(
-      MRI.getRegClass(SrcReg), SrcSubReg);
-
-  return TRI->isSGPRClass(DstRC) &&
-         !TRI->getCommonSubClass(DstRC, SrcRC);
+  SrcRC = TRI->getSubRegClass(MRI.getRegClass(SrcReg), SrcSubReg);
+  return TRI->isSGPRClass(DstRC) && TRI->hasVGPRs(SrcRC);
  }
  
  bool SIFixSGPRCopies::runOnMachineFunction(MachineFunction &MF) {
    MachineRegisterInfo &MRI = MF.getRegInfo();
-  const SIRegisterInfo *TRI = static_cast<const SIRegisterInfo *>(
-      MF.getTarget().getRegisterInfo());
-  const SIInstrInfo *TII = static_cast<const SIInstrInfo *>(
-      MF.getTarget().getInstrInfo());
+  const SIRegisterInfo *TRI =
+      static_cast<const SIRegisterInfo *>(MF.getSubtarget().getRegisterInfo());
+  const SIInstrInfo *TII =
+      static_cast<const SIInstrInfo *>(MF.getSubtarget().getInstrInfo());
    for (MachineFunction::iterator BI = MF.begin(), BE = MF.end();
                                                    BI != BE; ++BI) {
  
@@ -236,14 +238,66 @@ bool SIFixSGPRCopies::runOnMachineFunction(MachineFunction &MF) {
  
          // If a PHI node defines an SGPR and any of its operands are VGPRs,
          // then we need to move it to the VALU.
+        //
+        // Also, if a PHI node defines an SGPR and has all SGPR operands
+        // we must move it to the VALU, because the SGPR operands will
+        // all end up being assigned the same register, which means
+        // there is a potential for a conflict if different threads take
+        // different control flow paths.
+        //
+        // For Example:
+        //
+        // sgpr0 = def;
+        // ...
+        // sgpr1 = def;
+        // ...
+        // sgpr2 = PHI sgpr0, sgpr1
+        // use sgpr2;
+        //
+        // Will Become:
+        //
+        // sgpr2 = def;
+        // ...
+        // sgpr2 = def;
+        // ...
+        // use sgpr2
+        //
+        // FIXME: This is OK if the branching decision is made based on an
+        // SGPR value.
+        bool SGPRBranch = false;
+
+        // The one exception to this rule is when one of the operands
+        // is defined by a SI_BREAK, SI_IF_BREAK, or SI_ELSE_BREAK
+        // instruction.  In this case, there we know the program will
+        // never enter the second block (the loop) without entering
+        // the first block (where the condition is computed), so there
+        // is no chance for values to be over-written.
+
+        bool HasBreakDef = false;
          for (unsigned i = 1; i < MI.getNumOperands(); i+=2) {
            unsigned Reg = MI.getOperand(i).getReg();
            if (TRI->hasVGPRs(MRI.getRegClass(Reg))) {
              TII->moveToVALU(MI);
              break;
            }
+          MachineInstr *DefInstr = MRI.getUniqueVRegDef(Reg);
+          assert(DefInstr);
+          switch(DefInstr->getOpcode()) {
+
+          case AMDGPU::SI_BREAK:
+          case AMDGPU::SI_IF_BREAK:
+          case AMDGPU::SI_ELSE_BREAK:
+          // If we see a PHI instruction that defines an SGPR, then that PHI
+          // instruction has already been considered and should have
+          // a *_BREAK as an operand.
+          case AMDGPU::PHI:
+            HasBreakDef = true;
+            break;
+          }
          }
  
+        if (!SGPRBranch && !HasBreakDef)
+          TII->moveToVALU(MI);
          break;
        }
        case AMDGPU::REG_SEQUENCE: {
@@ -251,11 +305,21 @@ bool SIFixSGPRCopies::runOnMachineFunction(MachineFunction &MF) {
              !hasVGPROperands(MI, TRI))
            continue;
  
-        DEBUG(dbgs() << "Fixing REG_SEQUENCE: \n");
-        DEBUG(MI.print(dbgs()));
+        DEBUG(dbgs() << "Fixing REG_SEQUENCE: " << MI);
  
          TII->moveToVALU(MI);
-        TII->legalizeOperands(&MI);
+        break;
+      }
+      case AMDGPU::INSERT_SUBREG: {
+        const TargetRegisterClass *DstRC, *Src0RC, *Src1RC;
+        DstRC = MRI.getRegClass(MI.getOperand(0).getReg());
+        Src0RC = MRI.getRegClass(MI.getOperand(1).getReg());
+        Src1RC = MRI.getRegClass(MI.getOperand(2).getReg());
+        if (TRI->isSGPRClass(DstRC) &&
+            (TRI->hasVGPRs(Src0RC) || TRI->hasVGPRs(Src1RC))) {
+          DEBUG(dbgs() << " Fixing INSERT_SUBREG: " << MI);
+          TII->moveToVALU(MI);
+        }
          break;
        }
        }