R600/SI: Prettier display of input modifiers

author Vincent Lejeune <vljn@ovi.com>

Sat, 10 May 2014 19:18:33 +0000 (19:18 +0000)

committer Vincent Lejeune <vljn@ovi.com>

Sat, 10 May 2014 19:18:33 +0000 (19:18 +0000)
author Vincent Lejeune <vljn@ovi.com>
Sat, 10 May 2014 19:18:33 +0000 (19:18 +0000)
committer Vincent Lejeune <vljn@ovi.com>
Sat, 10 May 2014 19:18:33 +0000 (19:18 +0000)
diff --git a/lib/Target/R600/InstPrinter/AMDGPUInstPrinter.cpp b/lib/Target/R600/InstPrinter/AMDGPUInstPrinter.cpp

index e2753719271b8f0c6ce2bcb1527a545e4782e4bc..11ae09102188c56a44229213ffca273076433d80 100644 (file)
--- a/lib/Target/R600/InstPrinter/AMDGPUInstPrinter.cpp
+++ b/lib/Target/R600/InstPrinter/AMDGPUInstPrinter.cpp
@@ -158,6 +158,18 @@ void AMDGPUInstPrinter::printOperand(const MCInst *MI, unsigned OpNo,
    }
  }
  
+void AMDGPUInstPrinter::printOperandAndMods(const MCInst *MI, unsigned OpNo,
+                                            raw_ostream &O) {
+  unsigned InputModifiers = MI->getOperand(OpNo).getImm();
+  if (InputModifiers & 0x1)
+    O << "-";
+  if (InputModifiers & 0x2)
+    O << "|";
+  printOperand(MI, OpNo + 1, O);
+  if (InputModifiers & 0x2)
+    O << "|";
+}
+
  void AMDGPUInstPrinter::printInterpSlot(const MCInst *MI, unsigned OpNum,
                                          raw_ostream &O) {
    unsigned Imm = MI->getOperand(OpNum).getImm();
diff --git a/lib/Target/R600/InstPrinter/AMDGPUInstPrinter.h b/lib/Target/R600/InstPrinter/AMDGPUInstPrinter.h

index f30fc49ab058e089f9251d57de1e7b9fece02d6d..6ca717076cde2f2f3a11f73608399ceeabc4aad3 100644 (file)
--- a/lib/Target/R600/InstPrinter/AMDGPUInstPrinter.h
+++ b/lib/Target/R600/InstPrinter/AMDGPUInstPrinter.h
@@ -38,6 +38,7 @@ private:
    void printRegOperand(unsigned RegNo, raw_ostream &O);
    void printImmediate(uint32_t Imm, raw_ostream &O);
    void printOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O);
+  void printOperandAndMods(const MCInst *MI, unsigned OpNo, raw_ostream &O);
    static void printInterpSlot(const MCInst *MI, unsigned OpNum, raw_ostream &O);
    void printMemOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O);
    static void printIfSet(const MCInst *MI, unsigned OpNo, raw_ostream &O,
diff --git a/lib/Target/R600/SIISelLowering.cpp b/lib/Target/R600/SIISelLowering.cpp

index 1fae8cd592d53f7652295b89e5498459a77703f4..466d24771ce34036cac39165fb58d59d3111a84f 100644 (file)
--- a/lib/Target/R600/SIISelLowering.cpp
+++ b/lib/Target/R600/SIISelLowering.cpp
@@ -576,12 +576,12 @@ MachineBasicBlock * SITargetLowering::EmitInstrWithCustomInserter(
        static_cast<const SIInstrInfo*>(getTargetMachine().getInstrInfo());
      BuildMI(*BB, I, MI->getDebugLoc(), TII->get(AMDGPU::V_ADD_F32_e64),
              MI->getOperand(0).getReg())
+            .addImm(0) // SRC0 modifiers
              .addOperand(MI->getOperand(1))
+            .addImm(0) // SRC1 modifiers
              .addImm(0) // SRC1
-            .addImm(0) // ABS
              .addImm(1) // CLAMP
-            .addImm(0) // OMOD
-            .addImm(0); // NEG
+            .addImm(0); // OMOD
      MI->eraseFromParent();
    }
    }
@@ -1325,7 +1325,6 @@ SDNode *SITargetLowering::foldOperands(MachineSDNode *Node,
    const MCInstrDesc *DescE64 = OpcodeE64 == -1 ? nullptr : &TII->get(OpcodeE64);
  
    assert(!DescE64 || DescE64->getNumDefs() == NumDefs);
-  assert(!DescE64 || DescE64->getNumOperands() == (NumOps + 4));
  
    int32_t Immediate = Desc->getSize() == 4 ? 0 : -1;
    bool HaveVSrc = false, HaveSSrc = false;
@@ -1422,8 +1421,15 @@ SDNode *SITargetLowering::foldOperands(MachineSDNode *Node,
    }
  
    if (Promote2e64) {
+    std::vector<SDValue> OldOps(Ops);
+    Ops.clear();
+    for (unsigned i = 0; i < OldOps.size(); ++i) {
+      // src_modifier
+      Ops.push_back(DAG.getTargetConstant(0, MVT::i32));
+      Ops.push_back(OldOps[i]);
+    }
      // Add the modifier flags while promoting
-    for (unsigned i = 0; i < 4; ++i)
+    for (unsigned i = 0; i < 2; ++i)
        Ops.push_back(DAG.getTargetConstant(0, MVT::i32));
    }
  
diff --git a/lib/Target/R600/SIInstrFormats.td b/lib/Target/R600/SIInstrFormats.td

index aa2c22c51eb49041264ebe438b23471de5908cb7..4b2194b598e52fdf89236587727b885c40e1504b 100644 (file)
--- a/lib/Target/R600/SIInstrFormats.td
+++ b/lib/Target/R600/SIInstrFormats.td
@@ -210,16 +210,19 @@ class VOP3 <bits<9> op, dag outs, dag ins, string asm, list<dag> pattern> :
      Enc64 <outs, ins, asm, pattern> {
  
    bits<8> dst;
+  bits<2> src0_modifiers;
    bits<9> src0;
+  bits<2> src1_modifiers;
    bits<9> src1;
+  bits<2> src2_modifiers;
    bits<9> src2;
-  bits<3> abs;
    bits<1> clamp;
    bits<2> omod;
-  bits<3> neg;
  
    let Inst{7-0} = dst;
-  let Inst{10-8} = abs;
+  let Inst{8} = src0_modifiers{1};
+  let Inst{9} = src1_modifiers{1};
+  let Inst{10} = src2_modifiers{1};
    let Inst{11} = clamp;
    let Inst{25-17} = op;
    let Inst{31-26} = 0x34; //encoding
@@ -227,7 +230,9 @@ class VOP3 <bits<9> op, dag outs, dag ins, string asm, list<dag> pattern> :
    let Inst{49-41} = src1;
    let Inst{58-50} = src2;
    let Inst{60-59} = omod;
-  let Inst{63-61} = neg;
+  let Inst{61} = src0_modifiers{0};
+  let Inst{62} = src1_modifiers{0};
+  let Inst{63} = src2_modifiers{0};
    
    let mayLoad = 0;
    let mayStore = 0;
@@ -240,12 +245,14 @@ class VOP3b <bits<9> op, dag outs, dag ins, string asm, list<dag> pattern> :
      Enc64 <outs, ins, asm, pattern> {
  
    bits<8> dst;
+  bits<2> src0_modifiers;
    bits<9> src0;
+  bits<2> src1_modifiers;
    bits<9> src1;
+  bits<2> src2_modifiers;
    bits<9> src2;
    bits<7> sdst;
    bits<2> omod;
-  bits<3> neg;
  
    let Inst{7-0} = dst;
    let Inst{14-8} = sdst;
@@ -255,7 +262,9 @@ class VOP3b <bits<9> op, dag outs, dag ins, string asm, list<dag> pattern> :
    let Inst{49-41} = src1;
    let Inst{58-50} = src2;
    let Inst{60-59} = omod;
-  let Inst{63-61} = neg;
+  let Inst{61} = src0_modifiers{0};
+  let Inst{62} = src1_modifiers{0};
+  let Inst{63} = src2_modifiers{0};
  
    let mayLoad = 0;
    let mayStore = 0;
diff --git a/lib/Target/R600/SIInstrInfo.cpp b/lib/Target/R600/SIInstrInfo.cpp

index 029b97ee36a97abffd6ed7a02035912157bcf616..fbea8f966faf6f6ef3eb9e117eacd0e66f96e470 100644 (file)
--- a/lib/Target/R600/SIInstrInfo.cpp
+++ b/lib/Target/R600/SIInstrInfo.cpp
@@ -1188,6 +1188,10 @@ void SIInstrInfo::moveToVALU(MachineInstr &TopInst) const {
        // We are converting these to a BFE, so we need to add the missing
        // operands for the size and offset.
        unsigned Size = (Opcode == AMDGPU::S_SEXT_I32_I8) ? 8 : 16;
+      Inst->addOperand(Inst->getOperand(1));
+      Inst->getOperand(1).ChangeToImmediate(0);
+      Inst->addOperand(MachineOperand::CreateImm(0));
+      Inst->addOperand(MachineOperand::CreateImm(0));
        Inst->addOperand(MachineOperand::CreateImm(0));
        Inst->addOperand(MachineOperand::CreateImm(Size));
  
@@ -1195,8 +1199,6 @@ void SIInstrInfo::moveToVALU(MachineInstr &TopInst) const {
        // 3 to not hit an assertion later in MCInstLower.
        Inst->addOperand(MachineOperand::CreateImm(0));
        Inst->addOperand(MachineOperand::CreateImm(0));
-      Inst->addOperand(MachineOperand::CreateImm(0));
-      Inst->addOperand(MachineOperand::CreateImm(0));
      }
  
      addDescImplicitUseDef(NewDesc, Inst);
@@ -1213,10 +1215,11 @@ void SIInstrInfo::moveToVALU(MachineInstr &TopInst) const {
        uint32_t BitWidth = (Imm & 0x7f0000) >> 16; // Extract bits [22:16].
  
        Inst->RemoveOperand(2); // Remove old immediate.
+      Inst->addOperand(Inst->getOperand(1));
+      Inst->getOperand(1).ChangeToImmediate(0);
        Inst->addOperand(MachineOperand::CreateImm(Offset));
-      Inst->addOperand(MachineOperand::CreateImm(BitWidth));
-
        Inst->addOperand(MachineOperand::CreateImm(0));
+      Inst->addOperand(MachineOperand::CreateImm(BitWidth));
        Inst->addOperand(MachineOperand::CreateImm(0));
        Inst->addOperand(MachineOperand::CreateImm(0));
        Inst->addOperand(MachineOperand::CreateImm(0));
diff --git a/lib/Target/R600/SIInstrInfo.td b/lib/Target/R600/SIInstrInfo.td

index b86d227800130b4c42639fe171601dc4d8b82848..5f18d98195e3aa3ff71d4245a245d8c220d15db3 100644 (file)
--- a/lib/Target/R600/SIInstrInfo.td
+++ b/lib/Target/R600/SIInstrInfo.td
@@ -245,6 +245,11 @@ class VOP2_REV <string revOp, bit isOrig> {
    bit IsOrig = isOrig;
  }
  
+// This must always be right before the operand being input modified.
+def InputMods : OperandWithDefaultOps <i32, (ops (i32 0))> {
+  let PrintMethod = "printOperandAndMods";
+}
+
  multiclass VOP1_Helper <bits<8> op, RegisterClass drc, RegisterClass src,
                          string opName, list<dag> pattern> {
  
@@ -256,10 +261,8 @@ multiclass VOP1_Helper <bits<8> op, RegisterClass drc, RegisterClass src,
    def _e64 : VOP3 <
      {1, 1, op{6}, op{5}, op{4}, op{3}, op{2}, op{1}, op{0}},
      (outs drc:$dst),
-    (ins src:$src0,
-         i32imm:$abs, i32imm:$clamp,
-         i32imm:$omod, i32imm:$neg),
-    opName#"_e64 $dst, $src0, $abs, $clamp, $omod, $neg", []
+    (ins InputMods:$src0_modifiers, src:$src0, i32imm:$clamp, i32imm:$omod),
+    opName#"_e64 $dst, $src0_modifiers, $clamp, $omod", []
    >, VOP <opName> {
      let src1 = SIOperand.ZERO;
      let src2 = SIOperand.ZERO;
@@ -288,10 +291,10 @@ multiclass VOP2_Helper <bits<6> op, RegisterClass vrc, RegisterClass arc,
    def _e64 : VOP3 <
      {1, 0, 0, op{5}, op{4}, op{3}, op{2}, op{1}, op{0}},
      (outs vrc:$dst),
-    (ins arc:$src0, arc:$src1,
-         i32imm:$abs, i32imm:$clamp,
-         i32imm:$omod, i32imm:$neg),
-    opName#"_e64 $dst, $src0, $src1, $abs, $clamp, $omod, $neg", []
+    (ins InputMods:$src0_modifiers, arc:$src0,
+         InputMods:$src1_modifiers, arc:$src1,
+         i32imm:$clamp, i32imm:$omod),
+    opName#"_e64 $dst, $src0_modifiers, $src1_modifiers, $clamp, $omod", []
    >, VOP <opName>, VOP2_REV<revOp#"_e64", !eq(revOp, opName)> {
      let src2 = SIOperand.ZERO;
    }
@@ -316,10 +319,10 @@ multiclass VOP2b_32 <bits<6> op, string opName, list<dag> pattern,
    def _e64 : VOP3b <
      {1, 0, 0, op{5}, op{4}, op{3}, op{2}, op{1}, op{0}},
      (outs VReg_32:$dst),
-    (ins VSrc_32:$src0, VSrc_32:$src1,
-         i32imm:$abs, i32imm:$clamp,
-         i32imm:$omod, i32imm:$neg),
-    opName#"_e64 $dst, $src0, $src1, $abs, $clamp, $omod, $neg", []
+    (ins InputMods: $src0_modifiers, VSrc_32:$src0,
+         InputMods:$src1_modifiers, VSrc_32:$src1,
+         i32imm:$clamp, i32imm:$omod),
+    opName#"_e64 $dst, $src0_modifiers, $src1_modifiers, $clamp, $omod", []
    >, VOP <opName>, VOP2_REV<revOp#"_e64", !eq(revOp, opName)> {
      let src2 = SIOperand.ZERO;
      /* the VOP2 variant puts the carry out into VCC, the VOP3 variant
@@ -340,15 +343,16 @@ multiclass VOPC_Helper <bits<8> op, RegisterClass vrc, RegisterClass arc,
    def _e64 : VOP3 <
      {0, op{7}, op{6}, op{5}, op{4}, op{3}, op{2}, op{1}, op{0}},
      (outs SReg_64:$dst),
-    (ins arc:$src0, arc:$src1,
-         InstFlag:$abs, InstFlag:$clamp,
-         InstFlag:$omod, InstFlag:$neg),
-    opName#"_e64 $dst, $src0, $src1, $abs, $clamp, $omod, $neg",
+    (ins InputMods:$src0_modifiers, arc:$src0,
+         InputMods:$src1_modifiers, arc:$src1,
+         InstFlag:$clamp, InstFlag:$omod),
+    opName#"_e64 $dst, $src0_modifiers, $src1_modifiers, $clamp, $omod",
      !if(!eq(!cast<string>(cond), "COND_NULL"), []<dag>,
        [(set SReg_64:$dst, (i1 (setcc (vt arc:$src0), arc:$src1, cond)))]
      )
    >, VOP <opName> {
      let src2 = SIOperand.ZERO;
+    let src2_modifiers = 0;
    }
  }
  
@@ -362,9 +366,10 @@ multiclass VOPC_64 <bits<8> op, string opName,
  
  class VOP3_32 <bits<9> op, string opName, list<dag> pattern> : VOP3 <
    op, (outs VReg_32:$dst),
-  (ins VSrc_32:$src0, VSrc_32:$src1, VSrc_32:$src2,
-   InstFlag:$abs, InstFlag:$clamp, InstFlag:$omod, InstFlag:$neg),
-  opName#" $dst, $src0, $src1, $src2, $abs, $clamp, $omod, $neg", pattern
+  (ins InputMods: $src0_modifiers, VSrc_32:$src0, InputMods:$src1_modifiers,
+   VSrc_32:$src1, InputMods:$src2_modifiers, VSrc_32:$src2,
+   InstFlag:$clamp, InstFlag:$omod),
+  opName#" $dst, $src0_modifiers, $src1, $src2, $clamp, $omod", pattern
  >, VOP <opName>;
  
  class VOP3_64_Shift <bits <9> op, string opName, list<dag> pattern> : VOP3 <
@@ -374,10 +379,9 @@ class VOP3_64_Shift <bits <9> op, string opName, list<dag> pattern> : VOP3 <
  >, VOP <opName> {
  
    let src2 = SIOperand.ZERO;
-  let abs = 0;
+  let src0_modifiers = 0;
    let clamp = 0;
    let omod = 0;
-  let neg = 0;
  }
  
  class VOP3_64 <bits<9> op, string opName, list<dag> pattern> : VOP3 <
diff --git a/lib/Target/R600/SIInstructions.td b/lib/Target/R600/SIInstructions.td

index 7d6624b0404bff6e105b057cbf94749de8dce435..1ede24fd97626b68d7ffb43d20434fdc991c4b52 100644 (file)
--- a/lib/Target/R600/SIInstructions.td
+++ b/lib/Target/R600/SIInstructions.td
@@ -1115,7 +1115,11 @@ def V_CNDMASK_B32_e64 : VOP3 <0x00000100, (outs VReg_32:$dst),
     InstFlag:$abs, InstFlag:$clamp, InstFlag:$omod, InstFlag:$neg),
    "V_CNDMASK_B32_e64 $dst, $src0, $src1, $src2, $abs, $clamp, $omod, $neg",
    [(set i32:$dst, (select i1:$src2, i32:$src1, i32:$src0))]
->;
+> {
+  let src0_modifiers = 0;
+  let src1_modifiers = 0;
+  let src2_modifiers = 0;
+}
  
  //f32 pattern for V_CNDMASK_B32_e64
  def : Pat <
@@ -2138,7 +2142,7 @@ def : Pat <
  def : Pat <
    (int_SI_tid),
    (V_MBCNT_HI_U32_B32_e32 0xffffffff,
-                          (V_MBCNT_LO_U32_B32_e64 0xffffffff, 0, 0, 0, 0, 0))
+                          (V_MBCNT_LO_U32_B32_e64 0xffffffff, 0, 0, 0))
  >;
  
  /********** ================== **********/
diff --git a/test/CodeGen/R600/fneg.ll b/test/CodeGen/R600/fneg.ll

index f4e6be62467af908f164c496dc0a068af571c908..7ad760cadbb0b35bcd5e43559d81657eb649cdf7 100644 (file)
--- a/test/CodeGen/R600/fneg.ll
+++ b/test/CodeGen/R600/fneg.ll
@@ -51,7 +51,7 @@ entry:
  ; R600-CHECK: -KC0[2].Z
  ; SI-CHECK-LABEL: @fneg_free
  ; XXX: We could use V_ADD_F32_e64 with the negate bit here instead.
-; SI-CHECK: V_SUB_F32_e64 v{{[0-9]}}, 0.000000e+00, s{{[0-9]}}, 0, 0, 0, 0
+; SI-CHECK: V_SUB_F32_e64 v{{[0-9]}}, 0.000000e+00, s{{[0-9]}}, 0, 0
  define void @fneg_free(float addrspace(1)* %out, i32 %in) {
  entry:
    %0 = bitcast i32 %in to float
diff --git a/test/CodeGen/R600/seto.ll b/test/CodeGen/R600/seto.ll

index 8633a4b804af3b6e81fc5a5cf3be4e2e6e15b549..e90e7886a6a67922464fbe4bad7a47f8abec00f2 100644 (file)
--- a/test/CodeGen/R600/seto.ll
+++ b/test/CodeGen/R600/seto.ll
@@ -1,6 +1,7 @@
  ;RUN: llc < %s -march=r600 -mcpu=verde -verify-machineinstrs | FileCheck %s
  
-;CHECK: V_CMP_O_F32_e64 s[0:1], {{[sv][0-9]+, [sv][0-9]+}}, 0, 0, 0, 0
+;CHECK-LABEL: @main
+;CHECK: V_CMP_O_F32_e64 s[0:1], {{[sv][0-9]+, [sv][0-9]+}}, 0, 0
  
  define void @main(float %p) {
  main_body:
diff --git a/test/CodeGen/R600/setuo.ll b/test/CodeGen/R600/setuo.ll

index c77a37e19041872d7e6f9b8e6ae5b4ade08d4737..3b1db8b062bff83da862faded5730001e064d67d 100644 (file)
--- a/test/CodeGen/R600/setuo.ll
+++ b/test/CodeGen/R600/setuo.ll
@@ -1,6 +1,7 @@
  ;RUN: llc < %s -march=r600 -mcpu=verde -verify-machineinstrs | FileCheck %s
  
-;CHECK: V_CMP_U_F32_e64 s[0:1], {{[sv][0-9]+, [sv][0-9]+}}, 0, 0, 0, 0
+;CHECK-LABEL: @main
+;CHECK: V_CMP_U_F32_e64 s[0:1], {{[sv][0-9]+, [sv][0-9]+}}, 0, 0
  
  define void @main(float %p) {
  main_body:
author	Vincent Lejeune <vljn@ovi.com>
	Sat, 10 May 2014 19:18:33 +0000 (19:18 +0000)
committer	Vincent Lejeune <vljn@ovi.com>
	Sat, 10 May 2014 19:18:33 +0000 (19:18 +0000)
lib/Target/R600/InstPrinter/AMDGPUInstPrinter.cpp		patch \| blob \| history
lib/Target/R600/InstPrinter/AMDGPUInstPrinter.h		patch \| blob \| history
lib/Target/R600/SIISelLowering.cpp		patch \| blob \| history
lib/Target/R600/SIInstrFormats.td		patch \| blob \| history
lib/Target/R600/SIInstrInfo.cpp		patch \| blob \| history
lib/Target/R600/SIInstrInfo.td		patch \| blob \| history
lib/Target/R600/SIInstructions.td		patch \| blob \| history
test/CodeGen/R600/fneg.ll		patch \| blob \| history
test/CodeGen/R600/seto.ll		patch \| blob \| history
test/CodeGen/R600/setuo.ll		patch \| blob \| history