Several changes to Mips backend, experimental fp support being the most

[oota-llvm.git] / lib / Target / Mips / MipsInstrInfo.td
diff --git a/lib/Target/Mips/MipsInstrInfo.td b/lib/Target/Mips/MipsInstrInfo.td

index b1f975482aaa93b9f35089b285c3ac8f2f110b4a..f78fd5dae8701cfc2e94310257506638149ea6fa 100644 (file)
--- a/lib/Target/Mips/MipsInstrInfo.td
+++ b/lib/Target/Mips/MipsInstrInfo.td
@@ -2,8 +2,8 @@
  //
  //                     The LLVM Compiler Infrastructure
  //
-// This file was developed by Bruno Cardoso Lopes and is distributed under the 
-// University of Illinois Open Source License. See LICENSE.TXT for details.
+// This file is distributed under the University of Illinois Open Source
+// License. See LICENSE.TXT for details.
  //
  //===----------------------------------------------------------------------===//
  
@@ -17,41 +17,51 @@ include "MipsInstrFormats.td"
  // Mips profiles and nodes
  //===----------------------------------------------------------------------===//
  
+def SDT_MipsRet          : SDTypeProfile<0, 1, [SDTCisInt<0>]>;
+def SDT_MipsJmpLink      : SDTypeProfile<0, 1, [SDTCisVT<0, iPTR>]>;
+def SDT_MipsSelectCC     : SDTypeProfile<1, 3, [SDTCisSameAs<0, 1>, 
+                                         SDTCisSameAs<1, 2>, SDTCisInt<3>]>;
+def SDT_MipsCallSeqStart : SDCallSeqStart<[SDTCisVT<0, i32>]>;
+def SDT_MipsCallSeqEnd   : SDCallSeqEnd<[SDTCisVT<0, i32>, SDTCisVT<1, i32>]>;
+
  // Call
-def SDT_MipsJmpLink : SDTypeProfile<0, 1, [SDTCisVT<0, iPTR>]>;
-def MipsJmpLink     : SDNode<"MipsISD::JmpLink",SDT_MipsJmpLink, [SDNPHasChain,
-                             SDNPOutFlag]>;
-
-// Hi and Lo nodes are created to let easy manipulation of 16-bit when 
-// handling 32-bit immediates. They are used on MipsISelLowering to 
-// lower stuff like GlobalAddress, ExternalSymbol, ...
-// This two nodes have nothing to do with Mips Registers Hi and Lo.
-def MipsHi : SDNode<"MipsISD::Hi", SDTIntUnaryOp, [SDNPOutFlag]>;
-def MipsLo : SDNode<"MipsISD::Lo", SDTIntUnaryOp>; 
-
-// Necessary to generate glued instructions when loading GlobalAddress
-// into registers.
-def MipsAdd : SDNode<"MipsISD::Add", SDTIntBinOp, [SDNPCommutative, 
-                     SDNPAssociative, SDNPOptInFlag]>;
-
-// Return 
-def SDT_MipsRet : SDTypeProfile<0, 1, [SDTCisInt<0>]>; 
-def MipsRet     : SDNode<"MipsISD::Ret", SDT_MipsRet, [SDNPHasChain, 
-                             SDNPOptInFlag]>;
+def MipsJmpLink : SDNode<"MipsISD::JmpLink",SDT_MipsJmpLink, [SDNPHasChain,
+                         SDNPOutFlag]>;
+
+// Hi and Lo nodes are used to handle global addresses. Used on 
+// MipsISelLowering to lower stuff like GlobalAddress, ExternalSymbol 
+// static model. (nothing to do with Mips Registers Hi and Lo)
+def MipsHi  : SDNode<"MipsISD::Hi", SDTIntUnaryOp, [SDNPOutFlag]>;
+def MipsLo  : SDNode<"MipsISD::Lo", SDTIntUnaryOp>;
+
+// Return
+def MipsRet : SDNode<"MipsISD::Ret", SDT_MipsRet, [SDNPHasChain, 
+                     SDNPOptInFlag]>;
  
  // These are target-independent nodes, but have target-specific formats.
-def SDT_MipsCallSeq : SDTypeProfile<0, 1, [SDTCisVT<0, i32>]>;
-def callseq_start   : SDNode<"ISD::CALLSEQ_START", SDT_MipsCallSeq, 
-                             [SDNPHasChain, SDNPOutFlag]>;
-def callseq_end     : SDNode<"ISD::CALLSEQ_END", SDT_MipsCallSeq, 
-                             [SDNPHasChain, SDNPOutFlag]>;
+def callseq_start : SDNode<"ISD::CALLSEQ_START", SDT_MipsCallSeqStart,
+                           [SDNPHasChain, SDNPOutFlag]>;
+def callseq_end   : SDNode<"ISD::CALLSEQ_END", SDT_MipsCallSeqEnd,
+                           [SDNPHasChain, SDNPOptInFlag, SDNPOutFlag]>;
+
+// Select Condition Code
+def MipsSelectCC  : SDNode<"MipsISD::SelectCC", SDT_MipsSelectCC>;
+
+//===----------------------------------------------------------------------===//
+// Mips Instruction Predicate Definitions.
+//===----------------------------------------------------------------------===//
+def IsAllegrex : Predicate<"Subtarget.isAllegrex()">;
+
+//===----------------------------------------------------------------------===//
+// Mips Operand, Complex Patterns and Transformations Definitions.
+//===----------------------------------------------------------------------===//
  
  // Instruction operand types
  def brtarget    : Operand<OtherVT>;
  def calltarget  : Operand<i32>;
  def uimm16      : Operand<i32>;
  def simm16      : Operand<i32>;
-def shamt       : Operand<i32>; 
+def shamt       : Operand<i32>;
  
  // Address operand
  def mem : Operand<i32> {
@@ -59,10 +69,6 @@ def mem : Operand<i32> {
    let MIOperandInfo = (ops simm16, CPURegs);
  }
  
-//===----------------------------------------------------------------------===//
-// Mips Patterns and Transformations
-//===----------------------------------------------------------------------===//
-
  // Transformation Function - get the lower 16 bits.
  def LO16 : SDNodeXForm<imm, [{
    return getI32Imm((unsigned)N->getValue() & 0xFFFF);
@@ -78,7 +84,7 @@ def HI16 : SDNodeXForm<imm, [{
  def immSExt16  : PatLeaf<(imm), [{
    if (N->getValueType(0) == MVT::i32)
      return (int32_t)N->getValue() == (short)N->getValue();
-  else    
+  else
      return (int64_t)N->getValue() == (short)N->getValue();
  }]>;
  
@@ -89,7 +95,7 @@ def immSExt16  : PatLeaf<(imm), [{
  def immZExt16  : PatLeaf<(imm), [{
    if (N->getValueType(0) == MVT::i32)
      return (uint32_t)N->getValue() == (unsigned short)N->getValue();
-  else    
+  else
      return (uint64_t)N->getValue() == (unsigned short)N->getValue();
  }], LO16>;
  
@@ -103,7 +109,7 @@ def immZExt5 : PatLeaf<(imm), [{
    return N->getValue() == ((N->getValue()) & 0x1f) ;
  }]>;
  
-// Mips Address Mode! SDNode frameindex could possibily be a match 
+// Mips Address Mode! SDNode frameindex could possibily be a match
  // since load and store instructions from stack used it.
  def addr : ComplexPattern<i32, 2, "SelectAddr", [frameindex], []>;
  
@@ -112,52 +118,51 @@ def addr : ComplexPattern<i32, 2, "SelectAddr", [frameindex], []>;
  //===----------------------------------------------------------------------===//
  
  // Arithmetic 3 register operands
-let isCommutable = 1 in 
+let isCommutable = 1 in
  class ArithR<bits<6> op, bits<6> func, string instr_asm, SDNode OpNode,
-             InstrItinClass itin>: 
-  FR< op, 
-      func, 
-      (outs CPURegs:$dst), 
-      (ins CPURegs:$b, CPURegs:$c), 
-      !strconcat(instr_asm, " $dst, $b, $c"), 
+             InstrItinClass itin>:
+  FR< op,
+      func,
+      (outs CPURegs:$dst),
+      (ins CPURegs:$b, CPURegs:$c),
+      !strconcat(instr_asm, " $dst, $b, $c"),
        [(set CPURegs:$dst, (OpNode CPURegs:$b, CPURegs:$c))], itin>;
  
-let isCommutable = 1 in 
-class ArithOverflowR<bits<6> op, bits<6> func, string instr_asm>: 
-  FR< op, 
-      func, 
-      (outs CPURegs:$dst), 
-      (ins CPURegs:$b, CPURegs:$c), 
-      !strconcat(instr_asm, " $dst, $b, $c"), 
+let isCommutable = 1 in
+class ArithOverflowR<bits<6> op, bits<6> func, string instr_asm>:
+  FR< op,
+      func,
+      (outs CPURegs:$dst),
+      (ins CPURegs:$b, CPURegs:$c),
+      !strconcat(instr_asm, " $dst, $b, $c"),
        [], IIAlu>;
  
  // Arithmetic 2 register operands
-let isCommutable = 1 in
-class ArithI<bits<6> op, string instr_asm, SDNode OpNode, 
-             Operand Od, PatLeaf imm_type> : 
-  FI< op, 
-      (outs CPURegs:$dst), 
-      (ins CPURegs:$b, Od:$c), 
-      !strconcat(instr_asm, " $dst, $b, $c"), 
+class ArithI<bits<6> op, string instr_asm, SDNode OpNode,
+             Operand Od, PatLeaf imm_type> :
+  FI< op,
+      (outs CPURegs:$dst),
+      (ins CPURegs:$b, Od:$c),
+      !strconcat(instr_asm, " $dst, $b, $c"),
        [(set CPURegs:$dst, (OpNode CPURegs:$b, imm_type:$c))], IIAlu>;
  
  // Arithmetic Multiply ADD/SUB
  let rd=0 in
-class MArithR<bits<6> func, string instr_asm> : 
-  FR< 0x1c, 
+class MArithR<bits<6> func, string instr_asm> :
+  FR< 0x1c,
        func,
-      (outs CPURegs:$rs), 
-      (ins CPURegs:$rt), 
-      !strconcat(instr_asm, " $rs, $rt"), 
+      (outs CPURegs:$rs),
+      (ins CPURegs:$rt),
+      !strconcat(instr_asm, " $rs, $rt"),
        [], IIImul>;
  
  //  Logical
  class LogicR<bits<6> func, string instr_asm, SDNode OpNode>:
-  FR< 0x00, 
-      func, 
-      (outs CPURegs:$dst), 
-      (ins CPURegs:$b, CPURegs:$c), 
-      !strconcat(instr_asm, " $dst, $b, $c"), 
+  FR< 0x00,
+      func,
+      (outs CPURegs:$dst),
+      (ins CPURegs:$b, CPURegs:$c),
+      !strconcat(instr_asm, " $dst, $b, $c"),
        [(set CPURegs:$dst, (OpNode CPURegs:$b, CPURegs:$c))], IIAlu>;
  
  class LogicI<bits<6> op, string instr_asm, SDNode OpNode>:
@@ -165,32 +170,32 @@ class LogicI<bits<6> op, string instr_asm, SDNode OpNode>:
        (outs CPURegs:$dst),
        (ins CPURegs:$b, uimm16:$c),
        !strconcat(instr_asm, " $dst, $b, $c"),
-      [(set CPURegs:$dst, (OpNode CPURegs:$b, immSExt16:$c))], IIAlu>;
+      [(set CPURegs:$dst, (OpNode CPURegs:$b, immZExt16:$c))], IIAlu>;
  
  class LogicNOR<bits<6> op, bits<6> func, string instr_asm>:
-  FR< op, 
-      func, 
-      (outs CPURegs:$dst), 
-      (ins CPURegs:$b, CPURegs:$c), 
-      !strconcat(instr_asm, " $dst, $b, $c"), 
+  FR< op,
+      func,
+      (outs CPURegs:$dst),
+      (ins CPURegs:$b, CPURegs:$c),
+      !strconcat(instr_asm, " $dst, $b, $c"),
        [(set CPURegs:$dst, (not (or CPURegs:$b, CPURegs:$c)))], IIAlu>;
  
  // Shifts
  let rt = 0 in
  class LogicR_shift_imm<bits<6> func, string instr_asm, SDNode OpNode>:
-  FR< 0x00, 
-      func, 
+  FR< 0x00,
+      func,
        (outs CPURegs:$dst),
        (ins CPURegs:$b, shamt:$c),
-      !strconcat(instr_asm, " $dst, $b, $c"), 
+      !strconcat(instr_asm, " $dst, $b, $c"),
        [(set CPURegs:$dst, (OpNode CPURegs:$b, immZExt5:$c))], IIAlu>;
  
  class LogicR_shift_reg<bits<6> func, string instr_asm, SDNode OpNode>:
-  FR< 0x00, 
-      func, 
+  FR< 0x00,
+      func,
        (outs CPURegs:$dst),
        (ins CPURegs:$b, CPURegs:$c),
-      !strconcat(instr_asm, " $dst, $b, $c"), 
+      !strconcat(instr_asm, " $dst, $b, $c"),
        [(set CPURegs:$dst, (OpNode CPURegs:$b, CPURegs:$c))], IIAlu>;
  
  // Load Upper Imediate
@@ -201,8 +206,8 @@ class LoadUpper<bits<6> op, string instr_asm>:
        !strconcat(instr_asm, " $dst, $imm"),
        [], IIAlu>;
  
-// Memory Load/Store 
-let isLoad = 1, hasDelaySlot = 1 in
+// Memory Load/Store
+let isSimpleLoad = 1, hasDelaySlot = 1 in
  class LoadM<bits<6> op, string instr_asm, PatFrag OpNode>:
    FI< op,
        (outs CPURegs:$dst),
@@ -210,7 +215,6 @@ class LoadM<bits<6> op, string instr_asm, PatFrag OpNode>:
        !strconcat(instr_asm, " $dst, $addr"),
        [(set CPURegs:$dst, (OpNode addr:$addr))], IILoad>;
  
-let isStore = 1 in
  class StoreM<bits<6> op, string instr_asm, PatFrag OpNode>:
    FI< op,
        (outs),
@@ -236,9 +240,9 @@ class CBranchZero<bits<6> op, string instr_asm, PatFrag cond_op>:
        !strconcat(instr_asm, " $src, $offset"),
        [(brcond (cond_op CPURegs:$src, 0), bb:$offset)],
        IIBranch>;
-}      
+}
  
-// SetCC 
+// SetCC
  class SetCC_R<bits<6> op, bits<6> func, string instr_asm,
        PatFrag cond_op>:
    FR< op,
@@ -274,14 +278,14 @@ class JumpFR<bits<6> op, bits<6> func, string instr_asm>:
        (outs),
        (ins CPURegs:$target),
        !strconcat(instr_asm, " $target"),
-      [], IIBranch>;
+      [(brind CPURegs:$target)], IIBranch>;
  
  // Jump and Link (Call)
-let isCall=1, hasDelaySlot=1, 
+let isCall=1, hasDelaySlot=1,
    // All calls clobber the non-callee saved registers...
-  Defs = [AT, V0, V1, A0, A1, A2, A3, T0, T1, T2, 
-          T3, T4, T5, T6, T7, T8, T9, K0, K1, GP] in {
-  class JumpLink<bits<6> op, string instr_asm>: 
+  Defs = [AT, V0, V1, A0, A1, A2, A3, T0, T1, T2,
+          T3, T4, T5, T6, T7, T8, T9, K0, K1], Uses = [GP] in {
+  class JumpLink<bits<6> op, string instr_asm>:
      FJ< op,
          (outs),
          (ins calltarget:$target),
@@ -305,54 +309,80 @@ let isCall=1, hasDelaySlot=1,
          [], IIBranch>;
  }
  
-// Mul, Div 
-class MulDiv<bits<6> func, string instr_asm, InstrItinClass itin>: 
-  FR< 0x00, 
-      func, 
+// Mul, Div
+class MulDiv<bits<6> func, string instr_asm, InstrItinClass itin>:
+  FR< 0x00,
+      func,
        (outs),
-      (ins CPURegs:$a, CPURegs:$b), 
-      !strconcat(instr_asm, " $a, $b"), 
+      (ins CPURegs:$a, CPURegs:$b),
+      !strconcat(instr_asm, " $a, $b"),
        [], itin>;
  
-// Move from Hi/Lo 
+// Move from Hi/Lo
  class MoveFromTo<bits<6> func, string instr_asm>:
-  FR< 0x00, 
-      func, 
-      (outs CPURegs:$dst), 
+  FR< 0x00,
+      func,
+      (outs CPURegs:$dst),
        (ins),
-      !strconcat(instr_asm, " $dst"), 
+      !strconcat(instr_asm, " $dst"),
        [], IIHiLo>;
  
  // Count Leading Ones/Zeros in Word
  class CountLeading<bits<6> func, string instr_asm>:
-  FR< 0x1c, 
-      func, 
-      (outs CPURegs:$dst), 
-      (ins CPURegs:$src), 
-      !strconcat(instr_asm, " $dst, $src"), 
+  FR< 0x1c,
+      func,
+      (outs CPURegs:$dst),
+      (ins CPURegs:$src),
+      !strconcat(instr_asm, " $dst, $src"),
        [], IIAlu>;
  
+class EffectiveAddress<string instr_asm> :
+  FI<0x09,
+     (outs CPURegs:$dst),
+     (ins mem:$addr),
+     instr_asm,
+     [(set CPURegs:$dst, addr:$addr)], IIAlu>;
+
+class SignExtInReg<bits<6> func, string instr_asm, ValueType vt>:
+  FR< 0x3f, func, (outs CPURegs:$dst), (ins CPURegs:$src),
+      !strconcat(instr_asm, " $dst, $src"),
+      [(set CPURegs:$dst, (sext_inreg CPURegs:$src, vt))], NoItinerary>;
+
  
  //===----------------------------------------------------------------------===//
  // Pseudo instructions
  //===----------------------------------------------------------------------===//
  
-class Pseudo<dag outs, dag ins, string asmstr, list<dag> pattern>:
-      MipsInst<outs, ins, asmstr, pattern, IIPseudo>;
-
  // As stack alignment is always done with addiu, we need a 16-bit immediate
  let Defs = [SP], Uses = [SP] in {
-def ADJCALLSTACKDOWN : Pseudo<(outs), (ins uimm16:$amt),
-                              "!ADJCALLSTACKDOWN $amt",
-                              [(callseq_start imm:$amt)]>;
-def ADJCALLSTACKUP   : Pseudo<(outs), (ins uimm16:$amt),
-                              "!ADJCALLSTACKUP $amt",
-                              [(callseq_end imm:$amt)]>;
+def ADJCALLSTACKDOWN : MipsPseudo<(outs), (ins uimm16:$amt),
+                                  "!ADJCALLSTACKDOWN $amt",
+                                  [(callseq_start imm:$amt)]>;
+def ADJCALLSTACKUP   : MipsPseudo<(outs), (ins uimm16:$amt1, uimm16:$amt2),
+                                  "!ADJCALLSTACKUP $amt1",
+                                  [(callseq_end imm:$amt1, imm:$amt2)]>;
  }
  
-def IMPLICIT_DEF_CPURegs : Pseudo<(outs CPURegs:$dst), (ins),
-                                  "!IMPLICIT_DEF $dst",
-                                  [(set CPURegs:$dst, (undef))]>;
+// When handling PIC code the assembler needs .cpload and .cprestore
+// directives. If the real instructions corresponding these directives
+// are used, we have the same behavior, but get also a bunch of warnings
+// from the assembler.
+def CPLOAD : MipsPseudo<(outs), (ins CPURegs:$reg),
+                        ".set noreorder\n\t.cpload $reg\n\t.set reorder\n", 
+                        []>;
+def CPRESTORE : MipsPseudo<(outs), (ins uimm16:$loc),
+                           ".cprestore $loc\n", []>;
+
+// The supported Mips ISAs dont have any instruction close to the SELECT_CC 
+// operation. The solution is to create a Mips pseudo SELECT_CC instruction
+// (MipsSelectCC), use LowerSELECT_CC to generate this instruction and finally 
+// replace it for real supported nodes into EmitInstrWithCustomInserter
+let usesCustomDAGSchedInserter = 1 in {
+  def Select_CC : MipsPseudo<(outs CPURegs:$dst), 
+    (ins CPURegs:$CmpRes, CPURegs:$T, CPURegs:$F), "# MipsSelect_CC", 
+    [(set CPURegs:$dst, (MipsSelectCC CPURegs:$CmpRes, 
+                                      CPURegs:$T, CPURegs:$F))]>;
+}
  
  //===----------------------------------------------------------------------===//
  // Instruction definition
@@ -366,17 +396,14 @@ def IMPLICIT_DEF_CPURegs : Pseudo<(outs CPURegs:$dst), (ins),
  
  // ADDiu just accept 16-bit immediates but we handle this on Pat's.
  // immZExt32 is used here so it can match GlobalAddress immediates.
-def ADDiu   : ArithI<0x09, "addiu", MipsAdd, uimm16, immZExt16>;
+// MUL is a assembly macro in the current used ISAs.
+def ADDiu   : ArithI<0x09, "addiu", add, uimm16, immZExt16>;
  def ADDi    : ArithI<0x08, "addi",  add, simm16, immSExt16>;
-def MUL     : ArithR<0x1c, 0x02, "mul", mul, IIImul>;
+//def MUL     : ArithR<0x1c, 0x02, "mul", mul, IIImul>;
  def ADDu    : ArithR<0x00, 0x21, "addu", add, IIAlu>;
  def SUBu    : ArithR<0x00, 0x23, "subu", sub, IIAlu>;
  def ADD     : ArithOverflowR<0x00, 0x20, "add">;
  def SUB     : ArithOverflowR<0x00, 0x22, "sub">;
-def MADD    : MArithR<0x00, "madd">;
-def MADDU   : MArithR<0x01, "maddu">;
-def MSUB    : MArithR<0x04, "msub">;
-def MSUBU   : MArithR<0x05, "msubu">;
  
  // Logical
  def AND     : LogicR<0x24, "and", and>;
@@ -387,7 +414,7 @@ def ORi     : LogicI<0x0d, "ori",  or>;
  def XORi    : LogicI<0x0e, "xori",  xor>;
  def NOR     : LogicNOR<0x00, 0x27, "nor">;
  
-// Shifts 
+// Shifts
  def SLL     : LogicR_shift_imm<0x00, "sll", shl>;
  def SRL     : LogicR_shift_imm<0x02, "srl", srl>;
  def SRA     : LogicR_shift_imm<0x03, "sra", sra>;
@@ -412,7 +439,7 @@ def SW      : StoreM<0x2b, "sw", store>;
  def BEQ     : CBranch<0x04, "beq", seteq>;
  def BNE     : CBranch<0x05, "bne", setne>;
  
-let rt=1 in 
+let rt=1 in
  def BGEZ    : CBranchZero<0x01, "bgez", setge>;
  
  let rt=0 in {
@@ -445,43 +472,74 @@ def MULTu   : MulDiv<0x19, "multu", IIImul>;
  def DIV     : MulDiv<0x1a, "div", IIIdiv>;
  def DIVu    : MulDiv<0x1b, "divu", IIIdiv>;
  
-// Move From Hi/Lo 
+// Move From Hi/Lo
  def MFHI    : MoveFromTo<0x10, "mfhi">;
  def MFLO    : MoveFromTo<0x12, "mflo">;
  def MTHI    : MoveFromTo<0x11, "mthi">;
  def MTLO    : MoveFromTo<0x13, "mtlo">;
  
-// Count Leading
-def CLO     : CountLeading<0x21, "clo">;
-def CLZ     : CountLeading<0x20, "clz">;
-
  // No operation
  let addr=0 in
  def NOP     : FJ<0, (outs), (ins), "nop", [], IIAlu>;
  
-// Ret instruction - as mips does not have "ret" a 
+// Ret instruction - as mips does not have "ret" a
  // jr $ra must be generated.
  let isReturn=1, isTerminator=1, hasDelaySlot=1,
-    isBarrier=1, hasCtrlDep=1, rs=0, rt=0, shamt=0 in 
+    isBarrier=1, hasCtrlDep=1, rs=0, rt=0, shamt=0 in
  {
    def RET : FR <0x00, 0x02, (outs), (ins CPURegs:$target),
                  "jr $target", [(MipsRet CPURegs:$target)], IIBranch>;
  }
  
+// FrameIndexes are legalized when they are operands from load/store
+// instructions. The same not happens for stack address copies, so an
+// add op with mem ComplexPattern is used and the stack address copy
+// can be matched. It's similar to Sparc LEA_ADDRi
+def LEA_ADDiu : EffectiveAddress<"addiu $dst, ${addr:stackloc}">;
+
+// Count Leading
+// CLO/CLZ are part of the newer MIPS32(tm) instruction
+// set and not older Mips I keep this for future use
+// though. 
+//def CLO     : CountLeading<0x21, "clo">;
+//def CLZ     : CountLeading<0x20, "clz">;
+
+// MADD*/MSUB* are not part of MipsI either.
+//def MADD    : MArithR<0x00, "madd">;
+//def MADDU   : MArithR<0x01, "maddu">;
+//def MSUB    : MArithR<0x04, "msub">;
+//def MSUBU   : MArithR<0x05, "msubu">;
+
+let Predicates = [IsAllegrex] in {
+  let shamt = 0x10, rs = 0 in 
+    def SEB : SignExtInReg<0x21, "seb", i8>;
+
+  let shamt = 0x18, rs = 0 in 
+    def SEH : SignExtInReg<0x20, "seh", i16>;
+}
+
  //===----------------------------------------------------------------------===//
  //  Arbitrary patterns that map to one or more instructions
  //===----------------------------------------------------------------------===//
  
  // Small immediates
-def : Pat<(i32 immSExt16:$in), 
+def : Pat<(i32 immSExt16:$in),
            (ADDiu ZERO, imm:$in)>;
-def : Pat<(i32 immZExt16:$in), 
+def : Pat<(i32 immZExt16:$in),
            (ORi ZERO, imm:$in)>;
  
  // Arbitrary immediates
  def : Pat<(i32 imm:$imm),
            (ORi (LUi (HI16 imm:$imm)), (LO16 imm:$imm))>;
  
+// Carry patterns
+def : Pat<(subc CPURegs:$lhs, CPURegs:$rhs),
+          (SUBu CPURegs:$lhs, CPURegs:$rhs)>;
+def : Pat<(addc CPURegs:$lhs, CPURegs:$rhs),
+          (ADDu CPURegs:$lhs, CPURegs:$rhs)>;
+def : Pat<(addc  CPURegs:$src, imm:$imm),
+          (ADDiu CPURegs:$src, imm:$imm)>;
+
  // Call
  def : Pat<(MipsJmpLink (i32 tglobaladdr:$dst)),
            (JAL tglobaladdr:$dst)>;
@@ -493,24 +551,26 @@ def : Pat<(MipsJmpLink CPURegs:$dst),
  // GlobalAddress, Constant Pool, ExternalSymbol, and JumpTable
  def : Pat<(MipsHi tglobaladdr:$in), (LUi tglobaladdr:$in)>;
  def : Pat<(MipsLo tglobaladdr:$in), (ADDiu ZERO, tglobaladdr:$in)>;
-def : Pat<(MipsAdd CPURegs:$hi, (MipsLo tglobaladdr:$lo)),
+def : Pat<(add CPURegs:$hi, (MipsLo tglobaladdr:$lo)),
            (ADDiu CPURegs:$hi, tglobaladdr:$lo)>;
+def : Pat<(MipsHi tjumptable:$in), (LUi tjumptable:$in)>;
+def : Pat<(MipsLo tjumptable:$in), (ADDiu ZERO, tjumptable:$in)>;
+def : Pat<(add CPURegs:$hi, (MipsLo tjumptable:$lo)),
+          (ADDiu CPURegs:$hi, tjumptable:$lo)>;
  
-// Mips does not have not, so we increase the operation  
+// Mips does not have "not", so we expand our way
  def : Pat<(not CPURegs:$in),
            (NOR CPURegs:$in, ZERO)>;
  
-// extended load and stores 
+// extended load and stores
  def : Pat<(i32 (extloadi1  addr:$src)), (LBu addr:$src)>;
  def : Pat<(i32 (extloadi8  addr:$src)), (LBu addr:$src)>;
  def : Pat<(i32 (extloadi16 addr:$src)), (LHu addr:$src)>;
-def : Pat<(truncstorei1 CPURegs:$src, addr:$addr), 
-           (SB CPURegs:$src, addr:$addr)>;
  
-///
-/// brcond patterns
-///
+// peepholes
+def : Pat<(store (i32 0), addr:$dst), (SW ZERO, addr:$dst)>;
  
+// brcond patterns
  // direct match equal/notequal zero branches
  def : Pat<(brcond (setne CPURegs:$lhs, 0), bb:$dst),
            (BNE CPURegs:$lhs, ZERO, bb:$dst)>;
@@ -550,12 +610,8 @@ def : Pat<(brcond (setult CPURegs:$lhs, CPURegs:$rhs), bb:$dst),
  def : Pat<(brcond CPURegs:$cond, bb:$dst),
            (BNE CPURegs:$cond, ZERO, bb:$dst)>;
  
-///
-/// setcc patterns, only matched when there 
+/// setcc patterns, only matched when there
  /// is no brcond following a setcc operation
-///
-
-// setcc 2 register operands
  def : Pat<(setle CPURegs:$lhs, CPURegs:$rhs),
            (XORi (SLT CPURegs:$rhs, CPURegs:$lhs), 1)>;
  def : Pat<(setule CPURegs:$lhs, CPURegs:$rhs),
@@ -572,16 +628,21 @@ def : Pat<(setuge CPURegs:$lhs, CPURegs:$rhs),
            (XORi (SLTu CPURegs:$lhs, CPURegs:$rhs), 1)>;
  
  def : Pat<(setne CPURegs:$lhs, CPURegs:$rhs),
-          (OR (SLT CPURegs:$lhs, CPURegs:$rhs), 
+          (OR (SLT CPURegs:$lhs, CPURegs:$rhs),
                (SLT CPURegs:$rhs, CPURegs:$lhs))>;
  
  def : Pat<(seteq CPURegs:$lhs, CPURegs:$rhs),
-          (XORi (OR (SLT CPURegs:$lhs, CPURegs:$rhs), 
+          (XORi (OR (SLT CPURegs:$lhs, CPURegs:$rhs),
                      (SLT CPURegs:$rhs, CPURegs:$lhs)), 1)>;
-          
-// setcc reg/imm operands
+
  def : Pat<(setge CPURegs:$lhs, immSExt16:$rhs),
            (XORi (SLTi CPURegs:$lhs, immSExt16:$rhs), 1)>;
  def : Pat<(setuge CPURegs:$lhs, immZExt16:$rhs),
            (XORi (SLTiu CPURegs:$lhs, immZExt16:$rhs), 1)>;
  
+//===----------------------------------------------------------------------===//
+// Floating Point Support
+//===----------------------------------------------------------------------===//
+
+include "MipsInstrFPU.td"
+