Avoid a Symbol -> Name -> Symbol conversion.

[oota-llvm.git] / lib / Target / X86 / X86InstrCompiler.td
diff --git a/lib/Target/X86/X86InstrCompiler.td b/lib/Target/X86/X86InstrCompiler.td

index e7de24bca41798bfc9cff0b0a3a4a0afc4d4700a..7f850d6830e1506eddd0ac707bf465e09ce4292d 100644 (file)
--- a/lib/Target/X86/X86InstrCompiler.td
+++ b/lib/Target/X86/X86InstrCompiler.td
@@ -17,12 +17,12 @@
  
  def GetLo32XForm : SDNodeXForm<imm, [{
    // Transformation function: get the low 32 bits.
-  return getI32Imm((unsigned)N->getZExtValue());
+  return getI32Imm((unsigned)N->getZExtValue(), SDLoc(N));
  }]>;
  
  def GetLo8XForm : SDNodeXForm<imm, [{
    // Transformation function: get the low 8 bits.
-  return getI8Imm((uint8_t)N->getZExtValue());
+  return getI8Imm((uint8_t)N->getZExtValue(), SDLoc(N));
  }]>;
  
  
@@ -518,6 +518,10 @@ let usesCustomInserter = 1, Uses = [EFLAGS] in {
    defm _V8I64  : CMOVrr_PSEUDO<VR512, v8i64>;
    defm _V8F64  : CMOVrr_PSEUDO<VR512, v8f64>;
    defm _V16F32 : CMOVrr_PSEUDO<VR512, v16f32>;
+  defm _V8I1   : CMOVrr_PSEUDO<VK8,  v8i1>;
+  defm _V16I1  : CMOVrr_PSEUDO<VK16, v16i1>;
+  defm _V32I1  : CMOVrr_PSEUDO<VK32, v32i1>;
+  defm _V64I1  : CMOVrr_PSEUDO<VK64, v64i1>;
  } // usesCustomInserter = 1, Uses = [EFLAGS]
  
  //===----------------------------------------------------------------------===//
@@ -865,6 +869,7 @@ def : Pat<(i32 (X86Wrapper tjumptable  :$dst)), (MOV32ri tjumptable  :$dst)>;
  def : Pat<(i32 (X86Wrapper tglobaltlsaddr:$dst)),(MOV32ri tglobaltlsaddr:$dst)>;
  def : Pat<(i32 (X86Wrapper tglobaladdr :$dst)), (MOV32ri tglobaladdr :$dst)>;
  def : Pat<(i32 (X86Wrapper texternalsym:$dst)), (MOV32ri texternalsym:$dst)>;
+def : Pat<(i32 (X86Wrapper mcsym:$dst)), (MOV32ri mcsym:$dst)>;
  def : Pat<(i32 (X86Wrapper tblockaddress:$dst)), (MOV32ri tblockaddress:$dst)>;
  
  def : Pat<(add GR32:$src1, (X86Wrapper tconstpool:$src2)),
@@ -875,6 +880,8 @@ def : Pat<(add GR32:$src1, (X86Wrapper tglobaladdr :$src2)),
            (ADD32ri GR32:$src1, tglobaladdr:$src2)>;
  def : Pat<(add GR32:$src1, (X86Wrapper texternalsym:$src2)),
            (ADD32ri GR32:$src1, texternalsym:$src2)>;
+def : Pat<(add GR32:$src1, (X86Wrapper mcsym:$src2)),
+          (ADD32ri GR32:$src1, mcsym:$src2)>;
  def : Pat<(add GR32:$src1, (X86Wrapper tblockaddress:$src2)),
            (ADD32ri GR32:$src1, tblockaddress:$src2)>;
  
@@ -882,6 +889,8 @@ def : Pat<(store (i32 (X86Wrapper tglobaladdr:$src)), addr:$dst),
            (MOV32mi addr:$dst, tglobaladdr:$src)>;
  def : Pat<(store (i32 (X86Wrapper texternalsym:$src)), addr:$dst),
            (MOV32mi addr:$dst, texternalsym:$src)>;
+def : Pat<(store (i32 (X86Wrapper mcsym:$src)), addr:$dst),
+          (MOV32mi addr:$dst, mcsym:$src)>;
  def : Pat<(store (i32 (X86Wrapper tblockaddress:$src)), addr:$dst),
            (MOV32mi addr:$dst, tblockaddress:$src)>;
  
@@ -896,6 +905,8 @@ def : Pat<(i64 (X86Wrapper tglobaladdr :$dst)),
            (MOV64ri tglobaladdr :$dst)>, Requires<[FarData]>;
  def : Pat<(i64 (X86Wrapper texternalsym:$dst)),
            (MOV64ri texternalsym:$dst)>, Requires<[FarData]>;
+def : Pat<(i64 (X86Wrapper mcsym:$dst)),
+          (MOV64ri mcsym:$dst)>, Requires<[FarData]>;
  def : Pat<(i64 (X86Wrapper tblockaddress:$dst)),
            (MOV64ri tblockaddress:$dst)>, Requires<[FarData]>;
  
@@ -910,6 +921,8 @@ def : Pat<(i64 (X86Wrapper tglobaladdr :$dst)),
            (MOV64ri32 tglobaladdr :$dst)>, Requires<[KernelCode]>;
  def : Pat<(i64 (X86Wrapper texternalsym:$dst)),
            (MOV64ri32 texternalsym:$dst)>, Requires<[KernelCode]>;
+def : Pat<(i64 (X86Wrapper mcsym:$dst)),
+          (MOV64ri32 mcsym:$dst)>, Requires<[KernelCode]>;
  def : Pat<(i64 (X86Wrapper tblockaddress:$dst)),
            (MOV64ri32 tblockaddress:$dst)>, Requires<[KernelCode]>;
  
@@ -928,12 +941,15 @@ def : Pat<(store (i64 (X86Wrapper tglobaladdr:$src)), addr:$dst),
  def : Pat<(store (i64 (X86Wrapper texternalsym:$src)), addr:$dst),
            (MOV64mi32 addr:$dst, texternalsym:$src)>,
            Requires<[NearData, IsStatic]>;
+def : Pat<(store (i64 (X86Wrapper mcsym:$src)), addr:$dst),
+          (MOV64mi32 addr:$dst, mcsym:$src)>,
+          Requires<[NearData, IsStatic]>;
  def : Pat<(store (i64 (X86Wrapper tblockaddress:$src)), addr:$dst),
            (MOV64mi32 addr:$dst, tblockaddress:$src)>,
            Requires<[NearData, IsStatic]>;
  
-def : Pat<(i32 (X86RecoverFrameAlloc texternalsym:$dst)), (MOV32ri texternalsym:$dst)>;
-def : Pat<(i64 (X86RecoverFrameAlloc texternalsym:$dst)), (MOV64ri texternalsym:$dst)>;
+def : Pat<(i32 (X86RecoverFrameAlloc mcsym:$dst)), (MOV32ri mcsym:$dst)>;
+def : Pat<(i64 (X86RecoverFrameAlloc mcsym:$dst)), (MOV64ri mcsym:$dst)>;
  
  // Calls
  
@@ -1060,11 +1076,12 @@ defm : CMOVmr<X86_COND_O , CMOVNO16rm, CMOVNO32rm, CMOVNO64rm>;
  defm : CMOVmr<X86_COND_NO, CMOVO16rm , CMOVO32rm , CMOVO64rm>;
  
  // zextload bool -> zextload byte
-def : Pat<(zextloadi8i1  addr:$src), (MOV8rm     addr:$src)>;
-def : Pat<(zextloadi16i1 addr:$src), (MOVZX16rm8 addr:$src)>;
-def : Pat<(zextloadi32i1 addr:$src), (MOVZX32rm8 addr:$src)>;
+def : Pat<(zextloadi8i1  addr:$src), (AND8ri (MOV8rm addr:$src), (i8 1))>;
+def : Pat<(zextloadi16i1 addr:$src), (AND16ri (MOVZX16rm8 addr:$src), (i16 1))>;
+def : Pat<(zextloadi32i1 addr:$src), (AND32ri (MOVZX32rm8 addr:$src), (i32 1))>;
  def : Pat<(zextloadi64i1 addr:$src),
-          (SUBREG_TO_REG (i64 0), (MOVZX32rm8 addr:$src), sub_32bit)>;
+          (SUBREG_TO_REG (i64 0),
+           (AND32ri (MOVZX32rm8 addr:$src), (i32 1)), sub_32bit)>;
  
  // extload bool -> extload byte
  // When extloading from 16-bit and smaller memory locations into 64-bit
@@ -1232,8 +1249,11 @@ def : Pat<(store (add (loadi64 addr:$dst), 0x00000000800000000), addr:$dst),
  // with implicit zero-extension instead of a 64-bit and if the immediate has at
  // least 32 bits of leading zeros. If in addition the last 32 bits can be
  // represented with a sign extension of a 8 bit constant, use that.
+// This can also reduce instruction size by eliminating the need for the REX
+// prefix.
  
-let AddedComplexity = 1 in // Give priority over i64immSExt8.
+// AddedComplexity is needed to give priority over i64immSExt8 and i64immSExt32.
+let AddedComplexity = 1 in {
  def : Pat<(and GR64:$src, i64immZExt32SExt8:$imm),
            (SUBREG_TO_REG
              (i64 0),
@@ -1242,7 +1262,6 @@ def : Pat<(and GR64:$src, i64immZExt32SExt8:$imm),
                (i32 (GetLo8XForm imm:$imm))),
              sub_32bit)>;
  
-let AddedComplexity = 1 in // Give priority over i64immSExt32.
  def : Pat<(and GR64:$src, i64immZExt32:$imm),
            (SUBREG_TO_REG
              (i64 0),
@@ -1250,8 +1269,13 @@ def : Pat<(and GR64:$src, i64immZExt32:$imm),
                (EXTRACT_SUBREG GR64:$src, sub_32bit),
                (i32 (GetLo32XForm imm:$imm))),
              sub_32bit)>;
+} // AddedComplexity = 1
  
  
+// AddedComplexity is needed due to the increased complexity on the
+// i64immZExt32SExt8 and i64immZExt32 patterns above. Applying this to all
+// the MOVZX patterns keeps thems together in DAGIsel tables.
+let AddedComplexity = 1 in {
  // r & (2^16-1) ==> movz
  def : Pat<(and GR32:$src1, 0xffff),
            (MOVZX32rr16 (EXTRACT_SUBREG GR32:$src1, sub_16bit))>;
@@ -1269,7 +1293,6 @@ def : Pat<(and GR16:$src1, 0xff),
        Requires<[Not64BitMode]>;
  
  // r & (2^32-1) ==> movz
-let AddedComplexity = 1 in // Give priority over i64immZExt32.
  def : Pat<(and GR64:$src, 0x00000000FFFFFFFF),
            (SUBREG_TO_REG (i64 0),
                           (MOV32rr (EXTRACT_SUBREG GR64:$src, sub_32bit)),
@@ -1281,7 +1304,6 @@ def : Pat<(and GR64:$src, 0xffff),
                        (MOVZX32rr16 (i16 (EXTRACT_SUBREG GR64:$src, sub_16bit))),
                        sub_32bit)>;
  // r & (2^8-1) ==> movz
-let AddedComplexity = 1 in // Give priority over i64immSExt32.
  def : Pat<(and GR64:$src, 0xff),
            (SUBREG_TO_REG (i64 0),
                           (MOVZX32rr8 (i8 (EXTRACT_SUBREG GR64:$src, sub_8bit))),
@@ -1295,6 +1317,7 @@ def : Pat<(and GR16:$src1, 0xff),
             (EXTRACT_SUBREG (MOVZX32rr8 (i8
              (EXTRACT_SUBREG GR16:$src1, sub_8bit))), sub_16bit)>,
        Requires<[In64BitMode]>;
+} // AddedComplexity = 1
  
  
  // sext_inreg patterns