More missed vdup patterns

author Anton Korobeynikov <asl@math.spbu.ru>

Wed, 2 Sep 2009 21:21:28 +0000 (21:21 +0000)

committer Anton Korobeynikov <asl@math.spbu.ru>

Wed, 2 Sep 2009 21:21:28 +0000 (21:21 +0000)
author Anton Korobeynikov <asl@math.spbu.ru>
Wed, 2 Sep 2009 21:21:28 +0000 (21:21 +0000)
committer Anton Korobeynikov <asl@math.spbu.ru>
Wed, 2 Sep 2009 21:21:28 +0000 (21:21 +0000)
diff --git a/lib/Target/ARM/ARMInstrNEON.td b/lib/Target/ARM/ARMInstrNEON.td

index 0c2f65523b46c556cee60a818ad2102f91d80127..c111668c5b7263d182e43b15442bcab7318cd5d7 100644 (file)
--- a/lib/Target/ARM/ARMInstrNEON.td
+++ b/lib/Target/ARM/ARMInstrNEON.td
@@ -355,6 +355,9 @@ def DSubReg_i32_reg : SDNodeXForm<imm, [{
  def DSubReg_f64_reg : SDNodeXForm<imm, [{
    return CurDAG->getTargetConstant(5 + N->getZExtValue(), MVT::i32);
  }]>;
+def DSubReg_f64_other_reg : SDNodeXForm<imm, [{
+  return CurDAG->getTargetConstant(5 + (1 - N->getZExtValue()), MVT::i32);
+}]>;
  
  // Extract S sub-registers of Q/D registers.
  // (arm_ssubreg_0 is 1; arm_ssubreg_1 is 2; etc.)
@@ -1907,6 +1910,15 @@ def VDUPfqf   : N2V<0b11, 0b11, 0b01, 0b00, 0b11000, 1, 0,
                      NoItinerary, "vdup.32\t$dst, ${src:lane}", "",
                      [(set QPR:$dst, (v4f32 (NEONvdup (f32 SPR:$src))))]>;
  
+def : Pat<(v2i64 (NEONvduplane (v2i64 QPR:$src), imm:$lane)),
+          (INSERT_SUBREG QPR:$src, 
+                         (i64 (EXTRACT_SUBREG QPR:$src, (DSubReg_f64_reg imm:$lane))),
+                         (DSubReg_f64_other_reg imm:$lane))>;
+def : Pat<(v2f64 (NEONvduplane (v2f64 QPR:$src), imm:$lane)),
+          (INSERT_SUBREG QPR:$src, 
+                         (f64 (EXTRACT_SUBREG QPR:$src, (DSubReg_f64_reg imm:$lane))),
+                         (DSubReg_f64_other_reg imm:$lane))>;
+
  //   VMOVN    : Vector Narrowing Move
  defm VMOVN    : N2VNInt_HSD<0b11,0b11,0b10,0b00100,0,0, "vmovn.i",
                              int_arm_neon_vmovn>;
diff --git a/test/CodeGen/ARM/vdup_lane.ll b/test/CodeGen/ARM/vdup_lane.ll

index adadc9f5d31bd784c674e3dca867837e38b1b405..c14f864c48e3000ac52549f2ff7e309e716fb781 100644 (file)
--- a/test/CodeGen/ARM/vdup_lane.ll
+++ b/test/CodeGen/ARM/vdup_lane.ll
@@ -50,3 +50,27 @@ define <4 x float> @vduplaneQfloat(<2 x float>* %A) nounwind {
         %tmp2 = shufflevector <2 x float> %tmp1, <2 x float> undef, <4 x i32> < i32 1, i32 1, i32 1, i32 1 >
         ret <4 x float> %tmp2
  }
+
+define arm_apcscc <2 x i64> @foo(<2 x i64> %arg0_int64x1_t) nounwind readnone {
+entry:
+  %0 = shufflevector <2 x i64> %arg0_int64x1_t, <2 x i64> undef, <2 x i32> <i32 1, i32 1>
+  ret <2 x i64> %0
+}
+
+define arm_apcscc <2 x i64> @bar(<2 x i64> %arg0_int64x1_t) nounwind readnone {
+entry:
+  %0 = shufflevector <2 x i64> %arg0_int64x1_t, <2 x i64> undef, <2 x i32> <i32 0, i32 0>
+  ret <2 x i64> %0
+}
+
+define arm_apcscc <2 x double> @baz(<2 x double> %arg0_int64x1_t) nounwind readnone {
+entry:
+  %0 = shufflevector <2 x double> %arg0_int64x1_t, <2 x double> undef, <2 x i32> <i32 1, i32 1>
+  ret <2 x double> %0
+}
+
+define arm_apcscc <2 x double> @qux(<2 x double> %arg0_int64x1_t) nounwind readnone {
+entry:
+  %0 = shufflevector <2 x double> %arg0_int64x1_t, <2 x double> undef, <2 x i32> <i32 0, i32 0>
+  ret <2 x double> %0
+}
+\ No newline at end of file
author	Anton Korobeynikov <asl@math.spbu.ru>
	Wed, 2 Sep 2009 21:21:28 +0000 (21:21 +0000)
committer	Anton Korobeynikov <asl@math.spbu.ru>
	Wed, 2 Sep 2009 21:21:28 +0000 (21:21 +0000)
lib/Target/ARM/ARMInstrNEON.td		patch \| blob \| history
test/CodeGen/ARM/vdup_lane.ll		patch \| blob \| history