Add ARM patterns to match EXTRACT_SUBVECTOR nodes.

author Bob Wilson <bob.wilson@apple.com>

Fri, 7 Jan 2011 04:59:04 +0000 (04:59 +0000)

committer Bob Wilson <bob.wilson@apple.com>

Fri, 7 Jan 2011 04:59:04 +0000 (04:59 +0000)
author Bob Wilson <bob.wilson@apple.com>
Fri, 7 Jan 2011 04:59:04 +0000 (04:59 +0000)
committer Bob Wilson <bob.wilson@apple.com>
Fri, 7 Jan 2011 04:59:04 +0000 (04:59 +0000)
diff --git a/include/llvm/Target/TargetSelectionDAG.td b/include/llvm/Target/TargetSelectionDAG.td

index 92ceee5bfb573aef217de5d4335d1356d84e8960..37ebc12e5b2cffca97940202ab02271a1cccac9d 100644 (file)
--- a/include/llvm/Target/TargetSelectionDAG.td
+++ b/include/llvm/Target/TargetSelectionDAG.td
@@ -421,6 +421,9 @@ def scalar_to_vector : SDNode<"ISD::SCALAR_TO_VECTOR", SDTypeProfile<1, 1, []>,
                                []>;
  def vector_extract : SDNode<"ISD::EXTRACT_VECTOR_ELT",
      SDTypeProfile<1, 2, [SDTCisPtrTy<2>]>, []>;
+def vector_extract_subvec : SDNode<"ISD::EXTRACT_SUBVECTOR",
+    SDTypeProfile<1, 2, [SDTCisInt<2>, SDTCisVec<1>, SDTCisVec<0>]>, 
+    []>;
  def vector_insert : SDNode<"ISD::INSERT_VECTOR_ELT",
      SDTypeProfile<1, 3, [SDTCisSameAs<0, 1>, SDTCisPtrTy<3>]>, []>;
  
diff --git a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

index 88490b31203c9785a6fc094eb70c79acef42e2f4..2167523f2344ea43808f0fa712301affdfd494fa 100644 (file)
--- a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
@@ -2745,7 +2745,7 @@ void SelectionDAGBuilder::visitShuffleVector(const User &I) {
          } else {
            StartIdx[Input] = (MinRange[Input]/MaskNumElts)*MaskNumElts;
            if (MaxRange[Input] - StartIdx[Input] < (int)MaskNumElts &&
-              StartIdx[Input] + MaskNumElts < SrcNumElts)
+              StartIdx[Input] + MaskNumElts <= SrcNumElts)
              RangeUse[Input] = 1; // Extract from a multiple of the mask length.
          }
        }
diff --git a/lib/Target/ARM/ARMISelLowering.cpp b/lib/Target/ARM/ARMISelLowering.cpp

index f50eac523f421e4f78223a3aa18f20419880d979..b4432d52369683e34e3a44f41b37324279b4150d 100644 (file)
--- a/lib/Target/ARM/ARMISelLowering.cpp
+++ b/lib/Target/ARM/ARMISelLowering.cpp
@@ -94,7 +94,7 @@ void ARMTargetLowering::addTypeForNEON(EVT VT, EVT PromotedLdStVT,
    setOperationAction(ISD::BUILD_VECTOR, VT.getSimpleVT(), Custom);
    setOperationAction(ISD::VECTOR_SHUFFLE, VT.getSimpleVT(), Custom);
    setOperationAction(ISD::CONCAT_VECTORS, VT.getSimpleVT(), Legal);
-  setOperationAction(ISD::EXTRACT_SUBVECTOR, VT.getSimpleVT(), Expand);
+  setOperationAction(ISD::EXTRACT_SUBVECTOR, VT.getSimpleVT(), Legal);
    setOperationAction(ISD::SELECT, VT.getSimpleVT(), Expand);
    setOperationAction(ISD::SELECT_CC, VT.getSimpleVT(), Expand);
    if (VT.isInteger()) {
diff --git a/lib/Target/ARM/ARMInstrNEON.td b/lib/Target/ARM/ARMInstrNEON.td

index e307105a5cc3662f09afe34f743deca1931d546c..20437963f612b6b7738aa22736b64dcdfd585ff3 100644 (file)
--- a/lib/Target/ARM/ARMInstrNEON.td
+++ b/lib/Target/ARM/ARMInstrNEON.td
@@ -4530,6 +4530,23 @@ def VREV16q8  : VREV16Q<0b00, "vrev16", "8", v16i8>;
  
  // Other Vector Shuffles.
  
+//  Aligned extractions: really just dropping registers
+
+class AlignedVEXTq<ValueType DestTy, ValueType SrcTy, SDNodeXForm LaneCVT>
+      : Pat<(DestTy (vector_extract_subvec (SrcTy QPR:$src), (i32 imm:$start))),
+             (EXTRACT_SUBREG (SrcTy QPR:$src), (LaneCVT imm:$start))>;
+
+def : AlignedVEXTq<v8i8, v16i8, DSubReg_i8_reg>;
+
+def : AlignedVEXTq<v4i16, v8i16, DSubReg_i16_reg>;
+
+def : AlignedVEXTq<v2i32, v4i32, DSubReg_i32_reg>;
+
+def : AlignedVEXTq<v1i64, v2i64, DSubReg_f64_reg>;
+
+def : AlignedVEXTq<v2f32, v4f32, DSubReg_i32_reg>;
+
+
  //   VEXT     : Vector Extract
  
  class VEXTd<string OpcodeStr, string Dt, ValueType Ty>
diff --git a/test/CodeGen/ARM/spill-q.ll b/test/CodeGen/ARM/spill-q.ll

index dc83e25905cf33373161f139ed6f1b4ce9b1304e..bf4e55cb06c4d84b07c58a5c5bc883412caa2cff 100644 (file)
--- a/test/CodeGen/ARM/spill-q.ll
+++ b/test/CodeGen/ARM/spill-q.ll
@@ -15,7 +15,10 @@ define void @aaa(%quuz* %this, i8* %block) {
  ; CHECK: vst1.64 {{.*}}sp, :128
  ; CHECK: vld1.64 {{.*}}sp, :128
  entry:
-  %0 = call <4 x float> @llvm.arm.neon.vld1.v4f32(i8* undef, i32 1) nounwind ; <<4 x float>> [#uses=1]
+  %aligned_vec = alloca <4 x float>, align 16
+  %"alloca point" = bitcast i32 0 to i32
+  %vecptr = bitcast <4 x float>* %aligned_vec to i8*
+  %0 = call <4 x float> @llvm.arm.neon.vld1.v4f32(i8* %vecptr, i32 1) nounwind ; <<4 x float>> [#uses=1]
    store float 6.300000e+01, float* undef, align 4
    %1 = call <4 x float> @llvm.arm.neon.vld1.v4f32(i8* undef, i32 1) nounwind ; <<4 x float>> [#uses=1]
    store float 0.000000e+00, float* undef, align 4
diff --git a/test/CodeGen/Thumb2/thumb2-spill-q.ll b/test/CodeGen/Thumb2/thumb2-spill-q.ll

index 0d73fba93e90017a75e4f889c0a95c0e73e93463..d9a0617f5a460ebed9d2aad1250ca0fe49dd806d 100644 (file)
--- a/test/CodeGen/Thumb2/thumb2-spill-q.ll
+++ b/test/CodeGen/Thumb2/thumb2-spill-q.ll
@@ -15,7 +15,10 @@ define void @aaa(%quuz* %this, i8* %block) {
  ; CHECK: vst1.64 {{.*}}[{{.*}}, :128]
  ; CHECK: vld1.64 {{.*}}[{{.*}}, :128]
  entry:
-  %0 = call <4 x float> @llvm.arm.neon.vld1.v4f32(i8* undef, i32 1) nounwind ; <<4 x float>> [#uses=1]
+  %aligned_vec = alloca <4 x float>, align 16
+  %"alloca point" = bitcast i32 0 to i32
+  %vecptr = bitcast <4 x float>* %aligned_vec to i8*
+  %0 = call <4 x float> @llvm.arm.neon.vld1.v4f32(i8* %vecptr, i32 1) nounwind 
    store float 6.300000e+01, float* undef, align 4
    %1 = call <4 x float> @llvm.arm.neon.vld1.v4f32(i8* undef, i32 1) nounwind ; <<4 x float>> [#uses=1]
    store float 0.000000e+00, float* undef, align 4
author	Bob Wilson <bob.wilson@apple.com>
	Fri, 7 Jan 2011 04:59:04 +0000 (04:59 +0000)
committer	Bob Wilson <bob.wilson@apple.com>
	Fri, 7 Jan 2011 04:59:04 +0000 (04:59 +0000)
include/llvm/Target/TargetSelectionDAG.td		patch \| blob \| history
lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp		patch \| blob \| history
lib/Target/ARM/ARMISelLowering.cpp		patch \| blob \| history
lib/Target/ARM/ARMInstrNEON.td		patch \| blob \| history
test/CodeGen/ARM/spill-q.ll		patch \| blob \| history
test/CodeGen/Thumb2/thumb2-spill-q.ll		patch \| blob \| history