[x86] Handle single input shuffles in the SSSE3 case more intelligently.

author Chandler Carruth <chandlerc@gmail.com>

Mon, 4 Aug 2014 01:14:24 +0000 (01:14 +0000)

committer Chandler Carruth <chandlerc@gmail.com>

Mon, 4 Aug 2014 01:14:24 +0000 (01:14 +0000)
author Chandler Carruth <chandlerc@gmail.com>
Mon, 4 Aug 2014 01:14:24 +0000 (01:14 +0000)
committer Chandler Carruth <chandlerc@gmail.com>
Mon, 4 Aug 2014 01:14:24 +0000 (01:14 +0000)
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index 5ae752c1da578eb30e7d8ff35b34b19f06698625..94c19fb4c408161d645fe50b9d5731aab87180ed 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -7931,6 +7931,10 @@ static SDValue lowerV16I8VectorShuffle(SDValue Op, SDValue V1, SDValue V2,
        }
      V1 = DAG.getNode(X86ISD::PSHUFB, DL, MVT::v16i8, V1,
                       DAG.getNode(ISD::BUILD_VECTOR, DL, MVT::v16i8, V1Mask));
+    if (isSingleInputShuffleMask(Mask))
+      return V1; // Single inputs are easy.
+
+    // Otherwise, blend the two.
      V2 = DAG.getNode(X86ISD::PSHUFB, DL, MVT::v16i8, V2,
                       DAG.getNode(ISD::BUILD_VECTOR, DL, MVT::v16i8, V2Mask));
      return DAG.getNode(ISD::OR, DL, MVT::v16i8, V1, V2);
diff --git a/test/CodeGen/X86/vector-shuffle-128-v16.ll b/test/CodeGen/X86/vector-shuffle-128-v16.ll

index 49620e93d6fe32788a355ce2aa6029b1397c0bfd..693a2764d4336e94c07b045c662ca84fd1cb8617 100644 (file)
--- a/test/CodeGen/X86/vector-shuffle-128-v16.ll
+++ b/test/CodeGen/X86/vector-shuffle-128-v16.ll
@@ -179,9 +179,7 @@ define <16 x i8> @shuffle_v16i8_03_02_01_00_07_06_05_04_11_10_09_08_15_14_13_12(
  ;
  ; SSSE3-LABEL: @shuffle_v16i8_03_02_01_00_07_06_05_04_11_10_09_08_15_14_13_12
  ; SSSE3:       # BB#0:
-; SSSE3-NEXT:    pshufb {{.*}} # xmm1 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero
  ; SSSE3-NEXT:    pshufb {{.*}} # xmm0 = xmm0[3,2,1,0,7,6,5,4,11,10,9,8,15,14,13,12]
-; SSSE3-NEXT:    por %xmm1, %xmm0
  ; SSSE3-NEXT:    retq
    %shuffle = shufflevector <16 x i8> %a, <16 x i8> %b, <16 x i32> <i32 3, i32 2, i32 1, i32 0, i32 7, i32 6, i32 5, i32 4, i32 11, i32 10, i32 9, i32 8, i32 15, i32 14, i32 13, i32 12>
    ret <16 x i8> %shuffle
@@ -275,9 +273,7 @@ define <16 x i8> @trunc_v4i32_shuffle(<16 x i8> %a) {
  ;
  ; SSSE3-LABEL: @trunc_v4i32_shuffle
  ; SSSE3:       # BB#0:
-; SSSE3-NEXT:    pshufb {{.*}} # xmm1 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero
  ; SSSE3-NEXT:    pshufb {{.*}} # xmm0 = xmm0[0,4,8,12],zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero
-; SSSE3-NEXT:    por %xmm1, %xmm0
  ; SSSE3-NEXT:    retq
    %shuffle = shufflevector <16 x i8> %a, <16 x i8> undef, <16 x i32> <i32 0, i32 4, i32 8, i32 12, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
    ret <16 x i8> %shuffle
author	Chandler Carruth <chandlerc@gmail.com>
	Mon, 4 Aug 2014 01:14:24 +0000 (01:14 +0000)
committer	Chandler Carruth <chandlerc@gmail.com>
	Mon, 4 Aug 2014 01:14:24 +0000 (01:14 +0000)
lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history
test/CodeGen/X86/vector-shuffle-128-v16.ll		patch \| blob \| history