[x86] Fix a miscompile in the new shuffle lowering found through the new

author Chandler Carruth <chandlerc@gmail.com>

Thu, 7 Aug 2014 08:11:31 +0000 (08:11 +0000)

committer Chandler Carruth <chandlerc@gmail.com>

Thu, 7 Aug 2014 08:11:31 +0000 (08:11 +0000)
author Chandler Carruth <chandlerc@gmail.com>
Thu, 7 Aug 2014 08:11:31 +0000 (08:11 +0000)
committer Chandler Carruth <chandlerc@gmail.com>
Thu, 7 Aug 2014 08:11:31 +0000 (08:11 +0000)
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index 47e3a5a6dacf601ff625caeab5cc6b3de1e18f80..38cb996b8d77d41b12ffdb356bca084a1b19b45b 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -8234,10 +8234,11 @@ static SDValue lower128BitVectorShuffle(SDValue Op, SDValue V1, SDValue V2,
    }
  }
  
-/// \brief Tiny helper function to test whether adjacent masks are sequential.
-static bool areAdjacentMasksSequential(ArrayRef<int> Mask) {
+/// \brief Tiny helper function to test whether a shuffle mask could be
+/// simplified by widening the elements being shuffled.
+static bool canWidenShuffleElements(ArrayRef<int> Mask) {
    for (int i = 0, Size = Mask.size(); i < Size; i += 2)
-    if (Mask[i] + 1 != Mask[i+1])
+    if (Mask[i] % 2 != 0 || Mask[i] + 1 != Mask[i+1])
        return false;
  
    return true;
@@ -8291,7 +8292,7 @@ static SDValue lowerVectorShuffle(SDValue Op, const X86Subtarget *Subtarget,
    // but it might be interesting to form i128 integers to handle flipping the
    // low and high halves of AVX 256-bit vectors.
    if (VT.isInteger() && VT.getScalarSizeInBits() < 64 &&
-      areAdjacentMasksSequential(Mask)) {
+      canWidenShuffleElements(Mask)) {
      SmallVector<int, 8> NewMask;
      for (int i = 0, Size = Mask.size(); i < Size; i += 2)
        NewMask.push_back(Mask[i] / 2);
@@ -19517,8 +19518,7 @@ static SDValue PerformTargetShuffleCombine(SDValue N, SelectionDAG &DAG,
  
      // See if this reduces to a PSHUFD which is no more expensive and can
      // combine with more operations.
-    if (Mask[0] % 2 == 0 && Mask[2] % 2 == 0 &&
-        areAdjacentMasksSequential(Mask)) {
+    if (canWidenShuffleElements(Mask)) {
        int DMask[] = {-1, -1, -1, -1};
        int DOffset = N.getOpcode() == X86ISD::PSHUFLW ? 0 : 2;
        DMask[DOffset + 0] = DOffset + Mask[0] / 2;
diff --git a/test/CodeGen/X86/vector-shuffle-128-v4.ll b/test/CodeGen/X86/vector-shuffle-128-v4.ll

index 7d496fa19f15574b539f3fd3ef794a9bc97c8bab..210d672b5c0fbffa929fc53600ee6d5e48992308 100644 (file)
--- a/test/CodeGen/X86/vector-shuffle-128-v4.ll
+++ b/test/CodeGen/X86/vector-shuffle-128-v4.ll
@@ -17,6 +17,13 @@ define <4 x i32> @shuffle_v4i32_0020(<4 x i32> %a, <4 x i32> %b) {
    %shuffle = shufflevector <4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 0, i32 0, i32 2, i32 0>
    ret <4 x i32> %shuffle
  }
+define <4 x i32> @shuffle_v4i32_0112(<4 x i32> %a, <4 x i32> %b) {
+; CHECK-SSE2-LABEL: @shuffle_v4i32_0112
+; CHECK-SSE2:         pshufd {{.*}} # xmm0 = xmm0[0,1,1,2]
+; CHECK-SSE2-NEXT:    retq
+  %shuffle = shufflevector <4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 0, i32 1, i32 1, i32 2>
+  ret <4 x i32> %shuffle
+}
  define <4 x i32> @shuffle_v4i32_0300(<4 x i32> %a, <4 x i32> %b) {
  ; CHECK-SSE2-LABEL: @shuffle_v4i32_0300
  ; CHECK-SSE2:         pshufd {{.*}} # xmm0 = xmm0[0,3,0,0]
author	Chandler Carruth <chandlerc@gmail.com>
	Thu, 7 Aug 2014 08:11:31 +0000 (08:11 +0000)
committer	Chandler Carruth <chandlerc@gmail.com>
	Thu, 7 Aug 2014 08:11:31 +0000 (08:11 +0000)
lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history
test/CodeGen/X86/vector-shuffle-128-v4.ll		patch \| blob \| history