; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 | FileCheck %s ; Test that we correctly fold a shuffle that performs a swizzle of another ; shuffle node according to the rule ; shuffle (shuffle (x, undef, M0), undef, M1) -> shuffle(x, undef, M2) ; ; We only do this if the resulting mask is legal to avoid introducing an ; illegal shuffle that is expanded into a sub-optimal sequence of instructions ; during lowering stage. define <4 x i32> @swizzle_1(<4 x i32> %v) { ; CHECK-LABEL: swizzle_1: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,0,3,2] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_2(<4 x i32> %v) { ; CHECK-LABEL: swizzle_2: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,1,3,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_3(<4 x i32> %v) { ; CHECK-LABEL: swizzle_3: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,0,3,2] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_4(<4 x i32> %v) { ; CHECK-LABEL: swizzle_4: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[3,1,0,2] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_5(<4 x i32> %v) { ; CHECK-LABEL: swizzle_5: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_6(<4 x i32> %v) { ; CHECK-LABEL: swizzle_6: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,0,1,3] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_7(<4 x i32> %v) { ; CHECK-LABEL: swizzle_7: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,2,3,1] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_8(<4 x i32> %v) { ; CHECK-LABEL: swizzle_8: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,3,2,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_9(<4 x i32> %v) { ; CHECK-LABEL: swizzle_9: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_10(<4 x i32> %v) { ; CHECK-LABEL: swizzle_10: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,2,0,3] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_11(<4 x i32> %v) { ; CHECK-LABEL: swizzle_11: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[3,2,1,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_12(<4 x i32> %v) { ; CHECK-LABEL: swizzle_12: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,3,1,2] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_13(<4 x i32> %v) { ; CHECK-LABEL: swizzle_13: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[3,2,1,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x i32> @swizzle_14(<4 x i32> %v) { ; CHECK-LABEL: swizzle_14: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[3,0,2,1] ; CHECK-NEXT: retq %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> ret <4 x i32> %2 } define <4 x float> @swizzle_15(<4 x float> %v) { ; CHECK-LABEL: swizzle_15: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,3,2] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_16(<4 x float> %v) { ; CHECK-LABEL: swizzle_16: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,1,3,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_17(<4 x float> %v) { ; CHECK-LABEL: swizzle_17: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,3,2] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_18(<4 x float> %v) { ; CHECK-LABEL: swizzle_18: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,0,2] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_19(<4 x float> %v) { ; CHECK-LABEL: swizzle_19: ; CHECK: # BB#0: ; CHECK-NEXT: shufpd {{.*#+}} xmm0 = xmm0[1,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_20(<4 x float> %v) { ; CHECK-LABEL: swizzle_20: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,0,1,3] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_21(<4 x float> %v) { ; CHECK-LABEL: swizzle_21: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2,3,1] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_22(<4 x float> %v) { ; CHECK-LABEL: swizzle_22: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,3,2,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_23(<4 x float> %v) { ; CHECK-LABEL: swizzle_23: ; CHECK: # BB#0: ; CHECK-NEXT: shufpd {{.*#+}} xmm0 = xmm0[1,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_24(<4 x float> %v) { ; CHECK-LABEL: swizzle_24: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,2,0,3] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_25(<4 x float> %v) { ; CHECK-LABEL: swizzle_25: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,2,1,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_26(<4 x float> %v) { ; CHECK-LABEL: swizzle_26: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,3,1,2] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_27(<4 x float> %v) { ; CHECK-LABEL: swizzle_27: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,2,1,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_28(<4 x float> %v) { ; CHECK-LABEL: swizzle_28: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,0,2,1] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } define <4 x float> @swizzle_29(<4 x float> %v) { ; CHECK-LABEL: swizzle_29: ; CHECK: # BB#0: ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,3,2,0] ; CHECK-NEXT: retq %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> ret <4 x float> %2 } ; Make sure that we combine the shuffles from each function below into a single ; legal shuffle (either pshuflw or pshufb depending on the masks). define <8 x i16> @swizzle_30(<8 x i16> %v) { ; CHECK-LABEL: swizzle_30: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[1,3,2,0,4,5,6,7] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_31(<8 x i16> %v) { ; CHECK-LABEL: swizzle_31: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[1,3,2,0,4,5,6,7] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_32(<8 x i16> %v) { ; CHECK-LABEL: swizzle_32: ; CHECK: # BB#0: ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,0,2,3] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_33(<8 x i16> %v) { ; CHECK-LABEL: swizzle_33: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[2,1,3,0,4,5,6,7] ; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,5,7,6,4] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_34(<8 x i16> %v) { ; CHECK-LABEL: swizzle_34: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[1,3,0,2,4,5,6,7] ; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,7,6,4,5] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_35(<8 x i16> %v) { ; CHECK-LABEL: swizzle_35: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[2,1,0,3,4,5,6,7] ; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,4,5,7,6] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_36(<8 x i16> %v) { ; CHECK-LABEL: swizzle_36: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[0,3,2,1,4,5,6,7] ; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,4,6,5,7] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_37(<8 x i16> %v) { ; CHECK-LABEL: swizzle_37: ; CHECK: # BB#0: ; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,4,7,6,5] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_38(<8 x i16> %v) { ; CHECK-LABEL: swizzle_38: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[2,1,0,3,4,5,6,7] ; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,5,4,6,7] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_39(<8 x i16> %v) { ; CHECK-LABEL: swizzle_39: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[2,3,1,0,4,5,6,7] ; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,7,6,4,5] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_40(<8 x i16> %v) { ; CHECK-LABEL: swizzle_40: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[3,1,2,0,4,5,6,7] ; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,4,6,5,7] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_41(<8 x i16> %v) { ; CHECK-LABEL: swizzle_41: ; CHECK: # BB#0: ; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[3,2,1,0,4,5,6,7] ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,3,2] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 } define <8 x i16> @swizzle_42(<8 x i16> %v) { ; CHECK-LABEL: swizzle_42: ; CHECK: # BB#0: ; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,5,4,7,6] ; CHECK-NEXT: retq %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> ret <8 x i16> %2 }