; RUN: llc < %s -march=x86 -mattr=+sse2 -mcpu=penryn | FileCheck %s ; RUN: llc < %s -march=x86 -mattr=+sse2 -mcpu=penryn -x86-experimental-vector-shuffle-lowering | FileCheck %s --check-prefix=CHECK-EXP define <4 x float> @test(float %a) { ; CHECK-LABEL: test: ; CHECK: movss {{.*}}, %xmm0 ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,0,1,1] ; CHECK-NEXT: retl ; ; CHECK-EXP-LABEL: test: ; CHECK-EXP: insertps $285, {{.*}}, %xmm0 ; CHECK-EXP-NEXT: retl entry: %tmp = insertelement <4 x float> zeroinitializer, float %a, i32 1 %tmp5 = insertelement <4 x float> %tmp, float 0.000000e+00, i32 2 %tmp6 = insertelement <4 x float> %tmp5, float 0.000000e+00, i32 3 ret <4 x float> %tmp6 } define <2 x i64> @test2(i32 %a) { ; CHECK-LABEL: test2: ; CHECK: movd {{.*}}, %xmm0 ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,1,0,1] ; CHECK-NEXT: retl ; ; CHECK-EXP-LABEL: test2: ; CHECK-EXP: movd {{.*}}, %xmm0 ; CHECK-EXP-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,1,0,1] ; CHECK-EXP-NEXT: retl entry: %tmp7 = insertelement <4 x i32> zeroinitializer, i32 %a, i32 2 %tmp9 = insertelement <4 x i32> %tmp7, i32 0, i32 3 %tmp10 = bitcast <4 x i32> %tmp9 to <2 x i64> ret <2 x i64> %tmp10 } define <4 x float> @test3(<4 x float> %A) { ; CHECK-LABEL: test3: ; CHECK: xorps %[[X1:xmm[0-9]+]], %[[X1]] ; CHECK-NEXT: movss %xmm0, %[[X1]] ; CHECK-NEXT: pshufd {{.*#+}} xmm0 = [[X1]][1,0,1,1] ; CHECK-NEXT: retl ; ; CHECK-EXP-LABEL: test3: ; CHECK-EXP: insertps {{.*#+}} xmm0 = zero,xmm0[0],zero,zero ; CHECK-EXP-NEXT: retl %tmp0 = extractelement <4 x float> %A, i32 0 %tmp1 = insertelement <4 x float> , float %tmp0, i32 1 %tmp2 = insertelement <4 x float> %tmp1, float 0.000000e+00, i32 2 ret <4 x float> %tmp2 }