X-Git-Url: http://plrg.eecs.uci.edu/git/?a=blobdiff_plain;f=test%2FCodeGen%2FX86%2Fvec_set-3.ll;h=a13c813ea7b0f48a833bee5e1c8893473f365e58;hb=828f5b807cc2cec7dc3e25730e3c6bac965d17e2;hp=ff108970ac6b5cbbd6157766a253646e7d687f82;hpb=28beeeac4db2d582d4947db96d62e423e4b68d88;p=oota-llvm.git diff --git a/test/CodeGen/X86/vec_set-3.ll b/test/CodeGen/X86/vec_set-3.ll index ff108970ac6..a13c813ea7b 100644 --- a/test/CodeGen/X86/vec_set-3.ll +++ b/test/CodeGen/X86/vec_set-3.ll @@ -1,17 +1,37 @@ -; RUN: llvm-upgrade < %s | llvm-as | llc -march=x86 -mattr=+sse2 -o %t -f -; RUN: grep shufps %t | count 1 -; RUN: grep pshufd %t | count 1 +; RUN: llc < %s -march=x86 -mattr=+sse2 -mcpu=penryn | FileCheck %s -<4 x float> %test(float %a) { - %tmp = insertelement <4 x float> zeroinitializer, float %a, uint 1 - %tmp5 = insertelement <4 x float> %tmp, float 0.000000e+00, uint 2 - %tmp6 = insertelement <4 x float> %tmp5, float 0.000000e+00, uint 3 - ret <4 x float> %tmp6 +define <4 x float> @test(float %a) { +; CHECK-LABEL: test: +; CHECK: insertps $29, {{.*}}, %xmm0 +; CHECK-NEXT: retl + +entry: + %tmp = insertelement <4 x float> zeroinitializer, float %a, i32 1 + %tmp5 = insertelement <4 x float> %tmp, float 0.000000e+00, i32 2 + %tmp6 = insertelement <4 x float> %tmp5, float 0.000000e+00, i32 3 + ret <4 x float> %tmp6 } -<2 x long> %test2(int %a) { - %tmp7 = insertelement <4 x int> zeroinitializer, int %a, uint 2 - %tmp9 = insertelement <4 x int> %tmp7, int 0, uint 3 - %tmp10 = cast <4 x int> %tmp9 to <2 x long> - ret <2 x long> %tmp10 +define <2 x i64> @test2(i32 %a) { +; CHECK-LABEL: test2: +; CHECK: movd {{.*}}, %xmm0 +; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,1,0,1] +; CHECK-NEXT: retl + +entry: + %tmp7 = insertelement <4 x i32> zeroinitializer, i32 %a, i32 2 + %tmp9 = insertelement <4 x i32> %tmp7, i32 0, i32 3 + %tmp10 = bitcast <4 x i32> %tmp9 to <2 x i64> + ret <2 x i64> %tmp10 +} + +define <4 x float> @test3(<4 x float> %A) { +; CHECK-LABEL: test3: +; CHECK: insertps {{.*#+}} xmm0 = zero,xmm0[0],zero,zero +; CHECK-NEXT: retl + + %tmp0 = extractelement <4 x float> %A, i32 0 + %tmp1 = insertelement <4 x float> , float %tmp0, i32 1 + %tmp2 = insertelement <4 x float> %tmp1, float 0.000000e+00, i32 2 + ret <4 x float> %tmp2 }