projects
/
oota-llvm.git
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
[x86] Implement a faster vector population count based on the PSHUFB
[oota-llvm.git]
/
test
/
CodeGen
/
X86
/
vec_set-3.ll
diff --git
a/test/CodeGen/X86/vec_set-3.ll
b/test/CodeGen/X86/vec_set-3.ll
index 9823963d61b7ed675b90a86410910b0346cf3801..a13c813ea7b0f48a833bee5e1c8893473f365e58 100644
(file)
--- a/
test/CodeGen/X86/vec_set-3.ll
+++ b/
test/CodeGen/X86/vec_set-3.ll
@@
-1,15
+1,9
@@
; RUN: llc < %s -march=x86 -mattr=+sse2 -mcpu=penryn | FileCheck %s
; RUN: llc < %s -march=x86 -mattr=+sse2 -mcpu=penryn | FileCheck %s
-; RUN: llc < %s -march=x86 -mattr=+sse2 -mcpu=penryn -x86-experimental-vector-shuffle-lowering | FileCheck %s --check-prefix=CHECK-EXP
define <4 x float> @test(float %a) {
; CHECK-LABEL: test:
define <4 x float> @test(float %a) {
; CHECK-LABEL: test:
-; CHECK: movss {{.*}}, %xmm0
-; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,0,1,1]
+; CHECK: insertps $29, {{.*}}, %xmm0
; CHECK-NEXT: retl
; CHECK-NEXT: retl
-;
-; CHECK-EXP-LABEL: test:
-; CHECK-EXP: insertps $285, {{.*}}, %xmm0
-; CHECK-EXP-NEXT: retl
entry:
%tmp = insertelement <4 x float> zeroinitializer, float %a, i32 1
entry:
%tmp = insertelement <4 x float> zeroinitializer, float %a, i32 1
@@
-23,11
+17,6
@@
define <2 x i64> @test2(i32 %a) {
; CHECK: movd {{.*}}, %xmm0
; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,1,0,1]
; CHECK-NEXT: retl
; CHECK: movd {{.*}}, %xmm0
; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,1,0,1]
; CHECK-NEXT: retl
-;
-; CHECK-EXP-LABEL: test2:
-; CHECK-EXP: movd {{.*}}, %xmm0
-; CHECK-EXP-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,1,0,1]
-; CHECK-EXP-NEXT: retl
entry:
%tmp7 = insertelement <4 x i32> zeroinitializer, i32 %a, i32 2
entry:
%tmp7 = insertelement <4 x i32> zeroinitializer, i32 %a, i32 2
@@
-38,14
+27,8
@@
entry:
define <4 x float> @test3(<4 x float> %A) {
; CHECK-LABEL: test3:
define <4 x float> @test3(<4 x float> %A) {
; CHECK-LABEL: test3:
-; CHECK: xorps %[[X1:xmm[0-9]+]], %[[X1]]
-; CHECK-NEXT: movss %xmm0, %[[X1]]
-; CHECK-NEXT: pshufd {{.*#+}} xmm0 = [[X1]][1,0,1,1]
+; CHECK: insertps {{.*#+}} xmm0 = zero,xmm0[0],zero,zero
; CHECK-NEXT: retl
; CHECK-NEXT: retl
-;
-; CHECK-EXP-LABEL: test3:
-; CHECK-EXP: insertps {{.*#+}} xmm0 = zero,xmm0[0],zero,zero
-; CHECK-EXP-NEXT: retl
%tmp0 = extractelement <4 x float> %A, i32 0
%tmp1 = insertelement <4 x float> <float 0.000000e+00, float undef, float undef, float undef >, float %tmp0, i32 1
%tmp0 = extractelement <4 x float> %A, i32 0
%tmp1 = insertelement <4 x float> <float 0.000000e+00, float undef, float undef, float undef >, float %tmp0, i32 1