fix the buildvector->insertp[sd] logic to not always create a redundant
authorChris Lattner <sabre@nondot.org>
Sat, 28 Aug 2010 17:59:08 +0000 (17:59 +0000)
committerChris Lattner <sabre@nondot.org>
Sat, 28 Aug 2010 17:59:08 +0000 (17:59 +0000)
commit24faf611a33900b225c636f908eb30234215af21
treefb412877725cb1019812ce5b68beab763bc9347b
parent3ddcc430401f0d16bee17b2afb52dcaa2f480f8b
fix the buildvector->insertp[sd] logic to not always create a redundant
insertp[sd] $0, which is a noop.  Before:

_f32:                                   ## @f32
pshufd $1, %xmm1, %xmm2
pshufd $1, %xmm0, %xmm3
addss %xmm2, %xmm3
addss %xmm1, %xmm0
                                        ## kill: XMM0<def> XMM0<kill> XMM0<def>
insertps $0, %xmm0, %xmm0
insertps $16, %xmm3, %xmm0
ret

after:

_f32:                                   ## @f32
movdqa %xmm0, %xmm2
addss %xmm1, %xmm2
pshufd $1, %xmm1, %xmm1
pshufd $1, %xmm0, %xmm3
addss %xmm1, %xmm3
movdqa %xmm2, %xmm0
insertps $16, %xmm3, %xmm0
ret

The extra movs are due to a random (poor) scheduling decision.

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@112379 91177308-0d34-0410-b5e6-96231b3b80d8
lib/Target/X86/X86ISelLowering.cpp
test/CodeGen/X86/2009-02-26-MachineLICMBug.ll
test/CodeGen/X86/sse41.ll
test/CodeGen/X86/vec_insert-9.ll