diff options
| author | Chris Lattner <sabre@nondot.org> | 2010-08-28 17:59:08 +0000 |
|---|---|---|
| committer | Chris Lattner <sabre@nondot.org> | 2010-08-28 17:59:08 +0000 |
| commit | 94656b1c8c60994a8bcc6c9b03981a78f0bba3a7 (patch) | |
| tree | e3bc5c3c8b9500f9af2d1cc290a4cc10d59e2003 /llvm/test/CodeGen/X86/vec_insert-9.ll | |
| parent | bcb6090ad0660f018a8365248d5467047f423e39 (diff) | |
| download | bcm5719-llvm-94656b1c8c60994a8bcc6c9b03981a78f0bba3a7.tar.gz bcm5719-llvm-94656b1c8c60994a8bcc6c9b03981a78f0bba3a7.zip | |
fix the buildvector->insertp[sd] logic to not always create a redundant
insertp[sd] $0, which is a noop. Before:
_f32: ## @f32
pshufd $1, %xmm1, %xmm2
pshufd $1, %xmm0, %xmm3
addss %xmm2, %xmm3
addss %xmm1, %xmm0
## kill: XMM0<def> XMM0<kill> XMM0<def>
insertps $0, %xmm0, %xmm0
insertps $16, %xmm3, %xmm0
ret
after:
_f32: ## @f32
movdqa %xmm0, %xmm2
addss %xmm1, %xmm2
pshufd $1, %xmm1, %xmm1
pshufd $1, %xmm0, %xmm3
addss %xmm1, %xmm3
movdqa %xmm2, %xmm0
insertps $16, %xmm3, %xmm0
ret
The extra movs are due to a random (poor) scheduling decision.
llvm-svn: 112379
Diffstat (limited to 'llvm/test/CodeGen/X86/vec_insert-9.ll')
| -rw-r--r-- | llvm/test/CodeGen/X86/vec_insert-9.ll | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/llvm/test/CodeGen/X86/vec_insert-9.ll b/llvm/test/CodeGen/X86/vec_insert-9.ll index 2e829df1f8d..e5a7ccc5ef9 100644 --- a/llvm/test/CodeGen/X86/vec_insert-9.ll +++ b/llvm/test/CodeGen/X86/vec_insert-9.ll @@ -1,5 +1,5 @@ ; RUN: llc < %s -march=x86 -mattr=+sse41 > %t -; RUN: grep pinsrd %t | count 2 +; RUN: grep pinsrd %t | count 1 define <4 x i32> @var_insert2(<4 x i32> %x, i32 %val, i32 %idx) nounwind { entry: |

