4% faster on sandybridge
---
 libavcodec/x86/lpc.c | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/libavcodec/x86/lpc.c b/libavcodec/x86/lpc.c
index 7a37b88..902d364 100644
--- a/libavcodec/x86/lpc.c
+++ b/libavcodec/x86/lpc.c
@@ -124,11 +124,13 @@ static void lpc_compute_autocorr_sse2(const double *data, 
int len, int lag,
                 "movsd    "MANGLE(pd_1)", %%xmm1    \n\t"
                 "1:                                 \n\t"
                 "movapd   (%3,%0), %%xmm3           \n\t"
-                "movupd -8(%4,%0), %%xmm4           \n\t"
+                "movapd   (%4,%0), %%xmm4           \n\t"
+                "movsd  -8(%4,%0), %%xmm5           \n\t"
+                "movlhps   %%xmm4, %%xmm5           \n\t"
                 "mulpd     %%xmm3, %%xmm4           \n\t"
-                "mulpd    (%4,%0), %%xmm3           \n\t"
-                "addpd     %%xmm4, %%xmm1           \n\t"
-                "addpd     %%xmm3, %%xmm0           \n\t"
+                "mulpd     %%xmm3, %%xmm5           \n\t"
+                "addpd     %%xmm4, %%xmm0           \n\t"
+                "addpd     %%xmm5, %%xmm1           \n\t"
                 "add       $16,    %0               \n\t"
                 "jl 1b                              \n\t"
                 "movhlps   %%xmm0, %%xmm3           \n\t"
-- 
1.8.1.5

_______________________________________________
libav-devel mailing list
[email protected]
https://lists.libav.org/mailman/listinfo/libav-devel

Reply via email to