4% faster on sandybridge
---
libavcodec/x86/lpc.c | 10 ++++++----
1 file changed, 6 insertions(+), 4 deletions(-)
diff --git a/libavcodec/x86/lpc.c b/libavcodec/x86/lpc.c
index 7a37b88..902d364 100644
--- a/libavcodec/x86/lpc.c
+++ b/libavcodec/x86/lpc.c
@@ -124,11 +124,13 @@ static void lpc_compute_autocorr_sse2(const double *data,
int len, int lag,
"movsd "MANGLE(pd_1)", %%xmm1 \n\t"
"1: \n\t"
"movapd (%3,%0), %%xmm3 \n\t"
- "movupd -8(%4,%0), %%xmm4 \n\t"
+ "movapd (%4,%0), %%xmm4 \n\t"
+ "movsd -8(%4,%0), %%xmm5 \n\t"
+ "movlhps %%xmm4, %%xmm5 \n\t"
"mulpd %%xmm3, %%xmm4 \n\t"
- "mulpd (%4,%0), %%xmm3 \n\t"
- "addpd %%xmm4, %%xmm1 \n\t"
- "addpd %%xmm3, %%xmm0 \n\t"
+ "mulpd %%xmm3, %%xmm5 \n\t"
+ "addpd %%xmm4, %%xmm0 \n\t"
+ "addpd %%xmm5, %%xmm1 \n\t"
"add $16, %0 \n\t"
"jl 1b \n\t"
"movhlps %%xmm0, %%xmm3 \n\t"
--
1.8.1.5
_______________________________________________
libav-devel mailing list
[email protected]
https://lists.libav.org/mailman/listinfo/libav-devel