On Fri, 10 Feb 2017, Janne Grunau wrote:
On 2017-01-15 22:55:51 +0200, Martin Storsjö wrote:
---
libavcodec/aarch64/vp9lpf_neon.S | 16 +++++++++++++---
1 file changed, 13 insertions(+), 3 deletions(-)
diff --git a/libavcodec/aarch64/vp9lpf_neon.S b/libavcodec/aarch64/vp9lpf_neon.S
index 4553173..3894307 100644
--- a/libavcodec/aarch64/vp9lpf_neon.S
+++ b/libavcodec/aarch64/vp9lpf_neon.S
@@ -316,20 +316,30 @@
uxtl_sz v0.8h, v1.8h, v22, \sz // p1
uxtl_sz v2.8h, v3.8h, v25, \sz // q1
+.if \wd >= 8
+ mov x5, v6.d[0]
+.endif
saddw_sz v0.8h, v1.8h, v0.8h, v1.8h, \tmp3, \sz // p1 + f
ssubw_sz v2.8h, v3.8h, v2.8h, v3.8h, \tmp3, \sz // q1 - f
+.if \wd >= 8
+.ifc \sz, .16b
+ mov x6, v6.d[1]
+.endif
+.endif
is it helpful have this mov here? It would look a little less ugly if
you merged this .if with the one above
It doesn't seem to slow things down to move them next to each other, will
push in that form.
// Martin
_______________________________________________
libav-devel mailing list
libav-devel@libav.org
https://lists.libav.org/mailman/listinfo/libav-devel