This is an automated email from the git hooks/post-receive script. Git pushed a commit to branch master in repository ffmpeg.
commit c898ddb8fede853027a7c9458d928900d5db6e38 Author: Andreas Rheinhardt <[email protected]> AuthorDate: Mon Jan 26 03:21:48 2026 +0100 Commit: Andreas Rheinhardt <[email protected]> CommitDate: Thu Jan 29 01:33:40 2026 +0100 avcodec/x86/cfhddsp: Reduce number of xmm registers used Reviewed-by: James Almer <[email protected]> Signed-off-by: Andreas Rheinhardt <[email protected]> --- libavcodec/x86/cfhddsp.asm | 68 +++++++++++++++++++++++----------------------- 1 file changed, 34 insertions(+), 34 deletions(-) diff --git a/libavcodec/x86/cfhddsp.asm b/libavcodec/x86/cfhddsp.asm index 821d511ba2..01ba00f8a6 100644 --- a/libavcodec/x86/cfhddsp.asm +++ b/libavcodec/x86/cfhddsp.asm @@ -36,20 +36,20 @@ SECTION .text %macro CFHD_HORIZ_FILTER 1 %if %1 == 1023 -cglobal cfhd_horiz_filter_clip10, 5, 6, 8 + 4 * ARCH_X86_64, output, low, high, width, x, temp +cglobal cfhd_horiz_filter_clip10, 5, 6, 8 + 3 * ARCH_X86_64, output, low, high, width, x, temp shl widthd, 1 %define ostrideq widthq %define lwidthq widthq %define hwidthq widthq %elif %1 == 4095 -cglobal cfhd_horiz_filter_clip12, 5, 6, 8 + 4 * ARCH_X86_64, output, low, high, width, x, temp +cglobal cfhd_horiz_filter_clip12, 5, 6, 8 + 3 * ARCH_X86_64, output, low, high, width, x, temp shl widthd, 1 %define ostrideq widthq %define lwidthq widthq %define hwidthq widthq %else %if ARCH_X86_64 -cglobal cfhd_horiz_filter, 8, 11, 12, output, ostride, low, lwidth, high, hwidth, width, height, x, y, temp +cglobal cfhd_horiz_filter, 8, 11, 11, output, ostride, low, lwidth, high, hwidth, width, height, x, y, temp shl ostrided, 1 shl lwidthd, 1 shl hwidthd, 1 @@ -79,8 +79,8 @@ cglobal cfhd_horiz_filter, 7, 7, 8, output, x, low, y, high, temp, width, height %if ARCH_X86_64 mova m8, [factor_p1_n1] - mova m10, [pw_1] - mova m11, [pd_4] + mova m9, [pw_1] + mova m10, [pd_4] %endif %if %1 == 0 @@ -146,10 +146,10 @@ cglobal cfhd_horiz_filter, 7, 7, 8, output, x, low, y, high, temp, width, height pmaddwd m4, m8 pmaddwd m5, m8 - psubd m6, m11, m4 - psubd m7, m11, m5 - paddd m4, m11 - paddd m5, m11 + psubd m6, m10, m4 + psubd m7, m10, m5 + paddd m4, m10 + paddd m5, m10 %else mova m2, [pd_4] pmaddwd m4, [factor_p1_n1] @@ -177,8 +177,8 @@ cglobal cfhd_horiz_filter, 7, 7, 8, output, x, low, y, high, temp, width, height mova m3, m0 %if ARCH_X86_64 - pmaddwd m2, m10 - pmaddwd m0, m10 + pmaddwd m2, m9 + pmaddwd m0, m9 pmaddwd m1, m8 pmaddwd m3, m8 %else @@ -296,7 +296,7 @@ CFHD_HORIZ_FILTER 4095 INIT_XMM sse2 %if ARCH_X86_64 -cglobal cfhd_vert_filter, 8, 11, 14, output, ostride, low, lwidth, high, hwidth, width, height, x, y, pos +cglobal cfhd_vert_filter, 8, 11, 13, output, ostride, low, lwidth, high, hwidth, width, height, x, y, pos shl ostrided, 1 shl lwidthd, 1 shl hwidthd, 1 @@ -305,10 +305,10 @@ cglobal cfhd_vert_filter, 8, 11, 14, output, ostride, low, lwidth, high, hwidth, dec heightd mova m8, [factor_p1_n1] - mova m10, [pw_1] - mova m11, [pd_4] - mova m12, [factor_p11_n4] - mova m13, [factor_p5_p4] + mova m9, [pw_1] + mova m10, [pd_4] + mova m11, [factor_p11_n4] + mova m12, [factor_p5_p4] %else cglobal cfhd_vert_filter, 7, 7, 8, output, x, low, y, high, pos, width, height shl xd, 1 @@ -344,8 +344,8 @@ cglobal cfhd_vert_filter, 7, 7, 8, output, x, low, y, high, pos, width, height punpckhwd m2, m1 %if ARCH_X86_64 - pmaddwd m0, m12 - pmaddwd m2, m12 + pmaddwd m0, m11 + pmaddwd m2, m11 %else pmaddwd m0, [factor_p11_n4] pmaddwd m2, [factor_p11_n4] @@ -398,8 +398,8 @@ cglobal cfhd_vert_filter, 7, 7, 8, output, x, low, y, high, pos, width, height punpckhwd m2, m1 %if ARCH_X86_64 - pmaddwd m0, m13 - pmaddwd m2, m13 + pmaddwd m0, m12 + pmaddwd m2, m12 %else pmaddwd m0, [factor_p5_p4] pmaddwd m2, [factor_p5_p4] @@ -466,10 +466,10 @@ cglobal cfhd_vert_filter, 7, 7, 8, output, x, low, y, high, pos, width, height pmaddwd m4, m8 pmaddwd m5, m8 - psubd m6, m11, m4 - psubd m7, m11, m5 - paddd m4, m11 - paddd m5, m11 + psubd m6, m10, m4 + psubd m7, m10, m5 + paddd m4, m10 + paddd m5, m10 %else mova m2, [pd_4] pmaddwd m4, [factor_p1_n1] @@ -502,8 +502,8 @@ cglobal cfhd_vert_filter, 7, 7, 8, output, x, low, y, high, pos, width, height mova m3, m2 %if ARCH_X86_64 - pmaddwd m0, m10 - pmaddwd m2, m10 + pmaddwd m0, m9 + pmaddwd m2, m9 pmaddwd m1, m8 pmaddwd m3, m8 %else @@ -550,8 +550,8 @@ cglobal cfhd_vert_filter, 7, 7, 8, output, x, low, y, high, pos, width, height punpckhwd m2, m1 %if ARCH_X86_64 - pmaddwd m0, m13 - pmaddwd m2, m13 + pmaddwd m0, m12 + pmaddwd m2, m12 %else pmaddwd m0, [factor_p5_p4] pmaddwd m2, [factor_p5_p4] @@ -571,8 +571,8 @@ cglobal cfhd_vert_filter, 7, 7, 8, output, x, low, y, high, pos, width, height psubd m2, m3 %if ARCH_X86_64 - paddd m0, m11 - paddd m2, m11 + paddd m0, m10 + paddd m2, m10 %else paddd m0, [pd_4] paddd m2, [pd_4] @@ -618,8 +618,8 @@ cglobal cfhd_vert_filter, 7, 7, 8, output, x, low, y, high, pos, width, height punpckhwd m2, m1 %if ARCH_X86_64 - pmaddwd m0, m12 - pmaddwd m2, m12 + pmaddwd m0, m11 + pmaddwd m2, m11 %else pmaddwd m0, [factor_p11_n4] pmaddwd m2, [factor_p11_n4] @@ -639,8 +639,8 @@ cglobal cfhd_vert_filter, 7, 7, 8, output, x, low, y, high, pos, width, height paddd m2, m3 %if ARCH_X86_64 - paddd m0, m11 - paddd m2, m11 + paddd m0, m10 + paddd m2, m10 %else paddd m0, [pd_4] paddd m2, [pd_4] _______________________________________________ ffmpeg-cvslog mailing list -- [email protected] To unsubscribe send an email to [email protected]
