right
At 2014-01-29 21:16:56,[email protected] wrote: ># HG changeset patch ># User Yuvaraj Venkatesh <[email protected]> ># Date 1391001289 -19800 ># Wed Jan 29 18:44:49 2014 +0530 ># Branch stable ># Node ID 86743912a5b0459645e5aeccd1c35313e3f0af58 ># Parent d6091cb46ae1afeeec40d247d5d5247f26e3372c >asm: fix for 32-bit build satd overflow issue. > >diff -r d6091cb46ae1 -r 86743912a5b0 source/common/x86/pixel-a.asm >--- a/source/common/x86/pixel-a.asm Wed Jan 29 12:05:06 2014 +0530 >+++ b/source/common/x86/pixel-a.asm Wed Jan 29 18:44:49 2014 +0530 >@@ -626,23 +626,17 @@ > movd eax, m7 > RET > >-cglobal pixel_satd_8x8_internal >- LOAD_SUMSUB_8x4P 0, 1, 2, 3, 4, 5, 7, r0, r2, 1, 0 >- SATD_8x4_SSE vertical, 0, 1, 2, 3, 4, 5, 6 >-%%pixel_satd_8x4_internal: >- LOAD_SUMSUB_8x4P 0, 1, 2, 3, 4, 5, 7, r0, r2, 1, 0 >- SATD_8x4_SSE vertical, 0, 1, 2, 3, 4, 5, 6 >- ret >- > cglobal pixel_satd_8x8_internal2 > %if WIN64 > LOAD_SUMSUB_8x4P 0, 1, 2, 3, 4, 5, 7, r0, r2, 1, 0 > SATD_8x4_1_SSE vertical, 0, 1, 2, 3, 4, 5, 6, 12, 13 >+%%pixel_satd_8x4_internal2: > LOAD_SUMSUB_8x4P 0, 1, 2, 3, 4, 5, 7, r0, r2, 1, 0 > SATD_8x4_1_SSE vertical, 0, 1, 2, 3, 4, 5, 6, 12, 13 > %else > LOAD_SUMSUB_8x4P 0, 1, 2, 3, 4, 5, 7, r0, r2, 1, 0 > SATD_8x4_1_SSE vertical, 0, 1, 2, 3, 4, 5, 6, 4, 5 >+%%pixel_satd_8x4_internal2: > LOAD_SUMSUB_8x4P 0, 1, 2, 3, 4, 5, 7, r0, r2, 1, 0 > SATD_8x4_1_SSE vertical, 0, 1, 2, 3, 4, 5, 6, 4, 5 > %endif >@@ -652,15 +646,6 @@ > ; These aren't any faster on AVX systems with fast movddup (Bulldozer, Sandy > Bridge) > %if HIGH_BIT_DEPTH == 0 && (WIN64 || UNIX64) && notcpuflag(avx) > >-cglobal pixel_satd_16x4_internal >- LOAD_SUMSUB_16x4P 0, 1, 2, 3, 4, 8, 5, 9, 6, 7, r0, r2, 11 >- lea r2, [r2+4*r3] >- lea r0, [r0+4*r1] >- ; always use horizontal mode here >- SATD_8x4_SSE 0, 0, 1, 2, 3, 6, 11, 10 >- SATD_8x4_SSE 0, 4, 8, 5, 9, 6, 3, 10 >- ret >-
_______________________________________________ x265-devel mailing list [email protected] https://mailman.videolan.org/listinfo/x265-devel
