# HG changeset patch # User Praveen Tiwari # Date 1383908145 -19800 # Node ID ca406614f803412b3a8bd6e2eac1774e6d9615fc # Parent eee937070b03167e1f2055620b641957c47a0a5c blockcopy_sp_8x2, optimized asm code
diff -r eee937070b03 -r ca406614f803 source/common/x86/blockcopy8.asm --- a/source/common/x86/blockcopy8.asm Fri Nov 08 15:34:19 2013 +0530 +++ b/source/common/x86/blockcopy8.asm Fri Nov 08 16:25:45 2013 +0530 @@ -1100,20 +1100,17 @@ ; void blockcopy_sp_8x2(pixel *dest, intptr_t destStride, int16_t *src, intptr_t srcStride) ;----------------------------------------------------------------------------- INIT_XMM sse2 -cglobal blockcopy_sp_8x2, 4, 4, 3, dest, destStride, src, srcStride +cglobal blockcopy_sp_8x2, 4, 4, 2, dest, destStride, src, srcStride -add r3, r3 +add r3, r3 -mova m0, [tab_Vm] +movu m0, [r2] +movu m1, [r2 + r3] -movu m1, [r2] -movu m2, [r2 + r3] +packuswb m0, m1 -pshufb m1, m0 -pshufb m2, m0 - -movh [r0], m1 -movh [r0 + r1], m2 +movh [r0], m0 +movhps [r0 + r1], m0 RET _______________________________________________ x265-devel mailing list [email protected] https://mailman.videolan.org/listinfo/x265-devel
