>+;----------------------------------------------------------------------------- >+; void blockcopy_ps_%1x%2(int16_t *dest, intptr_t destStride, pixel *src, >intptr_t srcStride); >+;----------------------------------------------------------------------------- >+%macro BLOCKCOPY_PS_W24_H2 2 >+INIT_XMM sse4 >+cglobal blockcopy_ps_%1x%2, 4, 5, 3, dest, destStride, src, srcStride >+ >+add r1, r1 >+mov r4d, %2/2 >+pxor m0, m0 >+ >+.loop >+ movu m1, [r2] >+ pmovzxbw m2, m1 >+ movu [r0], m2 >+ punpckhbw m1, m0 >+ movu [r0 + 16], m1 >+ >+ movu m1, [r2 + 16] movh >+ pmovzxbw m1, m1 >+ movu [r0 + 32], m1
_______________________________________________ x265-devel mailing list [email protected] https://mailman.videolan.org/listinfo/x265-devel
