[x265] [PATCH] asm code for blockcopy_ps_24x32
chen
chenm003 at 163.com
Mon Nov 11 14:24:13 CET 2013
>+;-----------------------------------------------------------------------------
>+; void blockcopy_ps_%1x%2(int16_t *dest, intptr_t destStride, pixel *src, intptr_t srcStride);
>+;-----------------------------------------------------------------------------
>+%macro BLOCKCOPY_PS_W24_H2 2
>+INIT_XMM sse4
>+cglobal blockcopy_ps_%1x%2, 4, 5, 3, dest, destStride, src, srcStride
>+
>+add r1, r1
>+mov r4d, %2/2
>+pxor m0, m0
>+
>+.loop
>+ movu m1, [r2]
>+ pmovzxbw m2, m1
>+ movu [r0], m2
>+ punpckhbw m1, m0
>+ movu [r0 + 16], m1
>+
>+ movu m1, [r2 + 16]
movh
>+ pmovzxbw m1, m1
>+ movu [r0 + 32], m1
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://mailman.videolan.org/pipermail/x265-devel/attachments/20131111/aac3a3da/attachment.html>
More information about the x265-devel
mailing list