[x265] [PATCH Review only] asm: pixelsub_ps routine for 12x16 blocks
chen
chenm003 at 163.com
Fri Nov 8 12:37:45 CET 2013
>+;-----------------------------------------------------------------------------
>+; void pixel_sub_ps_c_%1x%2(pixel *dest, intptr_t destride, pixel *src0, pixel *src1, intptr_t srcstride0, intptr_t srcstride1);
>+;-----------------------------------------------------------------------------
>+%macro PIXELSUB_PS_W12_H4 2
>+INIT_XMM sse4
>+cglobal pixel_sub_ps_%1x%2, 6, 7, 8, dest, deststride, src0, src1, srcstride0, srcstride1
>+
>+add r1, r1
>+mov r6d, %2/4
>+
>+.loop
>+
>+ movh m0, [r2]
>+ movd m1, [r2 + 8]
>+ movh m2, [r3]
>+ movd m3, [r3 + 8]
>+
>+ movh m4, [r2 + r4]
>+ movd m5, [r2 + r4 + 8]
>+ movh m6, [r3 + r5]
>+ movd m7, [r3 + r5 + 8]
>+
>+ punpckldq m1, m5
>+ punpckldq m3, m7
>+ pmovzxbw m0, m0
>+ pmovzxbw m1, m1
>+ pmovzxbw m2, m2
>+ pmovzxbw m3, m3
>+ pmovzxbw m4, m4
>+ pmovzxbw m6, m6
movu m0, [r2]
movu m1, [r3]
movu m2, [r2 + r4]
movu m3, [r3 + r5]
mova m4, m0
mova m5, m1
punpckhdq m4, m2
punpckhdq m5, m3
pmovzxbw m0, m0
pmovzxbw m1, m1
pmovzxbw m2, m2
pmovzxbw m3, m3
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://mailman.videolan.org/pipermail/x265-devel/attachments/20131108/9e829f97/attachment-0001.html>
More information about the x265-devel
mailing list