[x265] [PATCH Review only] asm: pixel_sub_ps routine for 4x2 block size
chen
chenm003 at 163.com
Thu Nov 7 17:02:47 CET 2013
>+;-----------------------------------------------------------------------------
>+; void pixel_sub_ps_c_4x2(int16_t *dest, intptr_t destride, pixel *src0, pixel *src1, intptr_t srcstride0, intptr_t srcstride1);
>+;-----------------------------------------------------------------------------
This function can define in pixel-a.asm
>+INIT_XMM sse2
pmovzxbw is sse4.1
>+cglobal pixel_sub_ps_4x2, 4, 6, 6, dest, deststride, src0, src1
>+
>+add r1, r1
>+mov r4d, r4m
>+mov r5d, r5m
r4 and r5 define as intptr_t, didn't need convert to dword
>+movd m0, [r2]
>+movd m1, [r3]
>+pmovzxbw m2, m0
>+pmovzxbw m3, m1
pmovzxbw m0, m0
>+movd m0, [r2 + r4]
>+movd m1, [r3 + r5]
>+pmovzxbw m4, m0
>+pmovzxbw m5, m1
>+
>+psubw m4, m5
>+psubw m2, m3
>+
>+movh [r0], m2
>+movh [r0 + r1], m4
>+
>+RET
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://mailman.videolan.org/pipermail/x265-devel/attachments/20131108/6f5ced3c/attachment.html>
More information about the x265-devel
mailing list