[x265] [PATCH Review only] asm: pixel_sub_ps routine for 4x4 block size
chen
chenm003 at 163.com
Thu Nov 7 17:19:25 CET 2013
>+movd m0, [r2]
>+movd m1, [r3]
>+pmovzxbw m2, m0
>+pmovzxbw m3, m1
>+
>+movd m0, [r2 + r4]
>+movd m1, [r3 + r5]
>+pmovzxbw m4, m0
>+pmovzxbw m5, m1
>+
>+movd m0, [r2 + 2 * r4]
>+movd m1, [r3 + 2 * r5]
>+pmovzxbw m6, m0
>+pmovzxbw m7, m1
>+
>+psubw m2, m3
>+psubw m4, m5
>+psubw m6, m7
>+
>+lea r2, [r2 + 2 * r4]
>+lea r3, [r3 + 2 * r5]
>+
>+movd m0, [r2 + r4]
>+movd m1, [r3 + r5]
>+pmovzxbw m3, m0
>+pmovzxbw m5, m1
>+
>+psubw m3, m5
>+
>+movh [r0], m2
>+movh [r0 + r1], m4
>+movh [r0 + 2 * r1], m6
>+
>+lea r0, [r0 + 2 * r1]
>+
>+movh [r0 + r1], m3
>+
>+RET
un-debugged example
movd m0, [r2]
movd m1, [r3]
movd m2, [r2 + r4]
movd m3, [r3 + r5]
punpckldq m0, m2
punpckldq m1, m3
pmovzxbw m0, m0
pmovzxbw m1, m1
psubw m0, m1
movlps [r0], m0
movhps [r0 + r1], m0
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://mailman.videolan.org/pipermail/x265-devel/attachments/20131108/8b815bcf/attachment-0001.html>
More information about the x265-devel
mailing list