[x265] [PATCH] blockcopy_pp_8x6: optimize register uses
chen
chenm003 at 163.com
Tue Feb 3 12:51:50 CET 2015
right
At 2015-02-03 19:45:04,praveen at multicorewareinc.com wrote:
># HG changeset patch
># User Praveen Tiwari
># Date 1422963895 -19800
># Node ID bfc9a2d99e20568cb43d9fba0133735009793b00
># Parent d212ce9fa3705b9e7d4d23f14412bd28fe3bbfde
>blockcopy_pp_8x6: optimize register uses
>
>diff -r d212ce9fa370 -r bfc9a2d99e20 source/common/x86/blockcopy8.asm
>--- a/source/common/x86/blockcopy8.asm Tue Feb 03 14:30:42 2015 +0530
>+++ b/source/common/x86/blockcopy8.asm Tue Feb 03 17:14:55 2015 +0530
>@@ -327,24 +327,24 @@
> ; void blockcopy_pp_8x6(pixel* dst, intptr_t dstStride, const pixel* src, intptr_t srcStride)
> ;-----------------------------------------------------------------------------
> INIT_XMM sse2
>-cglobal blockcopy_pp_8x6, 4, 7, 6
>+cglobal blockcopy_pp_8x6, 4, 4, 6
> movh m0, [r2]
> movh m1, [r2 + r3]
>- movh m2, [r2 + 2 * r3]
>- lea r5, [r2 + 2 * r3]
>- movh m3, [r5 + r3]
>- movh m4, [r5 + 2 * r3]
>- lea r5, [r5 + 2 * r3]
>- movh m5, [r5 + r3]
>-
>- movh [r0], m0
>- movh [r0 + r1], m1
>- movh [r0 + 2 * r1], m2
>- lea r6, [r0 + 2 * r1]
>- movh [r6 + r1], m3
>- movh [r6 + 2 * r1], m4
>- lea r6, [r6 + 2 * r1]
>- movh [r6 + r1], m5
>+ lea r2, [r2 + 2 * r3]
>+ movh m2, [r2]
>+ movh m3, [r2 + r3]
>+ lea r2, [r2 + 2 * r3]
>+ movh m4, [r2]
>+ movh m5, [r2 + r3]
>+
>+ movh [r0], m0
>+ movh [r0 + r1], m1
>+ lea r0, [r0 + 2 * r1]
>+ movh [r0], m2
>+ movh [r0 + r1], m3
>+ lea r0, [r0 + 2 * r1]
>+ movh [r0], m4
>+ movh [r0 + r1], m5
> RET
>
> ;-----------------------------------------------------------------------------
>_______________________________________________
>x265-devel mailing list
>x265-devel at videolan.org
>https://mailman.videolan.org/listinfo/x265-devel
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://mailman.videolan.org/pipermail/x265-devel/attachments/20150203/a08aec38/attachment.html>
More information about the x265-devel
mailing list