[x265] [PATCH 1 of 3] asm: routines for chroma vsp filter functions for all block sizes

chen chenm003 at 163.com
Tue Nov 12 12:35:05 CET 2013


>+;-------------------------------------------------------------------------------------------------------------------
>+; void interp_4tap_vertical_sp_%1x%2(int16_t *src, intptr_t srcStride, pixel *dst, intptr_t dstStride, int coeffIdx)
>+;-------------------------------------------------------------------------------------------------------------------
>+%macro FILTER_VER_CHROMA_SP_W2_4R 2
>+INIT_XMM ssse3
>+cglobal interp_4tap_vert_sp_%1x%2, 5, 7, 6
>+
>+    add       r1d, r1d
>+    sub       r0, r1
>+    shl       r4d, 5
>+
>+%ifdef PIC
>+    lea       r5, [tab_ChromaCoeffV]
>+    lea       r6, [r5 + r4]
>+%else
>+    lea       r6, [tab_ChromaCoeffV + r4]
>+%endif
>+
>+    mova      m5, [tab_c_526336]
>+
>+    mov       r4d, (%2/4)
>+
>+.loopH
>+    PROCESS_CHROMA_SP_W2_4R
>+
>+    paddd     m0, m5
>+    paddd     m2, m5
>+
>+    psrad     m0, 12
>+    psrad     m2, 12
>+
>+    packssdw  m0, m2
>+    packuswb  m0, m0
>+
>+    pextrw    [r2], m0, 0
SSE4.1 instruction
 
>+    pextrw    [r2 + r3], m0, 1
>+    pextrw    [r2 + 2 * r3], m0, 2
>+    lea       r2, [r2 + 2 * r3]
>+    pextrw    [r2 + r3], m0, 3
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://mailman.videolan.org/pipermail/x265-devel/attachments/20131112/662105b0/attachment.html>


More information about the x265-devel mailing list