[x265] [PATCH] luma_hpp[4x4]: AVX2 asm code bug fix

praveen at multicorewareinc.com praveen at multicorewareinc.com
Thu Nov 20 07:23:25 CET 2014


# HG changeset patch
# User Praveen Tiwari
# Date 1416464378 -19800
# Node ID 3d1a17009bbe7ef3b4dae505fbfb3891e1019a66
# Parent  28a074cb1e02ca28697157f401a0cf8206043fe8
luma_hpp[4x4]: AVX2 asm code bug fix

diff -r 28a074cb1e02 -r 3d1a17009bbe source/common/x86/ipfilter8.asm
--- a/source/common/x86/ipfilter8.asm	Thu Nov 20 11:29:29 2014 +0530
+++ b/source/common/x86/ipfilter8.asm	Thu Nov 20 11:49:38 2014 +0530
@@ -124,10 +124,10 @@
 
 tab_c_64_n64:   times 8 db 64, -64
 
+const interp4_shuf, times 2 db 0, 1, 8, 9, 4, 5, 12, 13, 2, 3, 10, 11, 6, 7, 14, 15
 
 SECTION .text
 
-cextern idct4_shuf1
 cextern pb_128
 cextern pw_1
 cextern pw_512
@@ -844,7 +844,7 @@
     pmulhrsw        m3, [pw_512]
     vextracti128    xm4, m3, 1
     packuswb        xm3, xm4                        ; BYTE [R3D R3C R2D R2C R1D R1C R0D R0C R3B R3A R2B R2A R1B R1A R0B R0A]
-    pshufb          xm3, [idct4_shuf1]              ; [row3 row1 row2 row0]
+    pshufb          xm3, [interp4_shuf]             ; [row3 row1 row2 row0]
 
     lea             r0, [r3 * 3]
     movd            [r2], xm3


More information about the x265-devel mailing list