[x265] [PATCH] luma_hpp[4x4]: AVX2 asm code bug fix
praveen at multicorewareinc.com
praveen at multicorewareinc.com
Thu Nov 20 07:23:25 CET 2014
# HG changeset patch
# User Praveen Tiwari
# Date 1416464378 -19800
# Node ID 3d1a17009bbe7ef3b4dae505fbfb3891e1019a66
# Parent 28a074cb1e02ca28697157f401a0cf8206043fe8
luma_hpp[4x4]: AVX2 asm code bug fix
diff -r 28a074cb1e02 -r 3d1a17009bbe source/common/x86/ipfilter8.asm
--- a/source/common/x86/ipfilter8.asm Thu Nov 20 11:29:29 2014 +0530
+++ b/source/common/x86/ipfilter8.asm Thu Nov 20 11:49:38 2014 +0530
@@ -124,10 +124,10 @@
tab_c_64_n64: times 8 db 64, -64
+const interp4_shuf, times 2 db 0, 1, 8, 9, 4, 5, 12, 13, 2, 3, 10, 11, 6, 7, 14, 15
SECTION .text
-cextern idct4_shuf1
cextern pb_128
cextern pw_1
cextern pw_512
@@ -844,7 +844,7 @@
pmulhrsw m3, [pw_512]
vextracti128 xm4, m3, 1
packuswb xm3, xm4 ; BYTE [R3D R3C R2D R2C R1D R1C R0D R0C R3B R3A R2B R2A R1B R1A R0B R0A]
- pshufb xm3, [idct4_shuf1] ; [row3 row1 row2 row0]
+ pshufb xm3, [interp4_shuf] ; [row3 row1 row2 row0]
lea r0, [r3 * 3]
movd [r2], xm3
More information about the x265-devel
mailing list