[x265] [PATCH] asm: avx2 code for dst4x4 and idst4x4 for 10 bpp

sumalatha at multicorewareinc.com sumalatha at multicorewareinc.com
Tue Jun 2 09:06:00 CEST 2015


# HG changeset patch
# User Sumalatha Polureddy
# Date 1433228753 -19800
#      Tue Jun 02 12:35:53 2015 +0530
# Node ID 32a4d9008ddd1d7bdf1f5067d431800c7a0a94fb
# Parent  6a748b3eebd0aee64f821e9daff10b5ecc8a71f4
asm: avx2 code for dst4x4 and idst4x4 for 10 bpp

sse2
dst4x4          2.92x    455.01          1327.19
idst4x4         4.35x    533.15          2319.60

avx2
dst4x4          4.96x    275.16          1365.90
idst4x4         6.23x    349.51          2176.14

diff -r 6a748b3eebd0 -r 32a4d9008ddd source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Mon Jun 01 15:32:36 2015 +0530
+++ b/source/common/x86/asm-primitives.cpp	Tue Jun 02 12:35:53 2015 +0530
@@ -1360,6 +1360,8 @@
         p.quant = x265_quant_avx2;
         p.nquant = x265_nquant_avx2;
         p.dequant_normal  = x265_dequant_normal_avx2;
+        p.dst4x4 = x265_dst4_avx2;
+        p.idst4x4 = x265_idst4_avx2;
 
         p.scale1D_128to64 = x265_scale1D_128to64_avx2;
         p.scale2D_64to32 = x265_scale2D_64to32_avx2;


More information about the x265-devel mailing list