[x265] [PATCH] asm: avx2 code for sse_ss[64x64] for 10 bpp (7039 -> 4051)

sumalatha at multicorewareinc.com sumalatha at multicorewareinc.com
Thu May 21 08:35:05 CEST 2015


# HG changeset patch
# User Sumalatha Polureddy
# Date 1432190086 -19800
#      Thu May 21 12:04:46 2015 +0530
# Node ID 71c725248f29738c332973bde23ecb9cd1aaa805
# Parent  184d645ee5f097dfb94d139cd23c3f1e3feddec1
asm: avx2 code for sse_ss[64x64] for 10 bpp (7039 -> 4051)

sse2:
sse_ss[64x64]  4.63x    7039.23         32592.51

avx2:
sse_ss[64x64]  8.58x    4051.57         34751.46

diff -r 184d645ee5f0 -r 71c725248f29 source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Thu May 21 11:58:50 2015 +0530
+++ b/source/common/x86/asm-primitives.cpp	Thu May 21 12:04:46 2015 +0530
@@ -1260,6 +1260,7 @@
         p.cu[BLOCK_32x32].ssd_s = x265_pixel_ssd_s_32_avx2;
         p.cu[BLOCK_16x16].sse_ss = x265_pixel_ssd_ss_16x16_avx2;
         p.cu[BLOCK_32x32].sse_ss = x265_pixel_ssd_ss_32x32_avx2;
+        p.cu[BLOCK_64x64].sse_ss = x265_pixel_ssd_ss_64x64_avx2;
 
         p.quant = x265_quant_avx2;
         p.nquant = x265_nquant_avx2;
diff -r 184d645ee5f0 -r 71c725248f29 source/common/x86/ssd-a.asm
--- a/source/common/x86/ssd-a.asm	Thu May 21 11:58:50 2015 +0530
+++ b/source/common/x86/ssd-a.asm	Thu May 21 12:04:46 2015 +0530
@@ -348,6 +348,7 @@
 SSD_ONE    16,  8
 SSD_ONE    16, 16
 SSD_ONE    32, 32
+SSD_ONE    64, 64
 %endif ; HIGH_BIT_DEPTH
 
 ;-----------------------------------------------------------------------------


More information about the x265-devel mailing list