[x265] [PATCH] asm: avx2 code for addavg[32x16][32x64] for 10 bpp

sumalatha at multicorewareinc.com sumalatha at multicorewareinc.com
Tue May 26 10:16:45 CEST 2015


# HG changeset patch
# User Sumalatha Polureddy
# Date 1432628199 -19800
#      Tue May 26 13:46:39 2015 +0530
# Node ID d38860fea2c8625c8e4faf4dff4812b5672642ff
# Parent  4af40cfbfc2af9ce02d78e18df356a288bc3102d
asm: avx2 code for addavg[32x16][32x64] for 10 bpp

sse4:
[i422]  addAvg[32x16]  9.44x    2016.35         19044.10
[i422]  addAvg[32x48]  9.13x    5912.24         54003.47

avx2:
[i422]  addAvg[32x16]  18.13x   1060.93         19239.48
[i422]  addAvg[32x48]  18.32x   3028.78         55485.82

diff -r 4af40cfbfc2a -r d38860fea2c8 source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Tue May 26 10:33:56 2015 +0530
+++ b/source/common/x86/asm-primitives.cpp	Tue May 26 13:46:39 2015 +0530
@@ -1251,6 +1251,8 @@
         p.chroma[X265_CSP_I422].pu[CHROMA_422_8x64].addAvg = x265_addAvg_8x64_avx2;
         p.chroma[X265_CSP_I422].pu[CHROMA_422_24x64].addAvg = x265_addAvg_24x64_avx2;
         p.chroma[X265_CSP_I422].pu[CHROMA_422_12x32].addAvg = x265_addAvg_12x32_avx2;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_32x16].addAvg = x265_addAvg_32x16_avx2;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_32x48].addAvg = x265_addAvg_32x48_avx2;
 
         p.cu[BLOCK_4x4].psy_cost_ss = x265_psyCost_ss_4x4_avx2;
         p.cu[BLOCK_8x8].psy_cost_ss = x265_psyCost_ss_8x8_avx2;


More information about the x265-devel mailing list