[x265] [PATCH] asm: avx2 code for chroma sse_pp[16x32, 32x64] for i422

sumalatha at multicorewareinc.com sumalatha at multicorewareinc.com
Fri Jun 5 07:33:16 CEST 2015


# HG changeset patch
# User Sumalatha Polureddy
# Date 1433482390 -19800
#      Fri Jun 05 11:03:10 2015 +0530
# Node ID bf9ddfe13ca034c59e20989765af647bf2f304d7
# Parent  62adf0ef875f9c310250bada6f9a699c9f8ff758
asm: avx2 code for chroma sse_pp[16x32, 32x64] for i422

sse2
[i422] sse_pp[16x32]  5.29x    1030.36         5446.27
[i422] sse_pp[32x64]  4.40x    4091.52         17994.55
avx2
[i422] sse_pp[16x32]  9.07x    599.30          5436.95
[i422] sse_pp[32x64]  9.07x    2009.39         18226.27

diff -r 62adf0ef875f -r bf9ddfe13ca0 source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Thu Jun 04 15:25:47 2015 +0530
+++ b/source/common/x86/asm-primitives.cpp	Fri Jun 05 11:03:10 2015 +0530
@@ -1364,6 +1364,8 @@
         p.cu[BLOCK_64x64].sse_pp = x265_pixel_ssd_64x64_avx2;
         p.chroma[X265_CSP_I420].cu[BLOCK_420_16x16].sse_pp = x265_pixel_ssd_16x16_avx2;
         p.chroma[X265_CSP_I420].cu[BLOCK_420_32x32].sse_pp = x265_pixel_ssd_32x32_avx2;
+        p.chroma[X265_CSP_I422].cu[BLOCK_422_16x32].sse_pp = (pixelcmp_t)x265_pixel_ssd_ss_16x32_avx2;
+        p.chroma[X265_CSP_I422].cu[BLOCK_422_32x64].sse_pp = (pixelcmp_t)x265_pixel_ssd_ss_32x64_avx2;
 
         p.quant = x265_quant_avx2;
         p.nquant = x265_nquant_avx2;
diff -r 62adf0ef875f -r bf9ddfe13ca0 source/common/x86/ssd-a.asm
--- a/source/common/x86/ssd-a.asm	Thu Jun 04 15:25:47 2015 +0530
+++ b/source/common/x86/ssd-a.asm	Fri Jun 05 11:03:10 2015 +0530
@@ -467,6 +467,8 @@
 SSD_ONE    16, 16
 SSD_ONE    32, 32
 SSD_ONE    64, 64
+SSD_ONE    16, 32
+SSD_ONE    32, 64
 %endif ; HIGH_BIT_DEPTH
 
 ;-----------------------------------------------------------------------------


More information about the x265-devel mailing list