[x265] [PATCH 1 of 5] asm: avx2 code sse_pp[32x32] and sse_pp[64x64] for 8 bpp

sumalatha at multicorewareinc.com sumalatha at multicorewareinc.com
Wed Mar 25 06:35:45 CET 2015


# HG changeset patch
# User Sumalatha Polureddy
# Date 1427260761 -19800
#      Wed Mar 25 10:49:21 2015 +0530
# Node ID 49d9c978601618ab2588b2a6f11eeeb59fb57450
# Parent  e637273e2ae6391d43a037d9a4298a8be8e178ad
asm: avx2 code sse_pp[32x32] and sse_pp[64x64] for 8 bpp

sse3
sse_pp[32x32]  6.39x    2497.86         15957.98
sse_pp[64x64]  5.01x    12520.95        62749.02

avx2
sse_pp[32x32]  13.02x   1246.36         16225.92
sse_pp[64x64]  11.79x   5189.50         61170.29

diff -r e637273e2ae6 -r 49d9c9786016 source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Tue Mar 24 15:31:05 2015 -0500
+++ b/source/common/x86/asm-primitives.cpp	Wed Mar 25 10:49:21 2015 +0530
@@ -1534,6 +1534,8 @@
         p.pu[LUMA_16x32].sad_x4 = x265_pixel_sad_x4_16x32_avx2;
 
         p.cu[BLOCK_16x16].sse_pp = x265_pixel_ssd_16x16_avx2;
+        p.cu[BLOCK_32x32].sse_pp = x265_pixel_ssd_32x32_avx2;
+        p.cu[BLOCK_64x64].sse_pp = x265_pixel_ssd_64x64_avx2;
 
         p.cu[BLOCK_16x16].ssd_s = x265_pixel_ssd_s_16_avx2;
         p.cu[BLOCK_32x32].ssd_s = x265_pixel_ssd_s_32_avx2;
diff -r e637273e2ae6 -r 49d9c9786016 source/common/x86/ssd-a.asm
--- a/source/common/x86/ssd-a.asm	Tue Mar 24 15:31:05 2015 -0500
+++ b/source/common/x86/ssd-a.asm	Wed Mar 25 10:49:21 2015 +0530
@@ -1094,6 +1094,8 @@
 INIT_YMM avx2
 SSD 16, 16
 SSD 16,  8
+SSD 32, 32
+SSD 64, 64
 %assign function_align 16
 %endif ; !HIGH_BIT_DEPTH
 


More information about the x265-devel mailing list