[x265] [PATCH] asm: avx2 code for ssd_s[16x16] for 10 bpp (336 -> 221)
sumalatha at multicorewareinc.com
sumalatha at multicorewareinc.com
Fri May 22 07:09:35 CEST 2015
# HG changeset patch
# User Sumalatha Polureddy
# Date 1432271370 -19800
# Fri May 22 10:39:30 2015 +0530
# Node ID 2d8f8053ef1fd1daf5c175143d373c5ded6f17da
# Parent 234bc93bd51698801fad77cc861177ed019f5113
asm: avx2 code for ssd_s[16x16] for 10 bpp (336 -> 221)
sse2
ssd_s[16x16] 6.47x 336.95 2179.88
avx2
ssd_s[16x16] 9.85x 221.43 2181.85
diff -r 234bc93bd516 -r 2d8f8053ef1f source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp Thu May 21 16:34:48 2015 +0530
+++ b/source/common/x86/asm-primitives.cpp Fri May 22 10:39:30 2015 +0530
@@ -1257,7 +1257,9 @@
p.pu[LUMA_16x32].satd = x265_pixel_satd_16x32_avx2;
p.pu[LUMA_16x64].satd = x265_pixel_satd_16x64_avx2;
+ p.cu[BLOCK_16x16].ssd_s = x265_pixel_ssd_s_16_avx2;
p.cu[BLOCK_32x32].ssd_s = x265_pixel_ssd_s_32_avx2;
+
p.cu[BLOCK_16x16].sse_ss = x265_pixel_ssd_ss_16x16_avx2;
p.cu[BLOCK_32x32].sse_ss = x265_pixel_ssd_ss_32x32_avx2;
p.cu[BLOCK_64x64].sse_ss = x265_pixel_ssd_ss_64x64_avx2;
More information about the x265-devel
mailing list