[x265] [PATCH] asm: avx code for chroma i420 sa8d modules for 10 bpp

sumalatha at multicorewareinc.com sumalatha at multicorewareinc.com
Thu May 28 10:41:50 CEST 2015


# HG changeset patch
# User Sumalatha Polureddy
# Date 1432802505 -19800
#      Thu May 28 14:11:45 2015 +0530
# Node ID 4eead96be39e69b57f76796d76e77c6e937562e1
# Parent  9de31f8c784bdc871334f55d75f3ab73a034cc4d
asm: avx code for chroma i420 sa8d modules for 10 bpp

avx:
[i420] sa8d[  8x8]  5.19x    546.76          2838.15
[i420] sa8d[16x16]  5.38x    2094.43         11273.74
[i420] sa8d[32x32]  5.47x    8107.91         44385.75

diff -r 9de31f8c784b -r 4eead96be39e source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Thu May 28 12:23:30 2015 +0530
+++ b/source/common/x86/asm-primitives.cpp	Thu May 28 14:11:45 2015 +0530
@@ -1088,6 +1088,9 @@
         p.chroma[X265_CSP_I420].pu[CHROMA_420_4x16].satd = x265_pixel_satd_4x16_avx;
         p.chroma[X265_CSP_I420].pu[CHROMA_420_4x8].satd = x265_pixel_satd_4x8_avx;
         ASSIGN_SA8D(avx);
+        p.chroma[X265_CSP_I420].cu[BLOCK_420_8x8].sa8d = x265_pixel_sa8d_8x8_avx;
+        p.chroma[X265_CSP_I420].cu[BLOCK_420_16x16].sa8d = x265_pixel_sa8d_16x16_avx;
+        p.chroma[X265_CSP_I420].cu[BLOCK_420_32x32].sa8d = x265_pixel_sa8d_32x32_avx;
         LUMA_VAR(avx);
         p.ssim_4x4x2_core = x265_pixel_ssim_4x4x2_core_avx;
         p.ssim_end_4 = x265_pixel_ssim_end4_avx;


More information about the x265-devel mailing list