[x265] [PATCH] asm: avx2 code for satd for all chroma i422 for 10 bpp

sumalatha at multicorewareinc.com sumalatha at multicorewareinc.com
Mon May 25 08:17:49 CEST 2015


# HG changeset patch
# User Sumalatha Polureddy
# Date 1432534660 -19800
#      Mon May 25 11:47:40 2015 +0530
# Node ID 9934ac4ab4572583b1c47ea3e07f3e0968c4a903
# Parent  a7bf7a150a705489cb63d0454c59ec599bad8c93
asm: avx2 code for  satd for all chroma i422 for 10 bpp

avx2:
[i422] satd[  4x8]  5.32x    290.14          1542.77
[i422] satd[  4x4]  4.32x    179.90          777.19
[i422] satd[ 8x16]  4.44x    990.86          4402.91
[i422] satd[  8x8]  5.03x    480.01          2415.82
[i422] satd[ 4x16]  5.20x    547.30          2845.97
[i422] satd[  8x4]  4.00x    310.37          1240.04
[i422] satd[ 8x12]  5.16x    820.36          4229.93
[i422] satd[16x32]  9.39x    1994.98         18729.04
[i422] satd[16x16]  9.16x    1021.66         9358.59
[i422] satd[ 8x32]  4.53x    2024.80         9175.30
[i422] satd[ 16x8]  8.93x    530.12          4735.74
[i422] satd[16x24]  4.89x    2921.85         14279.47
[i422] satd[ 4x32]  4.67x    1213.40         5662.05
[i422] satd[12x32]  4.82x    3632.33         17507.59
[i422] satd[32x64]  9.62x    7672.94         73822.49
[i422] satd[32x32]  10.75x   3891.23         41826.38
[i422] satd[16x64]  9.66x    3821.15         36931.40
[i422] satd[32x16]  8.97x    1932.95         17338.38
[i422] satd[32x48]  4.72x    11329.97        53510.81
[i422] satd[ 8x64]  4.45x    3972.60         17696.34
[i422] satd[24x64]  5.06x    11323.39        57300.73

diff -r a7bf7a150a70 -r 9934ac4ab457 source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Fri May 22 14:29:35 2015 +0530
+++ b/source/common/x86/asm-primitives.cpp	Mon May 25 11:47:40 2015 +0530
@@ -1070,6 +1070,13 @@
         p.chroma[X265_CSP_I422].pu[CHROMA_422_8x12].satd = x265_pixel_satd_8x12_avx;
         p.chroma[X265_CSP_I422].pu[CHROMA_422_12x32].satd = x265_pixel_satd_12x32_avx;
         p.chroma[X265_CSP_I422].pu[CHROMA_422_4x32].satd = x265_pixel_satd_4x32_avx;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_4x8].satd = x265_pixel_satd_4x8_avx;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_8x16].satd = x265_pixel_satd_8x16_avx;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_4x4].satd = x265_pixel_satd_4x4_avx;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_8x8].satd = x265_pixel_satd_8x8_avx;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_4x16].satd = x265_pixel_satd_4x16_avx;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_8x32].satd = x265_pixel_satd_8x32_avx;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_8x4].satd = x265_pixel_satd_8x4_avx;
 
         ALL_LUMA_PU(satd, pixel_satd, avx);
         p.chroma[X265_CSP_I420].pu[CHROMA_420_8x8].satd = x265_pixel_satd_8x8_avx;
@@ -1273,6 +1280,13 @@
         p.chroma[X265_CSP_I420].pu[CHROMA_420_32x16].satd = x265_pixel_satd_32x16_avx2;
         p.chroma[X265_CSP_I420].pu[CHROMA_420_32x24].satd = x265_pixel_satd_32x24_avx2;
         p.chroma[X265_CSP_I420].pu[CHROMA_420_32x8].satd = x265_pixel_satd_32x8_avx2;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_16x32].satd = x265_pixel_satd_16x32_avx2;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_32x64].satd = x265_pixel_satd_32x64_avx2;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_16x16].satd = x265_pixel_satd_16x16_avx2;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_32x32].satd = x265_pixel_satd_32x32_avx2;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_16x64].satd = x265_pixel_satd_16x64_avx2;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_16x8].satd = x265_pixel_satd_16x8_avx2;
+        p.chroma[X265_CSP_I422].pu[CHROMA_422_32x16].satd = x265_pixel_satd_32x16_avx2;
 
         p.cu[BLOCK_16x16].ssd_s = x265_pixel_ssd_s_16_avx2;
         p.cu[BLOCK_32x32].ssd_s = x265_pixel_ssd_s_32_avx2;


More information about the x265-devel mailing list