[x265] [PATCH 009 of 307] x86: AVX512 pixel_avg_weight 8x32, 16x4, 16x12, 16x32, 16x64

mythreyi at multicorewareinc.com mythreyi at multicorewareinc.com
Sat Apr 7 04:30:07 CEST 2018


# HG changeset patch
# User Vignesh Vijayakumar
# Date 1499231221 -19800
#      Wed Jul 05 10:37:01 2017 +0530
# Node ID 84757e275a5427f0875fc4fd651bd1c48d534e8f
# Parent  69b61721fa2ffdf1a0f6609a299c4e0104b48628
x86: AVX512 pixel_avg_weight 8x32, 16x4, 16x12, 16x32, 16x64

diff -r 69b61721fa2f -r 84757e275a54 source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Mon Jun 26 16:31:52 2017 +0530
+++ b/source/common/x86/asm-primitives.cpp	Wed Jul 05 10:37:01 2017 +0530
@@ -3757,8 +3757,13 @@
 
         p.cu[BLOCK_8x8].var = PFX(pixel_var_8x8_avx512);
         p.cu[BLOCK_16x16].var = PFX(pixel_var_16x16_avx512);
+        p.pu[LUMA_16x64].pixelavg_pp = PFX(pixel_avg_16x64_avx512);
+        p.pu[LUMA_16x32].pixelavg_pp = PFX(pixel_avg_16x32_avx512);
         p.pu[LUMA_16x16].pixelavg_pp = PFX(pixel_avg_16x16_avx512);
+        p.pu[LUMA_16x12].pixelavg_pp = PFX(pixel_avg_16x12_avx512);
         p.pu[LUMA_16x8].pixelavg_pp = PFX(pixel_avg_16x8_avx512);
+        p.pu[LUMA_16x4].pixelavg_pp = PFX(pixel_avg_16x4_avx512);
+        p.pu[LUMA_8x32].pixelavg_pp = PFX(pixel_avg_8x32_avx512);
         p.pu[LUMA_8x16].pixelavg_pp = PFX(pixel_avg_8x16_avx512);
         p.pu[LUMA_8x8].pixelavg_pp = PFX(pixel_avg_8x8_avx512);
         p.pu[LUMA_8x4].pixelavg_pp = PFX(pixel_avg_8x4_avx512);
diff -r 69b61721fa2f -r 84757e275a54 source/common/x86/mc-a.asm
--- a/source/common/x86/mc-a.asm	Mon Jun 26 16:31:52 2017 +0530
+++ b/source/common/x86/mc-a.asm	Wed Jul 05 10:37:01 2017 +0530
@@ -4413,8 +4413,13 @@
 AVGH 16, 4
 
 INIT_XMM avx512
+AVGH 16, 64
+AVGH 16, 32
 AVGH 16, 16
+AVGH 16, 12
 AVGH 16,  8
+AVGH 16,  4
+AVGH  8, 32
 AVGH  8, 16
 AVGH  8,  8
 AVGH  8,  4


More information about the x265-devel mailing list