[x265] [PATCH 164 of 307] Disable all avx512 Kernels with negative IPC gains over avx2 Kernels

mythreyi at multicorewareinc.com mythreyi at multicorewareinc.com
Sat Apr 7 04:32:42 CEST 2018


# HG changeset patch
# User Jayashree
# Date 1510736734 -19800
#      Wed Nov 15 14:35:34 2017 +0530
# Node ID 7d41838f5d06ad4fbdabd08af99d724fcd599193
# Parent  e1dedfae074d765c26efca976538cd06e1ef7cab
Disable all avx512 Kernels with negative IPC gains over avx2 Kernels.

diff -r e1dedfae074d -r 7d41838f5d06 source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Tue Nov 14 02:11:35 2017 -0800
+++ b/source/common/x86/asm-primitives.cpp	Wed Nov 15 14:35:34 2017 +0530
@@ -4328,10 +4328,10 @@
     if (cpuMask & X265_CPU_AVX512)
     {
         p.pu[LUMA_32x8].sad = PFX(pixel_sad_32x8_avx512);
-        p.pu[LUMA_32x16].sad = PFX(pixel_sad_32x16_avx512);
+      //  p.pu[LUMA_32x16].sad = PFX(pixel_sad_32x16_avx512);
         p.pu[LUMA_32x24].sad = PFX(pixel_sad_32x24_avx512);
         p.pu[LUMA_32x32].sad = PFX(pixel_sad_32x32_avx512);
-        p.pu[LUMA_32x64].sad = PFX(pixel_sad_32x64_avx512);
+        //p.pu[LUMA_32x64].sad = PFX(pixel_sad_32x64_avx512);
         p.pu[LUMA_64x16].sad = PFX(pixel_sad_64x16_avx512);
         p.pu[LUMA_64x32].sad = PFX(pixel_sad_64x32_avx512);
         p.pu[LUMA_64x48].sad = PFX(pixel_sad_64x48_avx512);
@@ -4400,14 +4400,14 @@
         p.pu[LUMA_8x32].pixelavg_pp = PFX(pixel_avg_8x32_avx512);
         p.pu[LUMA_8x16].pixelavg_pp = PFX(pixel_avg_8x16_avx512);
         p.pu[LUMA_8x8].pixelavg_pp = PFX(pixel_avg_8x8_avx512);
-        p.pu[LUMA_8x4].pixelavg_pp = PFX(pixel_avg_8x4_avx512);
+        //p.pu[LUMA_8x4].pixelavg_pp = PFX(pixel_avg_8x4_avx512);
 
         p.pu[LUMA_4x4].sad = PFX(pixel_sad_4x4_avx512);
         p.pu[LUMA_4x8].sad = PFX(pixel_sad_4x8_avx512);
         p.pu[LUMA_4x16].sad = PFX(pixel_sad_4x16_avx512);
         p.pu[LUMA_8x4].sad = PFX(pixel_sad_8x4_avx512);
         p.pu[LUMA_8x8].sad = PFX(pixel_sad_8x8_avx512);
-        p.pu[LUMA_8x16].sad = PFX(pixel_sad_8x16_avx512);
+       // p.pu[LUMA_8x16].sad = PFX(pixel_sad_8x16_avx512);
         p.pu[LUMA_16x8].sad = PFX(pixel_sad_16x8_avx512);
         p.pu[LUMA_16x16].sad = PFX(pixel_sad_16x16_avx512);
 


More information about the x265-devel mailing list