[x265] [PATCH 6 of 6] SEA motion search:Enable asm primitives for integralv functions

vignesh at multicorewareinc.com vignesh at multicorewareinc.com
Tue May 9 06:46:23 CEST 2017


# HG changeset patch
# User Vignesh Vijayakumar
# Date 1494225575 -19800
#      Mon May 08 12:09:35 2017 +0530
# Node ID 30fe0887253840f4baf5b6f6027aa4f1fdb62917
# Parent  093a7d74fe35ffe5ab4c335efcc690a8e2ed31f2
SEA motion search:Enable asm primitives for integralv functions

diff -r 093a7d74fe35 -r 30fe08872538 source/encoder/framefilter.cpp
--- a/source/encoder/framefilter.cpp	Mon May 08 11:31:24 2017 +0530
+++ b/source/encoder/framefilter.cpp	Mon May 08 12:09:35 2017 +0530
@@ -854,45 +854,45 @@
             /*For width = 32 */
             integral_init32h_c(sum32x32, pix, stride);
             if (y >= 32 - padY)
-                integral_init32v_c(sum32x32 - 32 * stride, stride);
+                primitives.integral_initv[5](sum32x32 - 32 * stride, stride);
             integral_init32h_c(sum32x24, pix, stride);
             if (y >= 24 - padY)
-                integral_init24v_c(sum32x24 - 24 * stride, stride);
+                primitives.integral_initv[4](sum32x24 - 24 * stride, stride);
             integral_init32h_c(sum32x8, pix, stride);
             if (y >= 8 - padY)
-                integral_init8v_c(sum32x8 - 8 * stride, stride);
+                primitives.integral_initv[1](sum32x8 - 8 * stride, stride);
             /*For width = 24 */
             integral_init24h_c(sum24x32, pix, stride);
             if (y >= 32 - padY)
-                integral_init32v_c(sum24x32 - 32 * stride, stride);
+                primitives.integral_initv[5](sum24x32 - 32 * stride, stride);
             /*For width = 16 */
             integral_init16h_c(sum16x16, pix, stride);
             if (y >= 16 - padY)
-                integral_init16v_c(sum16x16 - 16 * stride, stride);
+                primitives.integral_initv[3](sum16x16 - 16 * stride, stride);
             integral_init16h_c(sum16x12, pix, stride);
             if (y >= 12 - padY)
-                integral_init12v_c(sum16x12 - 12 * stride, stride);
+                primitives.integral_initv[2](sum16x12 - 12 * stride, stride);
             integral_init16h_c(sum16x4, pix, stride);
             if (y >= 4 - padY)
-                integral_init4v_c(sum16x4 - 4 * stride, stride);
+                primitives.integral_initv[0](sum16x4 - 4 * stride, stride);
             /*For width = 12 */
             integral_init12h_c(sum12x16, pix, stride);
             if (y >= 16 - padY)
-                integral_init16v_c(sum12x16 - 16 * stride, stride);
+                primitives.integral_initv[3](sum12x16 - 16 * stride, stride);
             /*For width = 8 */
             integral_init8h_c(sum8x32, pix, stride);
             if (y >= 32 - padY)
-                integral_init32v_c(sum8x32 - 32 * stride, stride);
+                primitives.integral_initv[5](sum8x32 - 32 * stride, stride);
             integral_init8h_c(sum8x8, pix, stride);
             if (y >= 8 - padY)
-                integral_init8v_c(sum8x8 - 8 * stride, stride);
+                primitives.integral_initv[1](sum8x8 - 8 * stride, stride);
             /*For width = 4 */
             integral_init4h_c(sum4x16, pix, stride);
             if (y >= 16 - padY)
-                integral_init16v_c(sum4x16 - 16 * stride, stride);
+                primitives.integral_initv[3](sum4x16 - 16 * stride, stride);
             integral_init4h_c(sum4x4, pix, stride);
             if (y >= 4 - padY)
-                integral_init4v_c(sum4x4 - 4 * stride, stride);
+                primitives.integral_initv[0](sum4x4 - 4 * stride, stride);
         }
         m_parallelFilter[row].m_frameFilter->integralCompleted.set(1);
     }


More information about the x265-devel mailing list