[x265] [PATCH] asm: pixel_avg_48x64, pixel_avg_8x32

dnyaneshwar at multicorewareinc.com dnyaneshwar at multicorewareinc.com
Tue Nov 12 07:27:05 CET 2013


# HG changeset patch
# User Dnyaneshwar Gorade <dnyaneshwar at multicorewareinc.com>
# Date 1384237578 -19800
#      Tue Nov 12 11:56:18 2013 +0530
# Node ID 60303b478851805812f70b06a39c52836c2dffa8
# Parent  1130599ba7772f83bdfdbfafb896110544a0e594
asm: pixel_avg_48x64, pixel_avg_8x32

diff -r 1130599ba777 -r 60303b478851 source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Tue Nov 12 11:44:58 2013 +0530
+++ b/source/common/x86/asm-primitives.cpp	Tue Nov 12 11:56:18 2013 +0530
@@ -121,6 +121,7 @@
     p.pixelavg_pp[LUMA_64x64] = x265_pixel_avg_64x64_ ## cpu; \
     p.pixelavg_pp[LUMA_64x48] = x265_pixel_avg_64x48_ ## cpu; \
     p.pixelavg_pp[LUMA_64x16] = x265_pixel_avg_64x16_ ## cpu; \
+    p.pixelavg_pp[LUMA_48x64] = x265_pixel_avg_48x64_ ## cpu; \
     p.pixelavg_pp[LUMA_32x64] = x265_pixel_avg_32x64_ ## cpu; \
     p.pixelavg_pp[LUMA_32x32] = x265_pixel_avg_32x32_ ## cpu; \
     p.pixelavg_pp[LUMA_32x24] = x265_pixel_avg_32x24_ ## cpu; \
@@ -133,6 +134,7 @@
     p.pixelavg_pp[LUMA_16x12]  = x265_pixel_avg_16x12_ ## cpu; \
     p.pixelavg_pp[LUMA_16x8]  = x265_pixel_avg_16x8_ ## cpu; \
     p.pixelavg_pp[LUMA_16x4]  = x265_pixel_avg_16x4_ ## cpu; \
+    p.pixelavg_pp[LUMA_8x32]  = x265_pixel_avg_8x32_ ## cpu; \
     p.pixelavg_pp[LUMA_8x16]  = x265_pixel_avg_8x16_ ## cpu; \
     p.pixelavg_pp[LUMA_8x8]   = x265_pixel_avg_8x8_ ## cpu; \
     p.pixelavg_pp[LUMA_8x4]   = x265_pixel_avg_8x4_ ## cpu;
diff -r 1130599ba777 -r 60303b478851 source/common/x86/mc-a.asm
--- a/source/common/x86/mc-a.asm	Tue Nov 12 11:44:58 2013 +0530
+++ b/source/common/x86/mc-a.asm	Tue Nov 12 11:56:18 2013 +0530
@@ -239,6 +239,7 @@
 AVG_WEIGHT 32
 AVG_WEIGHT 64
 AVG_WEIGHT 24
+AVG_WEIGHT 48
 %if HIGH_BIT_DEPTH
 INIT_XMM sse2
 AVG_WEIGHT 4,  8
@@ -251,6 +252,7 @@
 AVG_WEIGHT 32, 7
 AVG_WEIGHT 64, 7
 AVG_WEIGHT 24, 7
+AVG_WEIGHT 48, 7
 %define BIWEIGHT BIWEIGHT_SSSE3
 %define BIWEIGHT_START BIWEIGHT_START_SSSE3
 INIT_MMX ssse3
@@ -261,6 +263,7 @@
 AVG_WEIGHT 32, 7
 AVG_WEIGHT 64, 7
 AVG_WEIGHT 24, 7
+AVG_WEIGHT 48, 7
 
 INIT_YMM avx2
 cglobal pixel_avg_weight_w16
@@ -720,6 +723,7 @@
 AVGH 4, 2
 
 AVG_FUNC 8, movq, movq
+AVGH 8, 32
 AVGH 8, 16
 AVGH 8,  8
 AVGH 8,  4
@@ -746,6 +750,9 @@
 AVG_FUNC 24, movq, movq
 AVGH 24, 32
 
+AVG_FUNC 48, movq, movq
+AVGH 48, 64
+
 INIT_XMM sse2
 AVG_FUNC 64, movdqu, movdqa
 AVGH 64, 64
@@ -769,6 +776,11 @@
 AVGH 16, 12
 AVGH 16, 8
 AVGH 16, 4
+
+AVG_FUNC 48, movdqu, movdqa
+AVGH 48, 64
+
+AVGH  8, 32
 AVGH  8, 16
 AVGH  8,  8
 AVGH  8,  4
@@ -791,6 +803,10 @@
 AVGH 16, 12
 AVGH 16, 8
 AVGH 16, 4
+
+AVGH 48, 64
+
+AVGH  8, 32
 AVGH  8, 16
 AVGH  8,  8
 AVGH  8,  4
diff -r 1130599ba777 -r 60303b478851 source/common/x86/pixel.h
--- a/source/common/x86/pixel.h	Tue Nov 12 11:44:58 2013 +0530
+++ b/source/common/x86/pixel.h	Tue Nov 12 11:56:18 2013 +0530
@@ -241,6 +241,7 @@
 DECL_SUF(x265_pixel_avg_64x64, (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_64x48, (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_64x16, (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
+DECL_SUF(x265_pixel_avg_48x64, (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_32x64, (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_32x32, (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_32x24, (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
@@ -253,6 +254,7 @@
 DECL_SUF(x265_pixel_avg_16x12, (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_16x8,  (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_16x4,  (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
+DECL_SUF(x265_pixel_avg_8x32,  (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_8x16,  (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_8x8,   (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))
 DECL_SUF(x265_pixel_avg_8x4,   (pixel *, intptr_t, pixel *, intptr_t, pixel *, intptr_t, int))


More information about the x265-devel mailing list