[x264-devel] commit: SSSE3 high bit depth sad_aligned functions (Jason Garrett-Glaser )
git at videolan.org
git at videolan.org
Mon Jan 10 22:00:59 CET 2011
x264 | branch: master | Jason Garrett-Glaser <darkshikari at gmail.com> | Sat Dec 18 05:40:49 2010 -0800| [e570fc2e6305cc5b5dd0422c9bdd1babe37f3d1b] | committer: Jason Garrett-Glaser
SSSE3 high bit depth sad_aligned functions
> http://git.videolan.org/gitweb.cgi/x264.git/?a=commit;h=e570fc2e6305cc5b5dd0422c9bdd1babe37f3d1b
---
common/pixel.c | 1 +
common/x86/pixel.h | 1 +
common/x86/sad16-a.asm | 6 ++++++
3 files changed, 8 insertions(+), 0 deletions(-)
diff --git a/common/pixel.c b/common/pixel.c
index 4abd6fa..ee05eab 100644
--- a/common/pixel.c
+++ b/common/pixel.c
@@ -825,6 +825,7 @@ void x264_pixel_init( int cpu, x264_pixel_function_t *pixf )
}
if( cpu&X264_CPU_SSSE3 )
{
+ INIT4_NAME( sad_aligned, sad, _ssse3_aligned );
INIT7( sad, _ssse3 );
INIT7( sad_x3, _ssse3 );
INIT7( sad_x4, _ssse3 );
diff --git a/common/x86/pixel.h b/common/x86/pixel.h
index bff7efb..2893244 100644
--- a/common/x86/pixel.h
+++ b/common/x86/pixel.h
@@ -50,6 +50,7 @@ DECL_X4( sad, sse2_misalign )
DECL_X1( sad, sse3 )
DECL_X1( sad, sse2_aligned )
DECL_X1( sad, ssse3 )
+DECL_X1( sad, ssse3_aligned )
DECL_X4( sad, mmxext )
DECL_X4( sad, sse2 )
DECL_X4( sad, sse3 )
diff --git a/common/x86/sad16-a.asm b/common/x86/sad16-a.asm
index d19d05b..bb480ce 100644
--- a/common/x86/sad16-a.asm
+++ b/common/x86/sad16-a.asm
@@ -189,6 +189,12 @@ SAD_XMM 16, 8, ssse3
SAD_XMM 8, 16, ssse3
SAD_XMM 8, 8, ssse3
SAD_XMM 8, 4, ssse3
+%define movdqu movdqa
+SAD_XMM 16, 16, ssse3_aligned
+SAD_XMM 16, 8, ssse3_aligned
+SAD_XMM 8, 16, ssse3_aligned
+SAD_XMM 8, 8, ssse3_aligned
+%undef movdqu
%undef ABS1
%undef ABS2
More information about the x264-devel
mailing list