[x265] [PATCH] asm: replace ssse3 instruction in pixel_ssd_ss_*_sse2

Min Chen chenm003 at 163.com
Fri Sep 5 01:42:31 CEST 2014


# HG changeset patch
# User Min Chen <chenm003 at 163.com>
# Date 1409874144 25200
# Node ID fb7b890c5265d17033828718c294f1843d7da6a6
# Parent  0e0d0309e61679cbf221d0c82c27f5703767f935
asm: replace ssse3 instruction in pixel_ssd_ss_*_sse2

diff -r 0e0d0309e616 -r fb7b890c5265 source/common/x86/ssd-a.asm
--- a/source/common/x86/ssd-a.asm	Thu Sep 04 18:17:44 2014 +0200
+++ b/source/common/x86/ssd-a.asm	Thu Sep 04 16:42:24 2014 -0700
@@ -434,12 +434,7 @@
     dec    r4d
     jg .loop
 %endif
-%if %1 == 4
-    phaddd    m0, m0
-%else
-    phaddd    m0, m0
-    phaddd    m0, m0
-%endif
+    HADDD     m0, m1
     movd     eax, m0
     RET
 %endmacro
@@ -495,8 +490,7 @@
     lea       r2, [r2 + 2*r3]
     dec      r4d
     jnz .loop
-    phaddd    m0, m0
-    phaddd    m0, m0
+    HADDD     m0, m1
     movd     eax, m0
     RET
 %endmacro
@@ -553,8 +547,7 @@
     lea       r2, [r2 + 2*r3]
     dec      r4d
     jnz .loop
-    phaddd    m0, m0
-    phaddd    m0, m0
+    HADDD     m0, m1
     movd     eax, m0
     RET
 %endmacro
@@ -609,8 +602,7 @@
     lea       r2, [r2 + 2*r3]
     dec      r4d
     jnz .loop
-    phaddd    m0, m0
-    phaddd    m0, m0
+    HADDD     m0, m1
     movd     eax, m0
     RET
 %endmacro
@@ -687,8 +679,7 @@
     lea       r2, [r2 + 2*r3]
     dec      r4d
     jnz .loop
-    phaddd    m0, m0
-    phaddd    m0, m0
+    HADDD     m0, m1
     movd     eax, m0
     RET
 %endmacro
@@ -785,8 +776,7 @@
     lea     r2, [r2 + 2*r3]
     dec     r4d
     jnz .loop
-    phaddd    m0, m0
-    phaddd    m0, m0
+    HADDD     m0, m1
     movd     eax, m0
     RET
 %endmacro



More information about the x265-devel mailing list