[x264-devel] Fix 10L in r1912

Jason Garrett-Glaser git at videolan.org
Sat Feb 19 02:51:39 CET 2011


x264 | branch: master | Jason Garrett-Glaser <jason at x264.com> | Fri Feb 18 17:50:42 2011 -0800| [f9255738e3ac37430715201430f577edf1a44b57] | committer: Jason Garrett-Glaser

Fix 10L in r1912
SSSE3 code got used in MMX/SSE2 and vice versa (in hpel).

> http://git.videolan.org/gitweb.cgi/x264.git/?a=commit;h=f9255738e3ac37430715201430f577edf1a44b57
---

 common/x86/mc-a2.asm |   12 ++++++------
 1 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/common/x86/mc-a2.asm b/common/x86/mc-a2.asm
index 6fdde60..bee1436 100644
--- a/common/x86/mc-a2.asm
+++ b/common/x86/mc-a2.asm
@@ -329,6 +329,12 @@ cglobal hpel_filter_v_%1, 5,6,%2
 %endif
 .loop:
 %if %3
+    LOAD_ADD_2 m1, m4, [r1     ], [r5+r3*2], m6, m7            ; a0 / a1
+    LOAD_ADD_2 m2, m5, [r1+r3  ], [r5+r3  ], m6, m7            ; b0 / b1
+    LOAD_ADD   m3,     [r1+r3*2], [r5     ], m7                ; c0
+    LOAD_ADD   m6,     [r1+r3*2+mmsize/2], [r5+mmsize/2], m7   ; c1
+    FILT_V2 m1, m2, m3, m4, m5, m6
+%else
     mova m1, [r1]
     mova m4, [r1+r3]
     mova m2, [r5+r3*2]
@@ -348,12 +354,6 @@ cglobal hpel_filter_v_%1, 5,6,%2
     paddw  m4, m5
     paddw  m1, m3
     paddw  m4, m6
-%else
-    LOAD_ADD_2 m1, m4, [r1     ], [r5+r3*2], m6, m7            ; a0 / a1
-    LOAD_ADD_2 m2, m5, [r1+r3  ], [r5+r3  ], m6, m7            ; b0 / b1
-    LOAD_ADD   m3,     [r1+r3*2], [r5     ], m7                ; c0
-    LOAD_ADD   m6,     [r1+r3*2+mmsize/2], [r5+mmsize/2], m7   ; c1
-    FILT_V2 m1, m2, m3, m4, m5, m6
 %endif
     mova      m7, [pw_16]
     mova      [r2+r4*2], m1



More information about the x264-devel mailing list