[x264-devel] Fix 10L in r1912
Jason Garrett-Glaser
git at videolan.org
Sat Feb 19 02:51:39 CET 2011
x264 | branch: master | Jason Garrett-Glaser <jason at x264.com> | Fri Feb 18 17:50:42 2011 -0800| [f9255738e3ac37430715201430f577edf1a44b57] | committer: Jason Garrett-Glaser
Fix 10L in r1912
SSSE3 code got used in MMX/SSE2 and vice versa (in hpel).
> http://git.videolan.org/gitweb.cgi/x264.git/?a=commit;h=f9255738e3ac37430715201430f577edf1a44b57
---
common/x86/mc-a2.asm | 12 ++++++------
1 files changed, 6 insertions(+), 6 deletions(-)
diff --git a/common/x86/mc-a2.asm b/common/x86/mc-a2.asm
index 6fdde60..bee1436 100644
--- a/common/x86/mc-a2.asm
+++ b/common/x86/mc-a2.asm
@@ -329,6 +329,12 @@ cglobal hpel_filter_v_%1, 5,6,%2
%endif
.loop:
%if %3
+ LOAD_ADD_2 m1, m4, [r1 ], [r5+r3*2], m6, m7 ; a0 / a1
+ LOAD_ADD_2 m2, m5, [r1+r3 ], [r5+r3 ], m6, m7 ; b0 / b1
+ LOAD_ADD m3, [r1+r3*2], [r5 ], m7 ; c0
+ LOAD_ADD m6, [r1+r3*2+mmsize/2], [r5+mmsize/2], m7 ; c1
+ FILT_V2 m1, m2, m3, m4, m5, m6
+%else
mova m1, [r1]
mova m4, [r1+r3]
mova m2, [r5+r3*2]
@@ -348,12 +354,6 @@ cglobal hpel_filter_v_%1, 5,6,%2
paddw m4, m5
paddw m1, m3
paddw m4, m6
-%else
- LOAD_ADD_2 m1, m4, [r1 ], [r5+r3*2], m6, m7 ; a0 / a1
- LOAD_ADD_2 m2, m5, [r1+r3 ], [r5+r3 ], m6, m7 ; b0 / b1
- LOAD_ADD m3, [r1+r3*2], [r5 ], m7 ; c0
- LOAD_ADD m6, [r1+r3*2+mmsize/2], [r5+mmsize/2], m7 ; c1
- FILT_V2 m1, m2, m3, m4, m5, m6
%endif
mova m7, [pw_16]
mova [r2+r4*2], m1
More information about the x264-devel
mailing list