[x265] [PATCH] remove reduce register copy in FILTER_H4_w2_2 and FILTER_H4_w4_2
Min Chen
chenm003 at 163.com
Sat Oct 19 12:09:11 CEST 2013
# HG changeset patch
# User Min Chen <chenm003 at 163.com>
# Date 1382177287 -28800
# Node ID 2424b68ff8ad01be0a134578cf4e16cd21174788
# Parent 4066e6e725ee5c3ec393ceabaf52f7e00c689bdb
remove reduce register copy in FILTER_H4_w2_2 and FILTER_H4_w4_2
diff -r 4066e6e725ee -r 2424b68ff8ad source/common/x86/ipfilter8.asm
--- a/source/common/x86/ipfilter8.asm Fri Oct 18 15:00:40 2013 -0500
+++ b/source/common/x86/ipfilter8.asm Sat Oct 19 18:08:07 2013 +0800
@@ -55,11 +55,11 @@
SECTION .text
%macro FILTER_H4_w2_2 3
- movu %1, [srcq - 1]
- pshufb %2, %1, Tm0
+ movu %2, [srcq - 1]
+ pshufb %2, Tm0
pmaddubsw %2, coef2
movu %1, [srcq + srcstrideq - 1]
- pshufb %1, %1, Tm0
+ pshufb %1, Tm0
pmaddubsw %1, coef2
phaddw %2, %1
pmulhrsw %2, %3
@@ -137,11 +137,11 @@
RET
%macro FILTER_H4_w4_2 3
- movu %1, [srcq - 1]
- pshufb %2, %1, Tm0
+ movu %2, [srcq - 1]
+ pshufb %2, Tm0
pmaddubsw %2, coef2
movu %1, [srcq + srcstrideq - 1]
- pshufb %1, %1, Tm0
+ pshufb %1, Tm0
pmaddubsw %1, coef2
phaddw %2, %1
pmulhrsw %2, %3
More information about the x265-devel
mailing list