[x265] [PATCH] remove reduce register copy in FILTER_H4_w2_2 and FILTER_H4_w4_2

Min Chen chenm003 at 163.com
Sat Oct 19 12:09:11 CEST 2013


# HG changeset patch
# User Min Chen <chenm003 at 163.com>
# Date 1382177287 -28800
# Node ID 2424b68ff8ad01be0a134578cf4e16cd21174788
# Parent  4066e6e725ee5c3ec393ceabaf52f7e00c689bdb
remove reduce register copy in FILTER_H4_w2_2 and FILTER_H4_w4_2

diff -r 4066e6e725ee -r 2424b68ff8ad source/common/x86/ipfilter8.asm
--- a/source/common/x86/ipfilter8.asm	Fri Oct 18 15:00:40 2013 -0500
+++ b/source/common/x86/ipfilter8.asm	Sat Oct 19 18:08:07 2013 +0800
@@ -55,11 +55,11 @@
 SECTION .text
 
 %macro FILTER_H4_w2_2 3
-    movu        %1, [srcq - 1]
-    pshufb      %2, %1, Tm0
+    movu        %2, [srcq - 1]
+    pshufb      %2, Tm0
     pmaddubsw   %2, coef2
     movu        %1, [srcq + srcstrideq - 1]
-    pshufb      %1, %1, Tm0
+    pshufb      %1, Tm0
     pmaddubsw   %1, coef2
     phaddw      %2, %1
     pmulhrsw    %2, %3
@@ -137,11 +137,11 @@
 RET
 
 %macro FILTER_H4_w4_2 3
-    movu        %1, [srcq - 1]
-    pshufb      %2, %1, Tm0
+    movu        %2, [srcq - 1]
+    pshufb      %2, Tm0
     pmaddubsw   %2, coef2
     movu        %1, [srcq + srcstrideq - 1]
-    pshufb      %1, %1, Tm0
+    pshufb      %1, Tm0
     pmaddubsw   %1, coef2
     phaddw      %2, %1
     pmulhrsw    %2, %3



More information about the x265-devel mailing list