[x265] [PATCH] all_angs_pred_4x4, reduced mov instruction

praveen at multicorewareinc.com praveen at multicorewareinc.com
Wed Dec 4 15:36:08 CET 2013


# HG changeset patch
# User Praveen Tiwari
# Date 1386167757 -19800
# Node ID c31e28cd26aa8a3f07ba0023a5923931cc687a2d
# Parent  1e130f825cbbfa805602d4eb381b38e62ff82458
all_angs_pred_4x4, reduced mov instruction

diff -r 1e130f825cbb -r c31e28cd26aa source/common/x86/intrapred8.asm
--- a/source/common/x86/intrapred8.asm	Wed Dec 04 19:26:58 2013 +0530
+++ b/source/common/x86/intrapred8.asm	Wed Dec 04 20:05:57 2013 +0530
@@ -791,7 +791,9 @@
 
 palignr       m2,        m1,        2
 
-pmaddubsw     m6,        m2,        [r5 + 20 * 16]
+mova          m7,        [r5 + 20 * 16]
+
+pmaddubsw     m6,        m2,        m7
 pmulhrsw      m6,        m0
 packuswb      m6,        m6
 movd          [r0 + 20], m6
@@ -827,7 +829,7 @@
 packuswb      m4,        m4
 movd          [r0 + 40], m4
 
-pmaddubsw     m4,        m3,        [r5 + 20 * 16]
+pmaddubsw     m4,        m3,        m7
 pmulhrsw      m4,        m0
 packuswb      m4,        m4
 movd          [r0 + 44], m4
@@ -909,7 +911,7 @@
 packuswb      m2,         m2
 movd          [r0 + 104], m2
 
-pmaddubsw     m2,         m1,       [r5 + 20 * 16]
+pmaddubsw     m2,         m1,       m7
 pmulhrsw      m2,         m0
 packuswb      m2,         m2
 movd          [r0 + 108], m2
@@ -1412,7 +1414,7 @@
 packuswb      m2,         m2
 movd          [r0 + 424], m2
 
-pmaddubsw     m2,         m1,     [r5 + 20 * 16]
+pmaddubsw     m2,         m1,     m7
 pmulhrsw      m2,         m0
 packuswb      m2,         m2
 movd          [r0 + 428], m2
@@ -1458,7 +1460,7 @@
 packuswb      m3,         m3
 movd          [r0 + 456], m3
 
-pmaddubsw     m5,         m2,     [r5 + 20 * 16]
+pmaddubsw     m5,         m2,     m7
 pmulhrsw      m5,         m0
 packuswb      m5,         m5
 movd          [r0 + 460], m5
@@ -1504,7 +1506,7 @@
 packuswb      m4,         m4
 movd          [r0 + 488], m4
 
-pmaddubsw     m4,         m3,     [r5 + 20 * 16]
+pmaddubsw     m4,         m3,     m7
 pmulhrsw      m4,         m0
 packuswb      m4,         m4
 movd          [r0 + 492], m4


More information about the x265-devel mailing list