[x265] [PATCH] asm code blockcopy_ps_16x4, hiden register copy

praveen at multicorewareinc.com praveen at multicorewareinc.com
Mon Nov 11 12:08:02 CET 2013


# HG changeset patch
# User Praveen Tiwari
# Date 1384168071 -19800
# Node ID a4198e18262ff5ce0655fa322e1ccdb69a44f933
# Parent  859aa956515ccc0b1717edaed67c7e8f59f915fc
asm code blockcopy_ps_16x4, hiden register copy

diff -r 859aa956515c -r a4198e18262f source/common/x86/blockcopy8.asm
--- a/source/common/x86/blockcopy8.asm	Mon Nov 11 16:29:44 2013 +0530
+++ b/source/common/x86/blockcopy8.asm	Mon Nov 11 16:37:51 2013 +0530
@@ -1797,19 +1797,19 @@
 pxor       m0,      m0
 
 movu       m1,                 [r2]
-punpcklbw  m2,                 m1,            m0
+pmovzxbw   m2,                 m1
 movu       [r0],               m2
 punpckhbw  m1,                 m0
 movu       [r0 + 16],          m1
 
 movu       m1,                 [r2 + r3]
-punpcklbw  m2,                 m1,            m0
+pmovzxbw   m2,                 m1
 movu       [r0 + r1],          m2
 punpckhbw  m1,                 m0
 movu       [r0 + r1 + 16],     m1
 
 movu       m1,                 [r2 + 2 * r3]
-punpcklbw  m2,                 m1,            m0
+pmovzxbw   m2,                 m1
 movu       [r0 + 2 * r1],      m2
 punpckhbw  m1,                 m0
 movu       [r0 + 2 * r1 + 16], m1
@@ -1818,7 +1818,7 @@
 lea        r2,                 [r2 + 2 * r3]
 
 movu       m1,                 [r2 + r3]
-punpcklbw  m2,                 m1,            m0
+pmovzxbw   m2,                 m1
 movu       [r0 + r1],          m2
 punpckhbw  m1,                 m0
 movu       [r0 + r1 + 16],     m1


More information about the x265-devel mailing list