[x265] [PATCH] pixel_add_pp: 4x8, 4x16, merged movd and pmovzxbw instructions

praveen at multicorewareinc.com praveen at multicorewareinc.com
Wed Nov 20 14:15:40 CET 2013


# HG changeset patch
# User Praveen Tiwari
# Date 1384953332 -19800
# Node ID ce1c38cd5e4373a6fe2d8df5bacd97536c7574c5
# Parent  1044e71e42ad08d9961e3c3106609eda58f099f4
pixel_add_pp: 4x8, 4x16, merged movd and pmovzxbw instructions

diff -r 1044e71e42ad -r ce1c38cd5e43 source/common/x86/pixeladd8.asm
--- a/source/common/x86/pixeladd8.asm	Wed Nov 20 18:40:59 2013 +0530
+++ b/source/common/x86/pixeladd8.asm	Wed Nov 20 18:45:32 2013 +0530
@@ -113,8 +113,7 @@
 mov         r6d,           %2/4
 
 .loop
-      movd        m0,            [r2]
-      pmovzxbw    m0,            m0
+      pmovzxbw    m0,            [r2]
       movh        m1,            [r3]
 
       paddw       m0,            m1
@@ -122,8 +121,7 @@
 
       movd        [r0],          m0
 
-      movd        m0,            [r2 + r4]
-      pmovzxbw    m0,            m0
+      pmovzxbw    m0,            [r2 + r4]
       movh        m1,            [r3 + r5]
 
       paddw       m0,            m1
@@ -131,8 +129,7 @@
 
       movd        [r0 + r1],     m0
 
-      movd        m0,            [r2 + 2 * r4]
-      pmovzxbw    m0,            m0
+      pmovzxbw    m0,            [r2 + 2 * r4]
       movh        m1,            [r3 + 2 * r5]
 
       paddw       m0,            m1
@@ -144,8 +141,7 @@
       lea         r2,            [r2 + 2 * r4]
       lea         r3,            [r3 + 2 * r5]
 
-      movd        m0,            [r2 + r4]
-      pmovzxbw    m0,            m0
+      pmovzxbw    m0,            [r2 + r4]
       movh        m1,            [r3 + r5]
 
       paddw       m0,            m1


More information about the x265-devel mailing list