[x265] [PATCH] copy_cnt_4 asm code, corrected register uses

praveen at multicorewareinc.com praveen at multicorewareinc.com
Fri Sep 5 12:05:56 CEST 2014


# HG changeset patch
# User Praveen Tiwari
# Date 1409911542 -19800
# Node ID 59fb3aae2bd7067268ceffd1fb2a9c4aec393f5c
# Parent  1a5956edc730c3f45982e94ecb6694bb613f63f8
copy_cnt_4 asm code, corrected register uses

diff -r 1a5956edc730 -r 59fb3aae2bd7 source/common/x86/blockcopy8.asm
--- a/source/common/x86/blockcopy8.asm	Fri Sep 05 15:14:35 2014 +0530
+++ b/source/common/x86/blockcopy8.asm	Fri Sep 05 15:35:42 2014 +0530
@@ -3989,9 +3989,9 @@
 
 
 INIT_YMM avx2
-cglobal copy_cnt_4, 3,3,5
+cglobal copy_cnt_4, 3,3,3
     add         r2d, r2d
-    xorpd       xm3, xm3
+    xorpd       xm2, xm2
 
     ; row 0 & 1
     movq        xm0, [r1]
@@ -4007,7 +4007,7 @@
 
     vextractf128 xm1, m0, 1
     packsswb     xm0, xm1
-    pcmpeqb      xm0, xm3
+    pcmpeqb      xm0, xm2
 
     ; get count
     pmovmskb    eax, xm0


More information about the x265-devel mailing list