[x265] [PATCH] copy_cnt_4 asm code, corrected register uses
praveen at multicorewareinc.com
praveen at multicorewareinc.com
Fri Sep 5 12:05:56 CEST 2014
# HG changeset patch
# User Praveen Tiwari
# Date 1409911542 -19800
# Node ID 59fb3aae2bd7067268ceffd1fb2a9c4aec393f5c
# Parent 1a5956edc730c3f45982e94ecb6694bb613f63f8
copy_cnt_4 asm code, corrected register uses
diff -r 1a5956edc730 -r 59fb3aae2bd7 source/common/x86/blockcopy8.asm
--- a/source/common/x86/blockcopy8.asm Fri Sep 05 15:14:35 2014 +0530
+++ b/source/common/x86/blockcopy8.asm Fri Sep 05 15:35:42 2014 +0530
@@ -3989,9 +3989,9 @@
INIT_YMM avx2
-cglobal copy_cnt_4, 3,3,5
+cglobal copy_cnt_4, 3,3,3
add r2d, r2d
- xorpd xm3, xm3
+ xorpd xm2, xm2
; row 0 & 1
movq xm0, [r1]
@@ -4007,7 +4007,7 @@
vextractf128 xm1, m0, 1
packsswb xm0, xm1
- pcmpeqb xm0, xm3
+ pcmpeqb xm0, xm2
; get count
pmovmskb eax, xm0
More information about the x265-devel
mailing list