[x265] [PATCH] copy_cnt_4: enable fast non zero coefficient count path

praveen at multicorewareinc.com praveen at multicorewareinc.com
Tue Sep 9 07:38:17 CEST 2014


# HG changeset patch
# User Praveen Tiwari
# Date 1410241079 -19800
# Node ID 7510b362ca969d850d33b10acb37f3e5a6d6b7dc
# Parent  91e5893dc024ccfcdec04cef5e8832c80632ee0a
copy_cnt_4: enable fast non zero coefficient count path

diff -r 91e5893dc024 -r 7510b362ca96 source/common/x86/blockcopy8.asm
--- a/source/common/x86/blockcopy8.asm	Tue Sep 09 10:46:25 2014 +0530
+++ b/source/common/x86/blockcopy8.asm	Tue Sep 09 11:07:59 2014 +0530
@@ -3973,7 +3973,7 @@
 
     ; get count
     ; CHECK_ME: Intel documents said POPCNT is SSE4.2 instruction, but just implement after Nehalem
-%if 0
+%if 1
     pmovmskb    eax, m0
     not         ax
     popcnt      ax, ax


More information about the x265-devel mailing list