[x265] [PATCH 157 of 307] dct8: cleanup redundant data movement
mythreyi at multicorewareinc.com
mythreyi at multicorewareinc.com
Sat Apr 7 04:32:35 CEST 2018
# HG changeset patch
# User Praveen Tiwari <praveen at multicorewareinc.com>
# Date 1510557478 28800
# Sun Nov 12 23:17:58 2017 -0800
# Node ID 4b01781203a4e7a08cee94346f52a24ac78a3478
# Parent 94523acd49e4b021384036a43a308cbc30cb4766
dct8: cleanup redundant data movement
diff -r 94523acd49e4 -r 4b01781203a4 source/common/x86/dct8.asm
--- a/source/common/x86/dct8.asm Mon Oct 30 15:54:11 2017 +0530
+++ b/source/common/x86/dct8.asm Sun Nov 12 23:17:58 2017 -0800
@@ -2319,7 +2319,7 @@
vpaddd m%2, m5
vpsrad m%2, DCT8_SHIFT1
vpackssdw m%2, m%2
- vpermq m%2, m1, m%2
+ vpermq m%2, m19, m%2
%endmacro
%macro DCT8_AVX512_PASS_2 4
@@ -2422,7 +2422,6 @@
vpshufb m0, m4
vpaddw m3, m2, m0
vpsubw m2, m0
- mova m1, [dct8_shuf6_AVX512]
; Load all the coefficients togather for better caching
vpbroadcastq m20, [r6 + 0 * 8]
More information about the x265-devel
mailing list