[x265] [PATCH] idct4_c: optimization

praveen at multicorewareinc.com praveen at multicorewareinc.com
Fri Nov 21 07:34:10 CET 2014


# HG changeset patch
# User Praveen Tiwari
# Date 1416549139 -19800
# Node ID 2209019a1065b53984b5c0646771f7f48f2368e5
# Parent  d00c6fb1f8c70a5c94808198f4c4e0e317f88351
idct4_c: optimization

diff -r d00c6fb1f8c7 -r 2209019a1065 source/common/dct.cpp
--- a/source/common/dct.cpp	Fri Nov 21 11:06:20 2014 +0530
+++ b/source/common/dct.cpp	Fri Nov 21 11:22:19 2014 +0530
@@ -550,18 +550,7 @@
     ALIGN_VAR_32(int16_t, coef[4 * 4]);
     ALIGN_VAR_32(int16_t, block[4 * 4]);
 
-#define N (4)
-    for (int i = 0; i < N; i++)
-    {
-        for (int j = 0; j < N; j++)
-        {
-            block[i * N + j] = (int16_t)src[i * N + j];
-        }
-    }
-
-#undef N
-
-    partialButterflyInverse4(block, coef, shift_1st, 4); // Forward DST BY FAST ALGORITHM, block input, coef output
+    partialButterflyInverse4(src, coef, shift_1st, 4); // Forward DST BY FAST ALGORITHM, block input, coef output
     partialButterflyInverse4(coef, block, shift_2nd, 4); // Forward DST BY FAST ALGORITHM, coef input, coeff output
 
     for (int i = 0; i < 4; i++)


More information about the x265-devel mailing list