[x265] [PATCH] Enable the idct4 asm routine

nabajit at multicorewareinc.com nabajit at multicorewareinc.com
Wed Nov 27 14:14:34 CET 2013


# HG changeset patch
# User Nabajit Deka
# Date 1385558054 -19800
#      Wed Nov 27 18:44:14 2013 +0530
# Branch stable
# Node ID e0400709b4b18ea159179882b9578adbd415fb6c
# Parent  e4206a37c20f531312013d2a5879f6dbb58c05c5
Enable the idct4 asm routine.

diff -r e4206a37c20f -r e0400709b4b1 source/common/vec/dct-sse3.cpp
--- a/source/common/vec/dct-sse3.cpp	Wed Nov 27 18:38:12 2013 +0530
+++ b/source/common/vec/dct-sse3.cpp	Wed Nov 27 18:44:14 2013 +0530
@@ -1656,7 +1656,6 @@
 void Setup_Vec_DCTPrimitives_sse3(EncoderPrimitives &p)
 {
 #if !HIGH_BIT_DEPTH
-    p.idct[IDCT_4x4] = idct4;
     p.idct[IDCT_8x8] = idct8;
     p.idct[IDCT_16x16] = idct16;
     p.idct[IDCT_32x32] = idct32;
diff -r e4206a37c20f -r e0400709b4b1 source/common/x86/asm-primitives.cpp
--- a/source/common/x86/asm-primitives.cpp	Wed Nov 27 18:38:12 2013 +0530
+++ b/source/common/x86/asm-primitives.cpp	Wed Nov 27 18:44:14 2013 +0530
@@ -564,6 +564,7 @@
         p.ssim_4x4x2_core = x265_pixel_ssim_4x4x2_core_sse2;
         p.ssim_end_4 = x265_pixel_ssim_end4_sse2;
         p.dct[DCT_4x4] = x265_dct4_sse2;
+        p.idct[IDCT_4x4] = x265_idct4_sse2;
     }
     if (cpuMask & X265_CPU_SSSE3)
     {
diff -r e4206a37c20f -r e0400709b4b1 source/common/x86/dct8.h
--- a/source/common/x86/dct8.h	Wed Nov 27 18:38:12 2013 +0530
+++ b/source/common/x86/dct8.h	Wed Nov 27 18:44:14 2013 +0530
@@ -25,5 +25,6 @@
 #define X265_DCT8_H
 
 void x265_dct4_sse2(int16_t *src, int32_t *dst, intptr_t stride);
+void x265_idct4_sse2(int32_t *src, int16_t *dst, intptr_t stride);
 
 #endif // ifndef X265_DCT8_H


More information about the x265-devel mailing list