[x265] [PATCH 9 of 9] asm-intra_pred_ang16_28: use macro 'INTRA_PRED_ANG16_MC2' to reduce code size

praveen at multicorewareinc.com praveen at multicorewareinc.com
Tue Mar 17 06:11:10 CET 2015


# HG changeset patch
# User Praveen Tiwari <praveen at multicorewareinc.com>
# Date 1426517062 -19800
# Node ID 2fa6b021a4ae109acd0e7fb24c945767ffaef265
# Parent  78cbbd3e24b223836d5c185b11ca952bb678ebd1
asm-intra_pred_ang16_28: use macro 'INTRA_PRED_ANG16_MC2' to reduce code size

diff -r 78cbbd3e24b2 -r 2fa6b021a4ae source/common/x86/intrapred8.asm
--- a/source/common/x86/intrapred8.asm	Mon Mar 16 20:11:40 2015 +0530
+++ b/source/common/x86/intrapred8.asm	Mon Mar 16 20:14:22 2015 +0530
@@ -10856,36 +10856,23 @@
     lea               r3, [3 * r1]
     lea               r4, [c_ang16_mode_28]
 
-    vbroadcasti128    m1, [r2 + 1]
-    pshufb            m1, m5
-    vbroadcasti128    m2, [r2 + 9]
-    pshufb            m2, m5
-
+    INTRA_PRED_ANG16_MC2 1
     INTRA_PRED_ANG16_MC1 0
 
     lea               r0, [r0 + 4 * r1]
 
     INTRA_PRED_ANG16_MC0 r0, r0 + r1, 2
 
-    vbroadcasti128    m1, [r2 + 2]
-    pshufb            m1, m5
-    vbroadcasti128    m2, [r2 + 10]
-    pshufb            m2, m5
-
+    INTRA_PRED_ANG16_MC2 2
     INTRA_PRED_ANG16_MC0 r0 + 2 * r1, r0 + r3, 3
 
     lea               r0, [r0 + 4 * r1]
     add               r4, 4 * mmsize
 
     INTRA_PRED_ANG16_MC1 0
-
-    vbroadcasti128    m1, [r2 + 3]
-    pshufb            m1, m5
-    vbroadcasti128    m2, [r2 + 11]
-    pshufb            m2, m5
+    INTRA_PRED_ANG16_MC2 3
 
     lea               r0, [r0 + 4 * r1]
-
     INTRA_PRED_ANG16_MC1 2
     RET
 


More information about the x265-devel mailing list