[x265] [PATCH 304 of 307] Fix SIMD register count for intra_pred_ang modes

mythreyi at multicorewareinc.com mythreyi at multicorewareinc.com
Sat Apr 7 04:35:02 CEST 2018


# HG changeset patch
# User Jayashree
# Date 1516361209 -19800
#      Fri Jan 19 16:56:49 2018 +0530
# Node ID e82bfd58acb99cd4c2e4767b1afdd3750881a68e
# Parent  f56354b2b542aaafa389a226f0fb3b41e4d33803
Fix SIMD register count for intra_pred_ang modes

diff -r f56354b2b542 -r e82bfd58acb9 source/common/x86/intrapred16.asm
--- a/source/common/x86/intrapred16.asm	Wed Jan 17 10:11:09 2018 -0800
+++ b/source/common/x86/intrapred16.asm	Fri Jan 19 16:56:49 2018 +0530
@@ -19236,8 +19236,7 @@
     packusdw        m2, m1
     TRANSPOSE_STORE_AVX2 4, 5, 6, 7, 8, 9, 10, 2, 0, 1, 16
     ret
-
-cglobal intra_pred_ang32_5, 3,8,13
+cglobal intra_pred_ang32_5, 3,8,17
     add         r2,        128
     xor         r6d,       r6d
     lea         r3,        [ang_table_avx2 + 16 * 32]
@@ -19259,11 +19258,9 @@
     vbroadcasti32x8  m15,  [pd_16]
     add         r2,        18
     lea         r0,        [r0 + 32]
-
     call        ang32_mode_5_31
     RET
-
-cglobal intra_pred_ang32_31, 3,7,13
+cglobal intra_pred_ang32_31, 3,7,17
     xor         r6d,       r6d
     inc         r6d
     lea         r3,        [ang_table_avx2 + 16 * 32]
@@ -19285,18 +19282,16 @@
     add         r2,        18
     call        ang32_mode_5_31
     RET
-cglobal intra_pred_ang16_5, 3,7,13
+cglobal intra_pred_ang16_5, 3,7,17
     add         r2,        64
     xor         r6d,       r6d
     vbroadcasti32x8  m15,  [pd_16]
     lea         r3,        [ang_table_avx2 + 16 * 32]
     add         r1d,       r1d
     lea         r4,        [r1 * 3]
-
     call        ang16_mode_5_31
     RET
-
-cglobal intra_pred_ang16_31, 3,7,13
+cglobal intra_pred_ang16_31, 3,7,17
     xor         r6d,       r6d
     inc         r6d
     vbroadcasti32x8  m15,  [pd_16]
@@ -19609,8 +19604,7 @@
     packusdw        m3, m0
     TRANSPOSE_STORE_AVX2 4, 5, 6, 7, 8, 9, 10, 3, 0, 1, 16
     ret
-
-cglobal intra_pred_ang32_4, 3,8,13
+cglobal intra_pred_ang32_4, 3,8,17
     add         r2,        128
     xor         r6d,       r6d
     lea         r3,        [ang_table_avx2 + 18 * 32]
@@ -19632,11 +19626,9 @@
 
     add         r2,        22
     lea         r0,        [r0 + 32]
-
     call        ang32_mode_4_32
     RET
-
-cglobal intra_pred_ang32_32, 3,7,13
+cglobal intra_pred_ang32_32, 3,7,17
     xor         r6d,       r6d
     inc         r6d
     lea         r3,        [ang_table_avx2 + 18 * 32]
@@ -19654,23 +19646,19 @@
     mov         r0,        r5
 
     call        ang16_mode_4_32
-
     add         r2,        22
-
     call        ang32_mode_4_32
     RET
-cglobal intra_pred_ang16_4, 3,7,13
+cglobal intra_pred_ang16_4, 3,7,17
     add         r2,        64
     xor         r6d,       r6d
     vbroadcasti32x8  m15,  [pd_16]
     lea         r3,        [ang_table_avx2 + 18 * 32]
     add         r1d,       r1d
     lea         r4,        [r1 * 3]
-
     call        ang16_mode_4_32
     RET
-
-cglobal intra_pred_ang16_32, 3,7,13
+cglobal intra_pred_ang16_32, 3,7,17
     xor         r6d,       r6d
     inc         r6d
     vbroadcasti32x8  m15,  [pd_16]
@@ -19949,8 +19937,7 @@
     packusdw        m11, m3
     TRANSPOSE_STORE_AVX2 4, 5, 6, 7, 8, 9, 10, 11, 0, 1, 16
     ret
-
-cglobal intra_pred_ang32_6, 3,8,14
+cglobal intra_pred_ang32_6, 3,8,17
     add         r2,        128
     xor         r6d,       r6d
     lea         r3,        [ang_table_avx2 + 15 * 32]
@@ -19972,11 +19959,9 @@
 
     add         r2,        12
     lea         r0,        [r0 + 32]
-
     call        ang32_mode_6_30
     RET
-
-cglobal intra_pred_ang32_30, 3,7,14
+cglobal intra_pred_ang32_30, 3,7,17
     xor         r6d,       r6d
     inc         r6d
     lea         r3,        [ang_table_avx2 + 15 * 32]
@@ -19998,18 +19983,16 @@
     add         r2,        12
     call        ang32_mode_6_30
     RET
-cglobal intra_pred_ang16_6, 3,7,14
+cglobal intra_pred_ang16_6, 3,7,17
     add         r2,        64
     xor         r6d,       r6d
     vbroadcasti32x8  m15,  [pd_16]
     lea         r3,        [ang_table_avx2 + 15 * 32]
     shl         r1d,       1
     lea         r4,        [r1 * 3]
-
     call        ang16_mode_6_30
     RET
-
-cglobal intra_pred_ang16_30, 3,7,14
+cglobal intra_pred_ang16_30, 3,7,17
     xor         r6d,       r6d
     inc         r6d
     vbroadcasti32x8  m15,  [pd_16]


More information about the x265-devel mailing list