[x265] [PATCH 075 of 307] x86: revoke some changes in ipfilter8
mythreyi at multicorewareinc.com
mythreyi at multicorewareinc.com
Sat Apr 7 04:31:13 CEST 2018
# HG changeset patch
# User Mythreyi P <mythreyi at multicorewareinc.com>
# Date 1522885678 25200
# Wed Apr 04 16:47:58 2018 -0700
# Node ID 7bdf20f62d02f5714c1332695ffa8c7c6a9d8a5a
# Parent 563b3c4f91eb20374311ed18fb18ad12aeebaf26
x86: revoke some changes in ipfilter8
diff -r 563b3c4f91eb -r 7bdf20f62d02 source/common/x86/ipfilter8.asm
--- a/source/common/x86/ipfilter8.asm Fri Jul 28 11:43:23 2017 +0530
+++ b/source/common/x86/ipfilter8.asm Wed Apr 04 16:47:58 2018 -0700
@@ -43,6 +43,15 @@
const pd_526336, times 8 dd 8192*64+2048
+const tab_ChromaCoeff, db 0, 64, 0, 0
+ db -2, 58, 10, -2
+ db -4, 54, 16, -2
+ db -6, 46, 28, -4
+ db -4, 36, 36, -4
+ db -4, 28, 46, -6
+ db -2, 16, 54, -4
+ db -2, 10, 58, -2
+
const tab_LumaCoeff, db 0, 0, 0, 64, 0, 0, 0, 0
db -1, 4, -10, 58, 17, -5, 1, 0
db -1, 4, -11, 40, 40, -11, 4, -1
diff -r 563b3c4f91eb -r 7bdf20f62d02 source/common/x86/v4-ipfilter8.asm
--- a/source/common/x86/v4-ipfilter8.asm Fri Jul 28 11:43:23 2017 +0530
+++ b/source/common/x86/v4-ipfilter8.asm Wed Apr 04 16:47:58 2018 -0700
@@ -43,7 +43,7 @@
const v4_interp4_vpp_shuf1, dd 0, 1, 1, 2, 2, 3, 3, 4
dd 2, 3, 3, 4, 4, 5, 5, 6
-const tab_ChromaCoeff, db 0, 64, 0, 0
+const v4_tab_ChromaCoeff, db 0, 64, 0, 0
db -2, 58, 10, -2
db -4, 54, 16, -2
db -6, 46, 28, -4
@@ -1031,8 +1031,8 @@
mova m6, [r5 + r4]
mova m5, [r5 + r4 + 16]
%else
- mova m6, [tab_ChromaCoeff + r4]
- mova m5, [tab_ChromaCoeff + r4 + 16]
+ mova m6, [v4_tab_ChromaCoeff + r4]
+ mova m5, [v4_tab_ChromaCoeff + r4 + 16]
%endif
%ifidn %1,pp
@@ -2114,10 +2114,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
lea r4, [r1 * 3]
lea r5, [r0 + 4 * r1]
@@ -2430,10 +2430,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m0, [tab_Cm]
@@ -2515,10 +2515,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m0, [tab_Cm]
@@ -2611,10 +2611,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m0, [tab_Cm]
@@ -2984,10 +2984,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m0, [tab_Cm]
@@ -3180,10 +3180,10 @@
punpcklbw m4, m2, m3
%ifdef PIC
- lea r6, [tab_ChromaCoeff]
+ lea r6, [v4_tab_ChromaCoeff]
movd m5, [r6 + r4 * 4]
%else
- movd m5, [tab_ChromaCoeff + r4 * 4]
+ movd m5, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m6, m5, [tab_Vm]
@@ -3233,10 +3233,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m0, [tab_Cm]
@@ -3280,10 +3280,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m0, [tab_Cm]
@@ -3355,10 +3355,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m0, [tab_Cm]
@@ -3442,10 +3442,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m5, [r5 + r4 * 4]
%else
- movd m5, [tab_ChromaCoeff + r4 * 4]
+ movd m5, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m6, m5, [tab_Vm]
@@ -3513,10 +3513,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m5, [r5 + r4 * 4]
%else
- movd m5, [tab_ChromaCoeff + r4 * 4]
+ movd m5, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m6, m5, [tab_Vm]
@@ -3605,10 +3605,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m5, [r5 + r4 * 4]
%else
- movd m5, [tab_ChromaCoeff + r4 * 4]
+ movd m5, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m6, m5, [tab_Vm]
@@ -3700,10 +3700,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -3786,10 +3786,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -3877,10 +3877,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -3995,10 +3995,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -4091,10 +4091,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m5, [r5 + r4 * 4]
%else
- movd m5, [tab_ChromaCoeff + r4 * 4]
+ movd m5, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m6, m5, [tab_Vm]
@@ -4942,10 +4942,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m5, [r5 + r4 * 4]
%else
- movd m5, [tab_ChromaCoeff + r4 * 4]
+ movd m5, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m6, m5, [tab_Vm]
@@ -5040,10 +5040,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -5130,10 +5130,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -7543,10 +7543,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -7666,10 +7666,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -8267,10 +8267,10 @@
sub r0, r1
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -8808,10 +8808,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m1, m0, [tab_Vm]
@@ -8907,10 +8907,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m0, [tab_Cm]
@@ -8981,10 +8981,10 @@
add r3d, r3d
%ifdef PIC
- lea r5, [tab_ChromaCoeff]
+ lea r5, [v4_tab_ChromaCoeff]
movd m0, [r5 + r4 * 4]
%else
- movd m0, [tab_ChromaCoeff + r4 * 4]
+ movd m0, [v4_tab_ChromaCoeff + r4 * 4]
%endif
pshufb m0, [tab_Cm]
More information about the x265-devel
mailing list