[x264-devel] Fix overflow in ARM NEON i16x16 planar pred
Mans Rullgard
git at videolan.org
Mon Feb 7 06:31:29 CET 2011
x264 | branch: master | Mans Rullgard <mans at mansr.com> | Thu Feb 3 13:32:06 2011 -0800| [aaa7525cc47aa58ae8f03097f2dbbbebaf326f45] | committer: Jason Garrett-Glaser
Fix overflow in ARM NEON i16x16 planar pred
Patch backported from ffmpeg.
> http://git.videolan.org/gitweb.cgi/x264.git/?a=commit;h=aaa7525cc47aa58ae8f03097f2dbbbebaf326f45
---
common/arm/predict-a.S | 4 ++--
1 files changed, 2 insertions(+), 2 deletions(-)
diff --git a/common/arm/predict-a.S b/common/arm/predict-a.S
index fbcb8da..574653e 100644
--- a/common/arm/predict-a.S
+++ b/common/arm/predict-a.S
@@ -444,8 +444,8 @@ function x264_predict_16x16_p_neon
vadd.i16 d5, d6, d7
vpadd.i16 d4, d4, d5
vpadd.i16 d4, d4, d4
- vshl.i16 d5, d4, #2
- vaddl.s16 q2, d4, d5
+ vshll.s16 q3, d4, #2
+ vaddw.s16 q2, q3, d4
vrshrn.s32 d4, q2, #6
mov r3, #0
vtrn.16 d4, d5
More information about the x264-devel
mailing list