[FFmpeg-cvslog] x86/vf_w3fdif: use aligned loads in w3fdif_complex_high

James Almer git at videolan.org
Tue Oct 27 05:50:48 CET 2015


ffmpeg | branch: master | James Almer <jamrial at gmail.com> | Tue Oct 27 01:49:22 2015 -0300| [d897d4c12de83e6be9e5d081a024ad5f5c548b34] | committer: James Almer

x86/vf_w3fdif: use aligned loads in w3fdif_complex_high

Found-by: Ronald S. Bultje <rsbultje at gmail.com>
Signed-off-by: James Almer <jamrial at gmail.com>

> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=d897d4c12de83e6be9e5d081a024ad5f5c548b34
---

 libavfilter/x86/vf_w3fdif.asm |    6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/libavfilter/x86/vf_w3fdif.asm b/libavfilter/x86/vf_w3fdif.asm
index fb33f41..c3c73ea 100644
--- a/libavfilter/x86/vf_w3fdif.asm
+++ b/libavfilter/x86/vf_w3fdif.asm
@@ -216,10 +216,8 @@ cglobal w3fdif_complex_high, 5, 13, 10, 0, work_line, in_lines_cur0, in_lines_ad
     pmaddwd                                m9, m4
     paddd                                  m5, m8
     paddd                                  m6, m9
-    movu                                   m8, [work_lineq+offsetq*4]
-    movu                                   m9, [work_lineq+offsetq*4+mmsize]
-    paddd                                  m5, m8
-    paddd                                  m6, m9
+    paddd                                  m5, [work_lineq+offsetq*4]
+    paddd                                  m6, [work_lineq+offsetq*4+mmsize]
     mova               [work_lineq+offsetq*4], m5
     mova        [work_lineq+offsetq*4+mmsize], m6
     add                               offsetq, mmsize/2



More information about the ffmpeg-cvslog mailing list