[FFmpeg-cvslog] dirac: dirac_hpel_filter_v does currently not receive aligned data, thus use unaligned accesses.

Michael Niedermayer git at videolan.org
Sun Oct 30 23:57:39 CET 2011


ffmpeg | branch: master | Michael Niedermayer <michaelni at gmx.at> | Sun Oct 30 23:24:19 2011 +0100| [f0d616e76ff6ebfafe8e3708dabe5dd6b0b71038] | committer: Michael Niedermayer

dirac: dirac_hpel_filter_v does currently not receive aligned data, thus use unaligned accesses.

Signed-off-by: Michael Niedermayer <michaelni at gmx.at>

> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=f0d616e76ff6ebfafe8e3708dabe5dd6b0b71038
---

 libavcodec/x86/diracdsp_yasm.asm |   10 +++++-----
 1 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/libavcodec/x86/diracdsp_yasm.asm b/libavcodec/x86/diracdsp_yasm.asm
index 666e657..e71da80 100644
--- a/libavcodec/x86/diracdsp_yasm.asm
+++ b/libavcodec/x86/diracdsp_yasm.asm
@@ -51,26 +51,26 @@ cglobal dirac_hpel_filter_v_%1, 4,6,8, dst, src, stride, width, src0, stridex3
     pxor    m7, m7
 .loop:
     ; 7*(src[0] + src[1])
-    UNPACK_ADD m0, m1, [srcq], [srcq + strideq], a,a
+    UNPACK_ADD m0, m1, [srcq], [srcq + strideq], u,u
     pmullw  m0, [pw_7]
     pmullw  m1, [pw_7]
 
     ; 3*( ... + src[-2] + src[3])
-    UNPACK_ADD m2, m3, [src0q + strideq], [srcq + stridex3q], a,a
+    UNPACK_ADD m2, m3, [src0q + strideq], [srcq + stridex3q], u,u
     paddw   m0, m2
     paddw   m1, m3
     pmullw  m0, [pw_3]
     pmullw  m1, [pw_3]
 
     ; ... - 7*(src[-1] + src[2])
-    UNPACK_ADD m2, m3, [src0q + strideq*2], [srcq + strideq*2], a,a
+    UNPACK_ADD m2, m3, [src0q + strideq*2], [srcq + strideq*2], u,u
     pmullw  m2, [pw_7]
     pmullw  m3, [pw_7]
     psubw   m0, m2
     psubw   m1, m3
 
     ; ... - (src[-3] + src[4])
-    UNPACK_ADD m2, m3, [src0q], [srcq + strideq*4], a,a
+    UNPACK_ADD m2, m3, [src0q], [srcq + strideq*4], u,u
     psubw   m0, m2
     psubw   m1, m3
 
@@ -79,7 +79,7 @@ cglobal dirac_hpel_filter_v_%1, 4,6,8, dst, src, stride, width, src0, stridex3
     psraw   m0, 5
     psraw   m1, 5
     packuswb m0, m1
-    mova    [dstq], m0
+    movu    [dstq], m0
     add     dstq, mmsize
     add     srcq, mmsize
     add     src0q, mmsize



More information about the ffmpeg-cvslog mailing list