[FFmpeg-devel] [PATCH 4/4] x86/hevc_deblock: use movhps instead of shuffling values

James Almer jamrial at gmail.com
Sat May 17 02:59:06 CEST 2014


Signed-off-by: James Almer <jamrial at gmail.com>
---
 libavcodec/x86/hevc_deblock.asm | 24 ++++++++----------------
 1 file changed, 8 insertions(+), 16 deletions(-)

diff --git a/libavcodec/x86/hevc_deblock.asm b/libavcodec/x86/hevc_deblock.asm
index 72f78ac..1522d5e 100644
--- a/libavcodec/x86/hevc_deblock.asm
+++ b/libavcodec/x86/hevc_deblock.asm
@@ -145,21 +145,17 @@ INIT_XMM sse2
     punpckldq        m0, m2
 
     movq             %1, m0
-    punpckhqdq       m0, m0
-    movq             %2, m0
+    movhps           %2, m0
     movq             %3, m6
-    punpckhqdq       m6, m6
-    movq             %4, m6
+    movhps           %4, m6
 
     punpckhdq        m6, m4, m5
     punpckldq        m4, m5
 
     movq             %5, m4
-    punpckhqdq       m4, m4
-    movq             %6, m4
+    movhps           %6, m4
     movq             %7, m6
-    punpckhqdq       m6, m6
-    movq             %8, m6
+    movhps           %8, m6
 %endmacro
 
 ; in: 8 rows of 8 bytes in %1..%8
@@ -237,17 +233,13 @@ INIT_XMM sse2
     punpckldq       m11, m8, m9;  4, 5
     punpckhdq        m8, m9;   6, 7
     movq             %1, m0
-    pshufd           m0, m0, 0x4E
-    movq             %2, m0
+    movhps           %2, m0
     movq             %3, m10
-    pshufd           m10, m10, 0x4E
-    movq             %4, m10
+    movhps           %4, m10
     movq             %5, m11
-    pshufd          m11, m11, 0x4E
-    movq             %6, m11
+    movhps           %6, m11
     movq             %7, m8
-    pshufd           m8, m8, 0x4E
-    movq             %8, m8
+    movhps           %8, m8
 %endmacro
 
 ; in: 8 rows of 8 words in %1..%8
-- 
1.8.5.5



More information about the ffmpeg-devel mailing list