[FFmpeg-cvslog] dca: ARMv6 optimised decode_blockcode()

Mans Rullgard git at videolan.org
Sat Oct 22 20:47:46 CEST 2011


ffmpeg | branch: master | Mans Rullgard <mans at mansr.com> | Thu Sep 29 22:03:40 2011 +0100| [d4999e0a798cc82db212be67d9edb22f0a7e5847] | committer: Michael Niedermayer

dca: ARMv6 optimised decode_blockcode()

Signed-off-by: Mans Rullgard <mans at mansr.com>
(cherry picked from commit 08e3dea3f7f69309574dafc0af6671615e909720)

Signed-off-by: Michael Niedermayer <michaelni at gmx.at>

> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=d4999e0a798cc82db212be67d9edb22f0a7e5847
---

 libavcodec/arm/dca.h |   39 +++++++++++++++++++++++++++++++++++++++
 libavcodec/dca.c     |    2 ++
 2 files changed, 41 insertions(+), 0 deletions(-)

diff --git a/libavcodec/arm/dca.h b/libavcodec/arm/dca.h
index 38c8d1f..e85b82c 100644
--- a/libavcodec/arm/dca.h
+++ b/libavcodec/arm/dca.h
@@ -23,6 +23,45 @@
 
 #include <stdint.h>
 #include "config.h"
+#include "libavutil/intmath.h"
+
+#if HAVE_ARMV6 && HAVE_INLINE_ASM
+
+#define decode_blockcode decode_blockcode
+static inline int decode_blockcode(int code, int levels, int *values)
+{
+    int v0, v1, v2, v3;
+
+    __asm__ ("smmul   %4, %8, %11           \n"
+             "smlabb  %8, %4, %10, %8       \n"
+             "smmul   %5, %4, %11           \n"
+             "sub     %8, %8, %9, lsr #1    \n"
+             "smlabb  %4, %5, %10, %4       \n"
+             "smmul   %6, %5, %11           \n"
+             "str     %8, %0                \n"
+             "sub     %4, %4, %9, lsr #1    \n"
+             "smlabb  %5, %6, %10, %5       \n"
+             "smmul   %7, %6, %11           \n"
+             "str     %4, %1                \n"
+             "sub     %5, %5, %9, lsr #1    \n"
+             "smlabb  %6, %7, %10, %6       \n"
+             "cmp     %7, #0                \n"
+             "str     %5, %2                \n"
+             "sub     %6, %6, %9, lsr #1    \n"
+             "it      eq                    \n"
+             "mvneq   %7, #0                \n"
+             "str     %6, %3                \n"
+             : "=m"(values[0]), "=m"(values[1]),
+               "=m"(values[2]), "=m"(values[3]),
+               "=&r"(v0), "=&r"(v1), "=&r"(v2), "=&r"(v3),
+               "+&r"(code)
+             : "r"(levels - 1), "r"(-levels), "r"(ff_inverse[levels])
+             : "cc");
+
+    return v3;
+}
+
+#endif
 
 #if HAVE_NEON && HAVE_INLINE_ASM && HAVE_ASM_MOD_Y
 
diff --git a/libavcodec/dca.c b/libavcodec/dca.c
index d900d88..cdd9161 100644
--- a/libavcodec/dca.c
+++ b/libavcodec/dca.c
@@ -1038,6 +1038,7 @@ static void dca_downmix(float *samples, int srcfmt,
 }
 
 
+#ifndef decode_blockcode
 /* Very compact version of the block code decoder that does not use table
  * look-up but is slightly slower */
 static int decode_blockcode(int code, int levels, int *values)
@@ -1058,6 +1059,7 @@ static int decode_blockcode(int code, int levels, int *values)
         return -1;
     }
 }
+#endif
 
 static const uint8_t abits_sizes[7] = { 7, 10, 12, 13, 15, 17, 19 };
 static const uint8_t abits_levels[7] = { 3, 5, 7, 9, 13, 17, 25 };



More information about the ffmpeg-cvslog mailing list