[FFmpeg-devel] [PATCH 2/2] pixblockdsp: Use memcpy for get_pixels_16_c
Timothy Gu
timothygu99 at gmail.com
Sun Oct 18 03:05:46 CEST 2015
Before:
15543 decicycles in get_pixels, 4193214 runs, 1090 skips
After:
5713 decicycles in get_pixels, 8387564 runs, 1044 skips
---
libavcodec/pixblockdsp.c | 38 ++++++++++++++++++++++++++++++++-----
libavcodec/pixblockdsp_template.c | 40 ---------------------------------------
2 files changed, 33 insertions(+), 45 deletions(-)
delete mode 100644 libavcodec/pixblockdsp_template.c
diff --git a/libavcodec/pixblockdsp.c b/libavcodec/pixblockdsp.c
index 322e1dd..fc21ea4 100644
--- a/libavcodec/pixblockdsp.c
+++ b/libavcodec/pixblockdsp.c
@@ -23,12 +23,40 @@
#include "avcodec.h"
#include "pixblockdsp.h"
-#define BIT_DEPTH 16
-#include "pixblockdsp_template.c"
-#undef BIT_DEPTH
+static void get_pixels_16_c(int16_t *av_restrict block, const uint8_t *pixels,
+ ptrdiff_t line_size)
+{
+ line_size /= 2;
+
+ memcpy(block , pixels , 2 * 8);
+ memcpy(block + 1 * 8, pixels + 1 * line_size, 2 * 8);
+ memcpy(block + 2 * 8, pixels + 2 * line_size, 2 * 8);
+ memcpy(block + 3 * 8, pixels + 3 * line_size, 2 * 8);
+ memcpy(block + 4 * 8, pixels + 4 * line_size, 2 * 8);
+ memcpy(block + 5 * 8, pixels + 5 * line_size, 2 * 8);
+ memcpy(block + 6 * 8, pixels + 6 * line_size, 2 * 8);
+ memcpy(block + 7 * 8, pixels + 7 * line_size, 2 * 8);
+}
+
+static void get_pixels_8_c(int16_t *av_restrict block, const uint8_t *pixels,
+ ptrdiff_t line_size)
+{
+ int i;
-#define BIT_DEPTH 8
-#include "pixblockdsp_template.c"
+ /* read the pixels */
+ for (i = 0; i < 8; i++) {
+ block[0] = pixels[0];
+ block[1] = pixels[1];
+ block[2] = pixels[2];
+ block[3] = pixels[3];
+ block[4] = pixels[4];
+ block[5] = pixels[5];
+ block[6] = pixels[6];
+ block[7] = pixels[7];
+ pixels += line_size;
+ block += 8;
+ }
+}
static void diff_pixels_c(int16_t *av_restrict block, const uint8_t *s1,
const uint8_t *s2, int stride)
diff --git a/libavcodec/pixblockdsp_template.c b/libavcodec/pixblockdsp_template.c
deleted file mode 100644
index d1e9102..0000000
--- a/libavcodec/pixblockdsp_template.c
+++ /dev/null
@@ -1,40 +0,0 @@
-/*
- * This file is part of FFmpeg.
- *
- * FFmpeg is free software; you can redistribute it and/or
- * modify it under the terms of the GNU Lesser General Public
- * License as published by the Free Software Foundation; either
- * version 2.1 of the License, or (at your option) any later version.
- *
- * FFmpeg is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with FFmpeg; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
- */
-
-#include "bit_depth_template.c"
-
-static void FUNCC(get_pixels)(int16_t *av_restrict block, const uint8_t *_pixels,
- ptrdiff_t line_size)
-{
- const pixel *pixels = (const pixel *) _pixels;
- int i;
-
- /* read the pixels */
- for (i = 0; i < 8; i++) {
- block[0] = pixels[0];
- block[1] = pixels[1];
- block[2] = pixels[2];
- block[3] = pixels[3];
- block[4] = pixels[4];
- block[5] = pixels[5];
- block[6] = pixels[6];
- block[7] = pixels[7];
- pixels += line_size / sizeof(pixel);
- block += 8;
- }
-}
--
1.9.1
More information about the ffmpeg-devel
mailing list