[FFmpeg-devel] [PATCH] pixblockdsp: Use memcpy for get_pixels_16_c

Ganesh Ajjanagadde gajjanag at mit.edu
Tue Oct 20 22:41:24 CEST 2015


On Tue, Oct 20, 2015 at 4:20 PM, Timothy Gu <timothygu99 at gmail.com> wrote:
> Before:
>   15543 decicycles in get_pixels, 4193214 runs,   1090 skips
> After:
>    5713 decicycles in get_pixels, 8387564 runs,   1044 skips
> ---
>  libavcodec/pixblockdsp.c          | 36 ++++++++++++++++++++++++++++++-----
>  libavcodec/pixblockdsp_template.c | 40 ---------------------------------------
>  2 files changed, 31 insertions(+), 45 deletions(-)
>  delete mode 100644 libavcodec/pixblockdsp_template.c
>
> diff --git a/libavcodec/pixblockdsp.c b/libavcodec/pixblockdsp.c
> index 322e1dd..0f23d8a 100644
> --- a/libavcodec/pixblockdsp.c
> +++ b/libavcodec/pixblockdsp.c
> @@ -23,12 +23,38 @@
>  #include "avcodec.h"
>  #include "pixblockdsp.h"
>
> -#define BIT_DEPTH 16
> -#include "pixblockdsp_template.c"
> -#undef BIT_DEPTH
> +static void get_pixels_16_c(int16_t *av_restrict block, const uint8_t *pixels,
> +                            ptrdiff_t line_size)
> +{
> +    memcpy(block + 0 * 8, pixels + 0 * line_size, sizeof(int16_t) * 8);
> +    memcpy(block + 1 * 8, pixels + 1 * line_size, sizeof(int16_t) * 8);
> +    memcpy(block + 2 * 8, pixels + 2 * line_size, sizeof(int16_t) * 8);
> +    memcpy(block + 3 * 8, pixels + 3 * line_size, sizeof(int16_t) * 8);
> +    memcpy(block + 4 * 8, pixels + 4 * line_size, sizeof(int16_t) * 8);
> +    memcpy(block + 5 * 8, pixels + 5 * line_size, sizeof(int16_t) * 8);
> +    memcpy(block + 6 * 8, pixels + 6 * line_size, sizeof(int16_t) * 8);
> +    memcpy(block + 7 * 8, pixels + 7 * line_size, sizeof(int16_t) * 8);
> +}
> +
> +static void get_pixels_8_c(int16_t *av_restrict block, const uint8_t *pixels,
> +                           ptrdiff_t line_size)
> +{
> +    int i;
>
> -#define BIT_DEPTH 8
> -#include "pixblockdsp_template.c"
> +    /* read the pixels */
> +    for (i = 0; i < 8; i++) {
> +        block[0] = pixels[0];
> +        block[1] = pixels[1];
> +        block[2] = pixels[2];
> +        block[3] = pixels[3];
> +        block[4] = pixels[4];
> +        block[5] = pixels[5];
> +        block[6] = pixels[6];
> +        block[7] = pixels[7];
> +        pixels  += line_size;
> +        block   += 8;
> +    }
> +}

out of curiosity: do you get gains for get_pixels_8_c as well? What I
am surprised to see is that even with the restrict keyword, a compiler
does not optimize the assignments within the loop to some sort of
block assignment (which I assume memcpy is doing).

>
>  static void diff_pixels_c(int16_t *av_restrict block, const uint8_t *s1,
>                            const uint8_t *s2, int stride)
> diff --git a/libavcodec/pixblockdsp_template.c b/libavcodec/pixblockdsp_template.c
> deleted file mode 100644
> index d1e9102..0000000
> --- a/libavcodec/pixblockdsp_template.c
> +++ /dev/null
> @@ -1,40 +0,0 @@
> -/*
> - * This file is part of FFmpeg.
> - *
> - * FFmpeg is free software; you can redistribute it and/or
> - * modify it under the terms of the GNU Lesser General Public
> - * License as published by the Free Software Foundation; either
> - * version 2.1 of the License, or (at your option) any later version.
> - *
> - * FFmpeg is distributed in the hope that it will be useful,
> - * but WITHOUT ANY WARRANTY; without even the implied warranty of
> - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> - * Lesser General Public License for more details.
> - *
> - * You should have received a copy of the GNU Lesser General Public
> - * License along with FFmpeg; if not, write to the Free Software
> - * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
> - */
> -
> -#include "bit_depth_template.c"
> -
> -static void FUNCC(get_pixels)(int16_t *av_restrict block, const uint8_t *_pixels,
> -                              ptrdiff_t line_size)
> -{
> -    const pixel *pixels = (const pixel *) _pixels;
> -    int i;
> -
> -    /* read the pixels */
> -    for (i = 0; i < 8; i++) {
> -        block[0] = pixels[0];
> -        block[1] = pixels[1];
> -        block[2] = pixels[2];
> -        block[3] = pixels[3];
> -        block[4] = pixels[4];
> -        block[5] = pixels[5];
> -        block[6] = pixels[6];
> -        block[7] = pixels[7];
> -        pixels  += line_size / sizeof(pixel);
> -        block   += 8;
> -    }
> -}
> --
> 1.9.1
>
> _______________________________________________
> ffmpeg-devel mailing list
> ffmpeg-devel at ffmpeg.org
> http://ffmpeg.org/mailman/listinfo/ffmpeg-devel


More information about the ffmpeg-devel mailing list