[FFmpeg-devel] [PATCH V1] lavfi/superfastblur: add superfastblur filter

Tue Nov 12 11:08:04 EET 2019

> 在 2019年11月12日，15:51，Jun Zhao <mypopydev at gmail.com> 写道：
> 
> From: Jun Zhao <barryjzhao at tencent.com>
> 
> add superfastblur filter
> 
> Signed-off-by: Jun Zhao <barryjzhao at tencent.com>
> ---
> doc/filters.texi               |   15 ++
> libavfilter/Makefile           |    1 +
> libavfilter/allfilters.c       |    1 +
> libavfilter/vf_superfastblur.c |  275 ++++++++++++++++++++++++++++++++++++++++
> 4 files changed, 292 insertions(+), 0 deletions(-)
> create mode 100644 libavfilter/vf_superfastblur.c
> 
> diff --git a/doc/filters.texi b/doc/filters.texi
> index 6800124..c7d1893 100644
> --- a/doc/filters.texi
> +++ b/doc/filters.texi
> @@ -17453,6 +17453,21 @@ Interpolate) pixel art scaling algorithm.
> 
> Useful for enlarging pixel art images without reducing sharpness.
> 
> + at section superfastblur
> +
> +Blur the input image with super fast blur algorithm, multiple invocations of this
> +filter with a small radius will approximate a gaussian blur quite well.
> +
> +This filter accepts the following options:
> +
> + at table @option
> + at item radius
> + at item r
> +Set the blurring box radius. The option value must be a int number in
> +the range [1, 10] that specifies the blur box size of the superfast blur filter
> +used to blur the image. Default value is @code{2}..
> + at end table
> +
> @section swaprect
> 
> Swap two rectangular objects in video.
> diff --git a/libavfilter/Makefile b/libavfilter/Makefile
> index fce9303..db4d5e6 100644
> --- a/libavfilter/Makefile
> +++ b/libavfilter/Makefile
> @@ -396,6 +396,7 @@ OBJS-$(CONFIG_STEREO3D_FILTER)               += vf_stereo3d.o
> OBJS-$(CONFIG_STREAMSELECT_FILTER)           += f_streamselect.o framesync.o
> OBJS-$(CONFIG_SUBTITLES_FILTER)              += vf_subtitles.o
> OBJS-$(CONFIG_SUPER2XSAI_FILTER)             += vf_super2xsai.o
> +OBJS-$(CONFIG_SUPEREQUALIZER_FILTER)         += vf_superfastblur.o
> OBJS-$(CONFIG_SWAPRECT_FILTER)               += vf_swaprect.o
> OBJS-$(CONFIG_SWAPUV_FILTER)                 += vf_swapuv.o
> OBJS-$(CONFIG_TBLEND_FILTER)                 += vf_blend.o framesync.o
> diff --git a/libavfilter/allfilters.c b/libavfilter/allfilters.c
> index 7c1e19e..d507bc5 100644
> --- a/libavfilter/allfilters.c
> +++ b/libavfilter/allfilters.c
> @@ -377,6 +377,7 @@ extern AVFilter ff_vf_stereo3d;
> extern AVFilter ff_vf_streamselect;
> extern AVFilter ff_vf_subtitles;
> extern AVFilter ff_vf_super2xsai;
> +extern AVFilter ff_vf_superfastblur;
> extern AVFilter ff_vf_swaprect;
> extern AVFilter ff_vf_swapuv;
> extern AVFilter ff_vf_tblend;
> diff --git a/libavfilter/vf_superfastblur.c b/libavfilter/vf_superfastblur.c
> new file mode 100644
> index 0000000..a6428cf
> --- /dev/null
> +++ b/libavfilter/vf_superfastblur.c
> @@ -0,0 +1,275 @@
> +/*
> + * Copyright (c) 2019 Jun Zhao
> + *
> + * This file is part of FFmpeg.
> + *
> + * FFmpeg is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * FFmpeg is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with FFmpeg; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
> + */
> +
> +/**
> + * @file
> + * Super fast blur filter
> + *
> + * @see http://incubator.quasimondo.com/processing/superfast_blur.php
> + */
> +
> +#include "libavutil/avassert.h"
> +#include "libavutil/imgutils.h"
> +#include "libavutil/opt.h"
> +#include "avfilter.h"
> +#include "formats.h"
> +#include "internal.h"
> +#include "video.h"
> +
> +typedef struct SuperFastBlurContext {
> +    const AVClass *class;
> +
> +    int radius;
> +
> +    uint32_t *vMIN;
> +    uint32_t *vMAX;
> +
> +    uint8_t *r;
> +    uint8_t *g;
> +    uint8_t *b;
> +
> +    uint8_t *dv;
> +} SuperFastBlurContext;
> +
> +#define OFFSET(x) offsetof(SuperFastBlurContext, x)
> +#define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
> +static const AVOption superfastblur_options[] = {
> +    { "radius", "Radius of the super fast blurring box", OFFSET(radius),  AV_OPT_TYPE_INT, {.i64 = 2}, 1, 10, FLAGS },
> +    { "r",      "Radius of the super fast blurring box", OFFSET(radius),  AV_OPT_TYPE_INT, {.i64 = 2}, 1, 10, FLAGS },
> +    { NULL }
> +};
> +
> +AVFILTER_DEFINE_CLASS(superfastblur);
> +
> +static av_cold int init(AVFilterContext *ctx)
> +{
> +    SuperFastBlurContext *s = ctx->priv;
> +
> +    // This line precalculates a lookup table for all the possible
> +    // mean values that can occur. This is to avoid costly division
> +    // in the inner loop. On some systems doing the division directly
> +    // instead of a doing an array lookup might actually be faster
> +    // nowadays.
> +    uint32_t div = 2 * s->radius + 1;
> +    s->dv = av_malloc(sizeof(*s->dv) * 256 * div);
> +    if (!s->dv)
> +        return AVERROR(ENOMEM);
> +    for (int i = 0; i < 256 * div; i++)
> +        s->dv[i] = (i / div);
> +
> +    return 0;
> +}
> +
> +static int query_formats(AVFilterContext *ctx)
> +{
> +    static const enum AVPixelFormat pix_fmts[] = {
> +        AV_PIX_FMT_RGB24, AV_PIX_FMT_BGR24,
> +
> +        AV_PIX_FMT_NONE
Empty line？
> +    };
> +
> +    AVFilterFormats *fmts_list = ff_make_format_list(pix_fmts);
> +    if (!fmts_list)
> +        return AVERROR(ENOMEM);
> +    return ff_set_common_formats(ctx, fmts_list);
> +}
> +
> +static int config_props(AVFilterLink *inlink)
> +{
> +    AVFilterContext *ctx = inlink->dst;
> +    SuperFastBlurContext *s = ctx->priv;
> +
> +    uint32_t wm = inlink->w - 1;
> +    uint32_t wh = inlink->w * inlink->h;
> +
> +    s->vMIN = av_malloc(sizeof(wm) * FFMAX(inlink->w, inlink->h));
> +    s->vMAX = av_malloc(sizeof(wm) * FFMAX(inlink->w, inlink->h));
> +    s->r = av_malloc(sizeof(*s->r) * wh);
> +    s->g = av_malloc(sizeof(*s->g) * wh);
> +    s->b = av_malloc(sizeof(*s->b) * wh);
> +
> +    if (!s->vMIN || !s->vMAX || !s->r || !s->g || !s->b)
> +        return AVERROR(ENOMEM);
> +
> +    return 0;
> +}
> +
> +/*
> + * Super Fast Blur v1.1+
> + * by Mario Klingemann <http://incubator.quasimondo.com>
> + * Original address: http://incubator.quasimondo.com/processing/superfastblur.pde
> + *
> + * Tip: Multiple invocations of this filter with a small
> + * radius will approximate a gaussian blur quite well.
> + */
> +static void superfast_blur(SuperFastBlurContext *s, uint8_t *pix, int w, int h, int nb_comps)
> +{
> +    uint32_t wm, hm;
> +    uint32_t *vMIN, *vMAX;
> +    uint8_t *r, *g, *b, *dv;
> +    uint32_t rsum, gsum, bsum;
> +    uint32_t p, p1, p2, yi, yw;
> +
> +    int radius;
> +
> +    int x, y, i, yp;
> +
> +    wm = w - 1;
> +    hm = h - 1;
> +
> +    vMIN = s->vMIN;
> +    vMAX = s->vMAX;
> +    r = s->r;
> +    g = s->g;
> +    b = s->b;
> +
> +    dv = s->dv;
> +
> +    radius = s->radius;
> +
> +    yw = yi = 0;
> +    for (y = 0; y < h; y++) {
> +        rsum = gsum = bsum = 0;
> +        // The reason why this algorithm is fast is that it uses a sliding
> +        // window and thus reduces the number of required pixel lookups.
> +        // The window slides from the left edge to the right (and in the
> +        // second pass from top to bottom) and only adds one pixel at the
> +        // right and removes one from the left. The code above initializes
> +        // the window by prefilling the window with the leftmost edge pixel
> +        // depending on the kernel size.
> +        for (i = -radius; i <= radius; i++) {
> +            p = (yi + FFMIN(wm, FFMAX(i, 0))) * nb_comps;
> +            rsum += pix[p];
> +            gsum += pix[p + 1];
> +            bsum += pix[p + 2];
> +        }
> +
> +        for (x = 0; x < w; x++) {
> +            r[yi] = dv[rsum];
> +            g[yi] = dv[gsum];
> +            b[yi] = dv[bsum];
> +
> +            // adds a new pixel but at the same time handles the border
> +            // conditions (when the window tries to read or remove pixels
> +            // outside the bitmap).
> +            if (y == 0) {
> +                vMIN[x] = FFMIN(x + radius + 1, wm);
> +                vMAX[x] = FFMAX(x - radius, 0);
> +            }
> +            p1 = (yw + vMIN[x]) * nb_comps;
> +            p2 = (yw + vMAX[x]) * nb_comps;
> +            rsum += pix[p1]     - pix[p2];
> +            gsum += pix[p1 + 1] - pix[p2 + 1];
> +            bsum += pix[p1 + 2] - pix[p2 + 2];
> +            yi++;
> +        }
> +        yw += w;
> +    }
> +
> +    for (x = 0; x < w; x++) {
> +        rsum = gsum = bsum = 0;
> +        yp = -radius * w;
> +        for (i = -radius; i <= radius; i++) {
> +            yi = FFMAX(0, yp) + x;
> +            rsum += r[yi];
> +            gsum += g[yi];
> +            bsum += b[yi];
> +            yp += w;
> +        }
> +
> +        yi = x;
> +        for (y = 0; y < h; y++) {
> +            pix[yi * nb_comps]     = dv[bsum];
> +            pix[yi * nb_comps + 1] = dv[gsum];
> +            pix[yi * nb_comps + 2] = dv[rsum];
> +
> +            if (x == 0) {
> +                vMIN[y] = FFMIN(y + radius + 1, hm) * w;
> +                vMAX[y] = FFMAX(y - radius, 0) * w;
> +            }
> +            p1 = x + vMIN[y];
> +            p2 = x + vMAX[y];
> +
> +            // rsum, gsum and bsum is the accumulated sum of pixels inside
> +            // the sliding window. What you see is the new pixel on the
> +            // right side being added to the sum and the leftmost pixel
> +            // i nthe window being removed from the sum.
> +            rsum += r[p1] - r[p2];
> +            gsum += g[p1] - g[p2];
> +            bsum += b[p1] - b[p2];
> +            yi += w;
> +        }
> +    }
> +}
> +
> +static int filter_frame(AVFilterLink *inlink, AVFrame *in)
> +{
> +    AVFilterContext *ctx = inlink->dst;
> +    SuperFastBlurContext *s = ctx->priv;
> +    AVFilterLink *outlink = ctx->outputs[0];
> +    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(inlink->format);
> +
> +    superfast_blur(s, in->data[0], inlink->w, inlink->h, desc->nb_components);
> +
> +    return ff_filter_frame(outlink, in);
> +}
> +
> +static av_cold void uninit(AVFilterContext *ctx)
> +{
> +    SuperFastBlurContext *s = ctx->priv;
> +
> +    av_freep(&s->r);
> +    av_freep(&s->g);
> +    av_freep(&s->b);
> +    av_freep(&s->vMIN);
> +    av_freep(&s->vMAX);
> +    av_freep(&s->dv);
> +}
> +
> +static const AVFilterPad superfastblur_inputs[] = {
> +    {
> +        .name         = "default",
> +        .type         = AVMEDIA_TYPE_VIDEO,
> +        .config_props = config_props,
> +        .filter_frame = filter_frame,
> +    },
> +    { NULL }
> +};
> +
> +static const AVFilterPad superfastblur_outputs[] = {
> +    {
> +        .name = "default",
> +        .type = AVMEDIA_TYPE_VIDEO,
> +    },
> +    { NULL }
> +};
> +
> +AVFilter ff_vf_superfastblur = {
> +    .name          = "superfastblur",
> +    .description   = NULL_IF_CONFIG_SMALL("Blur the input with super fast blur algorithm."),
> +    .priv_size     = sizeof(SuperFastBlurContext),
> +    .init          = init,
> +    .uninit        = uninit,
> +    .query_formats = query_formats,
> +    .inputs        = superfastblur_inputs,
> +    .outputs       = superfastblur_outputs,
> +    .priv_class    = &superfastblur_class,
> +    .flags         = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC,
> +};
> -- 
> 1.7.1
> 
> _______________________________________________
> ffmpeg-devel mailing list
> ffmpeg-devel at ffmpeg.org
> https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
> 
> To unsubscribe, visit link above, or email
> ffmpeg-devel-request at ffmpeg.org with subject "unsubscribe”.

LGTM
BTW, I saw you usually submit multi thread performance optimization for other filter,
Why don’y do that in this filter one time complete?
I think maybe only one patch complete the whole operation maybe better.

Thanks
Steven