[FFmpeg-devel] [PATCH] avfilter/vf_yaepblur: add yaepblur filter

Tao Zhang nowerzt at gmail.com
Tue Dec 3 11:26:26 EET 2019


ping:)

leozhang <leozhang at qiyi.com> 于2019年11月25日周一 下午5:53写道:
>
> Signed-off-by: leozhang <leozhang at qiyi.com>
> ---
> This filter blur the input while preserving edges, with slice threads speed up.
> My test speed is about 100fps on 1080p video with 16 threads, on my test machine whose cpu is E5-2660 v4 2.0GHz using 16 threads.
> I gauss that i7-9700K 3.6GHz can run faster more.
> The test command is
> ffmpeg -s 1920x1080 -r 30 -i your_test_file.yuv -filter_threads 16 -vf yaepblur -f null -
>
>  doc/filters.texi          |  22 +++
>  libavfilter/Makefile      |   1 +
>  libavfilter/allfilters.c  |   1 +
>  libavfilter/vf_yaepblur.c | 349 ++++++++++++++++++++++++++++++++++++++++++++++
>  4 files changed, 373 insertions(+)
>  create mode 100644 libavfilter/vf_yaepblur.c
>
> diff --git a/doc/filters.texi b/doc/filters.texi
> index c04421b..61e93d5 100644
> --- a/doc/filters.texi
> +++ b/doc/filters.texi
> @@ -19775,6 +19775,28 @@ Only deinterlace frames marked as interlaced.
>  The default value is @code{all}.
>  @end table
>
> + at section yaepblur
> +
> +Apply blur filter while preserving edges ("yaepblur" means "yet another edge preserving blur filter").
> +The algorithm is described in
> +"J. S. Lee, Digital image enhancement and noise filtering by use of local statistics, IEEE Trans. Pattern Anal. Mach. Intell. PAMI-2, 1980."
> +
> +It accepts the following parameters:
> +
> + at table @option
> + at item radius, r
> +Set the window radius. Default value is 3.
> +
> + at item planes, p
> +Set which planes to filter. Default is only the first plane.
> +
> + at item sigma, s
> +Set blur strength. Default value is 128.
> + at end table
> +
> + at subsection Commands
> +This filter supports same @ref{commands} as options.
> +
>  @section zoompan
>
>  Apply Zoom & Pan effect.
> diff --git a/libavfilter/Makefile b/libavfilter/Makefile
> index 6838d5c..b490a44 100644
> --- a/libavfilter/Makefile
> +++ b/libavfilter/Makefile
> @@ -442,6 +442,7 @@ OBJS-$(CONFIG_XSTACK_FILTER)                 += vf_stack.o framesync.o
>  OBJS-$(CONFIG_YADIF_FILTER)                  += vf_yadif.o yadif_common.o
>  OBJS-$(CONFIG_YADIF_CUDA_FILTER)             += vf_yadif_cuda.o vf_yadif_cuda.ptx.o \
>                                                  yadif_common.o
> +OBJS-$(CONFIG_YAEPBLUR_FILTER)               += vf_yaepblur.o
>  OBJS-$(CONFIG_ZMQ_FILTER)                    += f_zmq.o
>  OBJS-$(CONFIG_ZOOMPAN_FILTER)                += vf_zoompan.o
>  OBJS-$(CONFIG_ZSCALE_FILTER)                 += vf_zscale.o
> diff --git a/libavfilter/allfilters.c b/libavfilter/allfilters.c
> index 7c1e19e..8f41186 100644
> --- a/libavfilter/allfilters.c
> +++ b/libavfilter/allfilters.c
> @@ -420,6 +420,7 @@ extern AVFilter ff_vf_xmedian;
>  extern AVFilter ff_vf_xstack;
>  extern AVFilter ff_vf_yadif;
>  extern AVFilter ff_vf_yadif_cuda;
> +extern AVFilter ff_vf_yaepblur;
>  extern AVFilter ff_vf_zmq;
>  extern AVFilter ff_vf_zoompan;
>  extern AVFilter ff_vf_zscale;
> diff --git a/libavfilter/vf_yaepblur.c b/libavfilter/vf_yaepblur.c
> new file mode 100644
> index 0000000..ef6fbc9
> --- /dev/null
> +++ b/libavfilter/vf_yaepblur.c
> @@ -0,0 +1,349 @@
> +/*
> + * Copyright (C) 2019 Leo Zhang <leozhang at qiyi.com>
> +
> + * This file is part of FFmpeg.
> + *
> + * FFmpeg is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * FFmpeg is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with FFmpeg; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
> + */
> +
> +/**
> + * @file
> + * yaep(yet another edge preserving) blur filter
> + *
> + * This implementation is based on an algorithm described in
> + * "J. S. Lee, Digital image enhancement and noise filtering by use of local statistics, IEEE Trans. Pattern
> + * Anal. Mach. Intell. PAMI-2, 1980."
> + */
> +
> +#include "libavutil/opt.h"
> +#include "libavutil/imgutils.h"
> +#include "avfilter.h"
> +#include "internal.h"
> +
> +typedef struct YAEPContext {
> +    const AVClass *class;
> +
> +    int planes;
> +    int radius;
> +    int sigma;
> +
> +    int nb_planes;
> +    int planewidth[4];
> +    int planeheight[4];
> +    int depth;
> +
> +    uint64_t *sat;        ///< summed area table
> +    uint64_t *square_sat; ///< square summed area table
> +    int sat_linesize;
> +
> +    int (*pre_calculate_row)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs);
> +    int (*filter_slice     )(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs);
> +} YAEPContext;
> +
> +static av_cold void uninit(AVFilterContext *ctx)
> +{
> +    YAEPContext *s = ctx->priv;
> +    av_freep(&s->sat);
> +    av_freep(&s->square_sat);
> +}
> +
> +static int query_formats(AVFilterContext *ctx)
> +{
> +    static const enum AVPixelFormat pix_fmts[] = {
> +        AV_PIX_FMT_YUVA444P, AV_PIX_FMT_YUV444P, AV_PIX_FMT_YUV440P,
> +        AV_PIX_FMT_YUVJ444P, AV_PIX_FMT_YUVJ440P,
> +        AV_PIX_FMT_YUVA422P, AV_PIX_FMT_YUV422P, AV_PIX_FMT_YUVA420P, AV_PIX_FMT_YUV420P,
> +        AV_PIX_FMT_YUVJ422P, AV_PIX_FMT_YUVJ420P,
> +        AV_PIX_FMT_YUVJ411P, AV_PIX_FMT_YUV411P, AV_PIX_FMT_YUV410P,
> +        AV_PIX_FMT_YUV420P9, AV_PIX_FMT_YUV422P9, AV_PIX_FMT_YUV444P9,
> +        AV_PIX_FMT_YUV420P10, AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV444P10,
> +        AV_PIX_FMT_YUV420P12, AV_PIX_FMT_YUV422P12, AV_PIX_FMT_YUV444P12, AV_PIX_FMT_YUV440P12,
> +        AV_PIX_FMT_YUV420P14, AV_PIX_FMT_YUV422P14, AV_PIX_FMT_YUV444P14,
> +        AV_PIX_FMT_YUV420P16, AV_PIX_FMT_YUV422P16, AV_PIX_FMT_YUV444P16,
> +        AV_PIX_FMT_YUVA420P9, AV_PIX_FMT_YUVA422P9, AV_PIX_FMT_YUVA444P9,
> +        AV_PIX_FMT_YUVA420P10, AV_PIX_FMT_YUVA422P10, AV_PIX_FMT_YUVA444P10,
> +        AV_PIX_FMT_YUVA422P12, AV_PIX_FMT_YUVA444P12,
> +        AV_PIX_FMT_YUVA420P16, AV_PIX_FMT_YUVA422P16, AV_PIX_FMT_YUVA444P16,
> +        AV_PIX_FMT_GBRP, AV_PIX_FMT_GBRP9, AV_PIX_FMT_GBRP10,
> +        AV_PIX_FMT_GBRP12, AV_PIX_FMT_GBRP14, AV_PIX_FMT_GBRP16,
> +        AV_PIX_FMT_GBRAP, AV_PIX_FMT_GBRAP10, AV_PIX_FMT_GBRAP12, AV_PIX_FMT_GBRAP16,
> +        AV_PIX_FMT_GRAY8, AV_PIX_FMT_GRAY9, AV_PIX_FMT_GRAY10, AV_PIX_FMT_GRAY12, AV_PIX_FMT_GRAY14, AV_PIX_FMT_GRAY16,
> +        AV_PIX_FMT_NONE
> +    };
> +
> +    return ff_set_common_formats(ctx, ff_make_format_list(pix_fmts));
> +}
> +
> +typedef struct ThreadData {
> +    int width;
> +    int height;
> +    int src_linesize;
> +    int dst_linesize;
> +    uint8_t *src;
> +    uint8_t *dst;
> +} ThreadData;
> +
> +#define PRE_CALCULATE_ROW(type, name)                                    \
> +static int pre_calculate_row_##name(AVFilterContext *ctx, void *arg,     \
> +                                   int jobnr, int nb_jobs)               \
> +{                                                                        \
> +    ThreadData *td = arg;                                                \
> +    YAEPContext *s = ctx->priv;                                          \
> +                                                                         \
> +    const int width        = td->width;                                  \
> +    const int height       = td->height;                                 \
> +    const int linesize     = td->src_linesize / sizeof(type);            \
> +    const int sat_linesize = s->sat_linesize;                            \
> +                                                                         \
> +    const int starty = height * jobnr     / nb_jobs;                     \
> +    const int endy   = height * (jobnr+1) / nb_jobs;                     \
> +                                                                         \
> +    uint64_t *sat        = s->sat + (starty + 1) * sat_linesize;         \
> +    uint64_t *square_sat = s->square_sat + (starty + 1) * sat_linesize;  \
> +    const type *src      = (const type *)td->src + starty * linesize;    \
> +                                                                         \
> +    int x, y;                                                            \
> +                                                                         \
> +    for (y = starty; y < endy; y++) {                                    \
> +        for (x = 0; x < width; x++) {                                    \
> +            sat[x+1]        = sat[x] + src[x];                           \
> +            square_sat[x+1] = square_sat[x] + (uint64_t)src[x] * src[x]; \
> +        }                                                                \
> +        sat               += sat_linesize;                               \
> +        square_sat        += sat_linesize;                               \
> +        src               += linesize;                                   \
> +    }                                                                    \
> +                                                                         \
> +    return 0;                                                            \
> +}
> +
> +PRE_CALCULATE_ROW(uint8_t,  byte)
> +PRE_CALCULATE_ROW(uint16_t, word)
> +
> +static int pre_calculate_col(AVFilterContext *ctx, void *arg,
> +                             int jobnr, int nb_jobs)
> +{
> +    ThreadData *td = arg;
> +    YAEPContext *s = ctx->priv;
> +
> +    const int width        = td->width;
> +    const int height       = td->height;
> +    const int sat_linesize = s->sat_linesize;
> +
> +    const int startx = width * jobnr       / nb_jobs;
> +    const int endx   = width * (jobnr + 1) / nb_jobs;
> +
> +    uint64_t *sat, *square_sat;
> +    int x, y;
> +
> +    for (x = startx; x < endx; x++) {
> +        sat = s->sat + x + 1;
> +        square_sat = s->square_sat + x + 1;
> +        for (y = 0; y < height; y++) {
> +            *(sat+sat_linesize)        += *sat;
> +            *(square_sat+sat_linesize) += *square_sat;
> +            sat         += sat_linesize;
> +            square_sat  += sat_linesize;
> +        }
> +    }
> +
> +    return 0;
> +}
> +
> +#define FILTER_SLICE(type, name)                                                                          \
> +static int filter_slice_##name(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)                   \
> +{                                                                                                         \
> +    ThreadData *td = arg;                                                                                 \
> +    YAEPContext *s = ctx->priv;                                                                           \
> +                                                                                                          \
> +    const int width = td->width;                                                                          \
> +    const int height = td->height;                                                                        \
> +    const int src_linesize = td->src_linesize / sizeof(type);                                             \
> +    const int dst_linesize = td->dst_linesize / sizeof(type);                                             \
> +    const int sat_linesize = s->sat_linesize;                                                             \
> +    const int sigma = s->sigma;                                                                           \
> +    const int radius = s->radius;                                                                         \
> +                                                                                                          \
> +    uint64_t *sat = s->sat;                                                                               \
> +    uint64_t *square_sat = s->square_sat;                                                                 \
> +    const type *src = (const type *)td->src;                                                              \
> +    type *dst = (type *)td->dst;                                                                          \
> +                                                                                                          \
> +    const int starty = height * jobnr       / nb_jobs;                                                    \
> +    const int endy   = height * (jobnr + 1) / nb_jobs;                                                    \
> +                                                                                                          \
> +    int x, y;                                                                                             \
> +    int lower_x, higher_x;                                                                                \
> +    int lower_y, higher_y;                                                                                \
> +    int dist_y, count;                                                                                    \
> +    uint64_t sum, square_sum, mean, var;                                                                  \
> +                                                                                                          \
> +    for (y = starty; y < endy; y++) {                                                                     \
> +        lower_y  = y - radius     < 0      ? 0      : y - radius;                                         \
> +        higher_y = y + radius + 1 > height ? height : y + radius + 1;                                     \
> +        dist_y = higher_y - lower_y;                                                                      \
> +        for (x = 0; x < width; x++) {                                                                     \
> +            lower_x  = x - radius     < 0     ? 0     : x - radius;                                       \
> +            higher_x = x + radius + 1 > width ? width : x + radius + 1;                                   \
> +            count = dist_y * (higher_x - lower_x);                                                        \
> +            sum = sat[higher_y * sat_linesize + higher_x]                                                 \
> +                - sat[higher_y * sat_linesize + lower_x]                                                  \
> +                - sat[lower_y  * sat_linesize + higher_x]                                                 \
> +                + sat[lower_y  * sat_linesize + lower_x];                                                 \
> +            square_sum = square_sat[higher_y * sat_linesize + higher_x]                                   \
> +                       - square_sat[higher_y * sat_linesize + lower_x]                                    \
> +                       - square_sat[lower_y  * sat_linesize + higher_x]                                   \
> +                       + square_sat[lower_y  * sat_linesize + lower_x];                                   \
> +            mean = sum / count;                                                                           \
> +            var = (square_sum - sum * sum / count) / count;                                               \
> +            dst[y * dst_linesize + x] = (sigma * mean + var * src[y * src_linesize + x]) / (sigma + var); \
> +        }                                                                                                 \
> +    }                                                                                                     \
> +    return 0;                                                                                             \
> +}
> +
> +FILTER_SLICE(uint8_t,  byte)
> +FILTER_SLICE(uint16_t, word)
> +
> +static int filter_frame(AVFilterLink *inlink, AVFrame *in)
> +{
> +    AVFilterContext *ctx = inlink->dst;
> +    YAEPContext *s = ctx->priv;
> +    AVFilterLink *outlink = ctx->outputs[0];
> +    AVFrame *out;
> +    int plane;
> +    const int nb_threads = ff_filter_get_nb_threads(ctx);
> +    ThreadData td;
> +
> +    if (av_frame_is_writable(in)) {
> +        out = in;
> +    } else {
> +        out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
> +        if (!out) {
> +            av_frame_free(&in);
> +            return AVERROR(ENOMEM);
> +        }
> +        av_frame_copy_props(out, in);
> +    }
> +
> +    for (plane = 0; plane < s->nb_planes; plane++) {
> +        if (!s->radius || !(s->planes & (1<<plane))) {
> +            if (out != in) {
> +                av_image_copy_plane(out->data[plane], out->linesize[plane],
> +                                    in->data[plane], in->linesize[plane],
> +                                    s->planewidth[plane] * ((s->depth + 7) / 8),
> +                                    s->planeheight[plane]);
> +            }
> +            continue;
> +        }
> +
> +        td.width        = s->planewidth[plane];
> +        td.height       = s->planeheight[plane];
> +        td.src          = in->data[plane];
> +        td.src_linesize = in->linesize[plane];
> +        ctx->internal->execute(ctx, s->pre_calculate_row, &td, NULL, FFMIN(td.height, nb_threads));
> +        ctx->internal->execute(ctx, pre_calculate_col, &td, NULL, FFMIN(td.width,  nb_threads));
> +
> +        td.dst          = out->data[plane];
> +        td.dst_linesize = out->linesize[plane];
> +        ctx->internal->execute(ctx, s->filter_slice, &td, NULL, FFMIN(td.height, nb_threads));
> +    }
> +
> +    if (out != in)
> +        av_frame_free(&in);
> +
> +    return ff_filter_frame(outlink, out);
> +}
> +
> +static int config_input(AVFilterLink *inlink)
> +{
> +    YAEPContext *s = inlink->dst->priv;
> +    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(inlink->format);
> +
> +    s->depth = desc->comp[0].depth;
> +    s->planewidth[1] = s->planewidth[2] = AV_CEIL_RSHIFT(inlink->w, desc->log2_chroma_w);
> +    s->planewidth[0] = s->planewidth[3] = inlink->w;
> +    s->planeheight[1] = s->planeheight[2] = AV_CEIL_RSHIFT(inlink->h, desc->log2_chroma_h);
> +    s->planeheight[0] = s->planeheight[3] = inlink->h;
> +    s->nb_planes = av_pix_fmt_count_planes(inlink->format);
> +
> +    s->radius = FFMIN(s->radius, AV_CEIL_RSHIFT(FFMIN(inlink->w, inlink->h), 1));
> +
> +    if (s->depth <= 8) {
> +        s->pre_calculate_row = pre_calculate_row_byte;
> +        s->filter_slice      = filter_slice_byte;
> +    } else {
> +        s->pre_calculate_row = pre_calculate_row_word;
> +        s->filter_slice      = filter_slice_word;
> +    }
> +
> +    // padding one row on the top, and padding one col on the left, that is why + 1 below
> +    s->sat_linesize = inlink->w + 1;
> +    s->sat = av_mallocz_array(inlink->h + 1, s->sat_linesize*sizeof(*s->sat));
> +    if (!s->sat)
> +        return AVERROR(ENOMEM);
> +
> +    s->square_sat = av_mallocz_array(inlink->h + 1, s->sat_linesize*sizeof(*s->square_sat));
> +    if (!s->square_sat)
> +        return AVERROR(ENOMEM);
> +
> +    return 0;
> +}
> +
> +static const AVFilterPad yaep_inputs[] = {
> +    {
> +        .name = "default",
> +        .type = AVMEDIA_TYPE_VIDEO,
> +        .config_props = config_input,
> +        .filter_frame = filter_frame,
> +    },
> +    { NULL }
> +};
> +
> +static const AVFilterPad yaep_outputs[] = {
> +    {
> +        .name = "default",
> +        .type = AVMEDIA_TYPE_VIDEO,
> +    },
> +    { NULL }
> +};
> +
> +#define OFFSET(x) offsetof(YAEPContext, x)
> +#define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_RUNTIME_PARAM
> +
> +static const AVOption yaep_options[] = {
> +    { "radius", "set window radius",    OFFSET(radius), AV_OPT_TYPE_INT, {.i64=3},   0, INT_MAX, .flags=FLAGS },
> +    { "r"     , "set window radius",    OFFSET(radius), AV_OPT_TYPE_INT, {.i64=3},   0, INT_MAX, .flags=FLAGS },
> +    { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=1},   0,     0xF, .flags=FLAGS },
> +    { "p",      "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=1},   0,     0xF, .flags=FLAGS },
> +    { "sigma",  "set blur strength",    OFFSET(sigma),  AV_OPT_TYPE_INT, {.i64=128}, 1, INT_MAX, .flags=FLAGS },
> +    { "s",      "set blur strength",    OFFSET(sigma),  AV_OPT_TYPE_INT, {.i64=128}, 1, INT_MAX, .flags=FLAGS },
> +    { NULL }
> +};
> +
> +AVFILTER_DEFINE_CLASS(yaep);
> +
> +AVFilter ff_vf_yaepblur = {
> +    .name            = "yaepblur",
> +    .description     = NULL_IF_CONFIG_SMALL("Yet another edge preserving blur filter."),
> +    .priv_size       = sizeof(YAEPContext),
> +    .priv_class      = &yaep_class,
> +    .uninit          = uninit,
> +    .query_formats   = query_formats,
> +    .inputs          = yaep_inputs,
> +    .outputs         = yaep_outputs,
> +    .flags           = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC | AVFILTER_FLAG_SLICE_THREADS,
> +    .process_command = ff_filter_process_command,
> +};
> --
> 1.8.3.1
>
> _______________________________________________
> ffmpeg-devel mailing list
> ffmpeg-devel at ffmpeg.org
> https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
>
> To unsubscribe, visit link above, or email
> ffmpeg-devel-request at ffmpeg.org with subject "unsubscribe".


More information about the ffmpeg-devel mailing list