[FFmpeg-cvslog] avfilter: Add colorconstancy filter

Mina git at videolan.org
Mon Jul 23 23:35:08 EEST 2018


ffmpeg | branch: master | Mina <minasamy_ at hotmail.com> | Mon Jul 16 10:20:02 2018 +0200| [0bb5cd8c4d566d38d6f056fb13eba3a0a5c4d211] | committer: Thilo Borgmann

avfilter: Add colorconstancy filter

Signed-off-by: Mina <minasamy_ at hotmail.com>

> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=0bb5cd8c4d566d38d6f056fb13eba3a0a5c4d211
---

 Changelog                       |   1 +
 MAINTAINERS                     |   1 +
 doc/filters.texi                |  41 +++
 libavfilter/Makefile            |   1 +
 libavfilter/allfilters.c        |   1 +
 libavfilter/vf_colorconstancy.c | 758 ++++++++++++++++++++++++++++++++++++++++
 6 files changed, 803 insertions(+)

diff --git a/Changelog b/Changelog
index 72da5bf519..807a05dec9 100644
--- a/Changelog
+++ b/Changelog
@@ -15,6 +15,7 @@ version <next>:
 - vc1 decoder is now bit-exact
 - ATRAC9 decoder
 - lensfun wrapper filter
+- colorconstancy filter
 
 
 version 4.0:
diff --git a/MAINTAINERS b/MAINTAINERS
index 78f450dda6..234b655cef 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -332,6 +332,7 @@ Filters:
   vf_bwdif                              Thomas Mundt (CC <thomas.mundt at hr.de>)
   vf_chromakey.c                        Timo Rothenpieler
   vf_colorchannelmixer.c                Paul B Mahol
+  vf_colorconstancy.c                   Mina Sami    (CC <minas.gorgy at gmail.com>)
   vf_colorbalance.c                     Paul B Mahol
   vf_colorkey.c                         Timo Rothenpieler
   vf_colorlevels.c                      Paul B Mahol
diff --git a/doc/filters.texi b/doc/filters.texi
index e3005c3278..0b0903e5a7 100644
--- a/doc/filters.texi
+++ b/doc/filters.texi
@@ -9940,6 +9940,47 @@ gradfun=radius=8
 
 @end itemize
 
+ at section greyedge
+A color constancy variation filter which estimates scene illumination via grey edge algorithm
+and corrects the scene colors accordingly.
+
+See: @url{https://staff.science.uva.nl/th.gevers/pub/GeversTIP07.pdf}
+
+The filter accepts the following options:
+
+ at table @option
+ at item difford
+The order of differentiation to be applied on the scene. Must be chosen in the range
+[0,2] and default value is 1.
+
+ at item minknorm
+The Minkowski parameter to be used for calculating the Minkowski distance. Must
+be chosen in the range [0,65535] and default value is 1. Set to 0 for getting
+max value instead of calculating Minkowski distance.
+
+ at item sigma
+The standard deviation of Gaussian blur to be applied on the scene. Must be
+chosen in the range [0,1024.0] and default value = 1. Sigma can't be set to 0
+if @var{difford} is greater than 0.
+ at end table
+
+ at subsection Examples
+ at itemize
+
+ at item
+Grey Edge:
+ at example
+greyedge=difford=1:minknorm=5:sigma=2
+ at end example
+
+ at item
+Max Edge:
+ at example
+greyedge=difford=1:minknorm=0:sigma=2
+ at end example
+
+ at end itemize
+
 @anchor{haldclut}
 @section haldclut
 
diff --git a/libavfilter/Makefile b/libavfilter/Makefile
index 5d4549e24c..86b04e3efb 100644
--- a/libavfilter/Makefile
+++ b/libavfilter/Makefile
@@ -228,6 +228,7 @@ OBJS-$(CONFIG_FSPP_FILTER)                   += vf_fspp.o
 OBJS-$(CONFIG_GBLUR_FILTER)                  += vf_gblur.o
 OBJS-$(CONFIG_GEQ_FILTER)                    += vf_geq.o
 OBJS-$(CONFIG_GRADFUN_FILTER)                += vf_gradfun.o
+OBJS-$(CONFIG_GREYEDGE_FILTER)               += vf_colorconstancy.o
 OBJS-$(CONFIG_HALDCLUT_FILTER)               += vf_lut3d.o framesync.o
 OBJS-$(CONFIG_HFLIP_FILTER)                  += vf_hflip.o
 OBJS-$(CONFIG_HISTEQ_FILTER)                 += vf_histeq.o
diff --git a/libavfilter/allfilters.c b/libavfilter/allfilters.c
index 521bc53164..2d19929bdc 100644
--- a/libavfilter/allfilters.c
+++ b/libavfilter/allfilters.c
@@ -217,6 +217,7 @@ extern AVFilter ff_vf_fspp;
 extern AVFilter ff_vf_gblur;
 extern AVFilter ff_vf_geq;
 extern AVFilter ff_vf_gradfun;
+extern AVFilter ff_vf_greyedge;
 extern AVFilter ff_vf_haldclut;
 extern AVFilter ff_vf_hflip;
 extern AVFilter ff_vf_histeq;
diff --git a/libavfilter/vf_colorconstancy.c b/libavfilter/vf_colorconstancy.c
new file mode 100644
index 0000000000..7194688dfa
--- /dev/null
+++ b/libavfilter/vf_colorconstancy.c
@@ -0,0 +1,758 @@
+/*
+ * Copyright (c) 2018 Mina Sami
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+/**
+ * @file
+ * Color Constancy filter
+ *
+ * @see http://colorconstancy.com/
+ *
+ * @cite
+ * J. van de Weijer, Th. Gevers, A. Gijsenij "Edge-Based Color Constancy".
+ */
+
+#include "libavutil/bprint.h"
+#include "libavutil/imgutils.h"
+#include "libavutil/opt.h"
+#include "libavutil/pixdesc.h"
+
+#include "avfilter.h"
+#include "formats.h"
+#include "internal.h"
+#include "video.h"
+
+#include <math.h>
+
+#define GREY_EDGE "greyedge"
+
+#define NUM_PLANES    3
+#define MAX_DIFF_ORD  2
+#define MAX_META_DATA 4
+#define MAX_DATA      4
+
+#define INDEX_TEMP 0
+#define INDEX_DX   1
+#define INDEX_DY   2
+#define INDEX_DXY  3
+#define INDEX_NORM INDEX_DX
+#define INDEX_SRC  0
+#define INDEX_DST  1
+#define INDEX_ORD  2
+#define INDEX_DIR  3
+#define DIR_X 0
+#define DIR_Y 1
+
+/**
+ * Used for passing data between threads.
+ */
+typedef struct ThreadData {
+    AVFrame *in, *out;
+    int meta_data[MAX_META_DATA];
+    double  *data[MAX_DATA][NUM_PLANES];
+} ThreadData;
+
+/**
+ * Common struct for all algorithms contexts.
+ */
+typedef struct ColorConstancyContext {
+    const AVClass *class;
+
+    int difford;
+    int minknorm; /**< @minknorm = 0 : getMax instead */
+    double sigma;
+
+    int nb_threads;
+    int planeheight[4];
+    int planewidth[4];
+
+    int filtersize;
+    double *gauss[MAX_DIFF_ORD+1];
+
+    double white[NUM_PLANES];
+} ColorConstancyContext;
+
+#define OFFSET(x) offsetof(ColorConstancyContext, x)
+#define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
+
+#define GINDX(s, i) ( (i) - ((s) >> 2) )
+
+/**
+ * Sets gauss filters used for calculating gauss derivatives. Filter size
+ * depends on sigma which is a user option hence we calculate these
+ * filters each time. Also each higher order depends on lower ones. Sigma
+ * can be zero only at difford = 0, then we only convert data to double
+ * instead.
+ *
+ * @param ctx the filter context.
+ *
+ * @return 0 in case of success, a negative value corresponding to an
+ * AVERROR code in case of failure.
+ */
+static int set_gauss(AVFilterContext *ctx)
+{
+    ColorConstancyContext *s = ctx->priv;
+    int filtersize = s->filtersize;
+    int difford    = s->difford;
+    double sigma   = s->sigma;
+    double sum1, sum2;
+    int i;
+
+    for (i = 0; i <= difford; ++i) {
+        s->gauss[i] = av_mallocz_array(filtersize, sizeof(*s->gauss[i]));
+        if (!s->gauss[i]) {
+            for (; i >= 0; --i) {
+                av_freep(&s->gauss[i]);
+            }
+            av_log(ctx, AV_LOG_ERROR, "Out of memory while allocating gauss buffers.\n");
+            return AVERROR(ENOMEM);
+        }
+    }
+
+    // Order 0
+    av_log(ctx, AV_LOG_TRACE, "Setting 0-d gauss with filtersize = %d.\n", filtersize);
+    sum1 = 0.0;
+    if (!sigma) {
+        s->gauss[0][0] = 1; // Copying data to double instead of convolution
+    } else {
+        for (i = 0; i < filtersize; ++i) {
+            s->gauss[0][i] = exp(- pow(GINDX(filtersize, i), 2.) / (2 * sigma * sigma)) / ( sqrt(2 * M_PI) * sigma );
+            sum1 += s->gauss[0][i];
+        }
+        for (i = 0; i < filtersize; ++i) {
+            s->gauss[0][i] /= sum1;
+        }
+    }
+    // Order 1
+    if (difford > 0) {
+        av_log(ctx, AV_LOG_TRACE, "Setting 1-d gauss with filtersize = %d.\n", filtersize);
+        sum1 = 0.0;
+        for (i = 0; i < filtersize; ++i) {
+            s->gauss[1][i] = - (GINDX(filtersize, i) / pow(sigma, 2)) * s->gauss[0][i];
+            sum1 += s->gauss[1][i] *GINDX(filtersize, i);
+        }
+
+        for (i = 0; i < filtersize; ++i) {
+            s->gauss[1][i] /= sum1;
+        }
+
+        // Order 2
+        if (difford > 1) {
+            av_log(ctx, AV_LOG_TRACE, "Setting 2-d gauss with filtersize = %d.\n", filtersize);
+            sum1 = 0.0;
+            for (i = 0; i < filtersize; ++i) {
+                s->gauss[2][i] = ( pow(GINDX(filtersize, i), 2) / pow(sigma, 4) - 1/pow(sigma, 2) )
+                                 * s->gauss[0][i];
+                sum1 += s->gauss[2][i];
+            }
+
+            sum2 = 0.0;
+            for (i = 0; i < filtersize; ++i) {
+                s->gauss[2][i] -= sum1 / (filtersize);
+                sum2 += (0.5 * GINDX(filtersize, i) * GINDX(filtersize, i) * s->gauss[2][i]);
+            }
+            for (i = 0; i < filtersize ; ++i) {
+                s->gauss[2][i] /= sum2;
+            }
+        }
+    }
+    return 0;
+}
+
+/**
+ * Frees up buffers used by grey edge for storing derivatives final
+ * and intermidiate results. Number of buffers and number of planes
+ * for last buffer are given so it can be safely called at allocation
+ * failure instances.
+ *
+ * @param td holds the buffers.
+ * @param nb_buff number of buffers to be freed.
+ * @param nb_planes number of planes for last buffer to be freed.
+ */
+static void cleanup_derivative_buffers(ThreadData *td, int nb_buff, int nb_planes)
+{
+    int b, p;
+
+    for (b = 0; b < nb_buff; ++b) {
+        for (p = 0; p < NUM_PLANES; ++p) {
+            av_freep(&td->data[b][p]);
+        }
+    }
+    // Final buffer may not be fully allocated at fail cases
+    for (p = 0; p < nb_planes; ++p) {
+        av_freep(&td->data[b][p]);
+    }
+}
+
+/**
+ * Allocates buffers used by grey edge for storing derivatives final
+ * and intermidiate results.
+ *
+ * @param ctx the filter context.
+ * @param td holds the buffers.
+ *
+ * @return 0 in case of success, a negative value corresponding to an
+ * AVERROR code in case of failure.
+ */
+static int setup_derivative_buffers(AVFilterContext* ctx, ThreadData *td)
+{
+    ColorConstancyContext *s = ctx->priv;
+    int nb_buff = s->difford + 1;
+    int b, p;
+
+    av_log(ctx, AV_LOG_TRACE, "Allocating %d buffer(s) for grey edge.\n", nb_buff);
+    for (b = 0; b <= nb_buff; ++b) { // We need difford + 1 buffers
+        for (p = 0; p < NUM_PLANES; ++p) {
+            td->data[b][p] = av_mallocz_array(s->planeheight[p] * s->planewidth[p], sizeof(*td->data[b][p]));
+            if (!td->data[b][p]) {
+                cleanup_derivative_buffers(td, b + 1, p);
+                av_log(ctx, AV_LOG_ERROR, "Out of memory while allocating derivatives buffers.\n");
+                return AVERROR(ENOMEM);
+            }
+        }
+    }
+    return 0;
+}
+
+#define CLAMP(x, mx) av_clip((x), 0, (mx-1))
+#define INDX2D(r, c, w) ( (r) * (w) + (c) )
+#define GAUSS(s, sr, sc, sls, sh, sw, g) ( (s)[ INDX2D(CLAMP((sr), (sh)), CLAMP((sc), (sw)), (sls)) ] * (g) )
+
+/**
+ * Slice calculation of gaussian derivatives. Applies 1-D gaussian derivative filter
+ * either horizontally or vertically according to meta data given in thread data.
+ * When convoluting horizontally source is always the in frame withing thread data
+ * while when convoluting vertically source is a buffer.
+ *
+ * @param ctx the filter context.
+ * @param arg data to be passed between threads.
+ * @param jobnr current job nubmer.
+ * @param nb_jobs total number of jobs.
+ *
+ * @return 0.
+ */
+static int slice_get_derivative(AVFilterContext* ctx, void* arg, int jobnr, int nb_jobs)
+{
+    ColorConstancyContext *s = ctx->priv;
+    ThreadData *td = arg;
+    AVFrame *in = td->in;
+    const int ord = td->meta_data[INDEX_ORD];
+    const int dir = td->meta_data[INDEX_DIR];
+    const int src_index  = td->meta_data[INDEX_SRC];
+    const int dst_index  = td->meta_data[INDEX_DST];
+    const int filtersize = s->filtersize;
+    const double *gauss  = s->gauss[ord];
+    int plane;
+
+    for (plane = 0; plane < NUM_PLANES; ++plane) {
+        const int height      = s->planeheight[plane];
+        const int width       = s->planewidth[plane];
+        const int in_linesize = in->linesize[plane];
+        double *dst = td->data[dst_index][plane];
+        int slice_start, slice_end;
+        int r, c, g;
+
+        if (dir == DIR_X) {
+            /** Applying gauss horizontally along each row */
+            const uint8_t *src = in->data[plane];
+            slice_start = (height * jobnr      ) / nb_jobs;
+            slice_end   = (height * (jobnr + 1)) / nb_jobs;
+
+            for (r = slice_start; r < slice_end; ++r) {
+                for (c = 0; c < width; ++c) {
+                    dst[INDX2D(r, c, width)] = 0;
+                    for (g = 0; g < filtersize; ++g) {
+                        dst[INDX2D(r, c, width)] += GAUSS(src, r,                        c + GINDX(filtersize, g),
+                                                          in_linesize, height, width, gauss[GINDX(filtersize, g)]);
+                    }
+                }
+            }
+        } else {
+            /** Applying gauss vertically along each column */
+            const double *src = td->data[src_index][plane];
+            slice_start = (width * jobnr      ) / nb_jobs;
+            slice_end   = (width * (jobnr + 1)) / nb_jobs;
+
+            for (c = slice_start; c < slice_end; ++c) {
+                for (r = 0; r < height; ++r) {
+                    dst[INDX2D(r, c, width)] = 0;
+                    for (g = 0; g < filtersize; ++g) {
+                        dst[INDX2D(r, c, width)] += GAUSS(src, r + GINDX(filtersize, g), c,
+                                                          width, height, width, gauss[GINDX(filtersize, g)]);
+                    }
+                }
+            }
+        }
+
+    }
+    return 0;
+}
+
+/**
+ * Slice Frobius normalization of gaussian derivatives. Only called for difford values of
+ * 1 or 2.
+ *
+ * @param ctx the filter context.
+ * @param arg data to be passed between threads.
+ * @param jobnr current job nubmer.
+ * @param nb_jobs total number of jobs.
+ *
+ * @return 0.
+ */
+static int slice_normalize(AVFilterContext* ctx, void* arg, int jobnr, int nb_jobs)
+{
+    ColorConstancyContext *s = ctx->priv;
+    ThreadData *td = arg;
+    const int difford = s->difford;
+    int plane;
+
+    for (plane = 0; plane < NUM_PLANES; ++plane) {
+        const int height = s->planeheight[plane];
+        const int width  = s->planewidth[plane];
+        const int64_t numpixels = width * (int64_t)height;
+        const int slice_start   = (numpixels * jobnr    ) / nb_jobs;
+        const int slice_end     = (numpixels * (jobnr+1)) / nb_jobs;
+        const double *dx = td->data[INDEX_DX][plane];
+        const double *dy = td->data[INDEX_DY][plane];
+        double *norm = td->data[INDEX_NORM][plane];
+        int i;
+
+        if (difford == 1) {
+            for (i = slice_start; i < slice_end; ++i) {
+                norm[i] = sqrt( pow(dx[i], 2) + pow(dy[i], 2));
+            }
+        } else {
+            const double *dxy = td->data[INDEX_DXY][plane];
+            for (i = slice_start; i < slice_end; ++i) {
+                norm[i] = sqrt( pow(dx[i], 2) + 4 * pow(dxy[i], 2) + pow(dy[i], 2) );
+            }
+        }
+    }
+
+    return 0;
+}
+
+/**
+ * Utility function for setting up differentiation data/metadata.
+ *
+ * @param ctx the filter context.
+ * @param td to be used for passing data between threads.
+ * @param ord ord of differentiation.
+ * @param dir direction of differentiation.
+ * @param src index of source used for differentiation.
+ * @param dst index destination used for saving differentiation result.
+ * @param dim maximum dimension in current direction.
+ * @param nb_threads number of threads to use.
+ */
+static void av_always_inline
+get_deriv(AVFilterContext *ctx, ThreadData *td, int ord, int dir,
+          int src, int dst, int dim, int nb_threads) {
+    td->meta_data[INDEX_ORD] = ord;
+    td->meta_data[INDEX_DIR] = dir;
+    td->meta_data[INDEX_SRC] = src;
+    td->meta_data[INDEX_DST] = dst;
+    ctx->internal->execute(ctx, slice_get_derivative, td, NULL, FFMIN(dim, nb_threads));
+}
+
+/**
+ * Main control function for calculating gaussian derivatives.
+ *
+ * @param ctx the filter context.
+ * @param td holds the buffers used for storing results.
+ *
+ * @return 0 in case of success, a negative value corresponding to an
+ * AVERROR code in case of failure.
+ */
+static int get_derivative(AVFilterContext *ctx, ThreadData *td)
+{
+    ColorConstancyContext *s = ctx->priv;
+    int nb_threads = s->nb_threads;
+    int height = s->planeheight[1];
+    int width  = s->planewidth[1];
+
+    switch(s->difford) {
+    case 0:
+        if (!s->sigma) { // Only copy once
+            get_deriv(ctx, td, 0, DIR_X, 0         , INDEX_NORM, height, nb_threads);
+        } else {
+            get_deriv(ctx, td, 0, DIR_X, 0,          INDEX_TEMP, height, nb_threads);
+            get_deriv(ctx, td, 0, DIR_Y, INDEX_TEMP, INDEX_NORM, width , nb_threads);
+            // save to INDEX_NORM because this will not be normalied and
+            // end gry edge filter expects result to be found in INDEX_NORM
+        }
+        return 0;
+
+    case 1:
+        get_deriv(ctx, td, 1, DIR_X, 0,          INDEX_TEMP, height, nb_threads);
+        get_deriv(ctx, td, 0, DIR_Y, INDEX_TEMP, INDEX_DX,   width , nb_threads);
+
+        get_deriv(ctx, td, 0, DIR_X, 0,          INDEX_TEMP, height, nb_threads);
+        get_deriv(ctx, td, 1, DIR_Y, INDEX_TEMP, INDEX_DY,   width , nb_threads);
+        return 0;
+
+    case 2:
+        get_deriv(ctx, td, 2, DIR_X, 0,          INDEX_TEMP, height, nb_threads);
+        get_deriv(ctx, td, 0, DIR_Y, INDEX_TEMP, INDEX_DX,   width , nb_threads);
+
+        get_deriv(ctx, td, 0, DIR_X, 0,          INDEX_TEMP, height, nb_threads);
+        get_deriv(ctx, td, 2, DIR_Y, INDEX_TEMP, INDEX_DY,   width , nb_threads);
+
+        get_deriv(ctx, td, 1, DIR_X, 0,          INDEX_TEMP, height, nb_threads);
+        get_deriv(ctx, td, 1, DIR_Y, INDEX_TEMP, INDEX_DXY,  width , nb_threads);
+        return 0;
+
+    default:
+        av_log(ctx, AV_LOG_ERROR, "Unsupported difford value: %d.\n", s->difford);
+        return AVERROR(EINVAL);
+    }
+
+}
+
+/**
+ * Slice function for grey edge algorithm that does partial summing/maximizing
+ * of gaussian derivatives.
+ *
+ * @param ctx the filter context.
+ * @param arg data to be passed between threads.
+ * @param jobnr current job nubmer.
+ * @param nb_jobs total number of jobs.
+ *
+ * @return 0.
+ */
+static int filter_slice_grey_edge(AVFilterContext* ctx, void* arg, int jobnr, int nb_jobs)
+{
+    ColorConstancyContext *s = ctx->priv;
+    ThreadData *td = arg;
+    AVFrame *in    = td->in;
+    int minknorm   = s->minknorm;
+    const uint8_t thresh = 255;
+    int plane;
+
+    for (plane = 0; plane < NUM_PLANES; ++plane) {
+        const int height        = s->planeheight[plane];
+        const int width         = s->planewidth[plane];
+        const int in_linesize   = in->linesize[plane];
+        const int slice_start   = (height * jobnr) / nb_jobs;
+        const int slice_end     = (height * (jobnr+1)) / nb_jobs;
+        const uint8_t *img_data = in->data[plane];
+        const double *src       = td->data[INDEX_NORM][plane];
+        double *dst             = td->data[INDEX_DST][plane];
+        int r, c;
+
+        dst[jobnr] = 0;
+        if (!minknorm) {
+            for (r = slice_start; r < slice_end; ++r) {
+                for (c = 0; c < width; ++c) {
+                    dst[jobnr] = FFMAX( dst[jobnr], fabs(src[INDX2D(r, c, width)])
+                                        * (img_data[INDX2D(r, c, in_linesize)] < thresh) );
+                }
+            }
+        } else {
+            for (r = slice_start; r < slice_end; ++r) {
+                for (c = 0; c < width; ++c) {
+                    dst[jobnr] += ( pow( fabs(src[INDX2D(r, c, width)] / 255.), minknorm)
+                                    * (img_data[INDX2D(r, c, in_linesize)] < thresh) );
+                }
+            }
+        }
+    }
+    return 0;
+}
+
+/**
+ * Main control function for grey edge algorithm.
+ *
+ * @param ctx the filter context.
+ * @param in frame to perfrom grey edge on.
+ *
+ * @return 0 in case of success, a negative value corresponding to an
+ * AVERROR code in case of failure.
+ */
+static int filter_grey_edge(AVFilterContext *ctx, AVFrame *in)
+{
+    ColorConstancyContext *s = ctx->priv;
+    ThreadData td;
+    int minknorm  = s->minknorm;
+    int difford   = s->difford;
+    double *white = s->white;
+    int nb_jobs   = FFMIN3(s->planeheight[1], s->planewidth[1], s->nb_threads);
+    int plane, job, ret;
+
+    td.in = in;
+    ret = setup_derivative_buffers(ctx, &td);
+    if (ret) {
+        return ret;
+    }
+    get_derivative(ctx, &td);
+    if (difford > 0) {
+        ctx->internal->execute(ctx, slice_normalize, &td, NULL, nb_jobs);
+    }
+
+    ctx->internal->execute(ctx, filter_slice_grey_edge, &td, NULL, nb_jobs);
+    if (!minknorm) {
+        for (plane = 0; plane < NUM_PLANES; ++plane) {
+            white[plane] = 0; // All values are absolute
+            for (job = 0; job < nb_jobs; ++job) {
+                white[plane] = FFMAX(white[plane] , td.data[INDEX_DST][plane][job]);
+            }
+        }
+    } else {
+        for (plane = 0; plane < NUM_PLANES; ++plane) {
+            white[plane] = 0;
+            for (job = 0; job < nb_jobs; ++job) {
+                white[plane] += td.data[INDEX_DST][plane][job];
+            }
+            white[plane] = pow(white[plane], 1./minknorm);
+        }
+    }
+
+    cleanup_derivative_buffers(&td, difford + 1, NUM_PLANES);
+    return 0;
+}
+
+/**
+ * Normalizes estimated illumination since only illumination vector
+ * direction is required for color constancy.
+ *
+ * @param light the estimated illumination to be normalized in place
+ */
+static void normalize_light(double *light)
+{
+    double abs_val = pow( pow(light[0], 2.0) + pow(light[1], 2.0) + pow(light[2], 2.0), 0.5);
+    int plane;
+
+    // TODO: check if setting to 1.0 when estimated = 0.0 is the best thing to do
+
+    if (!abs_val) {
+        for (plane = 0; plane < NUM_PLANES; ++plane) {
+            light[plane] = 1.0;
+        }
+    } else {
+        for (plane = 0; plane < NUM_PLANES; ++plane) {
+            light[plane] = (light[plane] / abs_val);
+            if (!light[plane]) { // to avoid division by zero when correcting
+                light[plane] = 1.0;
+            }
+        }
+    }
+}
+
+/**
+ * Redirects to corresponding algorithm estimation function and performs normalization
+ * after estimation.
+ *
+ * @param ctx the filter context.
+ * @param in frame to perfrom estimation on.
+ *
+ * @return 0 in case of success, a negative value corresponding to an
+ * AVERROR code in case of failure.
+ */
+static int illumination_estimation(AVFilterContext *ctx, AVFrame *in)
+{
+    ColorConstancyContext *s = ctx->priv;
+    int ret;
+
+    ret = filter_grey_edge(ctx, in);
+
+    av_log(ctx, AV_LOG_DEBUG, "Estimated illumination= %f %f %f\n",
+           s->white[0], s->white[1], s->white[2]);
+    normalize_light(s->white);
+    av_log(ctx, AV_LOG_DEBUG, "Estimated illumination after normalization= %f %f %f\n",
+           s->white[0], s->white[1], s->white[2]);
+
+    return ret;
+}
+
+/**
+ * Performs simple correction via diagonal transformation model.
+ *
+ * @param ctx the filter context.
+ * @param arg data to be passed between threads.
+ * @param jobnr current job nubmer.
+ * @param nb_jobs total number of jobs.
+ *
+ * @return 0.
+ */
+static int diagonal_transformation(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+    ColorConstancyContext *s = ctx->priv;
+    ThreadData *td = arg;
+    AVFrame *in = td->in;
+    AVFrame *out = td->out;
+    double sqrt3 = pow(3.0, 0.5);
+    int plane;
+
+    for (plane = 0; plane < NUM_PLANES; ++plane) {
+        const int height = s->planeheight[plane];
+        const int width  = s->planewidth[plane];
+        const int64_t numpixels = width * (int64_t)height;
+        const int slice_start   = (numpixels * jobnr) / nb_jobs;
+        const int slice_end     = (numpixels * (jobnr+1)) / nb_jobs;
+        const uint8_t *src = in->data[plane];
+        uint8_t *dst       = out->data[plane];
+        double temp;
+        unsigned i;
+
+        for (i = slice_start; i < slice_end; ++i) {
+            temp = src[i] / (s->white[plane] * sqrt3);
+            dst[i] = av_clip_uint8((int)(temp + 0.5));
+        }
+    }
+    return 0;
+}
+
+/**
+ * Main control function for correcting scene illumination based on
+ * estimated illumination.
+ *
+ * @param ctx the filter context.
+ * @param in holds frame to correct
+ * @param out holds corrected frame
+ */
+static void chromatic_adaptation(AVFilterContext *ctx, AVFrame *in, AVFrame *out)
+{
+    ColorConstancyContext *s = ctx->priv;
+    ThreadData td;
+    int nb_jobs = FFMIN3(s->planeheight[1], s->planewidth[1], s->nb_threads);
+
+    td.in  = in;
+    td.out = out;
+    ctx->internal->execute(ctx, diagonal_transformation, &td, NULL, nb_jobs);
+}
+
+static int query_formats(AVFilterContext *ctx)
+{
+    static const enum AVPixelFormat pix_fmts[] = {
+        // TODO: support more formats
+        // FIXME: error when saving to .jpg
+        AV_PIX_FMT_GBRP,
+        AV_PIX_FMT_NONE
+    };
+
+    return ff_set_common_formats(ctx, ff_make_format_list(pix_fmts));
+}
+
+static int config_props(AVFilterLink *inlink)
+{
+    AVFilterContext *ctx = inlink->dst;
+    ColorConstancyContext *s = ctx->priv;
+    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(inlink->format);
+    const double break_off_sigma = 3.0;
+    double sigma = s->sigma;
+    int ret;
+
+    if (!sigma && s->difford) {
+        av_log(ctx, AV_LOG_ERROR, "Sigma can't be set to 0 when difford > 0.\n");
+        return AVERROR(EINVAL);
+    }
+
+    s->filtersize = 2 * floor(break_off_sigma * s->sigma + 0.5) + 1;
+    if (ret=set_gauss(ctx)) {
+        return ret;
+    }
+
+    s->nb_threads = ff_filter_get_nb_threads(ctx);
+    s->planewidth[1]  = s->planewidth[2]  = AV_CEIL_RSHIFT(inlink->w, desc->log2_chroma_w);
+    s->planewidth[0]  = s->planewidth[3]  = inlink->w;
+    s->planeheight[1] = s->planeheight[2] = AV_CEIL_RSHIFT(inlink->h, desc->log2_chroma_h);
+    s->planeheight[0] = s->planeheight[3] = inlink->h;
+
+    return 0;
+}
+
+static int filter_frame(AVFilterLink *inlink, AVFrame *in)
+{
+    AVFilterContext *ctx = inlink->dst;
+    AVFilterLink *outlink = ctx->outputs[0];
+    AVFrame *out;
+    int ret;
+
+    ret = illumination_estimation(ctx, in);
+    if (ret) {
+        return ret;
+    }
+
+    if (av_frame_is_writable(in)) {
+        out = in;
+    } else {
+        out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
+        if (!out) {
+            av_log(ctx, AV_LOG_ERROR, "Out of memory while allocating output video buffer.\n");
+            return AVERROR(ENOMEM);
+        }
+        av_frame_copy_props(out, in);
+    }
+    chromatic_adaptation(ctx, in, out);
+
+    return ff_filter_frame(outlink, out);
+}
+
+static av_cold void uninit(AVFilterContext *ctx)
+{
+    ColorConstancyContext *s = ctx->priv;
+    int difford = s->difford;
+    int i;
+
+    for (i = 0; i <= difford; ++i) {
+        av_freep(&s->gauss[i]);
+    }
+}
+
+static const AVFilterPad colorconstancy_inputs[] = {
+    {
+        .name         = "default",
+        .type         = AVMEDIA_TYPE_VIDEO,
+        .config_props = config_props,
+        .filter_frame = filter_frame,
+    },
+    { NULL }
+};
+
+static const AVFilterPad colorconstancy_outputs[] = {
+    {
+        .name = "default",
+        .type = AVMEDIA_TYPE_VIDEO,
+    },
+    { NULL }
+};
+
+#if CONFIG_GREYEDGE_FILTER
+
+static const AVOption greyedge_options[] = {
+    { "difford",  "set differentiation order", OFFSET(difford),  AV_OPT_TYPE_INT,    {.i64=1},   0,   2,      FLAGS },
+    { "minknorm", "set Minkowski norm",        OFFSET(minknorm), AV_OPT_TYPE_INT,    {.i64=1},   0,   65535,  FLAGS },
+    { "sigma",    "set sigma",                 OFFSET(sigma),    AV_OPT_TYPE_DOUBLE, {.dbl=1},   0.0, 1024.0, FLAGS },
+    { NULL }
+};
+
+AVFILTER_DEFINE_CLASS(greyedge);
+
+AVFilter ff_vf_greyedge = {
+    .name          = GREY_EDGE,
+    .description   = NULL_IF_CONFIG_SMALL("Estimates scene illumination by grey edge assumption."),
+    .priv_size     = sizeof(ColorConstancyContext),
+    .priv_class    = &greyedge_class,
+    .query_formats = query_formats,
+    .uninit        = uninit,
+    .inputs        = colorconstancy_inputs,
+    .outputs       = colorconstancy_outputs,
+    .flags         = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC | AVFILTER_FLAG_SLICE_THREADS,
+};
+
+#endif /* CONFIG_GREY_EDGE_FILTER */



More information about the ffmpeg-cvslog mailing list