[FFmpeg-cvslog] avfilter/af_afftdn: use better approach for gain smoothing

Sun Apr 24 00:03:37 EEST 2022

ffmpeg | branch: master | Paul B Mahol <onemda at gmail.com> | Sat Apr 23 22:18:26 2022 +0200| [fe85afbf8cb2b9cf8cb28cb13bff654949b43823] | committer: Paul B Mahol

avfilter/af_afftdn: use better approach for gain smoothing

> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=fe85afbf8cb2b9cf8cb28cb13bff654949b43823
---

 doc/filters.texi        |  7 ++++---
 libavfilter/af_afftdn.c | 35 ++++++++++++++++++++++++++---------
 2 files changed, 30 insertions(+), 12 deletions(-)

diff --git a/doc/filters.texi b/doc/filters.texi
index 495d59c924..c8699b9099 100644
--- a/doc/filters.texi
+++ b/doc/filters.texi
@@ -1392,10 +1392,11 @@ Default value is @code{none}.
 @end table
 
 @item gain_smooth, gs
-Set gain smooth factor, used to lowpass gains applied to each frequency bin.
+Set gain smooth spatial radius, used to smooth gains applied to each frequency bin.
 Useful to reduce random music noise artefacts.
-Higher values reduce smoothing of gains.
-Default value is @code{1.0}.
+Higher values increases smoothing of gains.
+Allowed range is from @code{0} to @code{50}.
+Default value is @code{0}.
 @end table
 
 @subsection Commands
diff --git a/libavfilter/af_afftdn.c b/libavfilter/af_afftdn.c
index 2fb3cb19ac..1b6487a102 100644
--- a/libavfilter/af_afftdn.c
+++ b/libavfilter/af_afftdn.c
@@ -71,6 +71,7 @@ typedef struct DeNoiseChannel {
     double     *band_amt;
     double     *band_excit;
     double     *gain;
+    double     *smoothed_gain;
     double     *prior;
     double     *prior_band_excit;
     double     *clean_data;
@@ -114,7 +115,7 @@ typedef struct AudioFFTDeNoiseContext {
     int     output_mode;
     int     noise_floor_link;
     float   ratio;
-    float   gain_smooth;
+    int     gain_smooth;
     float   band_multiplier;
     float   floor_offset;
 
@@ -208,8 +209,8 @@ static const AVOption afftdn_options[] = {
     {  "begin",   "start",                0,                       AV_OPT_TYPE_CONST,  {.i64 = SAMPLE_START},  0,  0, AFR, "sample" },
     {  "stop",    "stop",                 0,                       AV_OPT_TYPE_CONST,  {.i64 = SAMPLE_STOP},   0,  0, AFR, "sample" },
     {  "end",     "stop",                 0,                       AV_OPT_TYPE_CONST,  {.i64 = SAMPLE_STOP},   0,  0, AFR, "sample" },
-    { "gain_smooth", "set gain smooth factor",OFFSET(gain_smooth), AV_OPT_TYPE_FLOAT,  {.dbl = 1.00},     0.0001,  1, AFR },
-    { "gs",          "set gain smooth factor",OFFSET(gain_smooth), AV_OPT_TYPE_FLOAT,  {.dbl = 1.00},     0.0001,  1, AFR },
+    { "gain_smooth", "set gain smooth radius",OFFSET(gain_smooth), AV_OPT_TYPE_INT,    {.i64 = 0},             0, 50, AFR },
+    { "gs",          "set gain smooth radius",OFFSET(gain_smooth), AV_OPT_TYPE_INT,    {.i64 = 0},             0, 50, AFR },
     { NULL }
 };
 
@@ -357,6 +358,7 @@ static void process_frame(AVFilterContext *ctx,
     double *noisy_data = dnch->noisy_data;
     double *band_excit = dnch->band_excit;
     double *band_amt = dnch->band_amt;
+    double *smoothed_gain = dnch->smoothed_gain;
     double *gain = dnch->gain;
 
     for (int i = 0; i < s->bin_count; i++) {
@@ -424,16 +426,28 @@ static void process_frame(AVFilterContext *ctx,
         }
     }
 
-    {
-        const double f = s->gain_smooth;
-        const double F = 1. - f;
+    memcpy(smoothed_gain, gain, s->bin_count * sizeof(*smoothed_gain));
+    if (s->gain_smooth > 0) {
+        const int r = s->gain_smooth;
+
+        for (int i = r; i < s->bin_count - r; i++) {
+            const double gc = gain[i];
+            double num = 0., den = 0.;
+
+            for (int j = -r; j <= r; j++) {
+                const double g = gain[i + j];
+                const double d = 1. - fabs(g - gc);
 
-        for (int i = 1; i < s->bin_count; i++)
-            gain[i] = gain[i-1] * F + f * gain[i];
+                num += g * d;
+                den += d;
+            }
+
+            smoothed_gain[i] = num / den;
+        }
     }
 
     for (int i = 0; i < s->bin_count; i++) {
-        const double new_gain = gain[i];
+        const double new_gain = smoothed_gain[i];
 
         fft_data[i].re *= new_gain;
         fft_data[i].im *= new_gain;
@@ -685,6 +699,7 @@ static int config_input(AVFilterLink *inlink)
         dnch->band_amt = av_calloc(s->number_of_bands, sizeof(*dnch->band_amt));
         dnch->band_excit = av_calloc(s->number_of_bands, sizeof(*dnch->band_excit));
         dnch->gain = av_calloc(s->bin_count, sizeof(*dnch->gain));
+        dnch->smoothed_gain = av_calloc(s->bin_count, sizeof(*dnch->smoothed_gain));
         dnch->prior = av_calloc(s->bin_count, sizeof(*dnch->prior));
         dnch->prior_band_excit = av_calloc(s->number_of_bands, sizeof(*dnch->prior_band_excit));
         dnch->clean_data = av_calloc(s->bin_count, sizeof(*dnch->clean_data));
@@ -708,6 +723,7 @@ static int config_input(AVFilterLink *inlink)
             !dnch->band_amt ||
             !dnch->band_excit ||
             !dnch->gain ||
+            !dnch->smoothed_gain ||
             !dnch->prior ||
             !dnch->prior_band_excit ||
             !dnch->clean_data ||
@@ -1161,6 +1177,7 @@ static av_cold void uninit(AVFilterContext *ctx)
             av_freep(&dnch->band_amt);
             av_freep(&dnch->band_excit);
             av_freep(&dnch->gain);
+            av_freep(&dnch->smoothed_gain);
             av_freep(&dnch->prior);
             av_freep(&dnch->prior_band_excit);
             av_freep(&dnch->clean_data);