doxygen/trunk/af__deesser_8c_source.html

/*

 * Copyright (c) 2018 Chris Johnson

 *

 * Permission is hereby granted, free of charge, to any person obtaining a copy

 * of this software and associated documentation files (the "Software"), to deal

 * in the Software without restriction, including without limitation the rights

 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell

 * copies of the Software, and to permit persons to whom the Software is

 * furnished to do so, subject to the following conditions:

 *

 * The above copyright notice and this permission notice shall be included in all

 * copies or substantial portions of the Software.

 *

 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE

 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,

 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE

 * SOFTWARE.

 */


#include "libavutil/channel_layout.h"

#include "libavutil/mem.h"

#include "libavutil/opt.h"

#include "avfilter.h"

#include "audio.h"

#include "filters.h"


typedef struct DeesserChannel {

    double s1, s2, s3;

    double m1, m2;

    double ratioA, ratioB;

    double iirSampleA, iirSampleB;

    int flip;

} DeesserChannel;


typedef struct DeesserContext {

    const AVClass *class;


    double intensity;

    double max;

    double frequency;

    int    mode;


    DeesserChannel *chan;

} DeesserContext;


enum OutModes {

    IN_MODE,

    OUT_MODE,

    ESS_MODE,

    NB_MODES

};


#define OFFSET(x) offsetof(DeesserContext, x)

#define A AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM


static const AVOption deesser_options[] = {

    { "i", "set intensity",    OFFSET(intensity), AV_OPT_TYPE_DOUBLE, {.dbl=0.0}, 0.0, 1.0, A },

    { "m", "set max deessing", OFFSET(max),       AV_OPT_TYPE_DOUBLE, {.dbl=0.5}, 0.0, 1.0, A },

    { "f", "set frequency",    OFFSET(frequency), AV_OPT_TYPE_DOUBLE, {.dbl=0.5}, 0.0, 1.0, A },

    { "s", "set output mode",  OFFSET(mode),      AV_OPT_TYPE_INT,    {.i64=OUT_MODE}, 0, NB_MODES-1, A, .unit = "mode" },

    {  "i", "input",           0,                 AV_OPT_TYPE_CONST,  {.i64=IN_MODE},  0, 0, A, .unit = "mode" },

    {  "o", "output",          0,                 AV_OPT_TYPE_CONST,  {.i64=OUT_MODE}, 0, 0, A, .unit = "mode" },

    {  "e", "ess",             0,                 AV_OPT_TYPE_CONST,  {.i64=ESS_MODE}, 0, 0, A, .unit = "mode" },

    { NULL }

};


AVFILTER_DEFINE_CLASS(deesser);


static int config_input(AVFilterLink *inlink)

{

    AVFilterContext *ctx = inlink->dst;

    DeesserContext *s = ctx->priv;


    s->chan = av_calloc(inlink->ch_layout.nb_channels, sizeof(*s->chan));

    if (!s->chan)

        return AVERROR(ENOMEM);


    for (int i = 0; i < inlink->ch_layout.nb_channels; i++) {

        DeesserChannel *chan = &s->chan[i];


        chan->ratioA = chan->ratioB = 1.0;

    }


    return 0;

}


static int filter_frame(AVFilterLink *inlink, AVFrame *in)

{

    AVFilterContext *ctx = inlink->dst;

    AVFilterLink *outlink = ctx->outputs[0];

    DeesserContext *s = ctx->priv;

    AVFrame *out;


    if (av_frame_is_writable(in)) {

        out = in;

    } else {

        out = ff_get_audio_buffer(outlink, in->nb_samples);

        if (!out) {

            av_frame_free(&in);

            return AVERROR(ENOMEM);

        }

        av_frame_copy_props(out, in);

    }


    for (int ch = 0; ch < inlink->ch_layout.nb_channels; ch++) {

        DeesserChannel *dec = &s->chan[ch];

        double *src = (double *)in->extended_data[ch];

        double *dst = (double *)out->extended_data[ch];

        double overallscale = inlink->sample_rate < 44100 ? 44100.0 / inlink->sample_rate : inlink->sample_rate / 44100.0;

        double intensity = pow(s->intensity, 5) * (8192 / overallscale);

        double maxdess = 1.0 / pow(10.0, ((s->max - 1.0) * 48.0) / 20);

        double iirAmount = pow(s->frequency, 2) / overallscale;

        double offset;

        double sense;

        double recovery;

        double attackspeed;


        for (int i = 0; i < in->nb_samples; i++) {

            double sample = src[i];


            dec->s3 = dec->s2;

            dec->s2 = dec->s1;

            dec->s1 = sample;

            dec->m1 = (dec->s1 - dec->s2) * ((dec->s1 - dec->s2) / 1.3);

            dec->m2 = (dec->s2 - dec->s3) * ((dec->s1 - dec->s2) / 1.3);

            sense = (dec->m1 - dec->m2) * ((dec->m1 - dec->m2) / 1.3);

            attackspeed = 7.0 + sense * 1024;


            sense = 1.0 + intensity * intensity * sense;

            sense = FFMIN(sense, intensity);

            recovery = 1.0 + (0.01 / sense);


            offset = 1.0 - fabs(sample);


            if (dec->flip) {

                dec->iirSampleA = (dec->iirSampleA * (1.0 - (offset * iirAmount))) +

                                  (sample * (offset * iirAmount));

                if (dec->ratioA < sense) {

                    dec->ratioA = ((dec->ratioA * attackspeed) + sense) / (attackspeed + 1.0);

                } else {

                    dec->ratioA = 1.0 + ((dec->ratioA - 1.0) / recovery);

                }


                dec->ratioA = FFMIN(dec->ratioA, maxdess);

                sample = dec->iirSampleA + ((sample - dec->iirSampleA) / dec->ratioA);

            } else {

                dec->iirSampleB = (dec->iirSampleB * (1.0 - (offset * iirAmount))) +

                                  (sample * (offset * iirAmount));

                if (dec->ratioB < sense) {

                    dec->ratioB = ((dec->ratioB * attackspeed) + sense) / (attackspeed + 1.0);

                } else {

                    dec->ratioB = 1.0 + ((dec->ratioB - 1.0) / recovery);

                }


                dec->ratioB = FFMIN(dec->ratioB, maxdess);

                sample = dec->iirSampleB + ((sample - dec->iirSampleB) / dec->ratioB);

            }


            dec->flip = !dec->flip;


            if (ctx->is_disabled)

                sample = src[i];


            switch (s->mode) {

            case IN_MODE:  dst[i] = src[i]; break;

            case OUT_MODE: dst[i] = sample; break;

            case ESS_MODE: dst[i] = src[i] - sample; break;

            }

        }

    }


    if (out != in)

        av_frame_free(&in);


    return ff_filter_frame(outlink, out);

}


static av_cold void uninit(AVFilterContext *ctx)

{

    DeesserContext *s = ctx->priv;


    av_freep(&s->chan);

}


static const AVFilterPad inputs[] = {

    {

        .name         = "default",

        .type         = AVMEDIA_TYPE_AUDIO,

        .filter_frame = filter_frame,

        .config_props = config_input,

    },

};


const FFFilter ff_af_deesser = {

    .p.name        = "deesser",

    .p.description = NULL_IF_CONFIG_SMALL("Apply de-essing to the audio."),

    .p.priv_class  = &deesser_class,

    .p.flags       = AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL,

    .priv_size     = sizeof(DeesserContext),

    .uninit        = uninit,

    FILTER_INPUTS(inputs),

    FILTER_OUTPUTS(ff_audio_default_filterpad),

    FILTER_SINGLE_SAMPLEFMT(AV_SAMPLE_FMT_DBLP),

};