|
- /*
- * Copyright (c) 2018 Chris Johnson
- *
- * Permission is hereby granted, free of charge, to any person obtaining a copy
- * of this software and associated documentation files (the "Software"), to deal
- * in the Software without restriction, including without limitation the rights
- * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the Software is
- * furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in all
- * copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
- * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- */
-
- #include "libavutil/channel_layout.h"
- #include "libavutil/opt.h"
- #include "avfilter.h"
- #include "audio.h"
- #include "formats.h"
-
- typedef struct DeesserChannel {
- double s1, s2, s3;
- double m1, m2;
- double ratioA, ratioB;
- double iirSampleA, iirSampleB;
- int flip;
- } DeesserChannel;
-
- typedef struct DeesserContext {
- const AVClass *class;
-
- double intensity;
- double max;
- double frequency;
- int mode;
-
- DeesserChannel *chan;
- } DeesserContext;
-
- enum OutModes {
- IN_MODE,
- OUT_MODE,
- ESS_MODE,
- NB_MODES
- };
-
- #define OFFSET(x) offsetof(DeesserContext, x)
- #define A AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM
-
- static const AVOption deesser_options[] = {
- { "i", "set intensity", OFFSET(intensity), AV_OPT_TYPE_DOUBLE, {.dbl=0.0}, 0.0, 1.0, A },
- { "m", "set max deessing", OFFSET(max), AV_OPT_TYPE_DOUBLE, {.dbl=0.5}, 0.0, 1.0, A },
- { "f", "set frequency", OFFSET(frequency), AV_OPT_TYPE_DOUBLE, {.dbl=0.5}, 0.0, 1.0, A },
- { "s", "set output mode", OFFSET(mode), AV_OPT_TYPE_INT, {.i64=OUT_MODE}, 0, NB_MODES-1, A, "mode" },
- { "i", "input", 0, AV_OPT_TYPE_CONST, {.i64=IN_MODE}, 0, 0, A, "mode" },
- { "o", "output", 0, AV_OPT_TYPE_CONST, {.i64=OUT_MODE}, 0, 0, A, "mode" },
- { "e", "ess", 0, AV_OPT_TYPE_CONST, {.i64=ESS_MODE}, 0, 0, A, "mode" },
- { NULL }
- };
-
- AVFILTER_DEFINE_CLASS(deesser);
-
- static int query_formats(AVFilterContext *ctx)
- {
- AVFilterFormats *formats = NULL;
- AVFilterChannelLayouts *layouts = NULL;
- static const enum AVSampleFormat sample_fmts[] = {
- AV_SAMPLE_FMT_DBLP,
- AV_SAMPLE_FMT_NONE
- };
- int ret;
-
- formats = ff_make_format_list(sample_fmts);
- if (!formats)
- return AVERROR(ENOMEM);
- ret = ff_set_common_formats(ctx, formats);
- if (ret < 0)
- return ret;
-
- layouts = ff_all_channel_counts();
- if (!layouts)
- return AVERROR(ENOMEM);
-
- ret = ff_set_common_channel_layouts(ctx, layouts);
- if (ret < 0)
- return ret;
-
- formats = ff_all_samplerates();
- return ff_set_common_samplerates(ctx, formats);
- }
-
- static int config_input(AVFilterLink *inlink)
- {
- AVFilterContext *ctx = inlink->dst;
- DeesserContext *s = ctx->priv;
-
- s->chan = av_calloc(inlink->channels, sizeof(*s->chan));
- if (!s->chan)
- return AVERROR(ENOMEM);
-
- for (int i = 0; i < inlink->channels; i++) {
- DeesserChannel *chan = &s->chan[i];
-
- chan->ratioA = chan->ratioB = 1.0;
- }
-
- return 0;
- }
-
- static int filter_frame(AVFilterLink *inlink, AVFrame *in)
- {
- AVFilterContext *ctx = inlink->dst;
- AVFilterLink *outlink = ctx->outputs[0];
- DeesserContext *s = ctx->priv;
- AVFrame *out;
-
- if (av_frame_is_writable(in)) {
- out = in;
- } else {
- out = ff_get_audio_buffer(outlink, in->nb_samples);
- if (!out) {
- av_frame_free(&in);
- return AVERROR(ENOMEM);
- }
- av_frame_copy_props(out, in);
- }
-
- for (int ch = 0; ch < inlink->channels; ch++) {
- DeesserChannel *dec = &s->chan[ch];
- double *src = (double *)in->extended_data[ch];
- double *dst = (double *)out->extended_data[ch];
- double overallscale = inlink->sample_rate < 44100 ? 44100.0 / inlink->sample_rate : inlink->sample_rate / 44100.0;
- double intensity = pow(s->intensity, 5) * (8192 / overallscale);
- double maxdess = 1.0 / pow(10.0, ((s->max - 1.0) * 48.0) / 20);
- double iirAmount = pow(s->frequency, 2) / overallscale;
- double offset;
- double sense;
- double recovery;
- double attackspeed;
-
- for (int i = 0; i < in->nb_samples; i++) {
- double sample = src[i];
-
- dec->s3 = dec->s2;
- dec->s2 = dec->s1;
- dec->s1 = sample;
- dec->m1 = (dec->s1 - dec->s2) * ((dec->s1 - dec->s2) / 1.3);
- dec->m2 = (dec->s2 - dec->s3) * ((dec->s1 - dec->s2) / 1.3);
- sense = (dec->m1 - dec->m2) * ((dec->m1 - dec->m2) / 1.3);
- attackspeed = 7.0 + sense * 1024;
-
- sense = 1.0 + intensity * intensity * sense;
- sense = FFMIN(sense, intensity);
- recovery = 1.0 + (0.01 / sense);
-
- offset = 1.0 - fabs(sample);
-
- if (dec->flip) {
- dec->iirSampleA = (dec->iirSampleA * (1.0 - (offset * iirAmount))) +
- (sample * (offset * iirAmount));
- if (dec->ratioA < sense) {
- dec->ratioA = ((dec->ratioA * attackspeed) + sense) / (attackspeed + 1.0);
- } else {
- dec->ratioA = 1.0 + ((dec->ratioA - 1.0) / recovery);
- }
-
- dec->ratioA = FFMIN(dec->ratioA, maxdess);
- sample = dec->iirSampleA + ((sample - dec->iirSampleA) / dec->ratioA);
- } else {
- dec->iirSampleB = (dec->iirSampleB * (1.0 - (offset * iirAmount))) +
- (sample * (offset * iirAmount));
- if (dec->ratioB < sense) {
- dec->ratioB = ((dec->ratioB * attackspeed) + sense) / (attackspeed + 1.0);
- } else {
- dec->ratioB = 1.0 + ((dec->ratioB - 1.0) / recovery);
- }
-
- dec->ratioB = FFMIN(dec->ratioB, maxdess);
- sample = dec->iirSampleB + ((sample - dec->iirSampleB) / dec->ratioB);
- }
-
- dec->flip = !dec->flip;
-
- if (ctx->is_disabled)
- sample = src[i];
-
- switch (s->mode) {
- case IN_MODE: dst[i] = src[i]; break;
- case OUT_MODE: dst[i] = sample; break;
- case ESS_MODE: dst[i] = src[i] - sample; break;
- }
- }
- }
-
- if (out != in)
- av_frame_free(&in);
-
- return ff_filter_frame(outlink, out);
- }
-
- static av_cold void uninit(AVFilterContext *ctx)
- {
- DeesserContext *s = ctx->priv;
-
- av_freep(&s->chan);
- }
-
- static const AVFilterPad inputs[] = {
- {
- .name = "default",
- .type = AVMEDIA_TYPE_AUDIO,
- .filter_frame = filter_frame,
- .config_props = config_input,
- },
- { NULL }
- };
-
- static const AVFilterPad outputs[] = {
- {
- .name = "default",
- .type = AVMEDIA_TYPE_AUDIO,
- },
- { NULL }
- };
-
- AVFilter ff_af_deesser = {
- .name = "deesser",
- .description = NULL_IF_CONFIG_SMALL("Apply de-essing to the audio."),
- .query_formats = query_formats,
- .priv_size = sizeof(DeesserContext),
- .priv_class = &deesser_class,
- .uninit = uninit,
- .inputs = inputs,
- .outputs = outputs,
- .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL,
- };
|