git.sesse.net Git - ffmpeg/blob - libavfilter/af_afir.c

   1 /*
   2  * Copyright (c) 2017 Paul B Mahol
   3  *
   4  * This file is part of FFmpeg.
   5  *
   6  * FFmpeg is free software; you can redistribute it and/or
   7  * modify it under the terms of the GNU Lesser General Public
   8  * License as published by the Free Software Foundation; either
   9  * version 2.1 of the License, or (at your option) any later version.
  10  *
  11  * FFmpeg is distributed in the hope that it will be useful,
  12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  14  * Lesser General Public License for more details.
  15  *
  16  * You should have received a copy of the GNU Lesser General Public
  17  * License along with FFmpeg; if not, write to the Free Software
  18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19  */
  20
  21 /**
  22  * @file
  23  * An arbitrary audio FIR filter
  24  */
  25
  26 #include <float.h>
  27
  28 #include "libavutil/common.h"
  29 #include "libavutil/float_dsp.h"
  30 #include "libavutil/intreadwrite.h"
  31 #include "libavutil/opt.h"
  32 #include "libavutil/xga_font_data.h"
  33 #include "libavcodec/avfft.h"
  34
  35 #include "audio.h"
  36 #include "avfilter.h"
  37 #include "filters.h"
  38 #include "formats.h"
  39 #include "internal.h"
  40 #include "af_afir.h"
  41
  42 static void fcmul_add_c(float *sum, const float *t, const float *c, ptrdiff_t len)
  43 {
  44     int n;
  45
  46     for (n = 0; n < len; n++) {
  47         const float cre = c[2 * n    ];
  48         const float cim = c[2 * n + 1];
  49         const float tre = t[2 * n    ];
  50         const float tim = t[2 * n + 1];
  51
  52         sum[2 * n    ] += tre * cre - tim * cim;
  53         sum[2 * n + 1] += tre * cim + tim * cre;
  54     }
  55
  56     sum[2 * n] += t[2 * n] * c[2 * n];
  57 }
  58
  59 static int fir_channel(AVFilterContext *ctx, void *arg, int ch, int nb_jobs)
  60 {
  61     AudioFIRContext *s = ctx->priv;
  62     const float *src = (const float *)s->in[0]->extended_data[ch];
  63     int index1 = (s->index + 1) % 3;
  64     int index2 = (s->index + 2) % 3;
  65     float *sum = s->sum[ch];
  66     AVFrame *out = arg;
  67     float *block;
  68     float *dst;
  69     int n, i, j;
  70
  71     memset(sum, 0, sizeof(*sum) * s->fft_length);
  72     block = s->block[ch] + s->part_index * s->block_size;
  73     memset(block, 0, sizeof(*block) * s->fft_length);
  74
  75     s->fdsp->vector_fmul_scalar(block + s->part_size, src, s->dry_gain, FFALIGN(s->nb_samples, 4));
  76     emms_c();
  77
  78     av_rdft_calc(s->rdft[ch], block);
  79     block[2 * s->part_size] = block[1];
  80     block[1] = 0;
  81
  82     j = s->part_index;
  83
  84     for (i = 0; i < s->nb_partitions; i++) {
  85         const int coffset = i * s->coeff_size;
  86         const FFTComplex *coeff = s->coeff[ch * !s->one2many] + coffset;
  87
  88         block = s->block[ch] + j * s->block_size;
  89         s->fcmul_add(sum, block, (const float *)coeff, s->part_size);
  90
  91         if (j == 0)
  92             j = s->nb_partitions;
  93         j--;
  94     }
  95
  96     sum[1] = sum[2 * s->part_size];
  97     av_rdft_calc(s->irdft[ch], sum);
  98
  99     dst = (float *)s->buffer->extended_data[ch] + index1 * s->part_size;
 100     for (n = 0; n < s->part_size; n++) {
 101         dst[n] += sum[n];
 102     }
 103
 104     dst = (float *)s->buffer->extended_data[ch] + index2 * s->part_size;
 105
 106     memcpy(dst, sum + s->part_size, s->part_size * sizeof(*dst));
 107
 108     dst = (float *)s->buffer->extended_data[ch] + s->index * s->part_size;
 109
 110     if (out) {
 111         float *ptr = (float *)out->extended_data[ch];
 112         s->fdsp->vector_fmul_scalar(ptr, dst, s->wet_gain, FFALIGN(out->nb_samples, 4));
 113         emms_c();
 114     }
 115
 116     return 0;
 117 }
 118
 119 static int fir_frame(AudioFIRContext *s, AVFrame *in, AVFilterLink *outlink)
 120 {
 121     AVFilterContext *ctx = outlink->src;
 122     AVFrame *out = NULL;
 123     int ret;
 124
 125     s->nb_samples = in->nb_samples;
 126
 127     if (!s->want_skip) {
 128         out = ff_get_audio_buffer(outlink, s->nb_samples);
 129         if (!out)
 130             return AVERROR(ENOMEM);
 131     }
 132
 133     if (s->pts == AV_NOPTS_VALUE)
 134         s->pts = in->pts;
 135     s->in[0] = in;
 136     ctx->internal->execute(ctx, fir_channel, out, NULL, outlink->channels);
 137
 138     s->part_index = (s->part_index + 1) % s->nb_partitions;
 139
 140     if (!s->want_skip) {
 141         out->pts = s->pts;
 142         if (s->pts != AV_NOPTS_VALUE)
 143             s->pts += av_rescale_q(out->nb_samples, (AVRational){1, outlink->sample_rate}, outlink->time_base);
 144     }
 145
 146     s->index++;
 147     if (s->index == 3)
 148         s->index = 0;
 149
 150     av_frame_free(&in);
 151
 152     if (s->want_skip == 1) {
 153         s->want_skip = 0;
 154         ret = 0;
 155     } else {
 156         ret = ff_filter_frame(outlink, out);
 157     }
 158
 159     return ret;
 160 }
 161
 162 static void drawtext(AVFrame *pic, int x, int y, const char *txt, uint32_t color)
 163 {
 164     const uint8_t *font;
 165     int font_height;
 166     int i;
 167
 168     font = avpriv_cga_font, font_height = 8;
 169
 170     for (i = 0; txt[i]; i++) {
 171         int char_y, mask;
 172
 173         uint8_t *p = pic->data[0] + y * pic->linesize[0] + (x + i * 8) * 4;
 174         for (char_y = 0; char_y < font_height; char_y++) {
 175             for (mask = 0x80; mask; mask >>= 1) {
 176                 if (font[txt[i] * font_height + char_y] & mask)
 177                     AV_WL32(p, color);
 178                 p += 4;
 179             }
 180             p += pic->linesize[0] - 8 * 4;
 181         }
 182     }
 183 }
 184
 185 static void draw_line(AVFrame *out, int x0, int y0, int x1, int y1, uint32_t color)
 186 {
 187     int dx = FFABS(x1-x0);
 188     int dy = FFABS(y1-y0), sy = y0 < y1 ? 1 : -1;
 189     int err = (dx>dy ? dx : -dy) / 2, e2;
 190
 191     for (;;) {
 192         AV_WL32(out->data[0] + y0 * out->linesize[0] + x0 * 4, color);
 193
 194         if (x0 == x1 && y0 == y1)
 195             break;
 196
 197         e2 = err;
 198
 199         if (e2 >-dx) {
 200             err -= dy;
 201             x0--;
 202         }
 203
 204         if (e2 < dy) {
 205             err += dx;
 206             y0 += sy;
 207         }
 208     }
 209 }
 210
 211 static void draw_response(AVFilterContext *ctx, AVFrame *out)
 212 {
 213     AudioFIRContext *s = ctx->priv;
 214     float *mag, *phase, *delay, min = FLT_MAX, max = FLT_MIN;
 215     float min_delay = FLT_MAX, max_delay = FLT_MIN;
 216     int prev_ymag = -1, prev_yphase = -1, prev_ydelay = -1;
 217     char text[32];
 218     int channel, i, x;
 219
 220     memset(out->data[0], 0, s->h * out->linesize[0]);
 221
 222     phase = av_malloc_array(s->w, sizeof(*phase));
 223     mag = av_malloc_array(s->w, sizeof(*mag));
 224     delay = av_malloc_array(s->w, sizeof(*delay));
 225     if (!mag || !phase || !delay)
 226         goto end;
 227
 228     channel = av_clip(s->ir_channel, 0, s->in[1]->channels - 1);
 229     for (i = 0; i < s->w; i++) {
 230         const float *src = (const float *)s->in[1]->extended_data[channel];
 231         double w = i * M_PI / (s->w - 1);
 232         double div, real_num = 0., imag_num = 0., real = 0., imag = 0.;
 233
 234         for (x = 0; x < s->nb_taps; x++) {
 235             real += cos(-x * w) * src[x];
 236             imag += sin(-x * w) * src[x];
 237             real_num += cos(-x * w) * src[x] * x;
 238             imag_num += sin(-x * w) * src[x] * x;
 239         }
 240
 241         mag[i] = hypot(real, imag);
 242         phase[i] = atan2(imag, real);
 243         div = real * real + imag * imag;
 244         delay[i] = (real_num * real + imag_num * imag) / div;
 245         min = fminf(min, mag[i]);
 246         max = fmaxf(max, mag[i]);
 247         min_delay = fminf(min_delay, delay[i]);
 248         max_delay = fmaxf(max_delay, delay[i]);
 249     }
 250
 251     for (i = 0; i < s->w; i++) {
 252         int ymag = mag[i] / max * (s->h - 1);
 253         int ydelay = (delay[i] - min_delay) / (max_delay - min_delay) * (s->h - 1);
 254         int yphase = (0.5 * (1. + phase[i] / M_PI)) * (s->h - 1);
 255
 256         ymag = s->h - 1 - av_clip(ymag, 0, s->h - 1);
 257         yphase = s->h - 1 - av_clip(yphase, 0, s->h - 1);
 258         ydelay = s->h - 1 - av_clip(ydelay, 0, s->h - 1);
 259
 260         if (prev_ymag < 0)
 261             prev_ymag = ymag;
 262         if (prev_yphase < 0)
 263             prev_yphase = yphase;
 264         if (prev_ydelay < 0)
 265             prev_ydelay = ydelay;
 266
 267         draw_line(out, i,   ymag, FFMAX(i - 1, 0),   prev_ymag, 0xFFFF00FF);
 268         draw_line(out, i, yphase, FFMAX(i - 1, 0), prev_yphase, 0xFF00FF00);
 269         draw_line(out, i, ydelay, FFMAX(i - 1, 0), prev_ydelay, 0xFF00FFFF);
 270
 271         prev_ymag   = ymag;
 272         prev_yphase = yphase;
 273         prev_ydelay = ydelay;
 274     }
 275
 276     if (s->w > 400 && s->h > 100) {
 277         drawtext(out, 2, 2, "Max Magnitude:", 0xDDDDDDDD);
 278         snprintf(text, sizeof(text), "%.2f", max);
 279         drawtext(out, 15 * 8 + 2, 2, text, 0xDDDDDDDD);
 280
 281         drawtext(out, 2, 12, "Min Magnitude:", 0xDDDDDDDD);
 282         snprintf(text, sizeof(text), "%.2f", min);
 283         drawtext(out, 15 * 8 + 2, 12, text, 0xDDDDDDDD);
 284
 285         drawtext(out, 2, 22, "Max Delay:", 0xDDDDDDDD);
 286         snprintf(text, sizeof(text), "%.2f", max_delay);
 287         drawtext(out, 11 * 8 + 2, 22, text, 0xDDDDDDDD);
 288
 289         drawtext(out, 2, 32, "Min Delay:", 0xDDDDDDDD);
 290         snprintf(text, sizeof(text), "%.2f", min_delay);
 291         drawtext(out, 11 * 8 + 2, 32, text, 0xDDDDDDDD);
 292     }
 293
 294 end:
 295     av_free(delay);
 296     av_free(phase);
 297     av_free(mag);
 298 }
 299
 300 static int convert_coeffs(AVFilterContext *ctx)
 301 {
 302     AudioFIRContext *s = ctx->priv;
 303     int ret, i, ch, n, N;
 304     float power = 0;
 305
 306     s->nb_taps = ff_inlink_queued_samples(ctx->inputs[1]);
 307     if (s->nb_taps <= 0)
 308         return AVERROR(EINVAL);
 309
 310     for (n = 4; (1 << n) < s->nb_taps; n++);
 311     N = FFMIN(n, 16);
 312     s->ir_length = 1 << n;
 313     s->fft_length = (1 << (N + 1)) + 1;
 314     s->part_size = 1 << (N - 1);
 315     s->block_size = FFALIGN(s->fft_length, 32);
 316     s->coeff_size = FFALIGN(s->part_size + 1, 32);
 317     s->nb_partitions = (s->nb_taps + s->part_size - 1) / s->part_size;
 318     s->nb_coeffs = s->ir_length + s->nb_partitions;
 319
 320     for (ch = 0; ch < ctx->inputs[0]->channels; ch++) {
 321         s->sum[ch] = av_calloc(s->fft_length, sizeof(**s->sum));
 322         if (!s->sum[ch])
 323             return AVERROR(ENOMEM);
 324     }
 325
 326     for (ch = 0; ch < ctx->inputs[1]->channels; ch++) {
 327         s->coeff[ch] = av_calloc(s->nb_partitions * s->coeff_size, sizeof(**s->coeff));
 328         if (!s->coeff[ch])
 329             return AVERROR(ENOMEM);
 330     }
 331
 332     for (ch = 0; ch < ctx->inputs[0]->channels; ch++) {
 333         s->block[ch] = av_calloc(s->nb_partitions * s->block_size, sizeof(**s->block));
 334         if (!s->block[ch])
 335             return AVERROR(ENOMEM);
 336     }
 337
 338     for (ch = 0; ch < ctx->inputs[0]->channels; ch++) {
 339         s->rdft[ch]  = av_rdft_init(N, DFT_R2C);
 340         s->irdft[ch] = av_rdft_init(N, IDFT_C2R);
 341         if (!s->rdft[ch] || !s->irdft[ch])
 342             return AVERROR(ENOMEM);
 343     }
 344
 345     s->buffer = ff_get_audio_buffer(ctx->inputs[0], s->part_size * 3);
 346     if (!s->buffer)
 347         return AVERROR(ENOMEM);
 348
 349     ret = ff_inlink_consume_samples(ctx->inputs[1], s->nb_taps, s->nb_taps, &s->in[1]);
 350     if (ret < 0)
 351         return ret;
 352     if (ret == 0)
 353         return AVERROR_BUG;
 354
 355     if (s->response)
 356         draw_response(ctx, s->video);
 357
 358     s->gain = 1;
 359
 360     switch (s->gtype) {
 361     case -1:
 362         /* nothing to do */
 363         break;
 364     case 0:
 365         for (ch = 0; ch < ctx->inputs[1]->channels; ch++) {
 366             float *time = (float *)s->in[1]->extended_data[!s->one2many * ch];
 367
 368             for (i = 0; i < s->nb_taps; i++)
 369                 power += FFABS(time[i]);
 370         }
 371         s->gain = ctx->inputs[1]->channels / power;
 372         break;
 373     case 1:
 374         for (ch = 0; ch < ctx->inputs[1]->channels; ch++) {
 375             float *time = (float *)s->in[1]->extended_data[!s->one2many * ch];
 376
 377             for (i = 0; i < s->nb_taps; i++)
 378                 power += time[i];
 379         }
 380         s->gain = ctx->inputs[1]->channels / power;
 381         break;
 382     case 2:
 383         for (ch = 0; ch < ctx->inputs[1]->channels; ch++) {
 384             float *time = (float *)s->in[1]->extended_data[!s->one2many * ch];
 385
 386             for (i = 0; i < s->nb_taps; i++)
 387                 power += time[i] * time[i];
 388         }
 389         s->gain = sqrtf(ch / power);
 390         break;
 391     default:
 392         return AVERROR_BUG;
 393     }
 394
 395     s->gain = FFMIN(s->gain * s->ir_gain, 1.f);
 396     av_log(ctx, AV_LOG_DEBUG, "power %f, gain %f\n", power, s->gain);
 397     for (ch = 0; ch < ctx->inputs[1]->channels; ch++) {
 398         float *time = (float *)s->in[1]->extended_data[!s->one2many * ch];
 399
 400         s->fdsp->vector_fmul_scalar(time, time, s->gain, FFALIGN(s->nb_taps, 4));
 401     }
 402
 403     for (ch = 0; ch < ctx->inputs[1]->channels; ch++) {
 404         float *time = (float *)s->in[1]->extended_data[!s->one2many * ch];
 405         float *block = s->block[ch];
 406         FFTComplex *coeff = s->coeff[ch];
 407
 408         for (i = FFMAX(1, s->length * s->nb_taps); i < s->nb_taps; i++)
 409             time[i] = 0;
 410
 411         for (i = 0; i < s->nb_partitions; i++) {
 412             const float scale = 1.f / s->part_size;
 413             const int toffset = i * s->part_size;
 414             const int coffset = i * s->coeff_size;
 415             const int boffset = s->part_size;
 416             const int remaining = s->nb_taps - (i * s->part_size);
 417             const int size = remaining >= s->part_size ? s->part_size : remaining;
 418
 419             memset(block, 0, sizeof(*block) * s->fft_length);
 420             memcpy(block + boffset, time + toffset, size * sizeof(*block));
 421
 422             av_rdft_calc(s->rdft[0], block);
 423
 424             coeff[coffset].re = block[0] * scale;
 425             coeff[coffset].im = 0;
 426             for (n = 1; n < s->part_size; n++) {
 427                 coeff[coffset + n].re = block[2 * n] * scale;
 428                 coeff[coffset + n].im = block[2 * n + 1] * scale;
 429             }
 430             coeff[coffset + s->part_size].re = block[1] * scale;
 431             coeff[coffset + s->part_size].im = 0;
 432         }
 433     }
 434
 435     av_frame_free(&s->in[1]);
 436     av_log(ctx, AV_LOG_DEBUG, "nb_taps: %d\n", s->nb_taps);
 437     av_log(ctx, AV_LOG_DEBUG, "nb_partitions: %d\n", s->nb_partitions);
 438     av_log(ctx, AV_LOG_DEBUG, "partition size: %d\n", s->part_size);
 439     av_log(ctx, AV_LOG_DEBUG, "ir_length: %d\n", s->ir_length);
 440
 441     s->have_coeffs = 1;
 442
 443     return 0;
 444 }
 445
 446 static int check_ir(AVFilterLink *link, AVFrame *frame)
 447 {
 448     AVFilterContext *ctx = link->dst;
 449     AudioFIRContext *s = ctx->priv;
 450     int nb_taps, max_nb_taps;
 451
 452     nb_taps = ff_inlink_queued_samples(link);
 453     max_nb_taps = s->max_ir_len * ctx->outputs[0]->sample_rate;
 454     if (nb_taps > max_nb_taps) {
 455         av_log(ctx, AV_LOG_ERROR, "Too big number of coefficients: %d > %d.\n", nb_taps, max_nb_taps);
 456         return AVERROR(EINVAL);
 457     }
 458
 459     return 0;
 460 }
 461
 462 static int activate(AVFilterContext *ctx)
 463 {
 464     AudioFIRContext *s = ctx->priv;
 465     AVFilterLink *outlink = ctx->outputs[0];
 466     AVFrame *in = NULL;
 467     int ret, status;
 468     int64_t pts;
 469
 470     FF_FILTER_FORWARD_STATUS_BACK_ALL(ctx->outputs[0], ctx);
 471     if (s->response)
 472         FF_FILTER_FORWARD_STATUS_BACK_ALL(ctx->outputs[1], ctx);
 473     if (!s->eof_coeffs) {
 474         AVFrame *ir = NULL;
 475
 476         ret = check_ir(ctx->inputs[1], ir);
 477         if (ret < 0)
 478             return ret;
 479
 480         if (ff_outlink_get_status(ctx->inputs[1]) == AVERROR_EOF)
 481             s->eof_coeffs = 1;
 482
 483         if (!s->eof_coeffs) {
 484             if (ff_outlink_frame_wanted(ctx->outputs[0]))
 485                 ff_inlink_request_frame(ctx->inputs[1]);
 486             return 0;
 487         }
 488     }
 489
 490     if (!s->have_coeffs && s->eof_coeffs) {
 491         ret = convert_coeffs(ctx);
 492         if (ret < 0)
 493             return ret;
 494     }
 495
 496     if (s->need_padding) {
 497         in = ff_get_audio_buffer(outlink, s->part_size);
 498         if (!in)
 499             return AVERROR(ENOMEM);
 500         s->need_padding = 0;
 501         ret = 1;
 502     } else {
 503         ret = ff_inlink_consume_samples(ctx->inputs[0], s->part_size, s->part_size, &in);
 504     }
 505
 506     if (ret > 0)
 507         ret = fir_frame(s, in, outlink);
 508
 509     if (ret < 0)
 510         return ret;
 511
 512     if (s->response && s->have_coeffs) {
 513         if (ff_outlink_frame_wanted(ctx->outputs[1])) {
 514             s->video->pts = s->pts;
 515             return ff_filter_frame(ctx->outputs[1], av_frame_clone(s->video));
 516         }
 517     }
 518
 519     if (ff_inlink_acknowledge_status(ctx->inputs[0], &status, &pts)) {
 520         if (status == AVERROR_EOF) {
 521             ff_outlink_set_status(ctx->outputs[0], status, pts);
 522             if (s->response)
 523                 ff_outlink_set_status(ctx->outputs[1], status, pts);
 524             return 0;
 525         }
 526     }
 527
 528     if (ff_outlink_frame_wanted(ctx->outputs[0])) {
 529         ff_inlink_request_frame(ctx->inputs[0]);
 530         return 0;
 531     }
 532
 533     if (s->response && ff_outlink_frame_wanted(ctx->outputs[1])) {
 534         ff_inlink_request_frame(ctx->inputs[0]);
 535         return 0;
 536     }
 537
 538     return 0;
 539 }
 540
 541 static int query_formats(AVFilterContext *ctx)
 542 {
 543     AudioFIRContext *s = ctx->priv;
 544     AVFilterFormats *formats;
 545     AVFilterChannelLayouts *layouts;
 546     static const enum AVSampleFormat sample_fmts[] = {
 547         AV_SAMPLE_FMT_FLTP,
 548         AV_SAMPLE_FMT_NONE
 549     };
 550     static const enum AVPixelFormat pix_fmts[] = {
 551         AV_PIX_FMT_RGB0,
 552         AV_PIX_FMT_NONE
 553     };
 554     int ret;
 555
 556     if (s->response) {
 557         AVFilterLink *videolink = ctx->outputs[1];
 558         formats = ff_make_format_list(pix_fmts);
 559         if ((ret = ff_formats_ref(formats, &videolink->in_formats)) < 0)
 560             return ret;
 561     }
 562
 563     layouts = ff_all_channel_counts();
 564     if (!layouts)
 565         return AVERROR(ENOMEM);
 566
 567     if (s->ir_format) {
 568         ret = ff_set_common_channel_layouts(ctx, layouts);
 569         if (ret < 0)
 570             return ret;
 571     } else {
 572         AVFilterChannelLayouts *mono = NULL;
 573
 574         ret = ff_add_channel_layout(&mono, AV_CH_LAYOUT_MONO);
 575         if (ret)
 576             return ret;
 577
 578         if ((ret = ff_channel_layouts_ref(layouts, &ctx->inputs[0]->out_channel_layouts)) < 0)
 579             return ret;
 580         if ((ret = ff_channel_layouts_ref(layouts, &ctx->outputs[0]->in_channel_layouts)) < 0)
 581             return ret;
 582         if ((ret = ff_channel_layouts_ref(mono, &ctx->inputs[1]->out_channel_layouts)) < 0)
 583             return ret;
 584     }
 585
 586     formats = ff_make_format_list(sample_fmts);
 587     if ((ret = ff_set_common_formats(ctx, formats)) < 0)
 588         return ret;
 589
 590     formats = ff_all_samplerates();
 591     return ff_set_common_samplerates(ctx, formats);
 592 }
 593
 594 static int config_output(AVFilterLink *outlink)
 595 {
 596     AVFilterContext *ctx = outlink->src;
 597     AudioFIRContext *s = ctx->priv;
 598
 599     s->one2many = ctx->inputs[1]->channels == 1;
 600     outlink->sample_rate = ctx->inputs[0]->sample_rate;
 601     outlink->time_base   = ctx->inputs[0]->time_base;
 602     outlink->channel_layout = ctx->inputs[0]->channel_layout;
 603     outlink->channels = ctx->inputs[0]->channels;
 604
 605     s->sum = av_calloc(outlink->channels, sizeof(*s->sum));
 606     s->coeff = av_calloc(ctx->inputs[1]->channels, sizeof(*s->coeff));
 607     s->block = av_calloc(ctx->inputs[0]->channels, sizeof(*s->block));
 608     s->rdft = av_calloc(outlink->channels, sizeof(*s->rdft));
 609     s->irdft = av_calloc(outlink->channels, sizeof(*s->irdft));
 610     if (!s->sum || !s->coeff || !s->block || !s->rdft || !s->irdft)
 611         return AVERROR(ENOMEM);
 612
 613     s->nb_channels = outlink->channels;
 614     s->nb_coef_channels = ctx->inputs[1]->channels;
 615     s->want_skip = 1;
 616     s->need_padding = 1;
 617     s->pts = AV_NOPTS_VALUE;
 618
 619     return 0;
 620 }
 621
 622 static av_cold void uninit(AVFilterContext *ctx)
 623 {
 624     AudioFIRContext *s = ctx->priv;
 625     int ch;
 626
 627     if (s->sum) {
 628         for (ch = 0; ch < s->nb_channels; ch++) {
 629             av_freep(&s->sum[ch]);
 630         }
 631     }
 632     av_freep(&s->sum);
 633
 634     if (s->coeff) {
 635         for (ch = 0; ch < s->nb_coef_channels; ch++) {
 636             av_freep(&s->coeff[ch]);
 637         }
 638     }
 639     av_freep(&s->coeff);
 640
 641     if (s->block) {
 642         for (ch = 0; ch < s->nb_channels; ch++) {
 643             av_freep(&s->block[ch]);
 644         }
 645     }
 646     av_freep(&s->block);
 647
 648     if (s->rdft) {
 649         for (ch = 0; ch < s->nb_channels; ch++) {
 650             av_rdft_end(s->rdft[ch]);
 651         }
 652     }
 653     av_freep(&s->rdft);
 654
 655     if (s->irdft) {
 656         for (ch = 0; ch < s->nb_channels; ch++) {
 657             av_rdft_end(s->irdft[ch]);
 658         }
 659     }
 660     av_freep(&s->irdft);
 661
 662     av_frame_free(&s->in[1]);
 663     av_frame_free(&s->buffer);
 664
 665     av_freep(&s->fdsp);
 666
 667     for (int i = 0; i < ctx->nb_outputs; i++)
 668         av_freep(&ctx->output_pads[i].name);
 669     av_frame_free(&s->video);
 670 }
 671
 672 static int config_video(AVFilterLink *outlink)
 673 {
 674     AVFilterContext *ctx = outlink->src;
 675     AudioFIRContext *s = ctx->priv;
 676
 677     outlink->sample_aspect_ratio = (AVRational){1,1};
 678     outlink->w = s->w;
 679     outlink->h = s->h;
 680
 681     av_frame_free(&s->video);
 682     s->video = ff_get_video_buffer(outlink, outlink->w, outlink->h);
 683     if (!s->video)
 684         return AVERROR(ENOMEM);
 685
 686     return 0;
 687 }
 688
 689 static av_cold int init(AVFilterContext *ctx)
 690 {
 691     AudioFIRContext *s = ctx->priv;
 692     AVFilterPad pad, vpad;
 693     int ret;
 694
 695     pad = (AVFilterPad){
 696         .name          = av_strdup("default"),
 697         .type          = AVMEDIA_TYPE_AUDIO,
 698         .config_props  = config_output,
 699     };
 700
 701     if (!pad.name)
 702         return AVERROR(ENOMEM);
 703
 704     if (s->response) {
 705         vpad = (AVFilterPad){
 706             .name         = av_strdup("filter_response"),
 707             .type         = AVMEDIA_TYPE_VIDEO,
 708             .config_props = config_video,
 709         };
 710         if (!vpad.name)
 711             return AVERROR(ENOMEM);
 712     }
 713
 714     ret = ff_insert_outpad(ctx, 0, &pad);
 715     if (ret < 0) {
 716         av_freep(&pad.name);
 717         return ret;
 718     }
 719
 720     if (s->response) {
 721         ret = ff_insert_outpad(ctx, 1, &vpad);
 722         if (ret < 0) {
 723             av_freep(&vpad.name);
 724             return ret;
 725         }
 726     }
 727
 728     s->fcmul_add = fcmul_add_c;
 729
 730     s->fdsp = avpriv_float_dsp_alloc(0);
 731     if (!s->fdsp)
 732         return AVERROR(ENOMEM);
 733
 734     if (ARCH_X86)
 735         ff_afir_init_x86(s);
 736
 737     return 0;
 738 }
 739
 740 static const AVFilterPad afir_inputs[] = {
 741     {
 742         .name           = "main",
 743         .type           = AVMEDIA_TYPE_AUDIO,
 744     },{
 745         .name           = "ir",
 746         .type           = AVMEDIA_TYPE_AUDIO,
 747     },
 748     { NULL }
 749 };
 750
 751 #define AF AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM
 752 #define VF AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_FILTERING_PARAM
 753 #define OFFSET(x) offsetof(AudioFIRContext, x)
 754
 755 static const AVOption afir_options[] = {
 756     { "dry",    "set dry gain",      OFFSET(dry_gain),   AV_OPT_TYPE_FLOAT, {.dbl=1},    0, 10, AF },
 757     { "wet",    "set wet gain",      OFFSET(wet_gain),   AV_OPT_TYPE_FLOAT, {.dbl=1},    0, 10, AF },
 758     { "length", "set IR length",     OFFSET(length),     AV_OPT_TYPE_FLOAT, {.dbl=1},    0,  1, AF },
 759     { "gtype",  "set IR auto gain type",OFFSET(gtype),   AV_OPT_TYPE_INT,   {.i64=0},   -1,  2, AF, "gtype" },
 760     {  "none",  "without auto gain", 0,                  AV_OPT_TYPE_CONST, {.i64=-1},   0,  0, AF, "gtype" },
 761     {  "peak",  "peak gain",         0,                  AV_OPT_TYPE_CONST, {.i64=0},    0,  0, AF, "gtype" },
 762     {  "dc",    "DC gain",           0,                  AV_OPT_TYPE_CONST, {.i64=1},    0,  0, AF, "gtype" },
 763     {  "gn",    "gain to noise",     0,                  AV_OPT_TYPE_CONST, {.i64=2},    0,  0, AF, "gtype" },
 764     { "irgain", "set IR gain",       OFFSET(ir_gain),    AV_OPT_TYPE_FLOAT, {.dbl=1},    0,  1, AF },
 765     { "irfmt",  "set IR format",     OFFSET(ir_format),  AV_OPT_TYPE_INT,   {.i64=1},    0,  1, AF, "irfmt" },
 766     {  "mono",  "single channel",    0,                  AV_OPT_TYPE_CONST, {.i64=0},    0,  0, AF, "irfmt" },
 767     {  "input", "same as input",     0,                  AV_OPT_TYPE_CONST, {.i64=1},    0,  0, AF, "irfmt" },
 768     { "maxir",  "set max IR length", OFFSET(max_ir_len), AV_OPT_TYPE_FLOAT, {.dbl=30}, 0.1, 60, AF },
 769     { "response", "show IR frequency response", OFFSET(response), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, VF },
 770     { "channel", "set IR channel to display frequency response", OFFSET(ir_channel), AV_OPT_TYPE_INT, {.i64=0}, 0, 1024, VF },
 771     { "size",   "set video size",    OFFSET(w),          AV_OPT_TYPE_IMAGE_SIZE, {.str = "hd720"}, 0, 0, VF },
 772     { NULL }
 773 };
 774
 775 AVFILTER_DEFINE_CLASS(afir);
 776
 777 AVFilter ff_af_afir = {
 778     .name          = "afir",
 779     .description   = NULL_IF_CONFIG_SMALL("Apply Finite Impulse Response filter with supplied coefficients in 2nd stream."),
 780     .priv_size     = sizeof(AudioFIRContext),
 781     .priv_class    = &afir_class,
 782     .query_formats = query_formats,
 783     .init          = init,
 784     .activate      = activate,
 785     .uninit        = uninit,
 786     .inputs        = afir_inputs,
 787     .flags         = AVFILTER_FLAG_DYNAMIC_OUTPUTS |
 788                      AVFILTER_FLAG_SLICE_THREADS,
 789 };