FATE: add a test for the overlay filter

[ffmpeg] / libavfilter / avfiltergraph.c
diff --git a/libavfilter/avfiltergraph.c b/libavfilter/avfiltergraph.c

index 4521f790f7920f54f426796ea88c982b8cf9df27..516617e62bd9e336d4d1fe3517087a69eaa3430a 100644 (file)
--- a/libavfilter/avfiltergraph.c
+++ b/libavfilter/avfiltergraph.c
@@ -20,17 +20,17 @@
   * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
   */
  
-#include <ctype.h>
  #include <string.h>
  
+#include "libavutil/avassert.h"
+#include "libavutil/channel_layout.h"
+#include "libavutil/common.h"
+#include "libavutil/log.h"
  #include "avfilter.h"
  #include "avfiltergraph.h"
  #include "formats.h"
  #include "internal.h"
  
-#include "libavutil/audioconvert.h"
-#include "libavutil/log.h"
-
  static const AVClass filtergraph_class = {
      .class_name = "AVFilterGraph",
      .item_name  = av_default_item_name,
@@ -39,12 +39,10 @@ static const AVClass filtergraph_class = {
  
  AVFilterGraph *avfilter_graph_alloc(void)
  {
-    AVFilterGraph *ret = av_mallocz(sizeof(AVFilterGraph));
+    AVFilterGraph *ret = av_mallocz(sizeof(*ret));
      if (!ret)
          return NULL;
-#if FF_API_GRAPH_AVCLASS
      ret->av_class = &filtergraph_class;
-#endif
      return ret;
  }
  
@@ -52,9 +50,10 @@ void avfilter_graph_free(AVFilterGraph **graph)
  {
      if (!*graph)
          return;
-    for (; (*graph)->filter_count > 0; (*graph)->filter_count--)
-        avfilter_free((*graph)->filters[(*graph)->filter_count - 1]);
+    for (; (*graph)->nb_filters > 0; (*graph)->nb_filters--)
+        avfilter_free((*graph)->filters[(*graph)->nb_filters - 1]);
      av_freep(&(*graph)->scale_sws_opts);
+    av_freep(&(*graph)->resample_lavr_opts);
      av_freep(&(*graph)->filters);
      av_freep(graph);
  }
@@ -62,12 +61,12 @@ void avfilter_graph_free(AVFilterGraph **graph)
  int avfilter_graph_add_filter(AVFilterGraph *graph, AVFilterContext *filter)
  {
      AVFilterContext **filters = av_realloc(graph->filters,
-                                           sizeof(AVFilterContext*) * (graph->filter_count+1));
+                                           sizeof(*filters) * (graph->nb_filters + 1));
      if (!filters)
          return AVERROR(ENOMEM);
  
      graph->filters = filters;
-    graph->filters[graph->filter_count++] = filter;
+    graph->filters[graph->nb_filters++] = filter;
  
      return 0;
  }
@@ -106,7 +105,7 @@ static int graph_check_validity(AVFilterGraph *graph, AVClass *log_ctx)
      AVFilterContext *filt;
      int i, j;
  
-    for (i = 0; i < graph->filter_count; i++) {
+    for (i = 0; i < graph->nb_filters; i++) {
          filt = graph->filters[i];
  
          for (j = 0; j < filt->nb_inputs; j++) {
@@ -141,7 +140,7 @@ static int graph_config_links(AVFilterGraph *graph, AVClass *log_ctx)
      AVFilterContext *filt;
      int i, ret;
  
-    for (i=0; i < graph->filter_count; i++) {
+    for (i = 0; i < graph->nb_filters; i++) {
          filt = graph->filters[i];
  
          if (!filt->nb_outputs) {
@@ -157,7 +156,7 @@ AVFilterContext *avfilter_graph_get_filter(AVFilterGraph *graph, char *name)
  {
      int i;
  
-    for (i = 0; i < graph->filter_count; i++)
+    for (i = 0; i < graph->nb_filters; i++)
          if (graph->filters[i]->name && !strcmp(name, graph->filters[i]->name))
              return graph->filters[i];
  
@@ -170,7 +169,7 @@ static int query_formats(AVFilterGraph *graph, AVClass *log_ctx)
      int scaler_count = 0, resampler_count = 0;
  
      /* ask all the sub-filters for their supported media formats */
-    for (i = 0; i < graph->filter_count; i++) {
+    for (i = 0; i < graph->nb_filters; i++) {
          if (graph->filters[i]->filter->query_formats)
              graph->filters[i]->filter->query_formats(graph->filters[i]);
          else
@@ -178,7 +177,7 @@ static int query_formats(AVFilterGraph *graph, AVClass *log_ctx)
      }
  
      /* go through and merge as many format lists as possible */
-    for (i = 0; i < graph->filter_count; i++) {
+    for (i = 0; i < graph->nb_filters; i++) {
          AVFilterContext *filter = graph->filters[i];
  
          for (j = 0; j < filter->nb_inputs; j++) {
@@ -213,11 +212,16 @@ static int query_formats(AVFilterGraph *graph, AVClass *log_ctx)
                  /* couldn't merge format lists. auto-insert conversion filter */
                  switch (link->type) {
                  case AVMEDIA_TYPE_VIDEO:
+                    if (!(filter = avfilter_get_by_name("scale"))) {
+                        av_log(log_ctx, AV_LOG_ERROR, "'scale' filter "
+                               "not present, cannot convert pixel formats.\n");
+                        return AVERROR(EINVAL);
+                    }
+
                      snprintf(inst_name, sizeof(inst_name), "auto-inserted scaler %d",
                               scaler_count++);
                      snprintf(scale_args, sizeof(scale_args), "0:0:%s", graph->scale_sws_opts);
-                    if ((ret = avfilter_graph_create_filter(&convert,
-                                                            avfilter_get_by_name("scale"),
+                    if ((ret = avfilter_graph_create_filter(&convert, filter,
                                                              inst_name, scale_args, NULL,
                                                              graph)) < 0)
                          return ret;
@@ -231,9 +235,13 @@ static int query_formats(AVFilterGraph *graph, AVClass *log_ctx)
  
                      snprintf(inst_name, sizeof(inst_name), "auto-inserted resampler %d",
                               resampler_count++);
-                    if ((ret = avfilter_graph_create_filter(&convert,
-                                                            avfilter_get_by_name("resample"),
-                                                            inst_name, NULL, NULL, graph)) < 0)
+                    scale_args[0] = '\0';
+                    if (graph->resample_lavr_opts)
+                        snprintf(scale_args, sizeof(scale_args), "%s",
+                                 graph->resample_lavr_opts);
+                    if ((ret = avfilter_graph_create_filter(&convert, filter,
+                                                            inst_name, scale_args,
+                                                            NULL, graph)) < 0)
                          return ret;
                      break;
                  default:
@@ -369,7 +377,7 @@ static void reduce_formats(AVFilterGraph *graph)
      do {
          reduced = 0;
  
-        for (i = 0; i < graph->filter_count; i++)
+        for (i = 0; i < graph->nb_filters; i++)
              reduced |= reduce_formats_on_filter(graph->filters[i]);
      } while (reduced);
  }
@@ -417,15 +425,48 @@ static void swap_samplerates(AVFilterGraph *graph)
  {
      int i;
  
-    for (i = 0; i < graph->filter_count; i++)
+    for (i = 0; i < graph->nb_filters; i++)
          swap_samplerates_on_filter(graph->filters[i]);
  }
  
+#define CH_CENTER_PAIR (AV_CH_FRONT_LEFT_OF_CENTER | AV_CH_FRONT_RIGHT_OF_CENTER)
+#define CH_FRONT_PAIR  (AV_CH_FRONT_LEFT           | AV_CH_FRONT_RIGHT)
+#define CH_STEREO_PAIR (AV_CH_STEREO_LEFT          | AV_CH_STEREO_RIGHT)
+#define CH_WIDE_PAIR   (AV_CH_WIDE_LEFT            | AV_CH_WIDE_RIGHT)
+#define CH_SIDE_PAIR   (AV_CH_SIDE_LEFT            | AV_CH_SIDE_RIGHT)
+#define CH_DIRECT_PAIR (AV_CH_SURROUND_DIRECT_LEFT | AV_CH_SURROUND_DIRECT_RIGHT)
+#define CH_BACK_PAIR   (AV_CH_BACK_LEFT            | AV_CH_BACK_RIGHT)
+
+/* allowable substitutions for channel pairs when comparing layouts,
+ * ordered by priority for both values */
+static const uint64_t ch_subst[][2] = {
+    { CH_FRONT_PAIR,      CH_CENTER_PAIR     },
+    { CH_FRONT_PAIR,      CH_WIDE_PAIR       },
+    { CH_FRONT_PAIR,      AV_CH_FRONT_CENTER },
+    { CH_CENTER_PAIR,     CH_FRONT_PAIR      },
+    { CH_CENTER_PAIR,     CH_WIDE_PAIR       },
+    { CH_CENTER_PAIR,     AV_CH_FRONT_CENTER },
+    { CH_WIDE_PAIR,       CH_FRONT_PAIR      },
+    { CH_WIDE_PAIR,       CH_CENTER_PAIR     },
+    { CH_WIDE_PAIR,       AV_CH_FRONT_CENTER },
+    { AV_CH_FRONT_CENTER, CH_FRONT_PAIR      },
+    { AV_CH_FRONT_CENTER, CH_CENTER_PAIR     },
+    { AV_CH_FRONT_CENTER, CH_WIDE_PAIR       },
+    { CH_SIDE_PAIR,       CH_DIRECT_PAIR     },
+    { CH_SIDE_PAIR,       CH_BACK_PAIR       },
+    { CH_SIDE_PAIR,       AV_CH_BACK_CENTER  },
+    { CH_BACK_PAIR,       CH_DIRECT_PAIR     },
+    { CH_BACK_PAIR,       CH_SIDE_PAIR       },
+    { CH_BACK_PAIR,       AV_CH_BACK_CENTER  },
+    { AV_CH_BACK_CENTER,  CH_BACK_PAIR       },
+    { AV_CH_BACK_CENTER,  CH_DIRECT_PAIR     },
+    { AV_CH_BACK_CENTER,  CH_SIDE_PAIR       },
+};
+
  static void swap_channel_layouts_on_filter(AVFilterContext *filter)
  {
      AVFilterLink *link = NULL;
-    uint64_t chlayout;
-    int i, j;
+    int i, j, k;
  
      for (i = 0; i < filter->nb_inputs; i++) {
          link = filter->inputs[i];
@@ -437,29 +478,58 @@ static void swap_channel_layouts_on_filter(AVFilterContext *filter)
      if (i == filter->nb_inputs)
          return;
  
-    chlayout = link->out_channel_layouts->channel_layouts[0];
-
      for (i = 0; i < filter->nb_outputs; i++) {
          AVFilterLink *outlink = filter->outputs[i];
-        int best_idx, best_score = INT_MIN;
+        int best_idx = -1, best_score = INT_MIN, best_count_diff = INT_MAX;
  
          if (outlink->type != AVMEDIA_TYPE_AUDIO ||
              outlink->in_channel_layouts->nb_channel_layouts < 2)
              continue;
  
          for (j = 0; j < outlink->in_channel_layouts->nb_channel_layouts; j++) {
+            uint64_t  in_chlayout = link->out_channel_layouts->channel_layouts[0];
              uint64_t out_chlayout = outlink->in_channel_layouts->channel_layouts[j];
-            int matched_channels  = av_get_channel_layout_nb_channels(chlayout &
-                                                                      out_chlayout);
-            int extra_channels     = av_get_channel_layout_nb_channels(out_chlayout &
-                                                                       (~chlayout));
-            int score = matched_channels - extra_channels;
+            int  in_channels      = av_get_channel_layout_nb_channels(in_chlayout);
+            int out_channels      = av_get_channel_layout_nb_channels(out_chlayout);
+            int count_diff        = out_channels - in_channels;
+            int matched_channels, extra_channels;
+            int score = 0;
+
+            /* channel substitution */
+            for (k = 0; k < FF_ARRAY_ELEMS(ch_subst); k++) {
+                uint64_t cmp0 = ch_subst[k][0];
+                uint64_t cmp1 = ch_subst[k][1];
+                if (( in_chlayout & cmp0) && (!(out_chlayout & cmp0)) &&
+                    (out_chlayout & cmp1) && (!( in_chlayout & cmp1))) {
+                    in_chlayout  &= ~cmp0;
+                    out_chlayout &= ~cmp1;
+                    /* add score for channel match, minus a deduction for
+                       having to do the substitution */
+                    score += 10 * av_get_channel_layout_nb_channels(cmp1) - 2;
+                }
+            }
  
-            if (score > best_score) {
+            /* no penalty for LFE channel mismatch */
+            if ( (in_chlayout & AV_CH_LOW_FREQUENCY) &&
+                (out_chlayout & AV_CH_LOW_FREQUENCY))
+                score += 10;
+            in_chlayout  &= ~AV_CH_LOW_FREQUENCY;
+            out_chlayout &= ~AV_CH_LOW_FREQUENCY;
+
+            matched_channels = av_get_channel_layout_nb_channels(in_chlayout &
+                                                                 out_chlayout);
+            extra_channels   = av_get_channel_layout_nb_channels(out_chlayout &
+                                                                 (~in_chlayout));
+            score += 10 * matched_channels - 5 * extra_channels;
+
+            if (score > best_score ||
+                (count_diff < best_count_diff && score == best_score)) {
                  best_score = score;
                  best_idx   = j;
+                best_count_diff = count_diff;
              }
          }
+        av_assert0(best_idx >= 0);
          FFSWAP(uint64_t, outlink->in_channel_layouts->channel_layouts[0],
                 outlink->in_channel_layouts->channel_layouts[best_idx]);
      }
@@ -470,7 +540,7 @@ static void swap_channel_layouts(AVFilterGraph *graph)
  {
      int i;
  
-    for (i = 0; i < graph->filter_count; i++)
+    for (i = 0; i < graph->nb_filters; i++)
          swap_channel_layouts_on_filter(graph->filters[i]);
  }
  
@@ -495,7 +565,7 @@ static void swap_sample_fmts_on_filter(AVFilterContext *filter)
  
      for (i = 0; i < filter->nb_outputs; i++) {
          AVFilterLink *outlink = filter->outputs[i];
-        int best_idx, best_score = INT_MIN;
+        int best_idx = -1, best_score = INT_MIN;
  
          if (outlink->type != AVMEDIA_TYPE_AUDIO ||
              outlink->in_formats->format_count < 2)
@@ -528,6 +598,7 @@ static void swap_sample_fmts_on_filter(AVFilterContext *filter)
                  best_idx   = j;
              }
          }
+        av_assert0(best_idx >= 0);
          FFSWAP(int, outlink->in_formats->formats[0],
                 outlink->in_formats->formats[best_idx]);
      }
@@ -537,7 +608,7 @@ static void swap_sample_fmts(AVFilterGraph *graph)
  {
      int i;
  
-    for (i = 0; i < graph->filter_count; i++)
+    for (i = 0; i < graph->nb_filters; i++)
          swap_sample_fmts_on_filter(graph->filters[i]);
  
  }
@@ -546,7 +617,7 @@ static int pick_formats(AVFilterGraph *graph)
  {
      int i, j, ret;
  
-    for (i = 0; i < graph->filter_count; i++) {
+    for (i = 0; i < graph->nb_filters; i++) {
          AVFilterContext *filter = graph->filters[i];
  
          for (j = 0; j < filter->nb_inputs; j++)
@@ -587,12 +658,52 @@ static int graph_config_formats(AVFilterGraph *graph, AVClass *log_ctx)
      return 0;
  }
  
+static int graph_insert_fifos(AVFilterGraph *graph, AVClass *log_ctx)
+{
+    AVFilterContext *f;
+    int i, j, ret;
+    int fifo_count = 0;
+
+    for (i = 0; i < graph->nb_filters; i++) {
+        f = graph->filters[i];
+
+        for (j = 0; j < f->nb_inputs; j++) {
+            AVFilterLink *link = f->inputs[j];
+            AVFilterContext *fifo_ctx;
+            AVFilter *fifo;
+            char name[32];
+
+            if (!link->dstpad->needs_fifo)
+                continue;
+
+            fifo = f->inputs[j]->type == AVMEDIA_TYPE_VIDEO ?
+                   avfilter_get_by_name("fifo") :
+                   avfilter_get_by_name("afifo");
+
+            snprintf(name, sizeof(name), "auto-inserted fifo %d", fifo_count++);
+
+            ret = avfilter_graph_create_filter(&fifo_ctx, fifo, name, NULL,
+                                               NULL, graph);
+            if (ret < 0)
+                return ret;
+
+            ret = avfilter_insert_filter(link, fifo_ctx, 0, 0);
+            if (ret < 0)
+                return ret;
+        }
+    }
+
+    return 0;
+}
+
  int avfilter_graph_config(AVFilterGraph *graphctx, void *log_ctx)
  {
      int ret;
  
      if ((ret = graph_check_validity(graphctx, log_ctx)))
          return ret;
+    if ((ret = graph_insert_fifos(graphctx, log_ctx)) < 0)
+        return ret;
      if ((ret = graph_config_formats(graphctx, log_ctx)))
          return ret;
      if ((ret = graph_config_links(graphctx, log_ctx)))