Merge commit '124e26971e69bb25f38c6c7cb3fa20c77cf10966'

[ffmpeg] / ffmpeg.c
diff --git a/ffmpeg.c b/ffmpeg.c

index 532db80e0b1e70093bdc788a44125d672efc688e..1a0e909fb0037da7815361938a7bdeb0afe3970d 100644 (file)
--- a/ffmpeg.c
+++ b/ffmpeg.c
@@ -47,9 +47,11 @@
  #include "libavutil/parseutils.h"
  #include "libavutil/samplefmt.h"
  #include "libavutil/fifo.h"
+#include "libavutil/hwcontext.h"
  #include "libavutil/internal.h"
  #include "libavutil/intreadwrite.h"
  #include "libavutil/dict.h"
+#include "libavutil/display.h"
  #include "libavutil/mathematics.h"
  #include "libavutil/pixdesc.h"
  #include "libavutil/avstring.h"
@@ -1541,7 +1543,7 @@ static void print_final_stats(int64_t total_size)
          }
          extra_size += ost->enc_ctx->extradata_size;
          data_size  += ost->data_size;
-        if (   (ost->enc_ctx->flags & (AV_CODEC_FLAG_PASS1 | CODEC_FLAG_PASS2))
+        if (   (ost->enc_ctx->flags & (AV_CODEC_FLAG_PASS1 | AV_CODEC_FLAG_PASS2))
              != AV_CODEC_FLAG_PASS1)
              pass1_used = 0;
      }
@@ -2508,7 +2510,7 @@ static int transcode_subtitles(InputStream *ist, AVPacket *pkt, int *got_output,
                               1000, AV_TIME_BASE);
              if (end < ist->prev_sub.subtitle.end_display_time) {
                  av_log(ist->dec_ctx, AV_LOG_DEBUG,
-                       "Subtitle duration reduced from %d to %d%s\n",
+                       "Subtitle duration reduced from %"PRId32" to %d%s\n",
                         ist->prev_sub.subtitle.end_display_time, end,
                         end <= 0 ? ", dropping it" : "");
                  ist->prev_sub.subtitle.end_display_time = end;
@@ -3067,9 +3069,6 @@ static int init_output_stream_streamcopy(OutputStream *ost)
              const AVPacketSideData *sd_src = &ist->st->side_data[i];
              AVPacketSideData *sd_dst = &ost->st->side_data[ost->st->nb_side_data];
  
-            if (ost->rotate_overridden && sd_src->type == AV_PKT_DATA_DISPLAYMATRIX)
-                continue;
-
              sd_dst->data = av_malloc(sd_src->size);
              if (!sd_dst->data)
                  return AVERROR(ENOMEM);
@@ -3080,6 +3079,13 @@ static int init_output_stream_streamcopy(OutputStream *ost)
          }
      }
  
+    if (ost->rotate_overridden) {
+        uint8_t *sd = av_stream_new_side_data(ost->st, AV_PKT_DATA_DISPLAYMATRIX,
+                                              sizeof(int32_t) * 9);
+        if (sd)
+            av_display_rotation_set((int32_t *)sd, -ost->rotate_override_value);
+    }
+
      ost->parser = av_parser_init(par_dst->codec_id);
      ost->parser_avctx = avcodec_alloc_context3(NULL);
      if (!ost->parser_avctx)
@@ -3233,6 +3239,11 @@ static int init_output_stream_encode(OutputStream *ost)
  
      set_encoder_id(output_files[ost->file_index], ost);
  
+    // Muxers use AV_PKT_DATA_DISPLAYMATRIX to signal rotation. On the other
+    // hand, the legacy API makes demuxers set "rotate" metadata entries,
+    // which have to be filtered out to prevent leaking them to output files.
+    av_dict_set(&ost->st->metadata, "rotate", NULL, 0);
+
      if (ist) {
          ost->st->disposition          = ist->st->disposition;
  
@@ -3411,7 +3422,9 @@ static int init_output_stream(OutputStream *ost, char *error, int error_len)
              !av_dict_get(ost->encoder_opts, "ab", NULL, 0))
              av_dict_set(&ost->encoder_opts, "b", "128000", 0);
  
-        if (ost->filter && av_buffersink_get_hw_frames_ctx(ost->filter->filter)) {
+        if (ost->filter && av_buffersink_get_hw_frames_ctx(ost->filter->filter) &&
+            ((AVHWFramesContext*)av_buffersink_get_hw_frames_ctx(ost->filter->filter)->data)->format ==
+            av_buffersink_get_format(ost->filter->filter)) {
              ost->enc_ctx->hw_frames_ctx = av_buffer_ref(av_buffersink_get_hw_frames_ctx(ost->filter->filter));
              if (!ost->enc_ctx->hw_frames_ctx)
                  return AVERROR(ENOMEM);
@@ -3470,6 +3483,26 @@ static int init_output_stream(OutputStream *ost, char *error, int error_len)
              }
          }
  
+        /*
+         * Add global input side data. For now this is naive, and copies it
+         * from the input stream's global side data. All side data should
+         * really be funneled over AVFrame and libavfilter, then added back to
+         * packet side data, and then potentially using the first packet for
+         * global side data.
+         */
+        if (ist) {
+            int i;
+            for (i = 0; i < ist->st->nb_side_data; i++) {
+                AVPacketSideData *sd = &ist->st->side_data[i];
+                uint8_t *dst = av_stream_new_side_data(ost->st, sd->type, sd->size);
+                if (!dst)
+                    return AVERROR(ENOMEM);
+                memcpy(dst, sd->data, sd->size);
+                if (ist->autorotate && sd->type == AV_PKT_DATA_DISPLAYMATRIX)
+                    av_display_rotation_set((uint32_t *)dst, 0);
+            }
+        }
+
          // copy timebase while removing common factors
          if (ost->st->time_base.num <= 0 || ost->st->time_base.den <= 0)
              ost->st->time_base = av_add_q(ost->enc_ctx->time_base, (AVRational){0, 1});
@@ -4266,9 +4299,10 @@ static int process_input(int file_index)
              AVPacketSideData *src_sd = &ist->st->side_data[i];
              uint8_t *dst_data;
  
-            if (av_packet_get_side_data(&pkt, src_sd->type, NULL))
+            if (src_sd->type == AV_PKT_DATA_DISPLAYMATRIX)
                  continue;
-            if (ist->autorotate && src_sd->type == AV_PKT_DATA_DISPLAYMATRIX)
+
+            if (av_packet_get_side_data(&pkt, src_sd->type, NULL))
                  continue;
  
              dst_data = av_packet_new_side_data(&pkt, src_sd->type, src_sd->size);