avdevice/decklink_dec: capture timecode to metadata when requested

[ffmpeg] / libavformat / movenc.c
diff --git a/libavformat/movenc.c b/libavformat/movenc.c

index a597b0853d86ce496d3eb7dfa2e47b461af777c6..7e616e866fb9dcb59a2440323fc6cf53e8724b45 100644 (file)
--- a/libavformat/movenc.c
+++ b/libavformat/movenc.c
@@ -62,6 +62,7 @@ static const AVOption options[] = {
      { "moov_size", "maximum moov size so it can be placed at the begin", offsetof(MOVMuxContext, reserved_moov_size), AV_OPT_TYPE_INT, {.i64 = 0}, 0, INT_MAX, AV_OPT_FLAG_ENCODING_PARAM, 0 },
      { "empty_moov", "Make the initial moov atom empty", 0, AV_OPT_TYPE_CONST, {.i64 = FF_MOV_FLAG_EMPTY_MOOV}, INT_MIN, INT_MAX, AV_OPT_FLAG_ENCODING_PARAM, "movflags" },
      { "frag_keyframe", "Fragment at video keyframes", 0, AV_OPT_TYPE_CONST, {.i64 = FF_MOV_FLAG_FRAG_KEYFRAME}, INT_MIN, INT_MAX, AV_OPT_FLAG_ENCODING_PARAM, "movflags" },
+    { "frag_every_frame", "Fragment at every frame", 0, AV_OPT_TYPE_CONST, {.i64 = FF_MOV_FLAG_FRAG_EVERY_FRAME}, INT_MIN, INT_MAX, AV_OPT_FLAG_ENCODING_PARAM, "movflags" },
      { "separate_moof", "Write separate moof/mdat atoms for each track", 0, AV_OPT_TYPE_CONST, {.i64 = FF_MOV_FLAG_SEPARATE_MOOF}, INT_MIN, INT_MAX, AV_OPT_FLAG_ENCODING_PARAM, "movflags" },
      { "frag_custom", "Flush fragments on caller requests", 0, AV_OPT_TYPE_CONST, {.i64 = FF_MOV_FLAG_FRAG_CUSTOM}, INT_MIN, INT_MAX, AV_OPT_FLAG_ENCODING_PARAM, "movflags" },
      { "isml", "Create a live smooth streaming feed (for pushing to a publishing point)", 0, AV_OPT_TYPE_CONST, {.i64 = FF_MOV_FLAG_ISML}, INT_MIN, INT_MAX, AV_OPT_FLAG_ENCODING_PARAM, "movflags" },
@@ -97,6 +98,9 @@ static const AVOption options[] = {
      { "encryption_kid", "The media encryption key identifier (hex)", offsetof(MOVMuxContext, encryption_kid), AV_OPT_TYPE_BINARY, .flags = AV_OPT_FLAG_ENCODING_PARAM },
      { "use_stream_ids_as_track_ids", "use stream ids as track ids", offsetof(MOVMuxContext, use_stream_ids_as_track_ids), AV_OPT_TYPE_BOOL, {.i64 = 0}, 0, 1, AV_OPT_FLAG_ENCODING_PARAM},
      { "write_tmcd", "force or disable writing tmcd", offsetof(MOVMuxContext, write_tmcd), AV_OPT_TYPE_BOOL, {.i64 = -1}, -1, 1, AV_OPT_FLAG_ENCODING_PARAM},
+    { "write_prft", "Write producer reference time box with specified time source", offsetof(MOVMuxContext, write_prft), AV_OPT_TYPE_INT, {.i64 = MOV_PRFT_NONE}, 0, MOV_PRFT_NB-1, AV_OPT_FLAG_ENCODING_PARAM, "prft"},
+    { "wallclock", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = MOV_PRFT_SRC_WALLCLOCK}, 0, 0, AV_OPT_FLAG_ENCODING_PARAM, "prft"},
+    { "pts", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = MOV_PRFT_SRC_PTS}, 0, 0, AV_OPT_FLAG_ENCODING_PARAM, "prft"},
      { NULL },
  };
  
@@ -139,6 +143,15 @@ static int co64_required(const MOVTrack *track)
      return 0;
  }
  
+static int rtp_hinting_needed(const AVStream *st)
+{
+    /* Add hint tracks for each real audio and video stream */
+    if (st->disposition & AV_DISPOSITION_ATTACHED_PIC)
+        return 0;
+    return st->codecpar->codec_type == AVMEDIA_TYPE_VIDEO ||
+           st->codecpar->codec_type == AVMEDIA_TYPE_AUDIO;
+}
+
  /* Chunk offset atom */
  static int mov_write_stco_tag(AVIOContext *pb, MOVTrack *track)
  {
@@ -490,10 +503,7 @@ concatenate:
          if (info->num_blocks != 6)
              goto end;
          av_packet_unref(pkt);
-        ret = av_packet_ref(pkt, &info->pkt);
-        if (ret < 0)
-            goto end;
-        av_packet_unref(&info->pkt);
+        av_packet_move_ref(pkt, &info->pkt);
          info->num_blocks = 0;
      }
      ret = pkt->size;
@@ -1556,9 +1566,9 @@ static int mov_find_codec_tag(AVFormatContext *s, MOVTrack *track)
      else if (track->mode == MODE_ISM)
          tag = track->par->codec_tag;
      else if (track->mode == MODE_IPOD) {
-        if (!av_match_ext(s->filename, "m4a") &&
-            !av_match_ext(s->filename, "m4v") &&
-            !av_match_ext(s->filename, "m4b"))
+        if (!av_match_ext(s->url, "m4a") &&
+            !av_match_ext(s->url, "m4v") &&
+            !av_match_ext(s->url, "m4b"))
              av_log(s, AV_LOG_WARNING, "Warning, extension is not .m4a nor .m4v "
                     "Quicktime/Ipod might not play the file\n");
          tag = track->par->codec_tag;
@@ -3026,7 +3036,7 @@ static int mov_write_track_udta_tag(AVIOContext *pb, MOVMuxContext *mov,
      if (ret < 0)
          return ret;
  
-    if (mov->mode & MODE_MP4)
+    if (mov->mode & (MODE_MP4|MODE_MOV))
          mov_write_track_metadata(pb_buf, st, "name", "title");
  
      if ((size = avio_close_dyn_buf(pb_buf, &buf)) > 0) {
@@ -3415,6 +3425,51 @@ static int mov_write_int8_metadata(AVFormatContext *s, AVIOContext *pb,
      return size;
  }
  
+static int mov_write_covr(AVIOContext *pb, AVFormatContext *s)
+{
+    MOVMuxContext *mov = s->priv_data;
+    int64_t pos = 0;
+    int i, type;
+
+    for (i = 0; i < s->nb_streams; i++) {
+        MOVTrack *trk = &mov->tracks[i];
+        AVStream *st = s->streams[i];
+
+        if (!(st->disposition & AV_DISPOSITION_ATTACHED_PIC) ||
+            trk->cover_image.size <= 0)
+            continue;
+
+        switch (st->codecpar->codec_id) {
+        case AV_CODEC_ID_MJPEG:
+            type = 0xD;
+            break;
+        case AV_CODEC_ID_PNG:
+            type = 0xE;
+            break;
+        case AV_CODEC_ID_BMP:
+            type = 0x1B;
+            break;
+        default:
+            av_log(s, AV_LOG_ERROR, "unsupported codec_id (0x%x) for cover",
+                   st->codecpar->codec_id);
+            continue;
+        }
+
+        if (!pos) {
+            pos = avio_tell(pb);
+            avio_wb32(pb, 0);
+            ffio_wfourcc(pb, "covr");
+        }
+        avio_wb32(pb, 16 + trk->cover_image.size);
+        ffio_wfourcc(pb, "data");
+        avio_wb32(pb, type);
+        avio_wb32(pb , 0);
+        avio_write(pb, trk->cover_image.data, trk->cover_image.size);
+    }
+
+    return pos ? update_size(pb, pos) : 0;
+}
+
  /* iTunes meta data list */
  static int mov_write_ilst_tag(AVIOContext *pb, MOVMuxContext *mov,
                                AVFormatContext *s)
@@ -3434,7 +3489,7 @@ static int mov_write_ilst_tag(AVIOContext *pb, MOVMuxContext *mov,
      }
      mov_write_string_metadata(s, pb, "\251cmt", "comment"  , 1);
      mov_write_string_metadata(s, pb, "\251gen", "genre"    , 1);
-    mov_write_string_metadata(s, pb, "\251cpy", "copyright", 1);
+    mov_write_string_metadata(s, pb, "cprt",    "copyright", 1);
      mov_write_string_metadata(s, pb, "\251grp", "grouping" , 1);
      mov_write_string_metadata(s, pb, "\251lyr", "lyrics"   , 1);
      mov_write_string_metadata(s, pb, "desc",    "description",1);
@@ -3449,6 +3504,7 @@ static int mov_write_ilst_tag(AVIOContext *pb, MOVMuxContext *mov,
      mov_write_int8_metadata  (s, pb, "hdvd",    "hd_video",  1);
      mov_write_int8_metadata  (s, pb, "pgap",    "gapless_playback",1);
      mov_write_int8_metadata  (s, pb, "cpil",    "compilation", 1);
+    mov_write_covr(pb, s);
      mov_write_trkn_tag(pb, mov, s, 0); // track number
      mov_write_trkn_tag(pb, mov, s, 1); // disc number
      mov_write_tmpo_tag(pb, s);
@@ -3946,6 +4002,8 @@ static int mov_write_isml_manifest(AVIOContext *pb, MOVMuxContext *mov, AVFormat
          } else {
              continue;
          }
+        if (st->disposition & AV_DISPOSITION_ATTACHED_PIC)
+            continue;
  
          props = (AVCPBProperties*)av_stream_get_side_data(track->st, AV_PKT_DATA_CPB_PROPERTIES, NULL);
  
@@ -4459,6 +4517,49 @@ static int mov_write_sidx_tags(AVIOContext *pb, MOVMuxContext *mov,
      return 0;
  }
  
+static int mov_write_prft_tag(AVIOContext *pb, MOVMuxContext *mov, int tracks)
+{
+    int64_t pos = avio_tell(pb), pts_us, ntp_ts;
+    MOVTrack *first_track;
+
+    /* PRFT should be associated with at most one track. So, choosing only the
+     * first track. */
+    if (tracks > 0)
+        return 0;
+    first_track = &(mov->tracks[0]);
+
+    if (!first_track->entry) {
+        av_log(mov->fc, AV_LOG_WARNING, "Unable to write PRFT, no entries in the track\n");
+        return 0;
+    }
+
+    if (first_track->cluster[0].pts == AV_NOPTS_VALUE) {
+        av_log(mov->fc, AV_LOG_WARNING, "Unable to write PRFT, first PTS is invalid\n");
+        return 0;
+    }
+
+    if (mov->write_prft == MOV_PRFT_SRC_WALLCLOCK) {
+        ntp_ts = ff_get_formatted_ntp_time(ff_ntp_time());
+    } else if (mov->write_prft == MOV_PRFT_SRC_PTS) {
+        pts_us = av_rescale_q(first_track->cluster[0].pts,
+                              first_track->st->time_base, AV_TIME_BASE_Q);
+        ntp_ts = ff_get_formatted_ntp_time(pts_us + NTP_OFFSET_US);
+    } else {
+        av_log(mov->fc, AV_LOG_WARNING, "Unsupported PRFT box configuration: %d\n",
+               mov->write_prft);
+        return 0;
+    }
+
+    avio_wb32(pb, 0);                           // Size place holder
+    ffio_wfourcc(pb, "prft");                   // Type
+    avio_w8(pb, 1);                             // Version
+    avio_wb24(pb, 0);                           // Flags
+    avio_wb32(pb, first_track->track_id);       // reference track ID
+    avio_wb64(pb, ntp_ts);                      // NTP time stamp
+    avio_wb64(pb, first_track->cluster[0].pts); //media time
+    return update_size(pb, pos);
+}
+
  static int mov_write_moof_tag(AVIOContext *pb, MOVMuxContext *mov, int tracks,
                                int64_t mdat_size)
  {
@@ -4473,6 +4574,9 @@ static int mov_write_moof_tag(AVIOContext *pb, MOVMuxContext *mov, int tracks,
      if (mov->flags & FF_MOV_FLAG_DASH && !(mov->flags & FF_MOV_FLAG_GLOBAL_SIDX))
          mov_write_sidx_tags(pb, mov, tracks, moof_size + 8 + mdat_size);
  
+    if (mov->write_prft > MOV_PRFT_NONE && mov->write_prft < MOV_PRFT_NB)
+        mov_write_prft_tag(pb, mov, tracks);
+
      if (mov->flags & FF_MOV_FLAG_GLOBAL_SIDX ||
          !(mov->flags & FF_MOV_FLAG_SKIP_TRAILER) ||
          mov->ism_lookahead) {
@@ -4559,6 +4663,8 @@ static int mov_write_ftyp_tag(AVIOContext *pb, AVFormatContext *s)
  
      for (i = 0; i < s->nb_streams; i++) {
          AVStream *st = s->streams[i];
+        if (st->disposition & AV_DISPOSITION_ATTACHED_PIC)
+            continue;
          if (st->codecpar->codec_type == AVMEDIA_TYPE_VIDEO)
              has_video = 1;
          if (st->codecpar->codec_id == AV_CODEC_ID_H264)
@@ -4707,6 +4813,8 @@ static int mov_write_identification(AVIOContext *pb, AVFormatContext *s)
          int video_streams_nb = 0, audio_streams_nb = 0, other_streams_nb = 0;
          for (i = 0; i < s->nb_streams; i++) {
              AVStream *st = s->streams[i];
+            if (st->disposition & AV_DISPOSITION_ATTACHED_PIC)
+                continue;
              if (st->codecpar->codec_type == AVMEDIA_TYPE_VIDEO)
                  video_streams_nb++;
              else if (st->codecpar->codec_type == AVMEDIA_TYPE_AUDIO)
@@ -4896,7 +5004,8 @@ static int mov_flush_fragment(AVFormatContext *s, int force)
          int buf_size, moov_size;
  
          for (i = 0; i < mov->nb_streams; i++)
-            if (!mov->tracks[i].entry)
+            if (!mov->tracks[i].entry &&
+                (i >= s->nb_streams || !(s->streams[i]->disposition & AV_DISPOSITION_ATTACHED_PIC)))
                  break;
          /* Don't write the initial moov unless all tracks have data */
          if (i < mov->nb_streams && !force)
@@ -5257,6 +5366,7 @@ int ff_mov_write_packet(AVFormatContext *s, AVPacket *pkt)
      trk->cluster[trk->entry].size             = size;
      trk->cluster[trk->entry].entries          = samples_in_chunk;
      trk->cluster[trk->entry].dts              = pkt->dts;
+    trk->cluster[trk->entry].pts              = pkt->pts;
      if (!trk->entry && trk->start_dts != AV_NOPTS_VALUE) {
          if (!trk->frag_discont) {
              /* First packet of a new fragment. We already wrote the duration
@@ -5432,7 +5542,8 @@ static int mov_write_single_packet(AVFormatContext *s, AVPacket *pkt)
               (mov->max_fragment_size && mov->mdat_size + size >= mov->max_fragment_size) ||
               (mov->flags & FF_MOV_FLAG_FRAG_KEYFRAME &&
                par->codec_type == AVMEDIA_TYPE_VIDEO &&
-              trk->entry && pkt->flags & AV_PKT_FLAG_KEY)) {
+              trk->entry && pkt->flags & AV_PKT_FLAG_KEY) ||
+              (mov->flags & FF_MOV_FLAG_FRAG_EVERY_FRAME)) {
              if (frag_duration >= mov->min_fragment_duration) {
                  // Set the duration of this track to line up with the next
                  // sample in this track. This avoids relying on AVPacket
@@ -5474,13 +5585,34 @@ static int mov_write_subtitle_end_packet(AVFormatContext *s,
  
  static int mov_write_packet(AVFormatContext *s, AVPacket *pkt)
  {
+    MOVMuxContext *mov = s->priv_data;
+    MOVTrack *trk;
+    AVStream *st;
+
      if (!pkt) {
          mov_flush_fragment(s, 1);
          return 1;
+    }
+
+    st = s->streams[pkt->stream_index];
+    trk = &mov->tracks[pkt->stream_index];
+
+    if (st->disposition & AV_DISPOSITION_ATTACHED_PIC) {
+        int ret;
+
+        if (st->nb_frames >= 1) {
+            if (st->nb_frames == 1)
+                av_log(s, AV_LOG_WARNING, "Got more than one picture in stream %d,"
+                       " ignoring.\n", pkt->stream_index);
+            return 0;
+        }
+
+        if ((ret = av_packet_ref(&trk->cover_image, pkt)) < 0)
+            return ret;
+
+        return 0;
      } else {
          int i;
-        MOVMuxContext *mov = s->priv_data;
-        MOVTrack *trk = &mov->tracks[pkt->stream_index];
  
          if (!pkt->size)
              return mov_write_single_packet(s, pkt); /* Passthrough. */
@@ -5727,7 +5859,8 @@ static void enable_tracks(AVFormatContext *s)
          AVStream *st = s->streams[i];
  
          if (st->codecpar->codec_type <= AVMEDIA_TYPE_UNKNOWN ||
-            st->codecpar->codec_type >= AVMEDIA_TYPE_NB)
+            st->codecpar->codec_type >= AVMEDIA_TYPE_NB ||
+            st->disposition & AV_DISPOSITION_ATTACHED_PIC)
              continue;
  
          if (first[st->codecpar->codec_type] < 0)
@@ -5770,6 +5903,7 @@ static void mov_free(AVFormatContext *s)
              av_freep(&mov->tracks[i].par);
          av_freep(&mov->tracks[i].cluster);
          av_freep(&mov->tracks[i].frag_info);
+        av_packet_unref(&mov->tracks[i].cover_image);
  
          if (mov->tracks[i].vos_len)
              av_freep(&mov->tracks[i].vos_data);
@@ -5874,7 +6008,8 @@ static int mov_init(AVFormatContext *s)
      if (mov->max_fragment_duration || mov->max_fragment_size ||
          mov->flags & (FF_MOV_FLAG_EMPTY_MOOV |
                        FF_MOV_FLAG_FRAG_KEYFRAME |
-                      FF_MOV_FLAG_FRAG_CUSTOM))
+                      FF_MOV_FLAG_FRAG_CUSTOM |
+                      FF_MOV_FLAG_FRAG_EVERY_FRAME))
          mov->flags |= FF_MOV_FLAG_FRAGMENT;
  
      /* Set other implicit flags immediately */
@@ -5941,14 +6076,9 @@ static int mov_init(AVFormatContext *s)
          mov->chapter_track = mov->nb_streams++;
  
      if (mov->flags & FF_MOV_FLAG_RTP_HINT) {
-        /* Add hint tracks for each audio and video stream */
-        for (i = 0; i < s->nb_streams; i++) {
-            AVStream *st = s->streams[i];
-            if (st->codecpar->codec_type == AVMEDIA_TYPE_VIDEO ||
-                st->codecpar->codec_type == AVMEDIA_TYPE_AUDIO) {
+        for (i = 0; i < s->nb_streams; i++)
+            if (rtp_hinting_needed(s->streams[i]))
                  mov->nb_streams++;
-            }
-        }
      }
  
      if (   mov->write_tmcd == -1 && (mov->mode == MODE_MOV || mov->mode == MODE_MP4)
@@ -6079,6 +6209,15 @@ static int mov_init(AVFormatContext *s)
                      av_log(s, AV_LOG_ERROR, "VP9 only supported in MP4.\n");
                      return AVERROR(EINVAL);
                  }
+            } else if (track->par->codec_id == AV_CODEC_ID_AV1) {
+                /* spec is not finished, so forbid for now */
+                av_log(s, AV_LOG_ERROR, "AV1 muxing is currently not supported.\n");
+                return AVERROR_PATCHWELCOME;
+            } else if (track->par->codec_id == AV_CODEC_ID_VP8) {
+                /* altref frames handling is not defined in the spec as of version v1.0,
+                 * so just forbid muxing VP8 streams altogether until a new version does */
+                av_log(s, AV_LOG_ERROR, "VP8 muxing is currently not supported.\n");
+                return AVERROR_PATCHWELCOME;
              }
          } else if (st->codecpar->codec_type == AVMEDIA_TYPE_AUDIO) {
              track->timescale = st->codecpar->sample_rate;
@@ -6166,15 +6305,10 @@ static int mov_write_header(AVFormatContext *s)
          nb_tracks++;
  
      if (mov->flags & FF_MOV_FLAG_RTP_HINT) {
-        /* Add hint tracks for each audio and video stream */
          hint_track = nb_tracks;
-        for (i = 0; i < s->nb_streams; i++) {
-            AVStream *st = s->streams[i];
-            if (st->codecpar->codec_type == AVMEDIA_TYPE_VIDEO ||
-                st->codecpar->codec_type == AVMEDIA_TYPE_AUDIO) {
+        for (i = 0; i < s->nb_streams; i++)
+            if (rtp_hinting_needed(s->streams[i]))
                  nb_tracks++;
-            }
-        }
      }
  
      if (mov->mode == MODE_MOV || mov->mode == MODE_MP4)
@@ -6233,7 +6367,8 @@ static int mov_write_header(AVFormatContext *s)
      if (mov->flags & FF_MOV_FLAG_FRAGMENT) {
          /* If no fragmentation options have been set, set a default. */
          if (!(mov->flags & (FF_MOV_FLAG_FRAG_KEYFRAME |
-                            FF_MOV_FLAG_FRAG_CUSTOM)) &&
+                            FF_MOV_FLAG_FRAG_CUSTOM |
+                            FF_MOV_FLAG_FRAG_EVERY_FRAME)) &&
              !mov->max_fragment_duration && !mov->max_fragment_size)
              mov->flags |= FF_MOV_FLAG_FRAG_KEYFRAME;
      } else {
@@ -6251,11 +6386,8 @@ static int mov_write_header(AVFormatContext *s)
              return ret;
  
      if (mov->flags & FF_MOV_FLAG_RTP_HINT) {
-        /* Initialize the hint tracks for each audio and video stream */
          for (i = 0; i < s->nb_streams; i++) {
-            AVStream *st = s->streams[i];
-            if (st->codecpar->codec_type == AVMEDIA_TYPE_VIDEO ||
-                st->codecpar->codec_type == AVMEDIA_TYPE_AUDIO) {
+            if (rtp_hinting_needed(s->streams[i])) {
                  if ((ret = ff_mov_init_hinting(s, hint_track, i)) < 0)
                      return ret;
                  hint_track++;
@@ -6400,10 +6532,10 @@ static int shift_data(AVFormatContext *s)
       * writing, so we re-open the same output, but for reading. It also avoids
       * a read/seek/write/seek back and forth. */
      avio_flush(s->pb);
-    ret = s->io_open(s, &read_pb, s->filename, AVIO_FLAG_READ, NULL);
+    ret = s->io_open(s, &read_pb, s->url, AVIO_FLAG_READ, NULL);
      if (ret < 0) {
          av_log(s, AV_LOG_ERROR, "Unable to re-open %s output file for "
-               "the second pass (faststart)\n", s->filename);
+               "the second pass (faststart)\n", s->url);
          goto end;
      }