2 * Copyright (c) 2015 Martin Storsjo
4 * This file is part of FFmpeg.
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
23 #include "libavutil/intreadwrite.h"
24 #include "libavutil/mathematics.h"
25 #include "libavutil/md5.h"
27 #include "libavformat/avformat.h"
34 #include "compat/getopt.c"
39 static const uint8_t h264_extradata[] = {
40 0x01, 0x4d, 0x40, 0x1e, 0xff, 0xe1, 0x00, 0x02, 0x67, 0x4d, 0x01, 0x00, 0x02, 0x68, 0xef
42 static const uint8_t aac_extradata[] = {
47 static const char *format = "mp4";
57 uint8_t hash[HASH_SIZE];
59 AVStream *video_st, *audio_st;
60 int64_t audio_dts, video_dts;
64 int64_t audio_duration;
68 enum AVPictureType last_picture;
74 int fake_pkt_duration;
81 static void count_warnings(void *avcl, int level, const char *fmt, va_list vl)
83 if (level == AV_LOG_WARNING)
87 static void init_count_warnings(void)
89 av_log_set_callback(count_warnings);
93 static void reset_count_warnings(void)
95 av_log_set_callback(av_log_default_callback);
98 static int io_write(void *opaque, uint8_t *buf, int size)
101 av_md5_update(md5, buf, size);
103 fwrite(buf, 1, size, out);
107 static int io_write_data_type(void *opaque, uint8_t *buf, int size,
108 enum AVIODataMarkerType type, int64_t time)
110 char timebuf[30], content[5] = { 0 };
113 case AVIO_DATA_MARKER_HEADER: str = "header"; break;
114 case AVIO_DATA_MARKER_SYNC_POINT: str = "sync"; break;
115 case AVIO_DATA_MARKER_BOUNDARY_POINT: str = "boundary"; break;
116 case AVIO_DATA_MARKER_UNKNOWN: str = "unknown"; break;
117 case AVIO_DATA_MARKER_TRAILER: str = "trailer"; break;
118 default: str = "unknown"; break;
120 if (time == AV_NOPTS_VALUE)
121 snprintf(timebuf, sizeof(timebuf), "nopts");
123 snprintf(timebuf, sizeof(timebuf), "%"PRId64, time);
124 // There can be multiple header/trailer callbacks, only log the box type
125 // for header at out_size == 0
126 if (type != AVIO_DATA_MARKER_UNKNOWN &&
127 type != AVIO_DATA_MARKER_TRAILER &&
128 (type != AVIO_DATA_MARKER_HEADER || out_size == 0) &&
130 memcpy(content, &buf[4], 4);
132 snprintf(content, sizeof(content), "-");
133 printf("write_data len %d, time %s, type %s atom %s\n", size, timebuf, str, content);
134 return io_write(opaque, buf, size);
137 static void init_out(const char *name)
141 snprintf(buf, sizeof(buf), "%s.%s", cur_name, format);
145 out = fopen(buf, "wb");
152 static void close_out(void)
155 av_md5_final(md5, hash);
156 for (i = 0; i < HASH_SIZE; i++)
157 printf("%02x", hash[i]);
158 printf(" %d %s\n", out_size, cur_name);
164 static void check_func(int value, int line, const char *msg, ...)
169 printf("%d: ", line);
176 #define check(value, ...) check_func(value, __LINE__, __VA_ARGS__)
178 static void init_fps(int bf, int audio_preroll, int fps)
181 int iobuf_size = force_iobuf_size ? force_iobuf_size : sizeof(iobuf);
182 ctx = avformat_alloc_context();
185 ctx->oformat = av_guess_format(format, NULL, NULL);
188 ctx->pb = avio_alloc_context(iobuf, iobuf_size, AVIO_FLAG_WRITE, NULL, NULL, io_write, NULL);
191 ctx->pb->write_data_type = io_write_data_type;
192 ctx->flags |= AVFMT_FLAG_BITEXACT;
194 st = avformat_new_stream(ctx, NULL);
197 st->codecpar->codec_type = AVMEDIA_TYPE_VIDEO;
198 st->codecpar->codec_id = AV_CODEC_ID_H264;
199 st->codecpar->width = 640;
200 st->codecpar->height = 480;
201 st->time_base.num = 1;
202 st->time_base.den = 30;
203 st->codecpar->extradata_size = sizeof(h264_extradata);
204 st->codecpar->extradata = av_mallocz(st->codecpar->extradata_size + AV_INPUT_BUFFER_PADDING_SIZE);
205 if (!st->codecpar->extradata)
207 memcpy(st->codecpar->extradata, h264_extradata, sizeof(h264_extradata));
210 st = avformat_new_stream(ctx, NULL);
213 st->codecpar->codec_type = AVMEDIA_TYPE_AUDIO;
214 st->codecpar->codec_id = AV_CODEC_ID_AAC;
215 st->codecpar->sample_rate = 44100;
216 st->codecpar->channels = 2;
217 st->time_base.num = 1;
218 st->time_base.den = 44100;
219 st->codecpar->extradata_size = sizeof(aac_extradata);
220 st->codecpar->extradata = av_mallocz(st->codecpar->extradata_size + AV_INPUT_BUFFER_PADDING_SIZE);
221 if (!st->codecpar->extradata)
223 memcpy(st->codecpar->extradata, aac_extradata, sizeof(aac_extradata));
226 if (avformat_write_header(ctx, &opts) < 0)
232 duration = video_st->time_base.den / fps;
233 audio_duration = 1024LL * audio_st->time_base.den / audio_st->codecpar->sample_rate;
235 audio_preroll = 2048LL * audio_st->time_base.den / audio_st->codecpar->sample_rate;
238 video_dts = bframes ? -duration : 0;
239 audio_dts = -audio_preroll;
242 static void init(int bf, int audio_preroll)
244 init_fps(bf, audio_preroll, 30);
247 static void mux_frames(int n, int c)
249 int end_frames = frames + n;
252 uint8_t pktdata[8] = { 0 };
253 av_init_packet(&pkt);
255 if (av_compare_ts(audio_dts, audio_st->time_base, video_dts, video_st->time_base) < 0) {
256 pkt.dts = pkt.pts = audio_dts;
257 pkt.stream_index = 1;
258 pkt.duration = audio_duration;
259 audio_dts += audio_duration;
261 if (frames == end_frames)
264 pkt.stream_index = 0;
265 pkt.duration = duration;
266 if ((frames % gop_size) == 0) {
267 pkt.flags |= AV_PKT_FLAG_KEY;
268 last_picture = AV_PICTURE_TYPE_I;
269 pkt.pts = pkt.dts + duration;
272 if (last_picture == AV_PICTURE_TYPE_P) {
273 last_picture = AV_PICTURE_TYPE_B;
275 video_dts = next_p_pts;
277 last_picture = AV_PICTURE_TYPE_P;
278 if (((frames + 1) % gop_size) == 0) {
279 pkt.pts = pkt.dts + duration;
282 next_p_pts = pkt.pts = pkt.dts + 2 * duration;
283 video_dts += duration;
289 if (fake_pkt_duration)
290 pkt.duration = fake_pkt_duration;
296 AV_WB32(pktdata + 4, pkt.pts);
301 if (skip_write_audio && pkt.stream_index == 1)
305 pkt.pts += (1LL<<32);
306 pkt.dts += (1LL<<32);
310 av_interleaved_write_frame(ctx, &pkt);
312 av_write_frame(ctx, &pkt);
316 static void mux_gops(int n)
318 mux_frames(gop_size * n, 0);
321 static void skip_gops(int n)
328 static void signal_init_ts(void)
331 av_init_packet(&pkt);
335 pkt.stream_index = 0;
338 av_write_frame(ctx, &pkt);
340 pkt.stream_index = 1;
341 pkt.dts = pkt.pts = audio_dts;
342 av_write_frame(ctx, &pkt);
345 static void finish(void)
347 av_write_trailer(ctx);
348 avio_context_free(&ctx->pb);
349 avformat_free_context(ctx);
353 static void help(void)
355 printf("movenc-test [-w]\n"
356 "-w write output into files\n");
359 int main(int argc, char **argv)
362 uint8_t header[HASH_SIZE];
363 uint8_t content[HASH_SIZE];
368 c = getopt(argc, argv, "wh");
384 md5 = av_md5_alloc();
388 // Write a fragmented file with an initial moov that actually contains some
389 // samples. One moov+mdat with 1 second of data and one moof+mdat with 1
391 init_out("non-empty-moov");
392 av_dict_set(&opts, "movflags", "frag_keyframe", 0);
398 // Write a similar file, but with B-frames and audio preroll, handled
400 init_out("non-empty-moov-elst");
401 av_dict_set(&opts, "movflags", "frag_keyframe", 0);
402 av_dict_set(&opts, "use_editlist", "1", 0);
408 // Use B-frames but no audio-preroll, but without an edit list.
409 // Due to avoid_negative_ts == AVFMT_AVOID_NEG_TS_MAKE_ZERO, the dts
410 // of the first audio packet is > 0, but it is set to zero since edit
411 // lists aren't used, increasing the duration of the first packet instead.
412 init_out("non-empty-moov-no-elst");
413 av_dict_set(&opts, "movflags", "frag_keyframe", 0);
414 av_dict_set(&opts, "use_editlist", "0", 0);
421 // Write an ISMV, with B-frames and audio preroll.
423 av_dict_set(&opts, "movflags", "frag_keyframe", 0);
430 // An initial moov that doesn't contain any samples, followed by two
432 init_out("empty-moov");
433 av_dict_set(&opts, "movflags", "frag_keyframe+empty_moov", 0);
434 av_dict_set(&opts, "use_editlist", "0", 0);
439 memcpy(content, hash, HASH_SIZE);
441 // Similar to the previous one, but with input that doesn't start at
442 // pts/dts 0. avoid_negative_ts behaves in the same way as
443 // in non-empty-moov-no-elst above.
444 init_out("empty-moov-no-elst");
445 av_dict_set(&opts, "movflags", "frag_keyframe+empty_moov", 0);
451 // Same as the previous one, but disable avoid_negative_ts (which
452 // would require using an edit list, but with empty_moov, one can't
453 // write a sensible edit list, when the start timestamps aren't known).
454 // This should trigger a warning - we check that the warning is produced.
455 init_count_warnings();
456 init_out("empty-moov-no-elst-no-adjust");
457 av_dict_set(&opts, "movflags", "frag_keyframe+empty_moov", 0);
458 av_dict_set(&opts, "avoid_negative_ts", "0", 0);
464 reset_count_warnings();
465 check(num_warnings > 0, "No warnings printed for unhandled start offset");
467 // Verify that delay_moov produces the same as empty_moov for
469 init_out("delay-moov");
470 av_dict_set(&opts, "movflags", "frag_keyframe+delay_moov", 0);
471 av_dict_set(&opts, "use_editlist", "0", 0);
476 check(!memcmp(hash, content, HASH_SIZE), "delay_moov differs from empty_moov");
478 // Test writing content that requires an edit list using delay_moov
479 init_out("delay-moov-elst");
480 av_dict_set(&opts, "movflags", "frag_keyframe+delay_moov", 0);
486 // Test writing a file with one track lacking packets, with delay_moov.
487 skip_write_audio = 1;
488 init_out("delay-moov-empty-track");
489 av_dict_set(&opts, "movflags", "frag_keyframe+delay_moov", 0);
492 // The automatic flushing shouldn't output anything, since we're still
493 // waiting for data for some tracks
494 check(out_size == 0, "delay_moov flushed prematurely");
495 // When closed (or manually flushed), all the written data should still
499 check(out_size > 0, "delay_moov didn't output anything");
501 // Check that manually flushing still outputs things as expected. This
502 // produces two fragments, while the one above produces only one.
503 init_out("delay-moov-empty-track-flush");
504 av_dict_set(&opts, "movflags", "frag_custom+delay_moov", 0);
507 av_write_frame(ctx, NULL); // Force writing the moov
508 check(out_size > 0, "No moov written");
509 av_write_frame(ctx, NULL);
511 av_write_frame(ctx, NULL);
515 skip_write_audio = 0;
519 // Verify that the header written by delay_moov when manually flushed
520 // is identical to the one by empty_moov.
521 init_out("empty-moov-header");
522 av_dict_set(&opts, "movflags", "frag_keyframe+empty_moov", 0);
523 av_dict_set(&opts, "use_editlist", "0", 0);
526 memcpy(header, hash, HASH_SIZE);
527 init_out("empty-moov-content");
529 // Written 2 seconds of content, with an automatic flush after 1 second.
530 check(out_size > 0, "No automatic flush?");
531 empty_moov_pos = prev_pos = out_size;
532 // Manually flush the second fragment
533 av_write_frame(ctx, NULL);
534 check(out_size > prev_pos, "No second fragment flushed?");
536 // Check that an extra flush doesn't output any more data
537 av_write_frame(ctx, NULL);
538 check(out_size == prev_pos, "More data written?");
540 memcpy(content, hash, HASH_SIZE);
541 // Ignore the trailer written here
544 init_out("delay-moov-header");
545 av_dict_set(&opts, "movflags", "frag_custom+delay_moov", 0);
546 av_dict_set(&opts, "use_editlist", "0", 0);
548 check(out_size == 0, "Output written during init with delay_moov");
549 mux_gops(1); // Write 1 second of content
550 av_write_frame(ctx, NULL); // Force writing the moov
552 check(!memcmp(hash, header, HASH_SIZE), "delay_moov header differs from empty_moov");
553 init_out("delay-moov-content");
554 av_write_frame(ctx, NULL); // Flush the first fragment
555 check(out_size == empty_moov_pos, "Manually flushed content differs from automatically flushed, %d vs %d", out_size, empty_moov_pos);
556 mux_gops(1); // Write the rest of the content
557 av_write_frame(ctx, NULL); // Flush the second fragment
559 check(!memcmp(hash, content, HASH_SIZE), "delay_moov content differs from empty_moov");
563 // Verify that we can produce an identical second fragment without
564 // writing the first one. First write the reference fragments that
565 // we want to reproduce.
566 av_dict_set(&opts, "movflags", "frag_custom+empty_moov+dash", 0);
569 av_write_frame(ctx, NULL); // Output the first fragment
570 init_out("empty-moov-second-frag");
572 av_write_frame(ctx, NULL); // Output the second fragment
574 memcpy(content, hash, HASH_SIZE);
577 // Produce the same second fragment without actually writing the first
579 av_dict_set(&opts, "movflags", "frag_custom+empty_moov+dash+frag_discont", 0);
580 av_dict_set(&opts, "fragment_index", "2", 0);
581 av_dict_set(&opts, "avoid_negative_ts", "0", 0);
582 av_dict_set(&opts, "use_editlist", "0", 0);
585 init_out("empty-moov-second-frag-discont");
587 av_write_frame(ctx, NULL); // Output the second fragment
589 check(!memcmp(hash, content, HASH_SIZE), "discontinuously written fragment differs");
592 // Produce the same thing by using delay_moov, which requires a slightly
593 // different call sequence.
594 av_dict_set(&opts, "movflags", "frag_custom+delay_moov+dash+frag_discont", 0);
595 av_dict_set(&opts, "fragment_index", "2", 0);
599 av_write_frame(ctx, NULL); // Output the moov
600 init_out("delay-moov-second-frag-discont");
601 av_write_frame(ctx, NULL); // Output the second fragment
603 check(!memcmp(hash, content, HASH_SIZE), "discontinuously written fragment differs");
607 // Test discontinuously written fragments with B-frames (where the
608 // assumption of starting at pts=0 works) but not with audio preroll
609 // (which can't be guessed).
610 av_dict_set(&opts, "movflags", "frag_custom+delay_moov+dash", 0);
613 init_out("delay-moov-elst-init");
614 av_write_frame(ctx, NULL); // Output the moov
616 memcpy(header, hash, HASH_SIZE);
617 av_write_frame(ctx, NULL); // Output the first fragment
618 init_out("delay-moov-elst-second-frag");
620 av_write_frame(ctx, NULL); // Output the second fragment
622 memcpy(content, hash, HASH_SIZE);
625 av_dict_set(&opts, "movflags", "frag_custom+delay_moov+dash+frag_discont", 0);
626 av_dict_set(&opts, "fragment_index", "2", 0);
629 mux_gops(1); // Write the second fragment
630 init_out("delay-moov-elst-init-discont");
631 av_write_frame(ctx, NULL); // Output the moov
633 check(!memcmp(hash, header, HASH_SIZE), "discontinuously written header differs");
634 init_out("delay-moov-elst-second-frag-discont");
635 av_write_frame(ctx, NULL); // Output the second fragment
637 check(!memcmp(hash, content, HASH_SIZE), "discontinuously written fragment differs");
641 // Test discontinuously written fragments with B-frames and audio preroll,
642 // properly signaled.
643 av_dict_set(&opts, "movflags", "frag_custom+delay_moov+dash", 0);
646 init_out("delay-moov-elst-signal-init");
647 av_write_frame(ctx, NULL); // Output the moov
649 memcpy(header, hash, HASH_SIZE);
650 av_write_frame(ctx, NULL); // Output the first fragment
651 init_out("delay-moov-elst-signal-second-frag");
653 av_write_frame(ctx, NULL); // Output the second fragment
655 memcpy(content, hash, HASH_SIZE);
658 av_dict_set(&opts, "movflags", "frag_custom+delay_moov+dash+frag_discont", 0);
659 av_dict_set(&opts, "fragment_index", "2", 0);
663 mux_gops(1); // Write the second fragment
664 init_out("delay-moov-elst-signal-init-discont");
665 av_write_frame(ctx, NULL); // Output the moov
667 check(!memcmp(hash, header, HASH_SIZE), "discontinuously written header differs");
668 init_out("delay-moov-elst-signal-second-frag-discont");
669 av_write_frame(ctx, NULL); // Output the second fragment
671 check(!memcmp(hash, content, HASH_SIZE), "discontinuously written fragment differs");
675 // Test muxing discontinuous fragments with very large (> (1<<31)) timestamps.
676 av_dict_set(&opts, "movflags", "frag_custom+delay_moov+dash+frag_discont", 0);
677 av_dict_set(&opts, "fragment_index", "2", 0);
681 mux_frames(gop_size, 1); // Write the second fragment
682 init_out("delay-moov-elst-signal-init-discont-largets");
683 av_write_frame(ctx, NULL); // Output the moov
685 init_out("delay-moov-elst-signal-second-frag-discont-largets");
686 av_write_frame(ctx, NULL); // Output the second fragment
690 // Test VFR content, with sidx atoms (which declare the pts duration
691 // of a fragment, forcing overriding the start pts of the next one).
692 // Here, the fragment duration in pts is significantly different from
693 // the duration in dts. The video stream starts at dts=-10,pts=0, and
694 // the second fragment starts at dts=155,pts=156. The trun duration sum
695 // of the first fragment is 165, which also is written as
696 // baseMediaDecodeTime in the tfdt in the second fragment. The sidx for
697 // the first fragment says earliest_presentation_time = 0 and
698 // subsegment_duration = 156, which also matches the sidx in the second
699 // fragment. For the audio stream, the pts and dts durations also don't
700 // match - the input stream starts at pts=-2048, but that part is excluded
703 av_dict_set(&opts, "movflags", "frag_keyframe+delay_moov+dash", 0);
705 mux_frames(gop_size/2, 0);
707 mux_frames(gop_size/2, 0);
712 // Test VFR content, with cleared duration fields. In these cases,
713 // the muxer must guess the duration of the last packet of each
714 // fragment. As long as the framerate doesn't vary (too much) at the
715 // fragment edge, it works just fine. Additionally, when automatically
716 // cutting fragments, the muxer already know the timestamps of the next
717 // packet for one stream (in most cases the video stream), avoiding
718 // having to use guesses for that one.
719 init_count_warnings();
721 init_out("vfr-noduration");
722 av_dict_set(&opts, "movflags", "frag_keyframe+delay_moov+dash", 0);
724 mux_frames(gop_size/2, 0);
726 mux_frames(gop_size/2, 0);
731 reset_count_warnings();
732 check(num_warnings > 0, "No warnings printed for filled in durations");
734 // Test with an IO buffer size that is too small to hold a full fragment;
735 // this will cause write_data_type to be called with the type unknown.
736 force_iobuf_size = 1500;
737 init_out("large_frag");
738 av_dict_set(&opts, "movflags", "frag_keyframe+delay_moov", 0);
743 force_iobuf_size = 0;
745 // Test VFR content with bframes with interleaving.
746 // Here, using av_interleaved_write_frame allows the muxer to get the
747 // fragment end durations right. We always set the packet duration to
748 // the expected, but we simulate dropped frames at one point.
750 init_out("vfr-noduration-interleave");
751 av_dict_set(&opts, "movflags", "frag_keyframe+delay_moov", 0);
752 av_dict_set(&opts, "frag_duration", "650000", 0);
754 mux_frames(gop_size/2, 0);
755 // Pretend that the packet duration is the normal, even if
756 // we actually skip a bunch of frames. (I.e., simulate that
757 // we don't know of the framedrop in advance.)
758 fake_pkt_duration = duration;
761 fake_pkt_duration = 0;
763 mux_frames(gop_size/2 - 1, 0);
770 // Write a fragmented file with b-frames and audio preroll,
771 // with negative cts values, removing the edit list for the
773 init_out("delay-moov-elst-neg-cts");
774 av_dict_set(&opts, "movflags", "frag_keyframe+delay_moov+negative_cts_offsets", 0);
780 // Write a fragmented file with b-frames without audio preroll,
781 // with negative cts values, avoiding any edit lists, allowing
782 // to use empty_moov instead of delay_moov.
783 init_out("empty-moov-neg-cts");
784 av_dict_set(&opts, "movflags", "frag_keyframe+empty_moov+negative_cts_offsets", 0);
792 return check_faults > 0 ? 1 : 0;