2 * Copyright (c) 2012 Nicolas George
4 * This file is part of FFmpeg.
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public License
8 * as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public License
17 * along with FFmpeg; if not, write to the Free Software Foundation, Inc.,
18 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 #include "libavutil/avassert.h"
22 #include "libavutil/avstring.h"
23 #include "libavutil/intreadwrite.h"
24 #include "libavutil/opt.h"
25 #include "libavutil/parseutils.h"
26 #include "libavutil/timestamp.h"
31 typedef enum ConcatMatchMode {
36 typedef struct ConcatStream {
37 AVBitStreamFilterContext *bsf;
38 AVCodecContext *avctx;
45 int64_t file_start_time;
48 ConcatStream *streams;
51 AVDictionary *metadata;
64 ConcatMatchMode stream_match_mode;
65 unsigned auto_convert;
66 int segment_time_metadata;
69 static int concat_probe(AVProbeData *probe)
71 return memcmp(probe->buf, "ffconcat version 1.0", 20) ?
72 0 : AVPROBE_SCORE_MAX;
75 static char *get_keyword(uint8_t **cursor)
77 char *ret = *cursor += strspn(*cursor, SPACE_CHARS);
78 *cursor += strcspn(*cursor, SPACE_CHARS);
81 *cursor += strspn(*cursor, SPACE_CHARS);
86 static int safe_filename(const char *f)
88 const char *start = f;
92 if (!((unsigned)((*f | 32) - 'a') < 26 ||
93 (unsigned)(*f - '0') < 10 || *f == '_' || *f == '-')) {
105 #define FAIL(retcode) do { ret = (retcode); goto fail; } while(0)
107 static int add_file(AVFormatContext *avf, char *filename, ConcatFile **rfile,
108 unsigned *nb_files_alloc)
110 ConcatContext *cat = avf->priv_data;
114 size_t url_len, proto_len;
117 if (cat->safe > 0 && !safe_filename(filename)) {
118 av_log(avf, AV_LOG_ERROR, "Unsafe file name '%s'\n", filename);
119 FAIL(AVERROR(EPERM));
122 proto = avio_find_protocol_name(filename);
123 proto_len = proto ? strlen(proto) : 0;
124 if (!memcmp(filename, proto, proto_len) &&
125 (filename[proto_len] == ':' || filename[proto_len] == ',')) {
129 url_len = strlen(avf->filename) + strlen(filename) + 16;
130 if (!(url = av_malloc(url_len)))
131 FAIL(AVERROR(ENOMEM));
132 ff_make_absolute_url(url, url_len, avf->filename, filename);
136 if (cat->nb_files >= *nb_files_alloc) {
137 size_t n = FFMAX(*nb_files_alloc * 2, 16);
138 ConcatFile *new_files;
139 if (n <= cat->nb_files || n > SIZE_MAX / sizeof(*cat->files) ||
140 !(new_files = av_realloc(cat->files, n * sizeof(*cat->files))))
141 FAIL(AVERROR(ENOMEM));
142 cat->files = new_files;
146 file = &cat->files[cat->nb_files++];
147 memset(file, 0, sizeof(*file));
151 file->start_time = AV_NOPTS_VALUE;
152 file->duration = AV_NOPTS_VALUE;
153 file->inpoint = AV_NOPTS_VALUE;
154 file->outpoint = AV_NOPTS_VALUE;
164 static int copy_stream_props(AVStream *st, AVStream *source_st)
168 if (st->codecpar->codec_id || !source_st->codecpar->codec_id) {
169 if (st->codecpar->extradata_size < source_st->codecpar->extradata_size) {
170 if (st->codecpar->extradata) {
171 av_freep(&st->codecpar->extradata);
172 st->codecpar->extradata_size = 0;
174 ret = ff_alloc_extradata(st->codecpar,
175 source_st->codecpar->extradata_size);
179 memcpy(st->codecpar->extradata, source_st->codecpar->extradata,
180 source_st->codecpar->extradata_size);
183 if ((ret = avcodec_parameters_copy(st->codecpar, source_st->codecpar)) < 0)
185 /* We don't want to carry around MP4-style extradata, since we are usoign a bsf anyway. */
186 if (st->codecpar->codec_id == AV_CODEC_ID_H264) {
187 av_freep(&st->codecpar->extradata);
188 st->codecpar->extradata_size = 0;
190 st->r_frame_rate = source_st->r_frame_rate;
191 st->avg_frame_rate = source_st->avg_frame_rate;
192 st->time_base = source_st->time_base;
193 st->sample_aspect_ratio = source_st->sample_aspect_ratio;
195 av_dict_copy(&st->metadata, source_st->metadata, 0);
199 static int detect_stream_specific(AVFormatContext *avf, int idx)
201 ConcatContext *cat = avf->priv_data;
202 AVStream *st = cat->avf->streams[idx];
203 ConcatStream *cs = &cat->cur_file->streams[idx];
204 AVBitStreamFilterContext *bsf;
207 if (cat->auto_convert && st->codecpar->codec_id == AV_CODEC_ID_H264 &&
208 (st->codecpar->extradata_size < 4 || AV_RB32(st->codecpar->extradata) != 1)) {
209 av_log(cat->avf, AV_LOG_INFO,
210 "Auto-inserting h264_mp4toannexb bitstream filter\n");
211 if (!(bsf = av_bitstream_filter_init("h264_mp4toannexb"))) {
212 av_log(avf, AV_LOG_ERROR, "h264_mp4toannexb bitstream filter "
213 "required for H.264 streams\n");
214 return AVERROR_BSF_NOT_FOUND;
218 cs->avctx = avcodec_alloc_context3(NULL);
220 return AVERROR(ENOMEM);
222 ret = avcodec_parameters_to_context(cs->avctx, st->codecpar);
224 avcodec_free_context(&cs->avctx);
232 static int match_streams_one_to_one(AVFormatContext *avf)
234 ConcatContext *cat = avf->priv_data;
238 for (i = cat->cur_file->nb_streams; i < cat->avf->nb_streams; i++) {
239 if (i < avf->nb_streams) {
240 st = avf->streams[i];
242 if (!(st = avformat_new_stream(avf, NULL)))
243 return AVERROR(ENOMEM);
245 if ((ret = copy_stream_props(st, cat->avf->streams[i])) < 0)
247 cat->cur_file->streams[i].out_stream_index = i;
252 static int match_streams_exact_id(AVFormatContext *avf)
254 ConcatContext *cat = avf->priv_data;
258 for (i = cat->cur_file->nb_streams; i < cat->avf->nb_streams; i++) {
259 st = cat->avf->streams[i];
260 for (j = 0; j < avf->nb_streams; j++) {
261 if (avf->streams[j]->id == st->id) {
262 av_log(avf, AV_LOG_VERBOSE,
263 "Match slave stream #%d with stream #%d id 0x%x\n",
265 if ((ret = copy_stream_props(avf->streams[j], st)) < 0)
267 cat->cur_file->streams[i].out_stream_index = j;
274 static int match_streams(AVFormatContext *avf)
276 ConcatContext *cat = avf->priv_data;
280 if (cat->cur_file->nb_streams >= cat->avf->nb_streams)
282 map = av_realloc(cat->cur_file->streams,
283 cat->avf->nb_streams * sizeof(*map));
285 return AVERROR(ENOMEM);
286 cat->cur_file->streams = map;
287 memset(map + cat->cur_file->nb_streams, 0,
288 (cat->avf->nb_streams - cat->cur_file->nb_streams) * sizeof(*map));
290 for (i = cat->cur_file->nb_streams; i < cat->avf->nb_streams; i++)
291 map[i].out_stream_index = -1;
292 switch (cat->stream_match_mode) {
293 case MATCH_ONE_TO_ONE:
294 ret = match_streams_one_to_one(avf);
297 ret = match_streams_exact_id(avf);
304 for (i = cat->cur_file->nb_streams; i < cat->avf->nb_streams; i++)
305 if ((ret = detect_stream_specific(avf, i)) < 0)
307 cat->cur_file->nb_streams = cat->avf->nb_streams;
311 static int open_file(AVFormatContext *avf, unsigned fileno)
313 ConcatContext *cat = avf->priv_data;
314 ConcatFile *file = &cat->files[fileno];
318 avformat_close_input(&cat->avf);
320 cat->avf = avformat_alloc_context();
322 return AVERROR(ENOMEM);
324 cat->avf->interrupt_callback = avf->interrupt_callback;
326 if ((ret = ff_copy_whiteblacklists(cat->avf, avf)) < 0)
329 if ((ret = avformat_open_input(&cat->avf, file->url, NULL, NULL)) < 0 ||
330 (ret = avformat_find_stream_info(cat->avf, NULL)) < 0) {
331 av_log(avf, AV_LOG_ERROR, "Impossible to open '%s'\n", file->url);
332 avformat_close_input(&cat->avf);
335 cat->cur_file = file;
336 if (file->start_time == AV_NOPTS_VALUE)
337 file->start_time = !fileno ? 0 :
338 cat->files[fileno - 1].start_time +
339 cat->files[fileno - 1].duration;
340 file->file_start_time = (cat->avf->start_time == AV_NOPTS_VALUE) ? 0 : cat->avf->start_time;
341 file->file_inpoint = (file->inpoint == AV_NOPTS_VALUE) ? file->file_start_time : file->inpoint;
342 if (file->duration == AV_NOPTS_VALUE && file->outpoint != AV_NOPTS_VALUE)
343 file->duration = file->outpoint - file->file_inpoint;
345 if (cat->segment_time_metadata) {
346 av_dict_set_int(&file->metadata, "lavf.concatdec.start_time", file->start_time, 0);
347 if (file->duration != AV_NOPTS_VALUE)
348 av_dict_set_int(&file->metadata, "lavf.concatdec.duration", file->duration, 0);
351 if ((ret = match_streams(avf)) < 0)
353 if (file->inpoint != AV_NOPTS_VALUE) {
354 if ((ret = avformat_seek_file(cat->avf, -1, INT64_MIN, file->inpoint, file->inpoint, 0)) < 0)
360 static int concat_read_close(AVFormatContext *avf)
362 ConcatContext *cat = avf->priv_data;
365 for (i = 0; i < cat->nb_files; i++) {
366 av_freep(&cat->files[i].url);
367 for (j = 0; j < cat->files[i].nb_streams; j++) {
368 if (cat->files[i].streams[j].avctx)
369 avcodec_free_context(&cat->files[i].streams[j].avctx);
370 if (cat->files[i].streams[j].bsf)
371 av_bitstream_filter_close(cat->files[i].streams[j].bsf);
373 av_freep(&cat->files[i].streams);
374 av_dict_free(&cat->files[i].metadata);
377 avformat_close_input(&cat->avf);
378 av_freep(&cat->files);
382 static int concat_read_header(AVFormatContext *avf)
384 ConcatContext *cat = avf->priv_data;
386 uint8_t *cursor, *keyword;
387 int ret, line = 0, i;
388 unsigned nb_files_alloc = 0;
389 ConcatFile *file = NULL;
393 if ((ret = ff_get_line(avf->pb, buf, sizeof(buf))) <= 0)
397 keyword = get_keyword(&cursor);
398 if (!*keyword || *keyword == '#')
401 if (!strcmp(keyword, "file")) {
402 char *filename = av_get_token((const char **)&cursor, SPACE_CHARS);
404 av_log(avf, AV_LOG_ERROR, "Line %d: filename required\n", line);
405 FAIL(AVERROR_INVALIDDATA);
407 if ((ret = add_file(avf, filename, &file, &nb_files_alloc)) < 0)
409 } else if (!strcmp(keyword, "duration") || !strcmp(keyword, "inpoint") || !strcmp(keyword, "outpoint")) {
410 char *dur_str = get_keyword(&cursor);
413 av_log(avf, AV_LOG_ERROR, "Line %d: %s without file\n",
415 FAIL(AVERROR_INVALIDDATA);
417 if ((ret = av_parse_time(&dur, dur_str, 1)) < 0) {
418 av_log(avf, AV_LOG_ERROR, "Line %d: invalid %s '%s'\n",
419 line, keyword, dur_str);
422 if (!strcmp(keyword, "duration"))
423 file->duration = dur;
424 else if (!strcmp(keyword, "inpoint"))
426 else if (!strcmp(keyword, "outpoint"))
427 file->outpoint = dur;
428 } else if (!strcmp(keyword, "file_packet_metadata")) {
431 av_log(avf, AV_LOG_ERROR, "Line %d: %s without file\n",
433 FAIL(AVERROR_INVALIDDATA);
435 metadata = av_get_token((const char **)&cursor, SPACE_CHARS);
437 av_log(avf, AV_LOG_ERROR, "Line %d: packet metadata required\n", line);
438 FAIL(AVERROR_INVALIDDATA);
440 if ((ret = av_dict_parse_string(&file->metadata, metadata, "=", "", 0)) < 0) {
441 av_log(avf, AV_LOG_ERROR, "Line %d: failed to parse metadata string\n", line);
443 FAIL(AVERROR_INVALIDDATA);
446 } else if (!strcmp(keyword, "stream")) {
447 if (!avformat_new_stream(avf, NULL))
448 FAIL(AVERROR(ENOMEM));
449 } else if (!strcmp(keyword, "exact_stream_id")) {
450 if (!avf->nb_streams) {
451 av_log(avf, AV_LOG_ERROR, "Line %d: exact_stream_id without stream\n",
453 FAIL(AVERROR_INVALIDDATA);
455 avf->streams[avf->nb_streams - 1]->id =
456 strtol(get_keyword(&cursor), NULL, 0);
457 } else if (!strcmp(keyword, "ffconcat")) {
458 char *ver_kw = get_keyword(&cursor);
459 char *ver_val = get_keyword(&cursor);
460 if (strcmp(ver_kw, "version") || strcmp(ver_val, "1.0")) {
461 av_log(avf, AV_LOG_ERROR, "Line %d: invalid version\n", line);
462 FAIL(AVERROR_INVALIDDATA);
467 av_log(avf, AV_LOG_ERROR, "Line %d: unknown keyword '%s'\n",
469 FAIL(AVERROR_INVALIDDATA);
475 FAIL(AVERROR_INVALIDDATA);
477 for (i = 0; i < cat->nb_files; i++) {
478 if (cat->files[i].start_time == AV_NOPTS_VALUE)
479 cat->files[i].start_time = time;
481 time = cat->files[i].start_time;
482 if (cat->files[i].duration == AV_NOPTS_VALUE) {
483 if (cat->files[i].inpoint == AV_NOPTS_VALUE || cat->files[i].outpoint == AV_NOPTS_VALUE)
485 cat->files[i].duration = cat->files[i].outpoint - cat->files[i].inpoint;
487 time += cat->files[i].duration;
489 if (i == cat->nb_files) {
490 avf->duration = time;
494 cat->stream_match_mode = avf->nb_streams ? MATCH_EXACT_ID :
496 if ((ret = open_file(avf, 0)) < 0)
501 concat_read_close(avf);
505 static int open_next_file(AVFormatContext *avf)
507 ConcatContext *cat = avf->priv_data;
508 unsigned fileno = cat->cur_file - cat->files;
510 if (cat->cur_file->duration == AV_NOPTS_VALUE)
511 cat->cur_file->duration = cat->avf->duration - (cat->cur_file->file_inpoint - cat->cur_file->file_start_time);
513 if (++fileno >= cat->nb_files) {
517 return open_file(avf, fileno);
520 static int filter_packet(AVFormatContext *avf, ConcatStream *cs, AVPacket *pkt)
522 AVStream *st = avf->streams[cs->out_stream_index];
523 AVBitStreamFilterContext *bsf;
527 av_assert0(cs->out_stream_index >= 0);
528 for (bsf = cs->bsf; bsf; bsf = bsf->next) {
531 ret = av_bitstream_filter_filter(bsf, cs->avctx, NULL,
532 &pkt2.data, &pkt2.size,
533 pkt->data, pkt->size,
534 !!(pkt->flags & AV_PKT_FLAG_KEY));
536 av_packet_unref(pkt);
540 if (cs->avctx->extradata_size > st->codecpar->extradata_size) {
542 if (st->codecpar->extradata)
543 av_freep(&st->codecpar->extradata);
545 eret = ff_alloc_extradata(st->codecpar, cs->avctx->extradata_size);
547 av_packet_unref(pkt);
548 return AVERROR(ENOMEM);
550 st->codecpar->extradata_size = cs->avctx->extradata_size;
551 memcpy(st->codecpar->extradata, cs->avctx->extradata, cs->avctx->extradata_size);
554 av_assert0(pkt2.buf);
555 if (ret == 0 && pkt2.data != pkt->data) {
556 if ((ret = av_copy_packet(&pkt2, pkt)) < 0) {
563 av_packet_unref(pkt);
564 pkt2.buf = av_buffer_create(pkt2.data, pkt2.size,
565 av_buffer_default_free, NULL, 0);
568 return AVERROR(ENOMEM);
576 /* Returns true if the packet dts is greater or equal to the specified outpoint. */
577 static int packet_after_outpoint(ConcatContext *cat, AVPacket *pkt)
579 if (cat->cur_file->outpoint != AV_NOPTS_VALUE && pkt->dts != AV_NOPTS_VALUE) {
580 return av_compare_ts(pkt->dts, cat->avf->streams[pkt->stream_index]->time_base,
581 cat->cur_file->outpoint, AV_TIME_BASE_Q) >= 0;
586 static int concat_read_packet(AVFormatContext *avf, AVPacket *pkt)
588 ConcatContext *cat = avf->priv_data;
601 ret = av_read_frame(cat->avf, pkt);
602 if (ret == AVERROR_EOF) {
603 if ((ret = open_next_file(avf)) < 0)
609 if ((ret = match_streams(avf)) < 0) {
610 av_packet_unref(pkt);
613 if (packet_after_outpoint(cat, pkt)) {
614 av_packet_unref(pkt);
615 if ((ret = open_next_file(avf)) < 0)
619 cs = &cat->cur_file->streams[pkt->stream_index];
620 if (cs->out_stream_index < 0) {
621 av_packet_unref(pkt);
624 pkt->stream_index = cs->out_stream_index;
627 if ((ret = filter_packet(avf, cs, pkt)))
630 st = cat->avf->streams[pkt->stream_index];
631 av_log(avf, AV_LOG_DEBUG, "file:%d stream:%d pts:%s pts_time:%s dts:%s dts_time:%s",
632 (unsigned)(cat->cur_file - cat->files), pkt->stream_index,
633 av_ts2str(pkt->pts), av_ts2timestr(pkt->pts, &st->time_base),
634 av_ts2str(pkt->dts), av_ts2timestr(pkt->dts, &st->time_base));
636 delta = av_rescale_q(cat->cur_file->start_time - cat->cur_file->file_inpoint,
638 cat->avf->streams[pkt->stream_index]->time_base);
639 if (pkt->pts != AV_NOPTS_VALUE)
641 if (pkt->dts != AV_NOPTS_VALUE)
643 av_log(avf, AV_LOG_DEBUG, " -> pts:%s pts_time:%s dts:%s dts_time:%s\n",
644 av_ts2str(pkt->pts), av_ts2timestr(pkt->pts, &st->time_base),
645 av_ts2str(pkt->dts), av_ts2timestr(pkt->dts, &st->time_base));
646 if (cat->cur_file->metadata) {
649 char* packed_metadata = av_packet_pack_dictionary(cat->cur_file->metadata, &metadata_len);
650 if (!packed_metadata)
651 return AVERROR(ENOMEM);
652 if (!(metadata = av_packet_new_side_data(pkt, AV_PKT_DATA_STRINGS_METADATA, metadata_len))) {
653 av_freep(&packed_metadata);
654 return AVERROR(ENOMEM);
656 memcpy(metadata, packed_metadata, metadata_len);
657 av_freep(&packed_metadata);
662 static void rescale_interval(AVRational tb_in, AVRational tb_out,
663 int64_t *min_ts, int64_t *ts, int64_t *max_ts)
665 *ts = av_rescale_q (* ts, tb_in, tb_out);
666 *min_ts = av_rescale_q_rnd(*min_ts, tb_in, tb_out,
667 AV_ROUND_UP | AV_ROUND_PASS_MINMAX);
668 *max_ts = av_rescale_q_rnd(*max_ts, tb_in, tb_out,
669 AV_ROUND_DOWN | AV_ROUND_PASS_MINMAX);
672 static int try_seek(AVFormatContext *avf, int stream,
673 int64_t min_ts, int64_t ts, int64_t max_ts, int flags)
675 ConcatContext *cat = avf->priv_data;
676 int64_t t0 = cat->cur_file->start_time - cat->cur_file->file_inpoint;
679 min_ts = min_ts == INT64_MIN ? INT64_MIN : min_ts - t0;
680 max_ts = max_ts == INT64_MAX ? INT64_MAX : max_ts - t0;
682 if (stream >= cat->avf->nb_streams)
684 rescale_interval(AV_TIME_BASE_Q, cat->avf->streams[stream]->time_base,
685 &min_ts, &ts, &max_ts);
687 return avformat_seek_file(cat->avf, stream, min_ts, ts, max_ts, flags);
690 static int real_seek(AVFormatContext *avf, int stream,
691 int64_t min_ts, int64_t ts, int64_t max_ts, int flags)
693 ConcatContext *cat = avf->priv_data;
694 int ret, left, right;
697 if (stream >= avf->nb_streams)
698 return AVERROR(EINVAL);
699 rescale_interval(avf->streams[stream]->time_base, AV_TIME_BASE_Q,
700 &min_ts, &ts, &max_ts);
704 right = cat->nb_files;
705 while (right - left > 1) {
706 int mid = (left + right) / 2;
707 if (ts < cat->files[mid].start_time)
713 if ((ret = open_file(avf, left)) < 0)
716 ret = try_seek(avf, stream, min_ts, ts, max_ts, flags);
718 left < cat->nb_files - 1 &&
719 cat->files[left + 1].start_time < max_ts) {
720 if ((ret = open_file(avf, left + 1)) < 0)
722 ret = try_seek(avf, stream, min_ts, ts, max_ts, flags);
727 static int concat_seek(AVFormatContext *avf, int stream,
728 int64_t min_ts, int64_t ts, int64_t max_ts, int flags)
730 ConcatContext *cat = avf->priv_data;
731 ConcatFile *cur_file_saved = cat->cur_file;
732 AVFormatContext *cur_avf_saved = cat->avf;
736 return AVERROR(ESPIPE); /* XXX: can we use it? */
737 if (flags & (AVSEEK_FLAG_BYTE | AVSEEK_FLAG_FRAME))
738 return AVERROR(ENOSYS);
740 if ((ret = real_seek(avf, stream, min_ts, ts, max_ts, flags)) < 0) {
742 avformat_close_input(&cat->avf);
743 cat->avf = cur_avf_saved;
744 cat->cur_file = cur_file_saved;
746 avformat_close_input(&cur_avf_saved);
752 #define OFFSET(x) offsetof(ConcatContext, x)
753 #define DEC AV_OPT_FLAG_DECODING_PARAM
755 static const AVOption options[] = {
756 { "safe", "enable safe mode",
757 OFFSET(safe), AV_OPT_TYPE_BOOL, {.i64 = 1}, -1, 1, DEC },
758 { "auto_convert", "automatically convert bitstream format",
759 OFFSET(auto_convert), AV_OPT_TYPE_BOOL, {.i64 = 1}, 0, 1, DEC },
760 { "segment_time_metadata", "output file segment start time and duration as packet metadata",
761 OFFSET(segment_time_metadata), AV_OPT_TYPE_BOOL, {.i64 = 0}, 0, 1, DEC },
765 static const AVClass concat_class = {
766 .class_name = "concat demuxer",
767 .item_name = av_default_item_name,
769 .version = LIBAVUTIL_VERSION_INT,
773 AVInputFormat ff_concat_demuxer = {
775 .long_name = NULL_IF_CONFIG_SMALL("Virtual concatenation script"),
776 .priv_data_size = sizeof(ConcatContext),
777 .read_probe = concat_probe,
778 .read_header = concat_read_header,
779 .read_packet = concat_read_packet,
780 .read_close = concat_read_close,
781 .read_seek2 = concat_seek,
782 .priv_class = &concat_class,