2 * muxing functions for use within Libav
3 * Copyright (c) 2000, 2001, 2002 Fabrice Bellard
5 * This file is part of Libav.
7 * Libav is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * Libav is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with Libav; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
23 #include "avio_internal.h"
25 #include "libavcodec/internal.h"
26 #include "libavcodec/bytestream.h"
27 #include "libavutil/opt.h"
28 #include "libavutil/dict.h"
29 #include "libavutil/pixdesc.h"
32 #include "libavutil/avassert.h"
33 #include "libavutil/avstring.h"
34 #include "libavutil/mathematics.h"
35 #include "libavutil/parseutils.h"
36 #include "libavutil/time.h"
38 #include "audiointerleave.h"
50 * muxing functions for use within Libav
53 /* fraction handling */
56 * f = val + (num / den) + 0.5.
58 * 'num' is normalized so that it is such as 0 <= num < den.
60 * @param f fractional number
61 * @param val integer value
62 * @param num must be >= 0
63 * @param den must be >= 1
65 static void frac_init(AVFrac *f, int64_t val, int64_t num, int64_t den)
78 * Fractional addition to f: f = f + (incr / f->den).
80 * @param f fractional number
81 * @param incr increment, can be positive or negative
83 static void frac_add(AVFrac *f, int64_t incr)
96 } else if (num >= den) {
103 static int validate_codec_tag(AVFormatContext *s, AVStream *st)
105 const AVCodecTag *avctag;
107 enum AVCodecID id = AV_CODEC_ID_NONE;
108 unsigned int tag = 0;
111 * Check that tag + id is in the table
112 * If neither is in the table -> OK
113 * If tag is in the table with another id -> FAIL
114 * If id is in the table with another tag -> FAIL unless strict < normal
116 for (n = 0; s->oformat->codec_tag[n]; n++) {
117 avctag = s->oformat->codec_tag[n];
118 while (avctag->id != AV_CODEC_ID_NONE) {
119 if (avpriv_toupper4(avctag->tag) == avpriv_toupper4(st->codec->codec_tag)) {
121 if (id == st->codec->codec_id)
124 if (avctag->id == st->codec->codec_id)
129 if (id != AV_CODEC_ID_NONE)
131 if (tag && (st->codec->strict_std_compliance >= FF_COMPLIANCE_NORMAL))
137 static int init_muxer(AVFormatContext *s, AVDictionary **options)
141 AVDictionary *tmp = NULL;
142 AVCodecContext *codec = NULL;
143 AVOutputFormat *of = s->oformat;
146 av_dict_copy(&tmp, *options, 0);
148 if ((ret = av_opt_set_dict(s, &tmp)) < 0)
151 // some sanity checks
152 if (s->nb_streams == 0 && !(of->flags & AVFMT_NOSTREAMS)) {
153 av_log(s, AV_LOG_ERROR, "no streams\n");
154 ret = AVERROR(EINVAL);
158 for (i = 0; i < s->nb_streams; i++) {
162 switch (codec->codec_type) {
163 case AVMEDIA_TYPE_AUDIO:
164 if (codec->sample_rate <= 0) {
165 av_log(s, AV_LOG_ERROR, "sample rate not set\n");
166 ret = AVERROR(EINVAL);
169 if (!codec->block_align)
170 codec->block_align = codec->channels *
171 av_get_bits_per_sample(codec->codec_id) >> 3;
173 case AVMEDIA_TYPE_VIDEO:
174 if (codec->time_base.num <= 0 ||
175 codec->time_base.den <= 0) { //FIXME audio too?
176 av_log(s, AV_LOG_ERROR, "time base not set\n");
177 ret = AVERROR(EINVAL);
181 if ((codec->width <= 0 || codec->height <= 0) &&
182 !(of->flags & AVFMT_NODIMENSIONS)) {
183 av_log(s, AV_LOG_ERROR, "dimensions not set\n");
184 ret = AVERROR(EINVAL);
188 if (av_cmp_q(st->sample_aspect_ratio,
189 codec->sample_aspect_ratio)) {
190 if (st->sample_aspect_ratio.num != 0 &&
191 st->sample_aspect_ratio.den != 0 &&
192 codec->sample_aspect_ratio.den != 0 &&
193 codec->sample_aspect_ratio.den != 0) {
194 av_log(s, AV_LOG_ERROR, "Aspect ratio mismatch between muxer "
195 "(%d/%d) and encoder layer (%d/%d)\n",
196 st->sample_aspect_ratio.num, st->sample_aspect_ratio.den,
197 codec->sample_aspect_ratio.num,
198 codec->sample_aspect_ratio.den);
199 ret = AVERROR(EINVAL);
207 if (codec->codec_tag &&
208 codec->codec_id == AV_CODEC_ID_RAWVIDEO &&
209 !av_codec_get_tag(of->codec_tag, codec->codec_id) &&
210 !validate_codec_tag(s, st)) {
211 // the current rawvideo encoding system ends up setting
212 // the wrong codec_tag for avi, we override it here
213 codec->codec_tag = 0;
215 if (codec->codec_tag) {
216 if (!validate_codec_tag(s, st)) {
218 av_get_codec_tag_string(tagbuf, sizeof(tagbuf), codec->codec_tag);
219 av_log(s, AV_LOG_ERROR,
220 "Tag %s/0x%08x incompatible with output codec id '%d'\n",
221 tagbuf, codec->codec_tag, codec->codec_id);
222 ret = AVERROR_INVALIDDATA;
226 codec->codec_tag = av_codec_get_tag(of->codec_tag, codec->codec_id);
229 if (of->flags & AVFMT_GLOBALHEADER &&
230 !(codec->flags & CODEC_FLAG_GLOBAL_HEADER))
231 av_log(s, AV_LOG_WARNING,
232 "Codec for stream %d does not use global headers "
233 "but container format requires global headers\n", i);
236 if (!s->priv_data && of->priv_data_size > 0) {
237 s->priv_data = av_mallocz(of->priv_data_size);
239 ret = AVERROR(ENOMEM);
242 if (of->priv_class) {
243 *(const AVClass **)s->priv_data = of->priv_class;
244 av_opt_set_defaults(s->priv_data);
245 if ((ret = av_opt_set_dict(s->priv_data, &tmp)) < 0)
250 /* set muxer identification string */
251 if (s->nb_streams && !(s->streams[0]->codec->flags & CODEC_FLAG_BITEXACT)) {
252 av_dict_set(&s->metadata, "encoder", LIBAVFORMAT_IDENT, 0);
256 av_dict_free(options);
267 static int init_pts(AVFormatContext *s)
272 /* init PTS generation */
273 for (i = 0; i < s->nb_streams; i++) {
274 int64_t den = AV_NOPTS_VALUE;
277 switch (st->codec->codec_type) {
278 case AVMEDIA_TYPE_AUDIO:
279 den = (int64_t)st->time_base.num * st->codec->sample_rate;
281 case AVMEDIA_TYPE_VIDEO:
282 den = (int64_t)st->time_base.num * st->codec->time_base.den;
287 if (den != AV_NOPTS_VALUE) {
289 return AVERROR_INVALIDDATA;
291 frac_init(&st->pts, 0, 0, den);
298 int avformat_write_header(AVFormatContext *s, AVDictionary **options)
302 if (ret = init_muxer(s, options))
305 if (s->oformat->write_header) {
306 ret = s->oformat->write_header(s);
311 if ((ret = init_pts(s)) < 0)
317 //FIXME merge with compute_pkt_fields
318 static int compute_pkt_fields2(AVFormatContext *s, AVStream *st, AVPacket *pkt)
320 int delay = FFMAX(st->codec->has_b_frames, !!st->codec->max_b_frames);
321 int num, den, frame_size, i;
323 av_dlog(s, "compute_pkt_fields2: pts:%" PRId64 " dts:%" PRId64 " cur_dts:%" PRId64 " b:%d size:%d st:%d\n",
324 pkt->pts, pkt->dts, st->cur_dts, delay, pkt->size, pkt->stream_index);
326 /* if(pkt->pts == AV_NOPTS_VALUE && pkt->dts == AV_NOPTS_VALUE)
327 * return AVERROR(EINVAL);*/
330 if (pkt->duration == 0) {
331 ff_compute_frame_duration(&num, &den, st, NULL, pkt);
333 pkt->duration = av_rescale(1, num * (int64_t)st->time_base.den * st->codec->ticks_per_frame, den * (int64_t)st->time_base.num);
337 if (pkt->pts == AV_NOPTS_VALUE && pkt->dts != AV_NOPTS_VALUE && delay == 0)
340 //XXX/FIXME this is a temporary hack until all encoders output pts
341 if ((pkt->pts == 0 || pkt->pts == AV_NOPTS_VALUE) && pkt->dts == AV_NOPTS_VALUE && !delay) {
343 // pkt->pts= st->cur_dts;
344 pkt->pts = st->pts.val;
347 //calculate dts from pts
348 if (pkt->pts != AV_NOPTS_VALUE && pkt->dts == AV_NOPTS_VALUE && delay <= MAX_REORDER_DELAY) {
349 st->pts_buffer[0] = pkt->pts;
350 for (i = 1; i < delay + 1 && st->pts_buffer[i] == AV_NOPTS_VALUE; i++)
351 st->pts_buffer[i] = pkt->pts + (i - delay - 1) * pkt->duration;
352 for (i = 0; i<delay && st->pts_buffer[i] > st->pts_buffer[i + 1]; i++)
353 FFSWAP(int64_t, st->pts_buffer[i], st->pts_buffer[i + 1]);
355 pkt->dts = st->pts_buffer[0];
358 if (st->cur_dts && st->cur_dts != AV_NOPTS_VALUE &&
359 ((!(s->oformat->flags & AVFMT_TS_NONSTRICT) &&
360 st->cur_dts >= pkt->dts) || st->cur_dts > pkt->dts)) {
361 av_log(s, AV_LOG_ERROR,
362 "Application provided invalid, non monotonically increasing dts to muxer in stream %d: %" PRId64 " >= %" PRId64 "\n",
363 st->index, st->cur_dts, pkt->dts);
364 return AVERROR(EINVAL);
366 if (pkt->dts != AV_NOPTS_VALUE && pkt->pts != AV_NOPTS_VALUE && pkt->pts < pkt->dts) {
367 av_log(s, AV_LOG_ERROR, "pts < dts in stream %d\n", st->index);
368 return AVERROR(EINVAL);
371 av_dlog(s, "av_write_frame: pts2:%"PRId64" dts2:%"PRId64"\n",
373 st->cur_dts = pkt->dts;
374 st->pts.val = pkt->dts;
377 switch (st->codec->codec_type) {
378 case AVMEDIA_TYPE_AUDIO:
379 frame_size = ff_get_audio_frame_size(st->codec, pkt->size, 1);
381 /* HACK/FIXME, we skip the initial 0 size packets as they are most
382 * likely equal to the encoder delay, but it would be better if we
383 * had the real timestamps from the encoder */
384 if (frame_size >= 0 && (pkt->size || st->pts.num != st->pts.den >> 1 || st->pts.val)) {
385 frac_add(&st->pts, (int64_t)st->time_base.den * frame_size);
388 case AVMEDIA_TYPE_VIDEO:
389 frac_add(&st->pts, (int64_t)st->time_base.den * st->codec->time_base.num);
398 * FIXME: this function should NEVER get undefined pts/dts beside when the
399 * AVFMT_NOTIMESTAMPS is set.
400 * Those additional safety checks should be dropped once the correct checks
401 * are set in the callers.
404 static int write_packet(AVFormatContext *s, AVPacket *pkt)
406 if (!(s->oformat->flags & (AVFMT_TS_NEGATIVE | AVFMT_NOTIMESTAMPS))) {
407 AVRational time_base = s->streams[pkt->stream_index]->time_base;
410 if (!s->offset && pkt->dts != AV_NOPTS_VALUE && pkt->dts < 0) {
411 s->offset = -pkt->dts;
412 s->offset_timebase = time_base;
415 offset = av_rescale_q(s->offset, s->offset_timebase, time_base);
417 if (pkt->dts != AV_NOPTS_VALUE)
419 if (pkt->pts != AV_NOPTS_VALUE)
422 return s->oformat->write_packet(s, pkt);
425 int av_write_frame(AVFormatContext *s, AVPacket *pkt)
430 if (s->oformat->flags & AVFMT_ALLOW_FLUSH)
431 return s->oformat->write_packet(s, pkt);
435 ret = compute_pkt_fields2(s, s->streams[pkt->stream_index], pkt);
437 if (ret < 0 && !(s->oformat->flags & AVFMT_NOTIMESTAMPS))
440 ret = write_packet(s, pkt);
443 s->streams[pkt->stream_index]->nb_frames++;
447 void ff_interleave_add_packet(AVFormatContext *s, AVPacket *pkt,
448 int (*compare)(AVFormatContext *, AVPacket *, AVPacket *))
450 AVPacketList **next_point, *this_pktl;
452 this_pktl = av_mallocz(sizeof(AVPacketList));
453 this_pktl->pkt = *pkt;
454 #if FF_API_DESTRUCT_PACKET
455 pkt->destruct = NULL; // do not free original but only the copy
458 av_dup_packet(&this_pktl->pkt); // duplicate the packet if it uses non-alloced memory
460 if (s->streams[pkt->stream_index]->last_in_packet_buffer) {
461 next_point = &(s->streams[pkt->stream_index]->last_in_packet_buffer->next);
463 next_point = &s->packet_buffer;
466 if (compare(s, &s->packet_buffer_end->pkt, pkt)) {
467 while (!compare(s, &(*next_point)->pkt, pkt))
468 next_point = &(*next_point)->next;
471 next_point = &(s->packet_buffer_end->next);
474 assert(!*next_point);
476 s->packet_buffer_end = this_pktl;
479 this_pktl->next = *next_point;
481 s->streams[pkt->stream_index]->last_in_packet_buffer =
482 *next_point = this_pktl;
485 static int interleave_compare_dts(AVFormatContext *s, AVPacket *next,
488 AVStream *st = s->streams[pkt->stream_index];
489 AVStream *st2 = s->streams[next->stream_index];
490 int comp = av_compare_ts(next->dts, st2->time_base, pkt->dts,
494 return pkt->stream_index < next->stream_index;
498 int ff_interleave_packet_per_dts(AVFormatContext *s, AVPacket *out,
499 AVPacket *pkt, int flush)
502 int stream_count = 0;
506 ff_interleave_add_packet(s, pkt, interleave_compare_dts);
509 for (i = 0; i < s->nb_streams; i++)
510 stream_count += !!s->streams[i]->last_in_packet_buffer;
512 if (stream_count && (s->nb_streams == stream_count || flush)) {
513 pktl = s->packet_buffer;
516 s->packet_buffer = pktl->next;
517 if (!s->packet_buffer)
518 s->packet_buffer_end = NULL;
520 if (s->streams[out->stream_index]->last_in_packet_buffer == pktl)
521 s->streams[out->stream_index]->last_in_packet_buffer = NULL;
531 * Interleave an AVPacket correctly so it can be muxed.
532 * @param out the interleaved packet will be output here
533 * @param in the input packet
534 * @param flush 1 if no further packets are available as input and all
535 * remaining packets should be output
536 * @return 1 if a packet was output, 0 if no packet could be output,
537 * < 0 if an error occurred
539 static int interleave_packet(AVFormatContext *s, AVPacket *out, AVPacket *in, int flush)
541 if (s->oformat->interleave_packet) {
542 int ret = s->oformat->interleave_packet(s, out, in, flush);
547 return ff_interleave_packet_per_dts(s, out, in, flush);
550 int av_interleaved_write_frame(AVFormatContext *s, AVPacket *pkt)
555 AVStream *st = s->streams[pkt->stream_index];
557 //FIXME/XXX/HACK drop zero sized packets
558 if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO && pkt->size == 0)
561 av_dlog(s, "av_interleaved_write_frame size:%d dts:%" PRId64 " pts:%" PRId64 "\n",
562 pkt->size, pkt->dts, pkt->pts);
563 if ((ret = compute_pkt_fields2(s, st, pkt)) < 0 && !(s->oformat->flags & AVFMT_NOTIMESTAMPS))
566 if (pkt->dts == AV_NOPTS_VALUE && !(s->oformat->flags & AVFMT_NOTIMESTAMPS))
567 return AVERROR(EINVAL);
569 av_dlog(s, "av_interleaved_write_frame FLUSH\n");
575 int ret = interleave_packet(s, &opkt, pkt, flush);
576 if (ret <= 0) //FIXME cleanup needed for ret<0 ?
579 ret = write_packet(s, &opkt);
581 s->streams[opkt.stream_index]->nb_frames++;
583 av_free_packet(&opkt);
591 int av_write_trailer(AVFormatContext *s)
597 ret = interleave_packet(s, &pkt, NULL, 1);
598 if (ret < 0) //FIXME cleanup needed for ret<0 ?
603 ret = write_packet(s, &pkt);
605 s->streams[pkt.stream_index]->nb_frames++;
607 av_free_packet(&pkt);
613 if (s->oformat->write_trailer)
614 ret = s->oformat->write_trailer(s);
616 if (!(s->oformat->flags & AVFMT_NOFILE))
620 for (i = 0; i < s->nb_streams; i++) {
621 av_freep(&s->streams[i]->priv_data);
622 av_freep(&s->streams[i]->index_entries);
624 if (s->oformat->priv_class)
625 av_opt_free(s->priv_data);
626 av_freep(&s->priv_data);
630 int ff_write_chained(AVFormatContext *dst, int dst_stream, AVPacket *pkt,
631 AVFormatContext *src)
636 local_pkt.stream_index = dst_stream;
637 if (pkt->pts != AV_NOPTS_VALUE)
638 local_pkt.pts = av_rescale_q(pkt->pts,
639 src->streams[pkt->stream_index]->time_base,
640 dst->streams[dst_stream]->time_base);
641 if (pkt->dts != AV_NOPTS_VALUE)
642 local_pkt.dts = av_rescale_q(pkt->dts,
643 src->streams[pkt->stream_index]->time_base,
644 dst->streams[dst_stream]->time_base);
645 return av_write_frame(dst, &local_pkt);