3 * Copyright (c) 2003 The FFmpeg Project
5 * This demuxer will generate a 1 byte extradata for VP6F content.
7 * - upper 4bits: difference between encoded width and visible width
8 * - lower 4bits: difference between encoded height and visible height
10 * This file is part of FFmpeg.
12 * FFmpeg is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU Lesser General Public
14 * License as published by the Free Software Foundation; either
15 * version 2.1 of the License, or (at your option) any later version.
17 * FFmpeg is distributed in the hope that it will be useful,
18 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20 * Lesser General Public License for more details.
22 * You should have received a copy of the GNU Lesser General Public
23 * License along with FFmpeg; if not, write to the Free Software
24 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
27 #include "libavutil/avstring.h"
28 #include "libavutil/channel_layout.h"
29 #include "libavutil/dict.h"
30 #include "libavutil/opt.h"
31 #include "libavutil/intfloat.h"
32 #include "libavutil/mathematics.h"
33 #include "libavcodec/bytestream.h"
34 #include "libavcodec/mpeg4audio.h"
37 #include "avio_internal.h"
40 #define VALIDATE_INDEX_TS_THRESH 2500
42 typedef struct FLVContext {
43 const AVClass *class; ///< Class for private options.
44 int trust_metadata; ///< configure streams according onMetaData
45 int wrong_dts; ///< wrong dts due to negative cts
46 uint8_t *new_extradata[FLV_STREAM_TYPE_NB];
47 int new_extradata_size[FLV_STREAM_TYPE_NB];
59 static int probe(AVProbeData *p, int live)
61 const uint8_t *d = p->buf;
62 unsigned offset = AV_RB32(d + 5);
67 d[3] < 5 && d[5] == 0 &&
68 offset + 100 < p->buf_size &&
70 int is_live = !memcmp(d + offset + 40, "NGINX RTMP", 10);
73 return AVPROBE_SCORE_MAX;
78 static int flv_probe(AVProbeData *p)
83 static int live_flv_probe(AVProbeData *p)
88 static AVStream *create_stream(AVFormatContext *s, int codec_type)
90 AVStream *st = avformat_new_stream(s, NULL);
93 st->codec->codec_type = codec_type;
94 if (s->nb_streams>=3 ||( s->nb_streams==2
95 && s->streams[0]->codec->codec_type != AVMEDIA_TYPE_SUBTITLE
96 && s->streams[1]->codec->codec_type != AVMEDIA_TYPE_SUBTITLE))
97 s->ctx_flags &= ~AVFMTCTX_NOHEADER;
99 avpriv_set_pts_info(st, 32, 1, 1000); /* 32 bit pts in ms */
103 static int flv_same_audio_codec(AVCodecContext *acodec, int flags)
105 int bits_per_coded_sample = (flags & FLV_AUDIO_SAMPLESIZE_MASK) ? 16 : 8;
106 int flv_codecid = flags & FLV_AUDIO_CODECID_MASK;
109 if (!acodec->codec_id && !acodec->codec_tag)
112 if (acodec->bits_per_coded_sample != bits_per_coded_sample)
115 switch (flv_codecid) {
116 // no distinction between S16 and S8 PCM codec flags
117 case FLV_CODECID_PCM:
118 codec_id = bits_per_coded_sample == 8
121 : AV_CODEC_ID_PCM_S16BE;
123 : AV_CODEC_ID_PCM_S16LE;
125 return codec_id == acodec->codec_id;
126 case FLV_CODECID_PCM_LE:
127 codec_id = bits_per_coded_sample == 8
129 : AV_CODEC_ID_PCM_S16LE;
130 return codec_id == acodec->codec_id;
131 case FLV_CODECID_AAC:
132 return acodec->codec_id == AV_CODEC_ID_AAC;
133 case FLV_CODECID_ADPCM:
134 return acodec->codec_id == AV_CODEC_ID_ADPCM_SWF;
135 case FLV_CODECID_SPEEX:
136 return acodec->codec_id == AV_CODEC_ID_SPEEX;
137 case FLV_CODECID_MP3:
138 return acodec->codec_id == AV_CODEC_ID_MP3;
139 case FLV_CODECID_NELLYMOSER_8KHZ_MONO:
140 case FLV_CODECID_NELLYMOSER_16KHZ_MONO:
141 case FLV_CODECID_NELLYMOSER:
142 return acodec->codec_id == AV_CODEC_ID_NELLYMOSER;
143 case FLV_CODECID_PCM_MULAW:
144 return acodec->sample_rate == 8000 &&
145 acodec->codec_id == AV_CODEC_ID_PCM_MULAW;
146 case FLV_CODECID_PCM_ALAW:
147 return acodec->sample_rate == 8000 &&
148 acodec->codec_id == AV_CODEC_ID_PCM_ALAW;
150 return acodec->codec_tag == (flv_codecid >> FLV_AUDIO_CODECID_OFFSET);
154 static void flv_set_audio_codec(AVFormatContext *s, AVStream *astream,
155 AVCodecContext *acodec, int flv_codecid)
157 switch (flv_codecid) {
158 // no distinction between S16 and S8 PCM codec flags
159 case FLV_CODECID_PCM:
160 acodec->codec_id = acodec->bits_per_coded_sample == 8
163 : AV_CODEC_ID_PCM_S16BE;
165 : AV_CODEC_ID_PCM_S16LE;
168 case FLV_CODECID_PCM_LE:
169 acodec->codec_id = acodec->bits_per_coded_sample == 8
171 : AV_CODEC_ID_PCM_S16LE;
173 case FLV_CODECID_AAC:
174 acodec->codec_id = AV_CODEC_ID_AAC;
176 case FLV_CODECID_ADPCM:
177 acodec->codec_id = AV_CODEC_ID_ADPCM_SWF;
179 case FLV_CODECID_SPEEX:
180 acodec->codec_id = AV_CODEC_ID_SPEEX;
181 acodec->sample_rate = 16000;
183 case FLV_CODECID_MP3:
184 acodec->codec_id = AV_CODEC_ID_MP3;
185 astream->need_parsing = AVSTREAM_PARSE_FULL;
187 case FLV_CODECID_NELLYMOSER_8KHZ_MONO:
188 // in case metadata does not otherwise declare samplerate
189 acodec->sample_rate = 8000;
190 acodec->codec_id = AV_CODEC_ID_NELLYMOSER;
192 case FLV_CODECID_NELLYMOSER_16KHZ_MONO:
193 acodec->sample_rate = 16000;
194 acodec->codec_id = AV_CODEC_ID_NELLYMOSER;
196 case FLV_CODECID_NELLYMOSER:
197 acodec->codec_id = AV_CODEC_ID_NELLYMOSER;
199 case FLV_CODECID_PCM_MULAW:
200 acodec->sample_rate = 8000;
201 acodec->codec_id = AV_CODEC_ID_PCM_MULAW;
203 case FLV_CODECID_PCM_ALAW:
204 acodec->sample_rate = 8000;
205 acodec->codec_id = AV_CODEC_ID_PCM_ALAW;
208 avpriv_request_sample(s, "Audio codec (%x)",
209 flv_codecid >> FLV_AUDIO_CODECID_OFFSET);
210 acodec->codec_tag = flv_codecid >> FLV_AUDIO_CODECID_OFFSET;
214 static int flv_same_video_codec(AVCodecContext *vcodec, int flags)
216 int flv_codecid = flags & FLV_VIDEO_CODECID_MASK;
218 if (!vcodec->codec_id && !vcodec->codec_tag)
221 switch (flv_codecid) {
222 case FLV_CODECID_H263:
223 return vcodec->codec_id == AV_CODEC_ID_FLV1;
224 case FLV_CODECID_SCREEN:
225 return vcodec->codec_id == AV_CODEC_ID_FLASHSV;
226 case FLV_CODECID_SCREEN2:
227 return vcodec->codec_id == AV_CODEC_ID_FLASHSV2;
228 case FLV_CODECID_VP6:
229 return vcodec->codec_id == AV_CODEC_ID_VP6F;
230 case FLV_CODECID_VP6A:
231 return vcodec->codec_id == AV_CODEC_ID_VP6A;
232 case FLV_CODECID_H264:
233 return vcodec->codec_id == AV_CODEC_ID_H264;
235 return vcodec->codec_tag == flv_codecid;
239 static int flv_set_video_codec(AVFormatContext *s, AVStream *vstream,
240 int flv_codecid, int read)
242 AVCodecContext *vcodec = vstream->codec;
243 switch (flv_codecid) {
244 case FLV_CODECID_H263:
245 vcodec->codec_id = AV_CODEC_ID_FLV1;
247 case FLV_CODECID_REALH263:
248 vcodec->codec_id = AV_CODEC_ID_H263;
249 break; // Really mean it this time
250 case FLV_CODECID_SCREEN:
251 vcodec->codec_id = AV_CODEC_ID_FLASHSV;
253 case FLV_CODECID_SCREEN2:
254 vcodec->codec_id = AV_CODEC_ID_FLASHSV2;
256 case FLV_CODECID_VP6:
257 vcodec->codec_id = AV_CODEC_ID_VP6F;
258 case FLV_CODECID_VP6A:
259 if (flv_codecid == FLV_CODECID_VP6A)
260 vcodec->codec_id = AV_CODEC_ID_VP6A;
262 if (vcodec->extradata_size != 1) {
263 ff_alloc_extradata(vcodec, 1);
265 if (vcodec->extradata)
266 vcodec->extradata[0] = avio_r8(s->pb);
270 return 1; // 1 byte body size adjustment for flv_read_packet()
271 case FLV_CODECID_H264:
272 vcodec->codec_id = AV_CODEC_ID_H264;
273 vstream->need_parsing = AVSTREAM_PARSE_HEADERS;
274 return 3; // not 4, reading packet type will consume one byte
275 case FLV_CODECID_MPEG4:
276 vcodec->codec_id = AV_CODEC_ID_MPEG4;
279 avpriv_request_sample(s, "Video codec (%x)", flv_codecid);
280 vcodec->codec_tag = flv_codecid;
286 static int amf_get_string(AVIOContext *ioc, char *buffer, int buffsize)
288 int length = avio_rb16(ioc);
289 if (length >= buffsize) {
290 avio_skip(ioc, length);
294 avio_read(ioc, buffer, length);
296 buffer[length] = '\0';
301 static int parse_keyframes_index(AVFormatContext *s, AVIOContext *ioc,
302 AVStream *vstream, int64_t max_pos)
304 FLVContext *flv = s->priv_data;
305 unsigned int timeslen = 0, fileposlen = 0, i;
307 int64_t *times = NULL;
308 int64_t *filepositions = NULL;
309 int ret = AVERROR(ENOSYS);
310 int64_t initial_pos = avio_tell(ioc);
312 if (vstream->nb_index_entries>0) {
313 av_log(s, AV_LOG_WARNING, "Skipping duplicate index\n");
317 if (s->flags & AVFMT_FLAG_IGNIDX)
320 while (avio_tell(ioc) < max_pos - 2 &&
321 amf_get_string(ioc, str_val, sizeof(str_val)) > 0) {
322 int64_t **current_array;
323 unsigned int arraylen;
325 // Expect array object in context
326 if (avio_r8(ioc) != AMF_DATA_TYPE_ARRAY)
329 arraylen = avio_rb32(ioc);
333 if (!strcmp(KEYFRAMES_TIMESTAMP_TAG , str_val) && !times) {
334 current_array = ×
336 } else if (!strcmp(KEYFRAMES_BYTEOFFSET_TAG, str_val) &&
338 current_array = &filepositions;
339 fileposlen = arraylen;
341 // unexpected metatag inside keyframes, will not use such
342 // metadata for indexing
345 if (!(*current_array = av_mallocz(sizeof(**current_array) * arraylen))) {
346 ret = AVERROR(ENOMEM);
350 for (i = 0; i < arraylen && avio_tell(ioc) < max_pos - 1; i++) {
351 if (avio_r8(ioc) != AMF_DATA_TYPE_NUMBER)
353 current_array[0][i] = av_int2double(avio_rb64(ioc));
355 if (times && filepositions) {
356 // All done, exiting at a position allowing amf_parse_object
357 // to finish parsing the object
363 if (timeslen == fileposlen && fileposlen>1 && max_pos <= filepositions[0]) {
364 for (i = 0; i < fileposlen; i++) {
365 av_add_index_entry(vstream, filepositions[i], times[i] * 1000,
366 0, 0, AVINDEX_KEYFRAME);
368 flv->validate_index[i].pos = filepositions[i];
369 flv->validate_index[i].dts = times[i] * 1000;
370 flv->validate_count = i + 1;
375 av_log(s, AV_LOG_WARNING, "Invalid keyframes object, skipping.\n");
380 av_freep(&filepositions);
381 avio_seek(ioc, initial_pos, SEEK_SET);
385 static int amf_parse_object(AVFormatContext *s, AVStream *astream,
386 AVStream *vstream, const char *key,
387 int64_t max_pos, int depth)
389 AVCodecContext *acodec, *vcodec;
390 FLVContext *flv = s->priv_data;
392 AMFDataType amf_type;
398 amf_type = avio_r8(ioc);
401 case AMF_DATA_TYPE_NUMBER:
402 num_val = av_int2double(avio_rb64(ioc));
404 case AMF_DATA_TYPE_BOOL:
405 num_val = avio_r8(ioc);
407 case AMF_DATA_TYPE_STRING:
408 if (amf_get_string(ioc, str_val, sizeof(str_val)) < 0) {
409 av_log(s, AV_LOG_ERROR, "AMF_DATA_TYPE_STRING parsing failed\n");
413 case AMF_DATA_TYPE_OBJECT:
414 if ((vstream || astream) && key &&
416 !strcmp(KEYFRAMES_TAG, key) && depth == 1)
417 if (parse_keyframes_index(s, ioc, vstream ? vstream : astream,
419 av_log(s, AV_LOG_ERROR, "Keyframe index parsing failed\n");
421 while (avio_tell(ioc) < max_pos - 2 &&
422 amf_get_string(ioc, str_val, sizeof(str_val)) > 0)
423 if (amf_parse_object(s, astream, vstream, str_val, max_pos,
425 return -1; // if we couldn't skip, bomb out.
426 if (avio_r8(ioc) != AMF_END_OF_OBJECT) {
427 av_log(s, AV_LOG_ERROR, "Missing AMF_END_OF_OBJECT in AMF_DATA_TYPE_OBJECT\n");
431 case AMF_DATA_TYPE_NULL:
432 case AMF_DATA_TYPE_UNDEFINED:
433 case AMF_DATA_TYPE_UNSUPPORTED:
434 break; // these take up no additional space
435 case AMF_DATA_TYPE_MIXEDARRAY:
436 avio_skip(ioc, 4); // skip 32-bit max array index
437 while (avio_tell(ioc) < max_pos - 2 &&
438 amf_get_string(ioc, str_val, sizeof(str_val)) > 0)
439 // this is the only case in which we would want a nested
440 // parse to not skip over the object
441 if (amf_parse_object(s, astream, vstream, str_val, max_pos,
444 if (avio_r8(ioc) != AMF_END_OF_OBJECT) {
445 av_log(s, AV_LOG_ERROR, "Missing AMF_END_OF_OBJECT in AMF_DATA_TYPE_MIXEDARRAY\n");
449 case AMF_DATA_TYPE_ARRAY:
451 unsigned int arraylen, i;
453 arraylen = avio_rb32(ioc);
454 for (i = 0; i < arraylen && avio_tell(ioc) < max_pos - 1; i++)
455 if (amf_parse_object(s, NULL, NULL, NULL, max_pos,
457 return -1; // if we couldn't skip, bomb out.
460 case AMF_DATA_TYPE_DATE:
461 avio_skip(ioc, 8 + 2); // timestamp (double) and UTC offset (int16)
463 default: // unsupported type, we couldn't skip
464 av_log(s, AV_LOG_ERROR, "unsupported amf type %d\n", amf_type);
469 acodec = astream ? astream->codec : NULL;
470 vcodec = vstream ? vstream->codec : NULL;
472 // stream info doesn't live any deeper than the first object
474 if (amf_type == AMF_DATA_TYPE_NUMBER ||
475 amf_type == AMF_DATA_TYPE_BOOL) {
476 if (!strcmp(key, "duration"))
477 s->duration = num_val * AV_TIME_BASE;
478 else if (!strcmp(key, "videodatarate") && vcodec &&
479 0 <= (int)(num_val * 1024.0))
480 vcodec->bit_rate = num_val * 1024.0;
481 else if (!strcmp(key, "audiodatarate") && acodec &&
482 0 <= (int)(num_val * 1024.0))
483 acodec->bit_rate = num_val * 1024.0;
484 else if (!strcmp(key, "datastream")) {
485 AVStream *st = create_stream(s, AVMEDIA_TYPE_SUBTITLE);
487 return AVERROR(ENOMEM);
488 st->codec->codec_id = AV_CODEC_ID_TEXT;
489 } else if (flv->trust_metadata) {
490 if (!strcmp(key, "videocodecid") && vcodec) {
491 flv_set_video_codec(s, vstream, num_val, 0);
492 } else if (!strcmp(key, "audiocodecid") && acodec) {
493 int id = ((int)num_val) << FLV_AUDIO_CODECID_OFFSET;
494 flv_set_audio_codec(s, astream, acodec, id);
495 } else if (!strcmp(key, "audiosamplerate") && acodec) {
496 acodec->sample_rate = num_val;
497 } else if (!strcmp(key, "audiosamplesize") && acodec) {
498 acodec->bits_per_coded_sample = num_val;
499 } else if (!strcmp(key, "stereo") && acodec) {
500 acodec->channels = num_val + 1;
501 acodec->channel_layout = acodec->channels == 2 ?
502 AV_CH_LAYOUT_STEREO :
504 } else if (!strcmp(key, "width") && vcodec) {
505 vcodec->width = num_val;
506 } else if (!strcmp(key, "height") && vcodec) {
507 vcodec->height = num_val;
513 if (amf_type == AMF_DATA_TYPE_OBJECT && s->nb_streams == 1 &&
514 ((!acodec && !strcmp(key, "audiocodecid")) ||
515 (!vcodec && !strcmp(key, "videocodecid"))))
516 s->ctx_flags &= ~AVFMTCTX_NOHEADER; //If there is either audio/video missing, codecid will be an empty object
518 if (!strcmp(key, "duration") ||
519 !strcmp(key, "filesize") ||
520 !strcmp(key, "width") ||
521 !strcmp(key, "height") ||
522 !strcmp(key, "videodatarate") ||
523 !strcmp(key, "framerate") ||
524 !strcmp(key, "videocodecid") ||
525 !strcmp(key, "audiodatarate") ||
526 !strcmp(key, "audiosamplerate") ||
527 !strcmp(key, "audiosamplesize") ||
528 !strcmp(key, "stereo") ||
529 !strcmp(key, "audiocodecid") ||
530 !strcmp(key, "datastream"))
533 s->event_flags |= AVFMT_EVENT_FLAG_METADATA_UPDATED;
534 if (amf_type == AMF_DATA_TYPE_BOOL) {
535 av_strlcpy(str_val, num_val > 0 ? "true" : "false",
537 av_dict_set(&s->metadata, key, str_val, 0);
538 } else if (amf_type == AMF_DATA_TYPE_NUMBER) {
539 snprintf(str_val, sizeof(str_val), "%.f", num_val);
540 av_dict_set(&s->metadata, key, str_val, 0);
541 } else if (amf_type == AMF_DATA_TYPE_STRING)
542 av_dict_set(&s->metadata, key, str_val, 0);
548 #define TYPE_ONTEXTDATA 1
549 #define TYPE_ONCAPTION 2
550 #define TYPE_ONCAPTIONINFO 3
551 #define TYPE_UNKNOWN 9
553 static int flv_read_metabody(AVFormatContext *s, int64_t next_pos)
556 AVStream *stream, *astream, *vstream;
557 AVStream av_unused *dstream;
560 // only needs to hold the string "onMetaData".
561 // Anything longer is something we don't want.
569 // first object needs to be "onMetaData" string
571 if (type != AMF_DATA_TYPE_STRING ||
572 amf_get_string(ioc, buffer, sizeof(buffer)) < 0)
575 if (!strcmp(buffer, "onTextData"))
576 return TYPE_ONTEXTDATA;
578 if (!strcmp(buffer, "onCaption"))
579 return TYPE_ONCAPTION;
581 if (!strcmp(buffer, "onCaptionInfo"))
582 return TYPE_ONCAPTIONINFO;
584 if (strcmp(buffer, "onMetaData") && strcmp(buffer, "onCuePoint")) {
585 av_log(s, AV_LOG_DEBUG, "Unknown type %s\n", buffer);
589 // find the streams now so that amf_parse_object doesn't need to do
590 // the lookup every time it is called.
591 for (i = 0; i < s->nb_streams; i++) {
592 stream = s->streams[i];
593 if (stream->codec->codec_type == AVMEDIA_TYPE_VIDEO)
595 else if (stream->codec->codec_type == AVMEDIA_TYPE_AUDIO)
597 else if (stream->codec->codec_type == AVMEDIA_TYPE_SUBTITLE)
601 // parse the second object (we want a mixed array)
602 if (amf_parse_object(s, astream, vstream, buffer, next_pos, 0) < 0)
608 static int flv_read_header(AVFormatContext *s)
613 flags = avio_r8(s->pb);
615 s->ctx_flags |= AVFMTCTX_NOHEADER;
617 if (flags & FLV_HEADER_FLAG_HASVIDEO)
618 if (!create_stream(s, AVMEDIA_TYPE_VIDEO))
619 return AVERROR(ENOMEM);
620 if (flags & FLV_HEADER_FLAG_HASAUDIO)
621 if (!create_stream(s, AVMEDIA_TYPE_AUDIO))
622 return AVERROR(ENOMEM);
623 // Flag doesn't indicate whether or not there is script-data present. Must
624 // create that stream if it's encountered.
626 offset = avio_rb32(s->pb);
627 avio_seek(s->pb, offset, SEEK_SET);
635 static int flv_read_close(AVFormatContext *s)
638 FLVContext *flv = s->priv_data;
639 for (i=0; i<FLV_STREAM_TYPE_NB; i++)
640 av_freep(&flv->new_extradata[i]);
644 static int flv_get_extradata(AVFormatContext *s, AVStream *st, int size)
646 av_freep(&st->codec->extradata);
647 if (ff_get_extradata(st->codec, s->pb, size) < 0)
648 return AVERROR(ENOMEM);
652 static int flv_queue_extradata(FLVContext *flv, AVIOContext *pb, int stream,
655 av_free(flv->new_extradata[stream]);
656 flv->new_extradata[stream] = av_mallocz(size +
657 FF_INPUT_BUFFER_PADDING_SIZE);
658 if (!flv->new_extradata[stream])
659 return AVERROR(ENOMEM);
660 flv->new_extradata_size[stream] = size;
661 avio_read(pb, flv->new_extradata[stream], size);
665 static void clear_index_entries(AVFormatContext *s, int64_t pos)
668 av_log(s, AV_LOG_WARNING,
669 "Found invalid index entries, clearing the index.\n");
670 for (i = 0; i < s->nb_streams; i++) {
671 AVStream *st = s->streams[i];
672 /* Remove all index entries that point to >= pos */
674 for (j = 0; j < st->nb_index_entries; j++)
675 if (st->index_entries[j].pos < pos)
676 st->index_entries[out++] = st->index_entries[j];
677 st->nb_index_entries = out;
681 static int amf_skip_tag(AVIOContext *pb, AMFDataType type)
683 int nb = -1, ret, parse_name = 1;
686 case AMF_DATA_TYPE_NUMBER:
689 case AMF_DATA_TYPE_BOOL:
692 case AMF_DATA_TYPE_STRING:
693 avio_skip(pb, avio_rb16(pb));
695 case AMF_DATA_TYPE_ARRAY:
697 case AMF_DATA_TYPE_MIXEDARRAY:
699 case AMF_DATA_TYPE_OBJECT:
700 while(!pb->eof_reached && (nb-- > 0 || type != AMF_DATA_TYPE_ARRAY)) {
702 int size = avio_rb16(pb);
709 if ((ret = amf_skip_tag(pb, avio_r8(pb))) < 0)
713 case AMF_DATA_TYPE_NULL:
714 case AMF_DATA_TYPE_OBJECT_END:
717 return AVERROR_INVALIDDATA;
722 static int flv_data_packet(AVFormatContext *s, AVPacket *pkt,
723 int64_t dts, int64_t next)
725 AVIOContext *pb = s->pb;
728 int ret = AVERROR_INVALIDDATA;
732 switch (avio_r8(pb)) {
733 case AMF_DATA_TYPE_ARRAY:
735 case AMF_DATA_TYPE_MIXEDARRAY:
736 avio_seek(pb, 4, SEEK_CUR);
737 case AMF_DATA_TYPE_OBJECT:
743 while (array || (ret = amf_get_string(pb, buf, sizeof(buf))) > 0) {
744 AMFDataType type = avio_r8(pb);
745 if (type == AMF_DATA_TYPE_STRING && (array || !strcmp(buf, "text"))) {
746 length = avio_rb16(pb);
747 ret = av_get_packet(pb, pkt, length);
753 if ((ret = amf_skip_tag(pb, type)) < 0)
759 ret = AVERROR_INVALIDDATA;
763 for (i = 0; i < s->nb_streams; i++) {
765 if (st->codec->codec_type == AVMEDIA_TYPE_SUBTITLE)
769 if (i == s->nb_streams) {
770 st = create_stream(s, AVMEDIA_TYPE_SUBTITLE);
772 return AVERROR(ENOMEM);
773 st->codec->codec_id = AV_CODEC_ID_TEXT;
780 pkt->stream_index = st->index;
781 pkt->flags |= AV_PKT_FLAG_KEY;
784 avio_seek(s->pb, next + 4, SEEK_SET);
789 static int flv_read_packet(AVFormatContext *s, AVPacket *pkt)
791 FLVContext *flv = s->priv_data;
792 int ret, i, type, size, flags;
794 int64_t next, pos, meta_pos;
795 int64_t dts, pts = AV_NOPTS_VALUE;
796 int av_uninit(channels);
797 int av_uninit(sample_rate);
800 /* pkt size is repeated at end. skip it */
801 for (;; avio_skip(s->pb, 4)) {
802 pos = avio_tell(s->pb);
803 type = (avio_r8(s->pb) & 0x1F);
804 size = avio_rb24(s->pb);
805 dts = avio_rb24(s->pb);
806 dts |= avio_r8(s->pb) << 24;
807 av_log(s, AV_LOG_TRACE, "type:%d, size:%d, dts:%"PRId64" pos:%"PRId64"\n", type, size, dts, avio_tell(s->pb));
808 if (avio_feof(s->pb))
810 avio_skip(s->pb, 3); /* stream id, always 0 */
813 if (flv->validate_next < flv->validate_count) {
814 int64_t validate_pos = flv->validate_index[flv->validate_next].pos;
815 if (pos == validate_pos) {
816 if (FFABS(dts - flv->validate_index[flv->validate_next].dts) <=
817 VALIDATE_INDEX_TS_THRESH) {
818 flv->validate_next++;
820 clear_index_entries(s, validate_pos);
821 flv->validate_count = 0;
823 } else if (pos > validate_pos) {
824 clear_index_entries(s, validate_pos);
825 flv->validate_count = 0;
832 next = size + avio_tell(s->pb);
834 if (type == FLV_TAG_TYPE_AUDIO) {
835 stream_type = FLV_STREAM_TYPE_AUDIO;
836 flags = avio_r8(s->pb);
838 } else if (type == FLV_TAG_TYPE_VIDEO) {
839 stream_type = FLV_STREAM_TYPE_VIDEO;
840 flags = avio_r8(s->pb);
842 if ((flags & FLV_VIDEO_FRAMETYPE_MASK) == FLV_FRAME_VIDEO_INFO_CMD)
844 } else if (type == FLV_TAG_TYPE_META) {
845 stream_type=FLV_STREAM_TYPE_DATA;
846 if (size > 13 + 1 + 4) { // Header-type metadata stuff
848 meta_pos = avio_tell(s->pb);
849 type = flv_read_metabody(s, next);
850 if (type == 0 && dts == 0 || type < 0 || type == TYPE_UNKNOWN) {
852 } else if (type == TYPE_ONTEXTDATA) {
853 avpriv_request_sample(s, "OnTextData packet");
854 return flv_data_packet(s, pkt, dts, next);
855 } else if (type == TYPE_ONCAPTION) {
856 return flv_data_packet(s, pkt, dts, next);
858 avio_seek(s->pb, meta_pos, SEEK_SET);
861 av_log(s, AV_LOG_DEBUG,
862 "Skipping flv packet: type %d, size %d, flags %d.\n",
865 avio_seek(s->pb, next, SEEK_SET);
869 /* skip empty data packets */
873 /* now find stream */
874 for (i = 0; i < s->nb_streams; i++) {
876 if (stream_type == FLV_STREAM_TYPE_AUDIO) {
877 if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO &&
878 (s->audio_codec_id || flv_same_audio_codec(st->codec, flags)))
880 } else if (stream_type == FLV_STREAM_TYPE_VIDEO) {
881 if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO &&
882 (s->video_codec_id || flv_same_video_codec(st->codec, flags)))
884 } else if (stream_type == FLV_STREAM_TYPE_DATA) {
885 if (st->codec->codec_type == AVMEDIA_TYPE_SUBTITLE)
889 if (i == s->nb_streams) {
890 static const enum AVMediaType stream_types[] = {AVMEDIA_TYPE_VIDEO, AVMEDIA_TYPE_AUDIO, AVMEDIA_TYPE_SUBTITLE};
891 av_log(s, AV_LOG_WARNING, "Stream discovered after head already parsed\n");
892 st = create_stream(s, stream_types[stream_type]);
894 return AVERROR(ENOMEM);
897 av_log(s, AV_LOG_TRACE, "%d %X %d \n", stream_type, flags, st->discard);
899 if (s->pb->seekable &&
900 ((flags & FLV_VIDEO_FRAMETYPE_MASK) == FLV_FRAME_KEY ||
901 stream_type == FLV_STREAM_TYPE_AUDIO))
902 av_add_index_entry(st, pos, dts, size, 0, AVINDEX_KEYFRAME);
904 if ( (st->discard >= AVDISCARD_NONKEY && !((flags & FLV_VIDEO_FRAMETYPE_MASK) == FLV_FRAME_KEY || (stream_type == FLV_STREAM_TYPE_AUDIO)))
905 ||(st->discard >= AVDISCARD_BIDIR && ((flags & FLV_VIDEO_FRAMETYPE_MASK) == FLV_FRAME_DISP_INTER && (stream_type == FLV_STREAM_TYPE_VIDEO)))
906 || st->discard >= AVDISCARD_ALL
908 avio_seek(s->pb, next, SEEK_SET);
914 // if not streamed and no duration from metadata then seek to end to find
915 // the duration from the timestamps
916 if (s->pb->seekable && (!s->duration || s->duration == AV_NOPTS_VALUE) && !flv->searched_for_end) {
918 const int64_t pos = avio_tell(s->pb);
919 // Read the last 4 bytes of the file, this should be the size of the
920 // previous FLV tag. Use the timestamp of its payload as duration.
921 int64_t fsize = avio_size(s->pb);
923 avio_seek(s->pb, fsize - 4, SEEK_SET);
924 size = avio_rb32(s->pb);
925 // Seek to the start of the last FLV tag at position (fsize - 4 - size)
926 // but skip the byte indicating the type.
927 avio_seek(s->pb, fsize - 3 - size, SEEK_SET);
928 if (size == avio_rb24(s->pb) + 11) {
929 uint32_t ts = avio_rb24(s->pb);
930 ts |= avio_r8(s->pb) << 24;
932 s->duration = ts * (int64_t)AV_TIME_BASE / 1000;
933 else if (fsize >= 8 && fsize - 8 >= size) {
939 avio_seek(s->pb, pos, SEEK_SET);
940 flv->searched_for_end = 1;
943 if (stream_type == FLV_STREAM_TYPE_AUDIO) {
944 int bits_per_coded_sample;
945 channels = (flags & FLV_AUDIO_CHANNEL_MASK) == FLV_STEREO ? 2 : 1;
946 sample_rate = 44100 << ((flags & FLV_AUDIO_SAMPLERATE_MASK) >>
947 FLV_AUDIO_SAMPLERATE_OFFSET) >> 3;
948 bits_per_coded_sample = (flags & FLV_AUDIO_SAMPLESIZE_MASK) ? 16 : 8;
949 if (!st->codec->channels || !st->codec->sample_rate ||
950 !st->codec->bits_per_coded_sample) {
951 st->codec->channels = channels;
952 st->codec->channel_layout = channels == 1
954 : AV_CH_LAYOUT_STEREO;
955 st->codec->sample_rate = sample_rate;
956 st->codec->bits_per_coded_sample = bits_per_coded_sample;
958 if (!st->codec->codec_id) {
959 flv_set_audio_codec(s, st, st->codec,
960 flags & FLV_AUDIO_CODECID_MASK);
961 flv->last_sample_rate =
962 sample_rate = st->codec->sample_rate;
964 channels = st->codec->channels;
966 AVCodecContext ctx = {0};
967 ctx.sample_rate = sample_rate;
968 ctx.bits_per_coded_sample = bits_per_coded_sample;
969 flv_set_audio_codec(s, st, &ctx, flags & FLV_AUDIO_CODECID_MASK);
970 sample_rate = ctx.sample_rate;
972 } else if (stream_type == FLV_STREAM_TYPE_VIDEO) {
973 size -= flv_set_video_codec(s, st, flags & FLV_VIDEO_CODECID_MASK, 1);
974 } else if (stream_type == FLV_STREAM_TYPE_DATA) {
975 st->codec->codec_id = AV_CODEC_ID_TEXT;
978 if (st->codec->codec_id == AV_CODEC_ID_AAC ||
979 st->codec->codec_id == AV_CODEC_ID_H264 ||
980 st->codec->codec_id == AV_CODEC_ID_MPEG4) {
981 int type = avio_r8(s->pb);
983 if (st->codec->codec_id == AV_CODEC_ID_H264 || st->codec->codec_id == AV_CODEC_ID_MPEG4) {
985 int32_t cts = (avio_rb24(s->pb) + 0xff800000) ^ 0xff800000;
987 if (cts < 0) { // dts might be wrong
989 av_log(s, AV_LOG_WARNING,
990 "Negative cts, previous timestamps might be wrong.\n");
992 } else if (FFABS(dts - pts) > 1000*60*15) {
993 av_log(s, AV_LOG_WARNING,
994 "invalid timestamps %"PRId64" %"PRId64"\n", dts, pts);
995 dts = pts = AV_NOPTS_VALUE;
998 if (type == 0 && (!st->codec->extradata || st->codec->codec_id == AV_CODEC_ID_AAC ||
999 st->codec->codec_id == AV_CODEC_ID_H264)) {
1000 AVDictionaryEntry *t;
1002 if (st->codec->extradata) {
1003 if ((ret = flv_queue_extradata(flv, s->pb, stream_type, size)) < 0)
1005 ret = AVERROR(EAGAIN);
1008 if ((ret = flv_get_extradata(s, st, size)) < 0)
1011 /* Workaround for buggy Omnia A/XE encoder */
1012 t = av_dict_get(s->metadata, "Encoder", NULL, 0);
1013 if (st->codec->codec_id == AV_CODEC_ID_AAC && t && !strcmp(t->value, "Omnia A/XE"))
1014 st->codec->extradata_size = 2;
1016 if (st->codec->codec_id == AV_CODEC_ID_AAC && 0) {
1017 MPEG4AudioConfig cfg;
1019 if (avpriv_mpeg4audio_get_config(&cfg, st->codec->extradata,
1020 st->codec->extradata_size * 8, 1) >= 0) {
1021 st->codec->channels = cfg.channels;
1022 st->codec->channel_layout = 0;
1023 if (cfg.ext_sample_rate)
1024 st->codec->sample_rate = cfg.ext_sample_rate;
1026 st->codec->sample_rate = cfg.sample_rate;
1027 av_log(s, AV_LOG_TRACE, "mp4a config channels %d sample rate %d\n",
1028 st->codec->channels, st->codec->sample_rate);
1032 ret = AVERROR(EAGAIN);
1037 /* skip empty data packets */
1039 ret = AVERROR(EAGAIN);
1043 ret = av_get_packet(s->pb, pkt, size);
1047 pkt->pts = pts == AV_NOPTS_VALUE ? dts : pts;
1048 pkt->stream_index = st->index;
1049 if (flv->new_extradata[stream_type]) {
1050 uint8_t *side = av_packet_new_side_data(pkt, AV_PKT_DATA_NEW_EXTRADATA,
1051 flv->new_extradata_size[stream_type]);
1053 memcpy(side, flv->new_extradata[stream_type],
1054 flv->new_extradata_size[stream_type]);
1055 av_freep(&flv->new_extradata[stream_type]);
1056 flv->new_extradata_size[stream_type] = 0;
1059 if (stream_type == FLV_STREAM_TYPE_AUDIO &&
1060 (sample_rate != flv->last_sample_rate ||
1061 channels != flv->last_channels)) {
1062 flv->last_sample_rate = sample_rate;
1063 flv->last_channels = channels;
1064 ff_add_param_change(pkt, channels, 0, sample_rate, 0, 0);
1067 if ( stream_type == FLV_STREAM_TYPE_AUDIO ||
1068 ((flags & FLV_VIDEO_FRAMETYPE_MASK) == FLV_FRAME_KEY) ||
1069 stream_type == FLV_STREAM_TYPE_DATA)
1070 pkt->flags |= AV_PKT_FLAG_KEY;
1073 avio_skip(s->pb, 4);
1077 static int flv_read_seek(AVFormatContext *s, int stream_index,
1078 int64_t ts, int flags)
1080 FLVContext *flv = s->priv_data;
1081 flv->validate_count = 0;
1082 return avio_seek_time(s->pb, stream_index, ts, flags);
1085 #define OFFSET(x) offsetof(FLVContext, x)
1086 #define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
1087 static const AVOption options[] = {
1088 { "flv_metadata", "Allocate streams according to the onMetaData array", OFFSET(trust_metadata), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, VD },
1092 static const AVClass flv_class = {
1093 .class_name = "flvdec",
1094 .item_name = av_default_item_name,
1096 .version = LIBAVUTIL_VERSION_INT,
1099 AVInputFormat ff_flv_demuxer = {
1101 .long_name = NULL_IF_CONFIG_SMALL("FLV (Flash Video)"),
1102 .priv_data_size = sizeof(FLVContext),
1103 .read_probe = flv_probe,
1104 .read_header = flv_read_header,
1105 .read_packet = flv_read_packet,
1106 .read_seek = flv_read_seek,
1107 .read_close = flv_read_close,
1108 .extensions = "flv",
1109 .priv_class = &flv_class,
1112 static const AVClass live_flv_class = {
1113 .class_name = "live_flvdec",
1114 .item_name = av_default_item_name,
1116 .version = LIBAVUTIL_VERSION_INT,
1119 AVInputFormat ff_live_flv_demuxer = {
1121 .long_name = NULL_IF_CONFIG_SMALL("live RTMP FLV (Flash Video)"),
1122 .priv_data_size = sizeof(FLVContext),
1123 .read_probe = live_flv_probe,
1124 .read_header = flv_read_header,
1125 .read_packet = flv_read_packet,
1126 .read_seek = flv_read_seek,
1127 .read_close = flv_read_close,
1128 .extensions = "flv",
1129 .priv_class = &live_flv_class,
1130 .flags = AVFMT_TS_DISCONT