3 * Copyright (c) 2001 Fabrice Bellard.
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Lesser General Public
7 * License as published by the Free Software Foundation; either
8 * version 2 of the License, or (at your option) any later version.
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
15 * You should have received a copy of the GNU Lesser General Public
16 * License along with this library; if not, write to the Free Software
17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
29 typedef struct AVIStream {
30 int64_t frame_offset; /* current frame (video) or byte (audio) counter
31 (used to compute the pts) */
37 int sample_size; /* audio only data */
40 int cum_len; /* temporary storage (used during seek) */
42 int prefix; ///< normally 'd'<<8 + 'c' or 'w'<<8 + 'b'
54 DVDemuxContext* dv_demux;
57 static int avi_load_index(AVFormatContext *s);
60 static void print_tag(const char *str, unsigned int tag, int size)
62 printf("%s: tag=%c%c%c%c size=0x%x\n",
71 static int get_riff(AVIContext *avi, ByteIOContext *pb)
74 /* check RIFF header */
77 if (tag != MKTAG('R', 'I', 'F', 'F'))
79 avi->riff_end = get_le32(pb); /* RIFF chunk size */
80 avi->riff_end += url_ftell(pb); /* RIFF chunk end */
82 if (tag != MKTAG('A', 'V', 'I', ' ') && tag != MKTAG('A', 'V', 'I', 'X'))
88 static int avi_read_header(AVFormatContext *s, AVFormatParameters *ap)
90 AVIContext *avi = s->priv_data;
91 ByteIOContext *pb = &s->pb;
92 uint32_t tag, tag1, handler;
93 int codec_type, stream_index, frame_period, bit_rate;
94 unsigned int size, nb_frames;
98 int xan_video = 0; /* hack to support Xan A/V */
100 avi->stream_index= -1;
102 if (get_riff(avi, pb) < 0)
115 print_tag("tag", tag, size);
119 case MKTAG('L', 'I', 'S', 'T'):
120 /* ignored, except when start of video packets */
123 print_tag("list", tag1, 0);
125 if (tag1 == MKTAG('m', 'o', 'v', 'i')) {
126 avi->movi_list = url_ftell(pb) - 4;
127 if(size) avi->movi_end = avi->movi_list + size;
128 else avi->movi_end = url_fsize(pb);
130 printf("movi end=%Lx\n", avi->movi_end);
135 case MKTAG('d', 'm', 'l', 'h'):
137 url_fskip(pb, size + (size & 1));
139 case MKTAG('a', 'v', 'i', 'h'):
141 /* using frame_period is bad idea */
142 frame_period = get_le32(pb);
143 bit_rate = get_le32(pb) * 8;
144 url_fskip(pb, 4 * 4);
148 st = av_new_stream(s, i);
152 ast = av_mallocz(sizeof(AVIStream));
157 url_fskip(pb, size - 7 * 4);
159 case MKTAG('s', 't', 'r', 'h'):
163 handler = get_le32(pb); /* codec tag */
165 print_tag("strh", tag1, -1);
167 if(tag1 == MKTAG('i', 'a', 'v', 's') || tag1 == MKTAG('i', 'v', 'a', 's')){
169 * After some consideration -- I don't think we
170 * have to support anything but DV in a type1 AVIs.
172 if (s->nb_streams != 1)
175 if (handler != MKTAG('d', 'v', 's', 'd') &&
176 handler != MKTAG('d', 'v', 'h', 'd') &&
177 handler != MKTAG('d', 'v', 's', 'l'))
180 ast = s->streams[0]->priv_data;
181 av_freep(&s->streams[0]->codec->extradata);
182 av_freep(&s->streams[0]);
184 avi->dv_demux = dv_init_demux(s);
187 s->streams[0]->priv_data = ast;
188 url_fskip(pb, 3 * 4);
189 ast->scale = get_le32(pb);
190 ast->rate = get_le32(pb);
191 stream_index = s->nb_streams - 1;
192 url_fskip(pb, size - 7*4);
196 if (stream_index >= s->nb_streams) {
197 url_fskip(pb, size - 8);
200 st = s->streams[stream_index];
202 st->codec->stream_codec_tag= handler;
204 get_le32(pb); /* flags */
205 get_le16(pb); /* priority */
206 get_le16(pb); /* language */
207 get_le32(pb); /* initial frame */
208 ast->scale = get_le32(pb);
209 ast->rate = get_le32(pb);
210 if(ast->scale && ast->rate){
211 }else if(frame_period){
213 ast->scale = frame_period;
218 av_set_pts_info(st, 64, ast->scale, ast->rate);
220 ast->start= get_le32(pb); /* start */
221 nb_frames = get_le32(pb);
224 st->duration = nb_frames;
225 get_le32(pb); /* buffer size */
226 get_le32(pb); /* quality */
227 ast->sample_size = get_le32(pb); /* sample ssize */
228 // av_log(NULL, AV_LOG_DEBUG, "%d %d %d %d\n", ast->rate, ast->scale, ast->start, ast->sample_size);
231 case MKTAG('v', 'i', 'd', 's'):
232 codec_type = CODEC_TYPE_VIDEO;
234 ast->sample_size = 0;
236 case MKTAG('a', 'u', 'd', 's'):
237 codec_type = CODEC_TYPE_AUDIO;
239 case MKTAG('t', 'x', 't', 's'):
241 codec_type = CODEC_TYPE_DATA; //CODEC_TYPE_SUB ? FIXME
243 case MKTAG('p', 'a', 'd', 's'):
244 codec_type = CODEC_TYPE_UNKNOWN;
248 av_log(s, AV_LOG_ERROR, "unknown stream type %X\n", tag1);
251 url_fskip(pb, size - 12 * 4);
253 case MKTAG('s', 't', 'r', 'f'):
255 if (stream_index >= s->nb_streams || avi->dv_demux) {
258 st = s->streams[stream_index];
260 case CODEC_TYPE_VIDEO:
261 get_le32(pb); /* size */
262 st->codec->width = get_le32(pb);
263 st->codec->height = get_le32(pb);
264 get_le16(pb); /* panes */
265 st->codec->bits_per_sample= get_le16(pb); /* depth */
267 get_le32(pb); /* ImageSize */
268 get_le32(pb); /* XPelsPerMeter */
269 get_le32(pb); /* YPelsPerMeter */
270 get_le32(pb); /* ClrUsed */
271 get_le32(pb); /* ClrImportant */
273 if(size > 10*4 && size<(1<<30)){
274 st->codec->extradata_size= size - 10*4;
275 st->codec->extradata= av_malloc(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
276 get_buffer(pb, st->codec->extradata, st->codec->extradata_size);
279 if(st->codec->extradata_size & 1) //FIXME check if the encoder really did this correctly
282 /* Extract palette from extradata if bpp <= 8 */
283 /* This code assumes that extradata contains only palette */
284 /* This is true for all paletted codecs implemented in ffmpeg */
285 if (st->codec->extradata_size && (st->codec->bits_per_sample <= 8)) {
286 st->codec->palctrl = av_mallocz(sizeof(AVPaletteControl));
287 #ifdef WORDS_BIGENDIAN
288 for (i = 0; i < FFMIN(st->codec->extradata_size, AVPALETTE_SIZE)/4; i++)
289 st->codec->palctrl->palette[i] = bswap_32(((uint32_t*)st->codec->extradata)[i]);
291 memcpy(st->codec->palctrl->palette, st->codec->extradata,
292 FFMIN(st->codec->extradata_size, AVPALETTE_SIZE));
294 st->codec->palctrl->palette_changed = 1;
298 print_tag("video", tag1, 0);
300 st->codec->codec_type = CODEC_TYPE_VIDEO;
301 st->codec->codec_tag = tag1;
302 st->codec->codec_id = codec_get_id(codec_bmp_tags, tag1);
303 if (st->codec->codec_id == CODEC_ID_XAN_WC4)
305 st->need_parsing = 2; //only parse headers dont do slower repacketization, this is needed to get the pict type which is needed for generating correct pts
306 // url_fskip(pb, size - 5 * 4);
308 case CODEC_TYPE_AUDIO:
309 get_wav_header(pb, st->codec, size);
310 if (size%2) /* 2-aligned (fix for Stargate SG-1 - 3x18 - Shades of Grey.avi) */
312 /* special case time: To support Xan DPCM, hardcode
313 * the format if Xxan is the video codec */
314 st->need_parsing = 1;
315 /* force parsing as several audio frames can be in
318 st->codec->codec_id = CODEC_ID_XAN_DPCM;
321 st->codec->codec_type = CODEC_TYPE_DATA;
322 st->codec->codec_id= CODEC_ID_NONE;
323 st->codec->codec_tag= 0;
337 /* check stream number */
338 if (stream_index != s->nb_streams - 1) {
340 for(i=0;i<s->nb_streams;i++) {
341 av_freep(&s->streams[i]->codec->extradata);
342 av_freep(&s->streams[i]);
347 assert(!avi->index_loaded);
349 avi->index_loaded = 1;
354 static int avi_read_packet(AVFormatContext *s, AVPacket *pkt)
356 AVIContext *avi = s->priv_data;
357 ByteIOContext *pb = &s->pb;
363 size = dv_get_packet(avi->dv_demux, pkt);
368 if(avi->non_interleaved){
369 int best_stream_index = 0;
370 AVStream *best_st= NULL;
372 int64_t best_ts= INT64_MAX;
375 for(i=0; i<s->nb_streams; i++){
376 AVStream *st = s->streams[i];
377 AVIStream *ast = st->priv_data;
378 int64_t ts= ast->frame_offset;
381 ts /= ast->sample_size;
382 ts= av_rescale(ts, AV_TIME_BASE * (int64_t)st->time_base.num, st->time_base.den);
384 // av_log(NULL, AV_LOG_DEBUG, "%Ld %d/%d %Ld\n", ts, st->time_base.num, st->time_base.den, ast->frame_offset);
388 best_stream_index= i;
391 best_ast = best_st->priv_data;
392 best_ts= av_rescale(best_ts, best_st->time_base.den, AV_TIME_BASE * (int64_t)best_st->time_base.num); //FIXME a little ugly
393 if(best_ast->remaining)
394 i= av_index_search_timestamp(best_st, best_ts, AVSEEK_FLAG_ANY | AVSEEK_FLAG_BACKWARD);
396 i= av_index_search_timestamp(best_st, best_ts, AVSEEK_FLAG_ANY);
398 // av_log(NULL, AV_LOG_DEBUG, "%d\n", i);
400 int64_t pos= best_st->index_entries[i].pos;
401 pos += avi->movi_list + best_ast->packet_size - best_ast->remaining;
402 url_fseek(&s->pb, pos, SEEK_SET);
403 // av_log(NULL, AV_LOG_DEBUG, "pos=%Ld\n", pos);
405 if(best_ast->remaining)
406 avi->stream_index= best_stream_index;
408 avi->stream_index= -1;
413 if(avi->stream_index >= 0){
414 AVStream *st= s->streams[ avi->stream_index ];
415 AVIStream *ast= st->priv_data;
418 if(ast->sample_size == 0)
420 else if(ast->sample_size < 32)
421 size= 64*ast->sample_size;
423 size= ast->sample_size;
425 if(size > ast->remaining)
426 size= ast->remaining;
427 av_get_packet(pb, pkt, size);
430 dstr = pkt->destruct;
431 size = dv_produce_packet(avi->dv_demux, pkt,
432 pkt->data, pkt->size);
433 pkt->destruct = dstr;
434 pkt->flags |= PKT_FLAG_KEY;
436 /* XXX: how to handle B frames in avi ? */
437 pkt->dts = ast->frame_offset;
438 // pkt->dts += ast->start;
440 pkt->dts /= ast->sample_size;
441 //av_log(NULL, AV_LOG_DEBUG, "dts:%Ld offset:%d %d/%d smpl_siz:%d base:%d st:%d size:%d\n", pkt->dts, ast->frame_offset, ast->scale, ast->rate, ast->sample_size, AV_TIME_BASE, n, size);
442 pkt->stream_index = avi->stream_index;
444 if (st->codec->codec_type == CODEC_TYPE_VIDEO) {
445 if(st->index_entries){
449 index= av_index_search_timestamp(st, pkt->dts, 0);
450 e= &st->index_entries[index];
452 if(index >= 0 && e->timestamp == ast->frame_offset){
453 if (e->flags & AVINDEX_KEYFRAME)
454 pkt->flags |= PKT_FLAG_KEY;
457 /* if no index, better to say that all frames
459 pkt->flags |= PKT_FLAG_KEY;
462 pkt->flags |= PKT_FLAG_KEY;
465 ast->frame_offset += pkt->size;
469 ast->remaining -= size;
471 avi->stream_index= -1;
482 memset(d, -1, sizeof(int)*8);
483 for(i=sync=url_ftell(pb); !url_feof(pb); i++) {
486 if (i >= avi->movi_end) {
488 url_fskip(pb, avi->riff_end - i);
489 avi->riff_end = avi->movi_end = url_fsize(pb);
498 size= d[4] + (d[5]<<8) + (d[6]<<16) + (d[7]<<24);
500 if( d[2] >= '0' && d[2] <= '9'
501 && d[3] >= '0' && d[3] <= '9'){
502 n= (d[2] - '0') * 10 + (d[3] - '0');
504 n= 100; //invalid stream id
506 //av_log(NULL, AV_LOG_DEBUG, "%X %X %X %X %X %X %X %X %lld %d %d\n", d[0], d[1], d[2], d[3], d[4], d[5], d[6], d[7], i, size, n);
507 if(i + size > avi->movi_end || d[0]<0)
511 if( (d[0] == 'i' && d[1] == 'x' && n < s->nb_streams)
513 ||(d[0] == 'J' && d[1] == 'U' && d[2] == 'N' && d[3] == 'K')){
515 //av_log(NULL, AV_LOG_DEBUG, "SKIP\n");
519 if( d[0] >= '0' && d[0] <= '9'
520 && d[1] >= '0' && d[1] <= '9'){
521 n= (d[0] - '0') * 10 + (d[1] - '0');
523 n= 100; //invalid stream id
527 if(n < s->nb_streams){
533 if( (st->discard >= AVDISCARD_DEFAULT && size==0)
534 /*|| (st->discard >= AVDISCARD_NONKEY && !(pkt->flags & PKT_FLAG_KEY))*/ //FIXME needs a little reordering
535 || st->discard >= AVDISCARD_ALL){
536 if(ast->sample_size) ast->frame_offset += pkt->size;
537 else ast->frame_offset++;
542 if( ((ast->prefix_count<5 || sync+9 > i) && d[2]<128 && d[3]<128) ||
543 d[2]*256+d[3] == ast->prefix /*||
544 (d[2] == 'd' && d[3] == 'c') ||
545 (d[2] == 'w' && d[3] == 'b')*/) {
547 //av_log(NULL, AV_LOG_DEBUG, "OK\n");
548 if(d[2]*256+d[3] == ast->prefix)
551 ast->prefix= d[2]*256+d[3];
552 ast->prefix_count= 0;
555 avi->stream_index= n;
556 ast->packet_size= size + 8;
557 ast->remaining= size;
561 /* palette changed chunk */
562 if ( d[0] >= '0' && d[0] <= '9'
563 && d[1] >= '0' && d[1] <= '9'
564 && ((d[2] == 'p' && d[3] == 'c'))
565 && n < s->nb_streams && i + size <= avi->movi_end) {
568 int first, clr, flags, k, p;
572 first = get_byte(pb);
574 if(!clr) /* all 256 colors used */
576 flags = get_le16(pb);
578 for (k = first; k < clr + first; k++) {
584 st->codec->palctrl->palette[k] = b + (g << 8) + (r << 16);
586 st->codec->palctrl->palette_changed = 1;
595 /* XXX: we make the implicit supposition that the position are sorted
597 static int avi_read_idx1(AVFormatContext *s, int size)
599 AVIContext *avi = s->priv_data;
600 ByteIOContext *pb = &s->pb;
601 int nb_index_entries, i;
604 unsigned int index, tag, flags, pos, len;
605 unsigned last_pos= -1;
607 nb_index_entries = size / 16;
608 if (nb_index_entries <= 0)
611 /* read the entries and sort them in each stream component */
612 for(i = 0; i < nb_index_entries; i++) {
614 flags = get_le32(pb);
617 #if defined(DEBUG_SEEK)
618 av_log(NULL, AV_LOG_DEBUG, "%d: tag=0x%x flags=0x%x pos=0x%x len=%d/",
619 i, tag, flags, pos, len);
621 if(i==0 && pos > avi->movi_list)
622 avi->movi_list= 0; //FIXME better check
624 index = ((tag & 0xff) - '0') * 10;
625 index += ((tag >> 8) & 0xff) - '0';
626 if (index >= s->nb_streams)
628 st = s->streams[index];
631 #if defined(DEBUG_SEEK)
632 av_log(NULL, AV_LOG_DEBUG, "%d cum_len=%d\n", len, ast->cum_len);
635 avi->non_interleaved= 1;
637 av_add_index_entry(st, pos, ast->cum_len, 0, (flags&AVIIF_INDEX) ? AVINDEX_KEYFRAME : 0);
639 ast->cum_len += len / ast->sample_size;
647 static int guess_ni_flag(AVFormatContext *s){
649 int64_t last_start=0;
650 int64_t first_end= INT64_MAX;
652 for(i=0; i<s->nb_streams; i++){
653 AVStream *st = s->streams[i];
654 int n= st->nb_index_entries;
659 if(st->index_entries[0].pos > last_start)
660 last_start= st->index_entries[0].pos;
661 if(st->index_entries[n-1].pos < first_end)
662 first_end= st->index_entries[n-1].pos;
664 return last_start > first_end;
667 static int avi_load_index(AVFormatContext *s)
669 AVIContext *avi = s->priv_data;
670 ByteIOContext *pb = &s->pb;
672 offset_t pos= url_ftell(pb);
674 url_fseek(pb, avi->movi_end, SEEK_SET);
676 printf("movi_end=0x%llx\n", avi->movi_end);
684 printf("tag=%c%c%c%c size=0x%x\n",
692 case MKTAG('i', 'd', 'x', '1'):
693 if (avi_read_idx1(s, size) < 0)
706 avi->non_interleaved |= guess_ni_flag(s);
707 url_fseek(pb, pos, SEEK_SET);
711 static int avi_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
713 AVIContext *avi = s->priv_data;
718 if (!avi->index_loaded) {
719 /* we only load the index on demand */
721 avi->index_loaded = 1;
723 assert(stream_index>= 0);
725 st = s->streams[stream_index];
726 index= av_index_search_timestamp(st, timestamp, flags);
730 /* find the position */
731 pos = st->index_entries[index].pos;
732 timestamp = st->index_entries[index].timestamp;
734 // av_log(NULL, AV_LOG_DEBUG, "XX %Ld %d %Ld\n", timestamp, index, st->index_entries[index].timestamp);
736 for(i = 0; i < s->nb_streams; i++) {
737 AVStream *st2 = s->streams[i];
738 AVIStream *ast2 = st2->priv_data;
743 if (st2->nb_index_entries <= 0)
746 // assert(st2->codec.block_align);
747 assert(st2->time_base.den == ast2->rate);
748 assert(st2->time_base.num == ast2->scale);
749 index = av_index_search_timestamp(
751 av_rescale(timestamp, st2->time_base.den*(int64_t)st->time_base.num, st->time_base.den * (int64_t)st2->time_base.num),
752 flags | AVSEEK_FLAG_BACKWARD);
756 if(!avi->non_interleaved){
757 while(index>0 && st2->index_entries[index].pos > pos)
759 while(index+1 < st2->nb_index_entries && st2->index_entries[index].pos < pos)
763 // av_log(NULL, AV_LOG_DEBUG, "%Ld %d %Ld\n", timestamp, index, st2->index_entries[index].timestamp);
764 /* extract the current frame number */
765 ast2->frame_offset = st2->index_entries[index].timestamp;
766 if(ast2->sample_size)
767 ast2->frame_offset *=ast2->sample_size;
771 dv_flush_audio_packets(avi->dv_demux);
773 pos += avi->movi_list;
774 url_fseek(&s->pb, pos, SEEK_SET);
775 avi->stream_index= -1;
779 static int avi_read_close(AVFormatContext *s)
782 AVIContext *avi = s->priv_data;
784 for(i=0;i<s->nb_streams;i++) {
785 AVStream *st = s->streams[i];
786 AVIStream *ast = st->priv_data;
788 av_free(st->codec->extradata);
789 av_free(st->codec->palctrl);
793 av_free(avi->dv_demux);
798 static int avi_probe(AVProbeData *p)
800 /* check file header */
801 if (p->buf_size <= 32)
803 if (p->buf[0] == 'R' && p->buf[1] == 'I' &&
804 p->buf[2] == 'F' && p->buf[3] == 'F' &&
805 p->buf[8] == 'A' && p->buf[9] == 'V' &&
806 p->buf[10] == 'I' && p->buf[11] == ' ')
807 return AVPROBE_SCORE_MAX;
812 static AVInputFormat avi_iformat = {
823 int avidec_init(void)
825 av_register_input_format(&avi_iformat);