2 * "Real" compatible mux and demux.
3 * Copyright (c) 2000, 2001 Fabrice Bellard.
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Lesser General Public
7 * License as published by the Free Software Foundation; either
8 * version 2 of the License, or (at your option) any later version.
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
15 * You should have received a copy of the GNU Lesser General Public
16 * License along with this library; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
22 #define BUFFER_DURATION 0
26 int packet_total_size;
28 /* codec related output */
31 int nb_frames; /* current frame number */
32 int total_frames; /* total number of frames */
38 StreamInfo streams[2];
39 StreamInfo *audio_stream, *video_stream;
40 int data_pos; /* position of the data after the header */
44 static void put_str(ByteIOContext *s, const char *tag)
46 put_be16(s,strlen(tag));
52 static void put_str8(ByteIOContext *s, const char *tag)
54 put_byte(s, strlen(tag));
60 static void rv10_write_header(AVFormatContext *ctx,
61 int data_size, int index_pos)
63 RMContext *rm = ctx->priv_data;
64 ByteIOContext *s = &ctx->pb;
66 unsigned char *data_offset_ptr, *start_ptr;
67 const char *desc, *mimetype;
68 int nb_packets, packet_total_size, packet_max_size, size, packet_avg_size, i;
69 int bit_rate, v, duration, flags, data_pos;
71 start_ptr = s->buf_ptr;
74 put_be32(s,18); /* header size */
77 put_be32(s,4 + ctx->nb_streams); /* num headers */
83 packet_total_size = 0;
87 for(i=0;i<ctx->nb_streams;i++) {
88 StreamInfo *stream = &rm->streams[i];
89 bit_rate += stream->bit_rate;
90 if (stream->packet_max_size > packet_max_size)
91 packet_max_size = stream->packet_max_size;
92 nb_packets += stream->nb_packets;
93 packet_total_size += stream->packet_total_size;
94 /* select maximum duration */
95 v = (int) (1000.0 * (float)stream->total_frames / stream->frame_rate);
99 put_be32(s, bit_rate); /* max bit rate */
100 put_be32(s, bit_rate); /* avg bit rate */
101 put_be32(s, packet_max_size); /* max packet size */
103 packet_avg_size = packet_total_size / nb_packets;
106 put_be32(s, packet_avg_size); /* avg packet size */
107 put_be32(s, nb_packets); /* num packets */
108 put_be32(s, duration); /* duration */
109 put_be32(s, BUFFER_DURATION); /* preroll */
110 put_be32(s, index_pos); /* index offset */
111 /* computation of data the data offset */
112 data_offset_ptr = s->buf_ptr;
113 put_be32(s, 0); /* data offset : will be patched after */
114 put_be16(s, ctx->nb_streams); /* num streams */
115 flags = 1 | 2; /* save allowed & perfect play */
116 if (url_is_streamed(s))
117 flags |= 4; /* live broadcast */
123 size = strlen(ctx->title) + strlen(ctx->author) + strlen(ctx->copyright) +
124 strlen(ctx->comment) + 4 * 2 + 10;
127 put_str(s, ctx->title);
128 put_str(s, ctx->author);
129 put_str(s, ctx->copyright);
130 put_str(s, ctx->comment);
132 for(i=0;i<ctx->nb_streams;i++) {
135 stream = &rm->streams[i];
137 if (stream->enc->codec_type == CODEC_TYPE_AUDIO) {
138 desc = "The Audio Stream";
139 mimetype = "audio/x-pn-realaudio";
140 codec_data_size = 73;
142 desc = "The Video Stream";
143 mimetype = "video/x-pn-realvideo";
144 codec_data_size = 34;
148 size = 10 + 9 * 4 + strlen(desc) + strlen(mimetype) + codec_data_size;
152 put_be16(s, i); /* stream number */
153 put_be32(s, stream->bit_rate); /* max bit rate */
154 put_be32(s, stream->bit_rate); /* avg bit rate */
155 put_be32(s, stream->packet_max_size); /* max packet size */
156 if (stream->nb_packets > 0)
157 packet_avg_size = stream->packet_total_size /
161 put_be32(s, packet_avg_size); /* avg packet size */
162 put_be32(s, 0); /* start time */
163 put_be32(s, BUFFER_DURATION); /* preroll */
165 if (url_is_streamed(s) || !stream->total_frames)
166 put_be32(s, (int)(3600 * 1000));
168 put_be32(s, (int)(stream->total_frames * 1000 / stream->frame_rate));
170 put_str8(s, mimetype);
171 put_be32(s, codec_data_size);
173 if (stream->enc->codec_type == CODEC_TYPE_AUDIO) {
174 int coded_frame_size, fscode, sample_rate;
175 sample_rate = stream->enc->sample_rate;
176 coded_frame_size = (stream->enc->bit_rate *
177 stream->enc->frame_size) / (8 * sample_rate);
178 /* audio codec info */
181 put_be32(s, 0x00040000); /* version */
183 put_be32(s, 0x01b53530); /* stream length */
184 put_be16(s, 4); /* unknown */
185 put_be32(s, 0x39); /* header size */
187 switch(sample_rate) {
204 put_be16(s, fscode); /* codec additional info, for AC3, seems
205 to be a frequency code */
206 /* special hack to compensate rounding errors... */
207 if (coded_frame_size == 557)
209 put_be32(s, coded_frame_size); /* frame length */
210 put_be32(s, 0x51540); /* unknown */
211 put_be32(s, 0x249f0); /* unknown */
212 put_be32(s, 0x249f0); /* unknown */
214 /* frame length : seems to be very important */
215 put_be16(s, coded_frame_size);
216 put_be32(s, 0); /* unknown */
217 put_be16(s, stream->enc->sample_rate); /* sample rate */
218 put_be32(s, 0x10); /* unknown */
219 put_be16(s, stream->enc->channels);
220 put_str8(s, "Int0"); /* codec name */
221 put_str8(s, "dnet"); /* codec name */
222 put_be16(s, 0); /* title length */
223 put_be16(s, 0); /* author length */
224 put_be16(s, 0); /* copyright length */
225 put_byte(s, 0); /* end of header */
227 /* video codec info */
228 put_be32(s,34); /* size */
229 put_tag(s,"VIDORV10");
230 put_be16(s, stream->enc->width);
231 put_be16(s, stream->enc->height);
232 put_be16(s, (int) stream->frame_rate); /* frames per seconds ? */
233 put_be32(s,0); /* unknown meaning */
234 put_be16(s, (int) stream->frame_rate); /* unknown meaning */
235 put_be32(s,0); /* unknown meaning */
236 put_be16(s, 8); /* unknown meaning */
237 /* Seems to be the codec version: only use basic H263. The next
238 versions seems to add a diffential DC coding as in
239 MPEG... nothing new under the sun */
240 put_be32(s,0x10000000);
241 //put_be32(s,0x10003000);
245 /* patch data offset field */
246 data_pos = s->buf_ptr - start_ptr;
247 rm->data_pos = data_pos;
248 data_offset_ptr[0] = data_pos >> 24;
249 data_offset_ptr[1] = data_pos >> 16;
250 data_offset_ptr[2] = data_pos >> 8;
251 data_offset_ptr[3] = data_pos;
255 put_be32(s,data_size + 10 + 8);
258 put_be32(s, nb_packets); /* number of packets */
259 put_be32(s,0); /* next data header */
262 static void write_packet_header(AVFormatContext *ctx, StreamInfo *stream,
263 int length, int key_frame)
266 ByteIOContext *s = &ctx->pb;
268 stream->nb_packets++;
269 stream->packet_total_size += length;
270 if (length > stream->packet_max_size)
271 stream->packet_max_size = length;
273 put_be16(s,0); /* version */
274 put_be16(s,length + 12);
275 put_be16(s, stream->num); /* stream number */
276 timestamp = (1000 * (float)stream->nb_frames) / stream->frame_rate;
277 put_be32(s, timestamp); /* timestamp */
278 put_byte(s, 0); /* reserved */
279 put_byte(s, key_frame ? 2 : 0); /* flags */
282 static int rm_write_header(AVFormatContext *s)
284 RMContext *rm = s->priv_data;
287 AVCodecContext *codec;
289 for(n=0;n<s->nb_streams;n++) {
290 s->streams[n]->id = n;
291 codec = &s->streams[n]->codec;
292 stream = &rm->streams[n];
293 memset(stream, 0, sizeof(StreamInfo));
295 stream->bit_rate = codec->bit_rate;
298 switch(codec->codec_type) {
299 case CODEC_TYPE_AUDIO:
300 rm->audio_stream = stream;
301 stream->frame_rate = (float)codec->sample_rate / (float)codec->frame_size;
302 /* XXX: dummy values */
303 stream->packet_max_size = 1024;
304 stream->nb_packets = 0;
305 stream->total_frames = stream->nb_packets;
307 case CODEC_TYPE_VIDEO:
308 rm->video_stream = stream;
309 stream->frame_rate = (float)codec->frame_rate / (float)FRAME_RATE_BASE;
310 /* XXX: dummy values */
311 stream->packet_max_size = 4096;
312 stream->nb_packets = 0;
313 stream->total_frames = stream->nb_packets;
320 rv10_write_header(s, 0, 0);
321 put_flush_packet(&s->pb);
325 static int rm_write_audio(AVFormatContext *s, uint8_t *buf, int size)
328 RMContext *rm = s->priv_data;
329 ByteIOContext *pb = &s->pb;
330 StreamInfo *stream = rm->audio_stream;
333 /* XXX: suppress this malloc */
334 buf1= (uint8_t*) av_malloc( size * sizeof(uint8_t) );
336 write_packet_header(s, stream, size, stream->enc->coded_frame->key_frame);
338 /* for AC3, the words seems to be reversed */
339 for(i=0;i<size;i+=2) {
343 put_buffer(pb, buf1, size);
344 put_flush_packet(pb);
350 static int rm_write_video(AVFormatContext *s, uint8_t *buf, int size)
352 RMContext *rm = s->priv_data;
353 ByteIOContext *pb = &s->pb;
354 StreamInfo *stream = rm->video_stream;
355 int key_frame = stream->enc->coded_frame->key_frame;
357 /* XXX: this is incorrect: should be a parameter */
359 /* Well, I spent some time finding the meaning of these bits. I am
360 not sure I understood everything, but it works !! */
362 write_packet_header(s, stream, size + 7, key_frame);
363 /* bit 7: '1' if final packet of a frame converted in several packets */
365 /* bit 7: '1' if I frame. bits 6..0 : sequence number in current
366 frame starting from 1 */
372 put_be16(pb, 0x4000 | (size)); /* total frame size */
373 put_be16(pb, 0x4000 | (size)); /* offset from the start or the end */
376 write_packet_header(s, size + 6);
378 put_be16(pb, 0x4000 | size); /* total frame size */
379 put_be16(pb, 0x4000 + packet_number * 126); /* position in stream */
381 put_byte(pb, stream->nb_frames & 0xff);
383 put_buffer(pb, buf, size);
384 put_flush_packet(pb);
390 static int rm_write_packet(AVFormatContext *s, int stream_index,
391 uint8_t *buf, int size, int force_pts)
393 if (s->streams[stream_index]->codec.codec_type ==
395 return rm_write_audio(s, buf, size);
397 return rm_write_video(s, buf, size);
400 static int rm_write_trailer(AVFormatContext *s)
402 RMContext *rm = s->priv_data;
403 int data_size, index_pos, i;
404 ByteIOContext *pb = &s->pb;
406 if (!url_is_streamed(&s->pb)) {
407 /* end of file: finish to write header */
408 index_pos = url_fseek(pb, 0, SEEK_CUR);
409 data_size = index_pos - rm->data_pos;
413 put_be32(pb, 10 + 10 * s->nb_streams);
416 for(i=0;i<s->nb_streams;i++) {
417 put_be32(pb, 0); /* zero indices */
418 put_be16(pb, i); /* stream number */
419 put_be32(pb, 0); /* next index */
421 /* undocumented end header */
425 url_fseek(pb, 0, SEEK_SET);
426 for(i=0;i<s->nb_streams;i++)
427 rm->streams[i].total_frames = rm->streams[i].nb_frames;
428 rv10_write_header(s, data_size, index_pos);
430 /* undocumented end header */
434 put_flush_packet(pb);
438 /***************************************************/
440 static void get_str(ByteIOContext *pb, char *buf, int buf_size)
448 if (i < buf_size - 1)
454 static void get_str8(ByteIOContext *pb, char *buf, int buf_size)
462 if (i < buf_size - 1)
468 static int rm_read_header(AVFormatContext *s, AVFormatParameters *ap)
470 RMContext *rm = s->priv_data;
472 ByteIOContext *pb = &s->pb;
474 int tag_size, size, codec_data_size, i;
476 unsigned int h263_hack_version;
480 if (get_le32(pb) != MKTAG('.', 'R', 'M', 'F'))
483 get_be32(pb); /* header size */
486 get_be32(pb); /* number of headers */
492 tag_size = get_be32(pb);
495 printf("tag=%c%c%c%c (%08x) size=%d\n",
506 case MKTAG('P', 'R', 'O', 'P'):
508 get_be32(pb); /* max bit rate */
509 get_be32(pb); /* avg bit rate */
510 get_be32(pb); /* max packet size */
511 get_be32(pb); /* avg packet size */
512 get_be32(pb); /* nb packets */
513 get_be32(pb); /* duration */
514 get_be32(pb); /* preroll */
515 get_be32(pb); /* index offset */
516 get_be32(pb); /* data offset */
517 get_be16(pb); /* nb streams */
518 flags = get_be16(pb); /* flags */
520 case MKTAG('C', 'O', 'N', 'T'):
521 get_str(pb, s->title, sizeof(s->title));
522 get_str(pb, s->author, sizeof(s->author));
523 get_str(pb, s->copyright, sizeof(s->copyright));
524 get_str(pb, s->comment, sizeof(s->comment));
526 case MKTAG('M', 'D', 'P', 'R'):
527 st = av_mallocz(sizeof(AVStream));
530 avcodec_get_context_defaults(&st->codec);
531 s->streams[s->nb_streams++] = st;
532 st->id = get_be16(pb);
533 get_be32(pb); /* max bit rate */
534 st->codec.bit_rate = get_be32(pb); /* bit rate */
535 get_be32(pb); /* max packet size */
536 get_be32(pb); /* avg packet size */
537 get_be32(pb); /* start time */
538 get_be32(pb); /* preroll */
539 get_be32(pb); /* duration */
540 get_str8(pb, buf, sizeof(buf)); /* desc */
541 get_str8(pb, buf, sizeof(buf)); /* mimetype */
542 codec_data_size = get_be32(pb);
543 codec_pos = url_ftell(pb);
546 if (v == MKTAG(0xfd, 'a', 'r', '.')) {
548 get_be32(pb); /* version */
549 get_be32(pb); /* .ra4 */
552 get_be32(pb); /* header size */
553 get_be16(pb); /* add codec info */
554 get_be32(pb); /* coded frame size */
555 get_be32(pb); /* ??? */
556 get_be32(pb); /* ??? */
557 get_be32(pb); /* ??? */
558 get_be16(pb); /* 1 */
559 get_be16(pb); /* coded frame size */
561 st->codec.sample_rate = get_be16(pb);
563 st->codec.channels = get_be16(pb);
564 get_str8(pb, buf, sizeof(buf)); /* desc */
565 get_str8(pb, buf, sizeof(buf)); /* desc */
566 st->codec.codec_type = CODEC_TYPE_AUDIO;
567 if (!strcmp(buf, "dnet")) {
568 st->codec.codec_id = CODEC_ID_AC3;
570 st->codec.codec_id = CODEC_ID_NONE;
571 pstrcpy(st->codec.codec_name, sizeof(st->codec.codec_name),
575 if (get_le32(pb) != MKTAG('V', 'I', 'D', 'O')) {
577 fprintf(stderr, "Unsupported video codec\n");
580 st->codec.codec_tag = get_le32(pb);
581 if (st->codec.codec_tag != MKTAG('R', 'V', '1', '0'))
583 st->codec.width = get_be16(pb);
584 st->codec.height = get_be16(pb);
585 st->codec.frame_rate = get_be16(pb) * FRAME_RATE_BASE;
586 st->codec.codec_type = CODEC_TYPE_VIDEO;
591 /* modification of h263 codec version (!) */
592 h263_hack_version = get_be32(pb);
593 switch(h263_hack_version) {
597 st->codec.sub_id = h263_hack_version;
598 st->codec.codec_id = CODEC_ID_RV10;
602 st->codec.codec_id = CODEC_ID_NONE;
606 /* skip codec info */
607 size = url_ftell(pb) - codec_pos;
608 url_fskip(pb, codec_data_size - size);
610 case MKTAG('D', 'A', 'T', 'A'):
613 /* unknown tag: skip it */
614 url_fskip(pb, tag_size - 10);
619 rm->nb_packets = get_be32(pb); /* number of packets */
620 if (!rm->nb_packets && (flags & 4))
621 rm->nb_packets = 3600 * 25;
622 get_be32(pb); /* next data header */
626 for(i=0;i<s->nb_streams;i++) {
627 av_free(s->streams[i]);
632 static int get_num(ByteIOContext *pb, int *len)
643 return (n << 16) | n1;
647 static int rm_read_packet(AVFormatContext *s, AVPacket *pkt)
649 RMContext *rm = s->priv_data;
650 ByteIOContext *pb = &s->pb;
652 int len, num, timestamp, i, tmp, j;
657 if (rm->nb_packets == 0)
664 timestamp = get_be32(pb);
665 get_byte(pb); /* reserved */
666 flags = get_byte(pb); /* flags */
671 for(i=0;i<s->nb_streams;i++) {
676 if (i == s->nb_streams) {
677 /* skip packet if unknown number */
682 if (st->codec.codec_type == CODEC_TYPE_VIDEO) {
683 int full_frame, h, pic_num;
686 if ((h & 0xc0) == 0xc0) {
689 len2= get_num(pb, &len);
690 pos = get_num(pb, &len);
691 //printf("pos:%d\n",len);
694 int seq, frame_size, pos;
697 frame_size = get_num(pb, &len);
698 pos = get_num(pb, &len);
699 //printf("seq:%d, size:%d, pos:%d\n",seq,frame_size,pos);
703 pic_num= get_byte(pb);
705 //XXX/FIXME/HACK, demuxer should be fixed to send complete frames ...
706 if(st->codec.slice_offset==NULL)
707 st->codec.slice_offset= (int*)av_malloc(sizeof(int));
708 st->codec.slice_count= full_frame;
709 st->codec.slice_offset[0]= 0;
712 av_new_packet(pkt, len);
713 pkt->stream_index = i;
714 get_buffer(pb, pkt->data, len);
716 /* for AC3, needs to swap bytes */
717 if (st->codec.codec_id == CODEC_ID_AC3) {
719 for(j=0;j<len;j+=2) {
729 static int rm_read_close(AVFormatContext *s)
734 static int rm_probe(AVProbeData *p)
736 /* check file header */
737 if (p->buf_size <= 32)
739 if (p->buf[0] == '.' && p->buf[1] == 'R' &&
740 p->buf[2] == 'M' && p->buf[3] == 'F' &&
741 p->buf[4] == 0 && p->buf[5] == 0)
742 return AVPROBE_SCORE_MAX;
747 static AVInputFormat rm_iformat = {
757 static AVOutputFormat rm_oformat = {
760 "application/vnd.rn-realmedia",
772 av_register_input_format(&rm_iformat);
773 av_register_output_format(&rm_oformat);