2 * MOV, 3GP, MP4 encoder.
3 * Copyright (c) 2003 Thomas Raivio.
4 * Copyright (c) 2004 Gildas Bazin <gbazin at videolan dot org>.
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
27 #define MOV_INDEX_CLUSTER_SIZE 16384
28 #define globalTimescale 1000
33 #define MODE_PSP 3 // example working PSP command line:
34 // ffmpeg -i testinput.avi -f psp -r 14.985 -s 320x240 -b 768 -ar 24000 -ab 32 M4V00001.MP4
37 typedef struct MOVIentry {
38 unsigned int flags, pos, size;
39 unsigned int samplesInChunk;
44 typedef struct MOVIndex {
63 typedef struct MOVContext {
70 MOVTrack tracks[MAX_STREAMS];
73 static int mov_write_esds_tag(ByteIOContext *pb, MOVTrack* track);
75 //FIXME supprt 64bit varaint with wide placeholders
76 static int updateSize (ByteIOContext *pb, int pos)
78 long curpos = url_ftell(pb);
79 url_fseek(pb, pos, SEEK_SET);
80 put_be32(pb, curpos - pos); /* rewrite size */
81 url_fseek(pb, curpos, SEEK_SET);
86 /* Chunk offset atom */
87 static int mov_write_stco_tag(ByteIOContext *pb, MOVTrack* track)
90 int pos = url_ftell(pb);
91 put_be32(pb, 0); /* size */
93 put_be32(pb, 0); /* version & flags */
94 put_be32(pb, track->entry); /* entry count */
95 for (i=0; i<track->entry; i++) {
96 int cl = i / MOV_INDEX_CLUSTER_SIZE;
97 int id = i % MOV_INDEX_CLUSTER_SIZE;
98 put_be32(pb, track->cluster[cl][id].pos);
100 return updateSize (pb, pos);
103 /* Sample size atom */
104 static int mov_write_stsz_tag(ByteIOContext *pb, MOVTrack* track)
107 int i, j, entries = 0, tst = -1, oldtst = -1;
109 int pos = url_ftell(pb);
110 put_be32(pb, 0); /* size */
112 put_be32(pb, 0); /* version & flags */
114 for (i=0; i<track->entry; i++) {
115 int cl = i / MOV_INDEX_CLUSTER_SIZE;
116 int id = i % MOV_INDEX_CLUSTER_SIZE;
117 tst = track->cluster[cl][id].size/track->cluster[cl][id].entries;
118 if(oldtst != -1 && tst != oldtst) {
122 entries += track->cluster[cl][id].entries;
125 int sSize = track->cluster[0][0].size/track->cluster[0][0].entries;
126 put_be32(pb, sSize); // sample size
127 put_be32(pb, entries); // sample count
130 put_be32(pb, 0); // sample size
131 put_be32(pb, entries); // sample count
132 for (i=0; i<track->entry; i++) {
133 int cl = i / MOV_INDEX_CLUSTER_SIZE;
134 int id = i % MOV_INDEX_CLUSTER_SIZE;
135 for ( j=0; j<track->cluster[cl][id].entries; j++) {
136 put_be32(pb, track->cluster[cl][id].size /
137 track->cluster[cl][id].entries);
141 return updateSize (pb, pos);
144 /* Sample to chunk atom */
145 static int mov_write_stsc_tag(ByteIOContext *pb, MOVTrack* track)
147 int index = 0, oldval = -1, i, entryPos, curpos;
149 int pos = url_ftell(pb);
150 put_be32(pb, 0); /* size */
152 put_be32(pb, 0); // version & flags
153 entryPos = url_ftell(pb);
154 put_be32(pb, track->entry); // entry count
155 for (i=0; i<track->entry; i++) {
156 int cl = i / MOV_INDEX_CLUSTER_SIZE;
157 int id = i % MOV_INDEX_CLUSTER_SIZE;
158 if(oldval != track->cluster[cl][id].samplesInChunk)
160 put_be32(pb, i+1); // first chunk
161 put_be32(pb, track->cluster[cl][id].samplesInChunk); // samples per chunk
162 put_be32(pb, 0x1); // sample description index
163 oldval = track->cluster[cl][id].samplesInChunk;
167 curpos = url_ftell(pb);
168 url_fseek(pb, entryPos, SEEK_SET);
169 put_be32(pb, index); // rewrite size
170 url_fseek(pb, curpos, SEEK_SET);
172 return updateSize (pb, pos);
175 /* Sync sample atom */
176 static int mov_write_stss_tag(ByteIOContext *pb, MOVTrack* track)
179 int i, index = 0, entryPos;
180 int pos = url_ftell(pb);
181 put_be32(pb, 0); // size
183 put_be32(pb, 0); // version & flags
184 entryPos = url_ftell(pb);
185 put_be32(pb, track->entry); // entry count
186 for (i=0; i<track->entry; i++) {
187 int cl = i / MOV_INDEX_CLUSTER_SIZE;
188 int id = i % MOV_INDEX_CLUSTER_SIZE;
189 if(track->cluster[cl][id].key_frame == 1) {
194 curpos = url_ftell(pb);
195 url_fseek(pb, entryPos, SEEK_SET);
196 put_be32(pb, index); // rewrite size
197 url_fseek(pb, curpos, SEEK_SET);
198 return updateSize (pb, pos);
201 static int mov_write_damr_tag(ByteIOContext *pb)
203 put_be32(pb, 0x11); /* size */
208 put_be16(pb, 0x80); /* Mode set (all modes for AMR_NB) */
209 put_be16(pb, 0xa); /* Mode change period (no restriction) */
210 //put_be16(pb, 0x81ff); /* Mode set (all modes for AMR_NB) */
211 //put_be16(pb, 1); /* Mode change period (no restriction) */
215 static int mov_write_wave_tag(ByteIOContext *pb, MOVTrack* track)
217 int pos = url_ftell(pb);
219 put_be32(pb, 0); /* size */
222 put_be32(pb, 12); /* size */
226 put_be32(pb, 12); /* size */
230 mov_write_esds_tag(pb, track);
232 put_be32(pb, 12); /* size */
236 put_be32(pb, 8); /* size */
237 put_be32(pb, 0); /* null tag */
239 return updateSize (pb, pos);
242 const CodecTag codec_movaudio_tags[] = {
243 { CODEC_ID_PCM_MULAW, MKTAG('u', 'l', 'a', 'w') },
244 { CODEC_ID_PCM_ALAW, MKTAG('a', 'l', 'a', 'w') },
245 { CODEC_ID_ADPCM_IMA_QT, MKTAG('i', 'm', 'a', '4') },
246 { CODEC_ID_MACE3, MKTAG('M', 'A', 'C', '3') },
247 { CODEC_ID_MACE6, MKTAG('M', 'A', 'C', '6') },
248 { CODEC_ID_AAC, MKTAG('m', 'p', '4', 'a') },
249 { CODEC_ID_AMR_NB, MKTAG('s', 'a', 'm', 'r') },
250 { CODEC_ID_PCM_S16BE, MKTAG('t', 'w', 'o', 's') },
251 { CODEC_ID_PCM_S16LE, MKTAG('s', 'o', 'w', 't') },
252 { CODEC_ID_MP3, MKTAG('.', 'm', 'p', '3') },
256 static int mov_write_audio_tag(ByteIOContext *pb, MOVTrack* track)
258 int pos = url_ftell(pb);
261 put_be32(pb, 0); /* size */
263 tag = track->enc->codec_tag;
265 tag = codec_get_tag(codec_movaudio_tags, track->enc->codec_id);
266 // if no mac fcc found, try with Microsoft tags
269 int tmp = codec_get_tag(codec_wav_tags, track->enc->codec_id);
270 tag = MKTAG('m', 's', ((tmp >> 8) & 0xff), (tmp & 0xff));
272 put_le32(pb, tag); // store it byteswapped
274 put_be32(pb, 0); /* Reserved */
275 put_be16(pb, 0); /* Reserved */
276 put_be16(pb, 1); /* Data-reference index, XXX == 1 */
278 /* SoundDescription */
279 if(track->mode == MODE_MOV && track->enc->codec_id == CODEC_ID_AAC)
280 put_be16(pb, 1); /* Version 1 */
282 put_be16(pb, 0); /* Version 0 */
283 put_be16(pb, 0); /* Revision level */
284 put_be32(pb, 0); /* Reserved */
286 put_be16(pb, track->enc->channels); /* Number of channels */
287 /* TODO: Currently hard-coded to 16-bit, there doesn't seem
288 to be a good way to get number of bits of audio */
289 put_be16(pb, 0x10); /* Reserved */
291 if(track->enc->codec_id == CODEC_ID_AAC ||
292 track->enc->codec_id == CODEC_ID_MP3)
294 put_be16(pb, 0xfffe); /* compression ID (vbr)*/
298 put_be16(pb, 0); /* compression ID (= 0) */
300 put_be16(pb, 0); /* packet size (= 0) */
301 put_be16(pb, track->timescale); /* Time scale */
302 put_be16(pb, 0); /* Reserved */
304 if(track->mode == MODE_MOV && track->enc->codec_id == CODEC_ID_AAC)
306 /* SoundDescription V1 extended info */
307 put_be32(pb, track->enc->frame_size); /* Samples per packet */
308 put_be32(pb, 1536); /* Bytes per packet */
309 put_be32(pb, 2); /* Bytes per frame */
310 put_be32(pb, 2); /* Bytes per sample */
313 if(track->enc->codec_id == CODEC_ID_AAC) {
314 if( track->mode == MODE_MOV ) mov_write_wave_tag(pb, track);
315 else mov_write_esds_tag(pb, track);
317 if(track->enc->codec_id == CODEC_ID_AMR_NB)
318 mov_write_damr_tag(pb);
319 return updateSize (pb, pos);
322 static int mov_write_d263_tag(ByteIOContext *pb)
324 put_be32(pb, 0xf); /* size */
332 /* TODO: No idea about these values */
333 static int mov_write_svq3_tag(ByteIOContext *pb)
339 put_be32(pb, 0xe2c0211d);
340 put_be32(pb, 0xc0000000);
345 static unsigned int descrLength(unsigned int len)
347 if (len < 0x00000080)
349 else if (len < 0x00004000)
351 else if(len < 0x00200000)
357 static void putDescr(ByteIOContext *pb, int tag, int size)
363 vals[3] = (uint8_t)(len & 0x7f);
365 vals[2] = (uint8_t)((len & 0x7f) | 0x80);
367 vals[1] = (uint8_t)((len & 0x7f) | 0x80);
369 vals[0] = (uint8_t)((len & 0x7f) | 0x80);
371 put_byte(pb, tag); // DescriptorTag
373 if (size < 0x00000080)
375 put_byte(pb, vals[3]);
377 else if (size < 0x00004000)
379 put_byte(pb, vals[2]);
380 put_byte(pb, vals[3]);
382 else if (size < 0x00200000)
384 put_byte(pb, vals[1]);
385 put_byte(pb, vals[2]);
386 put_byte(pb, vals[3]);
388 else if (size < 0x10000000)
390 put_byte(pb, vals[0]);
391 put_byte(pb, vals[1]);
392 put_byte(pb, vals[2]);
393 put_byte(pb, vals[3]);
397 static int mov_write_esds_tag(ByteIOContext *pb, MOVTrack* track) // Basic
399 int decoderSpecificInfoLen;
400 int pos = url_ftell(pb);
401 void *vosDataBackup=track->vosData;
402 int vosLenBackup=track->vosLen;
404 // we should be able to have these passed in, via vosData, then we wouldn't need to attack this routine at all
405 static const char PSPAACData[]={0x13,0x10};
406 static const char PSPMP4Data[]={0x00,0x00,0x01,0xB0,0x03,0x00,0x00,0x01,0xB5,0x09,0x00,0x00,0x01,0x00,0x00,0x00,0x01,0x20,0x00,0x84,0x5D,0x4C,0x28,0x50,0x20,0xF0,0xA3,0x1F };
409 if (track->mode == MODE_PSP) // fails on psp if this is not here
411 if (track->enc->codec_id == CODEC_ID_AAC)
414 track->vosData = PSPAACData;
417 if (track->enc->codec_id == CODEC_ID_MPEG4)
420 track->vosData = PSPMP4Data;
424 decoderSpecificInfoLen = track->vosLen ? descrLength(track->vosLen):0;
426 put_be32(pb, 0); // size
428 put_be32(pb, 0); // Version
431 putDescr(pb, 0x03, 3 + descrLength(13 + decoderSpecificInfoLen) +
433 put_be16(pb, 0x0001); // ID (= 1)
434 put_byte(pb, 0x00); // flags (= no flags)
436 // DecoderConfig descriptor
437 putDescr(pb, 0x04, 13 + decoderSpecificInfoLen);
439 if(track->enc->codec_id == CODEC_ID_AAC)
440 put_byte(pb, 0x40); // Object type indication
441 else if(track->enc->codec_id == CODEC_ID_MPEG4)
442 put_byte(pb, 0x20); // Object type indication (Visual 14496-2)
444 if(track->enc->codec_type == CODEC_TYPE_AUDIO)
445 put_byte(pb, 0x15); // flags (= Audiostream)
447 put_byte(pb, 0x11); // flags (= Visualstream)
449 put_byte(pb, 0x0); // Buffersize DB (24 bits)
450 put_be16(pb, 0x0dd2); // Buffersize DB
452 // TODO: find real values for these
453 put_be32(pb, track->enc->bit_rate); // maxbitrate
454 put_be32(pb, track->enc->bit_rate); // avg bitrate
458 // DecoderSpecific info descriptor
459 putDescr(pb, 0x05, track->vosLen);
460 put_buffer(pb, track->vosData, track->vosLen);
463 track->vosData = vosDataBackup;
464 track->vosLen = vosLenBackup;
467 putDescr(pb, 0x06, 1);
469 return updateSize (pb, pos);
472 const CodecTag codec_movvideo_tags[] = {
473 { CODEC_ID_SVQ1, MKTAG('S', 'V', 'Q', '1') },
474 { CODEC_ID_SVQ3, MKTAG('S', 'V', 'Q', '3') },
475 { CODEC_ID_MPEG4, MKTAG('m', 'p', '4', 'v') },
476 { CODEC_ID_H263, MKTAG('s', '2', '6', '3') },
477 { CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'c', ' ') },
481 static int mov_write_video_tag(ByteIOContext *pb, MOVTrack* track)
483 int pos = url_ftell(pb);
484 char compressor_name[32];
487 put_be32(pb, 0); /* size */
489 tag = track->enc->codec_tag;
491 tag = codec_get_tag(codec_movvideo_tags, track->enc->codec_id);
492 // if no mac fcc found, try with Microsoft tags
494 tag = codec_get_tag(codec_bmp_tags, track->enc->codec_id);
495 put_le32(pb, tag); // store it byteswapped
497 put_be32(pb, 0); /* Reserved */
498 put_be16(pb, 0); /* Reserved */
499 put_be16(pb, 1); /* Data-reference index */
501 put_be16(pb, 0); /* Codec stream version */
502 put_be16(pb, 0); /* Codec stream revision (=0) */
503 put_tag(pb, "FFMP"); /* Vendor */
504 if(track->enc->codec_id == CODEC_ID_RAWVIDEO) {
505 put_be32(pb, 0); /* Temporal Quality */
506 put_be32(pb, 0x400); /* Spatial Quality = lossless*/
508 put_be32(pb, 0x200); /* Temporal Quality = normal */
509 put_be32(pb, 0x200); /* Spatial Quality = normal */
511 put_be16(pb, track->enc->width); /* Video width */
512 put_be16(pb, track->enc->height); /* Video height */
513 put_be32(pb, 0x00480000); /* Horizontal resolution 72dpi */
514 put_be32(pb, 0x00480000); /* Vertical resolution 72dpi */
515 put_be32(pb, 0); /* Data size (= 0) */
516 put_be16(pb, 1); /* Frame count (= 1) */
518 memset(compressor_name,0,32);
519 if (track->enc->codec && track->enc->codec->name)
520 strncpy(compressor_name,track->enc->codec->name,31);
521 put_byte(pb, strlen(compressor_name));
522 put_buffer(pb, compressor_name, 31);
524 put_be16(pb, 0x18); /* Reserved */
525 put_be16(pb, 0xffff); /* Reserved */
526 if(track->enc->codec_id == CODEC_ID_MPEG4)
527 mov_write_esds_tag(pb, track);
528 else if(track->enc->codec_id == CODEC_ID_H263)
529 mov_write_d263_tag(pb);
530 else if(track->enc->codec_id == CODEC_ID_SVQ3)
531 mov_write_svq3_tag(pb);
533 return updateSize (pb, pos);
536 static int mov_write_stsd_tag(ByteIOContext *pb, MOVTrack* track)
538 int pos = url_ftell(pb);
539 put_be32(pb, 0); /* size */
541 put_be32(pb, 0); /* version & flags */
542 put_be32(pb, 1); /* entry count */
543 if (track->enc->codec_type == CODEC_TYPE_VIDEO)
544 mov_write_video_tag(pb, track);
545 else if (track->enc->codec_type == CODEC_TYPE_AUDIO)
546 mov_write_audio_tag(pb, track);
547 return updateSize(pb, pos);
551 /* Time to sample atom */
552 static int mov_write_stts_tag(ByteIOContext *pb, MOVTrack* track)
554 put_be32(pb, 0x18); /* size */
556 put_be32(pb, 0); /* version & flags */
557 put_be32(pb, 1); /* entry count */
559 put_be32(pb, track->sampleCount); /* sample count */
560 put_be32(pb, track->sampleDuration); /* sample duration */
564 static int mov_write_dref_tag(ByteIOContext *pb)
566 put_be32(pb, 28); /* size */
568 put_be32(pb, 0); /* version & flags */
569 put_be32(pb, 1); /* entry count */
571 put_be32(pb, 0xc); /* size */
573 put_be32(pb, 1); /* version & flags */
578 static int mov_write_stbl_tag(ByteIOContext *pb, MOVTrack* track)
580 int pos = url_ftell(pb);
581 put_be32(pb, 0); /* size */
583 mov_write_stsd_tag(pb, track);
584 mov_write_stts_tag(pb, track);
585 if (track->enc->codec_type == CODEC_TYPE_VIDEO &&
587 mov_write_stss_tag(pb, track);
588 mov_write_stsc_tag(pb, track);
589 mov_write_stsz_tag(pb, track);
590 mov_write_stco_tag(pb, track);
591 return updateSize(pb, pos);
594 static int mov_write_dinf_tag(ByteIOContext *pb)
596 int pos = url_ftell(pb);
597 put_be32(pb, 0); /* size */
599 mov_write_dref_tag(pb);
600 return updateSize(pb, pos);
603 static int mov_write_smhd_tag(ByteIOContext *pb)
605 put_be32(pb, 16); /* size */
607 put_be32(pb, 0); /* version & flags */
608 put_be16(pb, 0); /* reserved (balance, normally = 0) */
609 put_be16(pb, 0); /* reserved */
613 static int mov_write_vmhd_tag(ByteIOContext *pb)
615 put_be32(pb, 0x14); /* size (always 0x14) */
617 put_be32(pb, 0x01); /* version & flags */
618 put_be64(pb, 0); /* reserved (graphics mode = copy) */
622 static int mov_write_hdlr_tag(ByteIOContext *pb, MOVTrack* track)
624 char *descr, *hdlr, *hdlr_type;
625 int pos = url_ftell(pb);
627 if (!track) { /* no media --> data handler */
630 descr = "DataHandler";
632 hdlr = (track->mode == MODE_MOV) ? "mhlr" : "\0\0\0\0";
633 if (track->enc->codec_type == CODEC_TYPE_VIDEO) {
635 descr = "VideoHandler";
638 descr = "SoundHandler";
642 put_be32(pb, 0); /* size */
644 put_be32(pb, 0); /* Version & flags */
645 put_buffer(pb, hdlr, 4); /* handler */
646 put_tag(pb, hdlr_type); /* handler type */
647 put_be32(pb ,0); /* reserved */
648 put_be32(pb ,0); /* reserved */
649 put_be32(pb ,0); /* reserved */
650 put_byte(pb, strlen(descr)); /* string counter */
651 put_buffer(pb, descr, strlen(descr)); /* handler description */
652 return updateSize(pb, pos);
655 static int mov_write_minf_tag(ByteIOContext *pb, MOVTrack* track)
657 int pos = url_ftell(pb);
658 put_be32(pb, 0); /* size */
660 if(track->enc->codec_type == CODEC_TYPE_VIDEO)
661 mov_write_vmhd_tag(pb);
663 mov_write_smhd_tag(pb);
664 if (track->mode == MODE_MOV) /* FIXME: Why do it for MODE_MOV only ? */
665 mov_write_hdlr_tag(pb, NULL);
666 mov_write_dinf_tag(pb);
667 mov_write_stbl_tag(pb, track);
668 return updateSize(pb, pos);
671 static int mov_write_mdhd_tag(ByteIOContext *pb, MOVTrack* track)
673 put_be32(pb, 32); /* size */
675 put_be32(pb, 0); /* Version & flags */
676 put_be32(pb, track->time); /* creation time */
677 put_be32(pb, track->time); /* modification time */
678 put_be32(pb, track->timescale); /* time scale (sample rate for audio) */
679 put_be32(pb, track->trackDuration); /* duration */
680 put_be16(pb, 0); /* language, 0 = english */
681 put_be16(pb, 0); /* reserved (quality) */
685 static int mov_write_mdia_tag(ByteIOContext *pb, MOVTrack* track)
687 int pos = url_ftell(pb);
688 put_be32(pb, 0); /* size */
690 mov_write_mdhd_tag(pb, track);
691 mov_write_hdlr_tag(pb, track);
692 mov_write_minf_tag(pb, track);
693 return updateSize(pb, pos);
696 static int mov_write_tkhd_tag(ByteIOContext *pb, MOVTrack* track)
698 int64_t maxTrackLenTemp;
699 put_be32(pb, 0x5c); /* size (always 0x5c) */
701 put_be32(pb, 0xf); /* version & flags (track enabled) */
702 put_be32(pb, track->time); /* creation time */
703 put_be32(pb, track->time); /* modification time */
704 put_be32(pb, track->trackID); /* track-id */
705 put_be32(pb, 0); /* reserved */
706 maxTrackLenTemp = ((int64_t)globalTimescale*(int64_t)track->trackDuration)/(int64_t)track->timescale;
707 put_be32(pb, (long)maxTrackLenTemp); /* duration */
709 put_be32(pb, 0); /* reserved */
710 put_be32(pb, 0); /* reserved */
711 put_be32(pb, 0x0); /* reserved (Layer & Alternate group) */
712 /* Volume, only for audio */
713 if(track->enc->codec_type == CODEC_TYPE_AUDIO)
714 put_be16(pb, 0x0100);
717 put_be16(pb, 0); /* reserved */
719 /* Matrix structure */
720 put_be32(pb, 0x00010000); /* reserved */
721 put_be32(pb, 0x0); /* reserved */
722 put_be32(pb, 0x0); /* reserved */
723 put_be32(pb, 0x0); /* reserved */
724 put_be32(pb, 0x00010000); /* reserved */
725 put_be32(pb, 0x0); /* reserved */
726 put_be32(pb, 0x0); /* reserved */
727 put_be32(pb, 0x0); /* reserved */
728 put_be32(pb, 0x40000000); /* reserved */
730 /* Track width and height, for visual only */
731 if(track->enc->codec_type == CODEC_TYPE_VIDEO) {
732 double sample_aspect_ratio = av_q2d(track->enc->sample_aspect_ratio);
733 if( !sample_aspect_ratio ) sample_aspect_ratio = 1;
734 put_be32(pb, sample_aspect_ratio * track->enc->width*0x10000);
735 put_be32(pb, track->enc->height*0x10000);
744 // This box seems important for the psp playback ... without it the movie seems to hang
745 static int mov_write_edts_tag(ByteIOContext *pb, MOVTrack *track)
747 int64_t maxTrackLenTemp;
748 put_be32(pb, 0x24); /* size */
750 put_be32(pb, 0x1c); /* size */
755 maxTrackLenTemp = ((int64_t)globalTimescale*(int64_t)track->trackDuration)/(int64_t)track->timescale;
756 put_be32(pb, (long)maxTrackLenTemp); /* duration ... doesn't seem to effect psp */
759 put_be32(pb, 0x00010000);
763 // goes at the end of each track! ... Critical for PSP playback ("Incompatible data" without it)
764 static int mov_write_uuid_tag_psp(ByteIOContext *pb, MOVTrack *mov)
766 put_be32(pb, 0x34); /* size ... reports as 28 in mp4box! */
769 put_be32(pb, 0x21d24fce);
770 put_be32(pb, 0xbb88695c);
771 put_be32(pb, 0xfac9c740);
772 put_be32(pb, 0x1c); // another size here!
774 put_be32(pb, 0x00010012);
776 put_be32(pb, 0x55c40000);
782 static int mov_write_trak_tag(ByteIOContext *pb, MOVTrack* track)
784 int pos = url_ftell(pb);
785 put_be32(pb, 0); /* size */
787 mov_write_tkhd_tag(pb, track);
788 if (track->mode == MODE_PSP)
789 mov_write_edts_tag(pb, track); // PSP Movies require edts box
790 mov_write_mdia_tag(pb, track);
791 if (track->mode == MODE_PSP)
792 mov_write_uuid_tag_psp(pb,track); // PSP Movies require this uuid box
793 return updateSize(pb, pos);
796 /* TODO: Not sorted out, but not necessary either */
797 static int mov_write_iods_tag(ByteIOContext *pb, MOVContext *mov)
799 put_be32(pb, 0x15); /* size */
801 put_be32(pb, 0); /* version & flags */
802 put_be16(pb, 0x1007);
804 put_be16(pb, 0x4fff);
805 put_be16(pb, 0xfffe);
806 put_be16(pb, 0x01ff);
810 static int mov_write_mvhd_tag(ByteIOContext *pb, MOVContext *mov)
812 int maxTrackID = 1, maxTrackLen = 0, i;
813 int64_t maxTrackLenTemp;
815 put_be32(pb, 0x6c); /* size (always 0x6c) */
817 put_be32(pb, 0); /* version & flags */
818 put_be32(pb, mov->time); /* creation time */
819 put_be32(pb, mov->time); /* modification time */
820 put_be32(pb, mov->timescale); /* timescale */
821 for (i=0; i<MAX_STREAMS; i++) {
822 if(mov->tracks[i].entry > 0) {
823 maxTrackLenTemp = ((int64_t)globalTimescale*(int64_t)mov->tracks[i].trackDuration)/(int64_t)mov->tracks[i].timescale;
824 if(maxTrackLen < maxTrackLenTemp)
825 maxTrackLen = maxTrackLenTemp;
826 if(maxTrackID < mov->tracks[i].trackID)
827 maxTrackID = mov->tracks[i].trackID;
830 put_be32(pb, maxTrackLen); /* duration of longest track */
832 put_be32(pb, 0x00010000); /* reserved (preferred rate) 1.0 = normal */
833 put_be16(pb, 0x0100); /* reserved (preferred volume) 1.0 = normal */
834 put_be16(pb, 0); /* reserved */
835 put_be32(pb, 0); /* reserved */
836 put_be32(pb, 0); /* reserved */
838 /* Matrix structure */
839 put_be32(pb, 0x00010000); /* reserved */
840 put_be32(pb, 0x0); /* reserved */
841 put_be32(pb, 0x0); /* reserved */
842 put_be32(pb, 0x0); /* reserved */
843 put_be32(pb, 0x00010000); /* reserved */
844 put_be32(pb, 0x0); /* reserved */
845 put_be32(pb, 0x0); /* reserved */
846 put_be32(pb, 0x0); /* reserved */
847 put_be32(pb, 0x40000000); /* reserved */
849 put_be32(pb, 0); /* reserved (preview time) */
850 put_be32(pb, 0); /* reserved (preview duration) */
851 put_be32(pb, 0); /* reserved (poster time) */
852 put_be32(pb, 0); /* reserved (selection time) */
853 put_be32(pb, 0); /* reserved (selection duration) */
854 put_be32(pb, 0); /* reserved (current time) */
855 put_be32(pb, maxTrackID+1); /* Next track id */
859 static int mov_write_itunes_hdlr_tag(ByteIOContext *pb, MOVContext* mov,
862 int pos = url_ftell(pb);
863 put_be32(pb, 0); /* size */
872 return updateSize(pb, pos);
875 /* helper function to write a data tag with the specified string as data */
876 static int mov_write_string_data_tag(ByteIOContext *pb, MOVContext* mov,
877 AVFormatContext *s, const char *data)
879 int pos = url_ftell(pb);
880 put_be32(pb, 0); /* size */
884 put_buffer(pb, data, strlen(data));
885 return updateSize(pb, pos);
888 /* iTunes name of the song/movie */
889 static int mov_write_nam_tag(ByteIOContext *pb, MOVContext* mov,
894 int pos = url_ftell(pb);
895 put_be32(pb, 0); /* size */
896 put_tag(pb, "\251nam");
897 mov_write_string_data_tag(pb, mov, s, s->title);
898 size = updateSize(pb, pos);
903 /* iTunes name of the artist/performer */
904 static int mov_write_ART_tag(ByteIOContext *pb, MOVContext* mov,
908 if ( s->author[0] ) {
909 int pos = url_ftell(pb);
910 put_be32(pb, 0); /* size */
911 put_tag(pb, "\251ART");
912 // we use the author here as this is the only thing that we have...
913 mov_write_string_data_tag(pb, mov, s, s->author);
914 size = updateSize(pb, pos);
919 /* iTunes name of the writer */
920 static int mov_write_wrt_tag(ByteIOContext *pb, MOVContext* mov,
924 if ( s->author[0] ) {
925 int pos = url_ftell(pb);
926 put_be32(pb, 0); /* size */
927 put_tag(pb, "\251wrt");
928 mov_write_string_data_tag(pb, mov, s, s->author);
929 size = updateSize(pb, pos);
934 /* iTunes name of the album */
935 static int mov_write_alb_tag(ByteIOContext *pb, MOVContext* mov,
940 int pos = url_ftell(pb);
941 put_be32(pb, 0); /* size */
942 put_tag(pb, "\251alb");
943 mov_write_string_data_tag(pb, mov, s, s->album);
944 size = updateSize(pb, pos);
950 static int mov_write_day_tag(ByteIOContext *pb, MOVContext* mov,
956 int pos = url_ftell(pb);
957 put_be32(pb, 0); /* size */
958 put_tag(pb, "\251day");
959 snprintf(year, 5, "%04d", s->year);
960 mov_write_string_data_tag(pb, mov, s, year);
961 size = updateSize(pb, pos);
966 /* iTunes tool used to create the file */
967 static int mov_write_too_tag(ByteIOContext *pb, MOVContext* mov,
970 int pos = url_ftell(pb);
971 put_be32(pb, 0); /* size */
972 put_tag(pb, "\251too");
973 mov_write_string_data_tag(pb, mov, s, LIBAVFORMAT_IDENT);
974 return updateSize(pb, pos);
978 static int mov_write_cmt_tag(ByteIOContext *pb, MOVContext* mov,
982 if ( s->comment[0] ) {
983 int pos = url_ftell(pb);
984 put_be32(pb, 0); /* size */
985 put_tag(pb, "\251cmt");
986 mov_write_string_data_tag(pb, mov, s, s->comment);
987 size = updateSize(pb, pos);
992 /* iTunes custom genre */
993 static int mov_write_gen_tag(ByteIOContext *pb, MOVContext* mov,
998 int pos = url_ftell(pb);
999 put_be32(pb, 0); /* size */
1000 put_tag(pb, "\251gen");
1001 mov_write_string_data_tag(pb, mov, s, s->genre);
1002 size = updateSize(pb, pos);
1007 /* iTunes track number */
1008 static int mov_write_trkn_tag(ByteIOContext *pb, MOVContext* mov,
1013 int pos = url_ftell(pb);
1014 put_be32(pb, 0); /* size */
1015 put_tag(pb, "trkn");
1017 int pos = url_ftell(pb);
1018 put_be32(pb, 0); /* size */
1019 put_tag(pb, "data");
1020 put_be32(pb, 0); // 8 bytes empty
1022 put_be16(pb, 0); // empty
1023 put_be16(pb, s->track); // track number
1024 put_be16(pb, 0); // total track number
1025 put_be16(pb, 0); // empty
1026 updateSize(pb, pos);
1028 size = updateSize(pb, pos);
1033 /* iTunes meta data list */
1034 static int mov_write_ilst_tag(ByteIOContext *pb, MOVContext* mov,
1037 int pos = url_ftell(pb);
1038 put_be32(pb, 0); /* size */
1039 put_tag(pb, "ilst");
1040 mov_write_nam_tag(pb, mov, s);
1041 mov_write_ART_tag(pb, mov, s);
1042 mov_write_wrt_tag(pb, mov, s);
1043 mov_write_alb_tag(pb, mov, s);
1044 mov_write_day_tag(pb, mov, s);
1045 mov_write_too_tag(pb, mov, s);
1046 mov_write_cmt_tag(pb, mov, s);
1047 mov_write_gen_tag(pb, mov, s);
1048 mov_write_trkn_tag(pb, mov, s);
1049 return updateSize(pb, pos);
1052 /* iTunes meta data tag */
1053 static int mov_write_meta_tag(ByteIOContext *pb, MOVContext* mov,
1058 // only save meta tag if required
1059 if ( s->title[0] || s->author[0] || s->album[0] || s->year ||
1060 s->comment[0] || s->genre[0] || s->track ) {
1061 int pos = url_ftell(pb);
1062 put_be32(pb, 0); /* size */
1063 put_tag(pb, "meta");
1065 mov_write_itunes_hdlr_tag(pb, mov, s);
1066 mov_write_ilst_tag(pb, mov, s);
1067 size = updateSize(pb, pos);
1072 static int mov_write_udta_tag(ByteIOContext *pb, MOVContext* mov,
1075 int pos = url_ftell(pb);
1078 put_be32(pb, 0); /* size */
1079 put_tag(pb, "udta");
1081 /* iTunes meta data */
1082 mov_write_meta_tag(pb, mov, s);
1085 for (i=0; i<MAX_STREAMS; i++) {
1086 if(mov->tracks[i].entry <= 0) continue;
1087 if (mov->tracks[i].enc->codec_id == CODEC_ID_AAC ||
1088 mov->tracks[i].enc->codec_id == CODEC_ID_MPEG4) {
1089 int pos = url_ftell(pb);
1090 put_be32(pb, 0); /* size */
1091 put_tag(pb, "\251req");
1092 put_be16(pb, sizeof("QuickTime 6.0 or greater") - 1);
1094 put_buffer(pb, "QuickTime 6.0 or greater",
1095 sizeof("QuickTime 6.0 or greater") - 1);
1096 updateSize(pb, pos);
1102 if(mov->tracks[0].enc && !(mov->tracks[0].enc->flags & CODEC_FLAG_BITEXACT))
1104 int pos = url_ftell(pb);
1105 put_be32(pb, 0); /* size */
1106 put_tag(pb, "\251enc");
1107 put_be16(pb, sizeof(LIBAVFORMAT_IDENT) - 1); /* string length */
1109 put_buffer(pb, LIBAVFORMAT_IDENT, sizeof(LIBAVFORMAT_IDENT) - 1);
1110 updateSize(pb, pos);
1115 int pos = url_ftell(pb);
1116 put_be32(pb, 0); /* size */
1117 put_tag(pb, "\251nam");
1118 put_be16(pb, strlen(s->title)); /* string length */
1120 put_buffer(pb, s->title, strlen(s->title));
1121 updateSize(pb, pos);
1126 int pos = url_ftell(pb);
1127 put_be32(pb, 0); /* size */
1128 put_tag(pb, /*"\251aut"*/ "\251day" );
1129 put_be16(pb, strlen(s->author)); /* string length */
1131 put_buffer(pb, s->author, strlen(s->author));
1132 updateSize(pb, pos);
1137 int pos = url_ftell(pb);
1138 put_be32(pb, 0); /* size */
1139 put_tag(pb, "\251des");
1140 put_be16(pb, strlen(s->comment)); /* string length */
1142 put_buffer(pb, s->comment, strlen(s->comment));
1143 updateSize(pb, pos);
1146 return updateSize(pb, pos);
1149 static int mov_write_moov_tag(ByteIOContext *pb, MOVContext *mov,
1153 pos = url_ftell(pb);
1154 put_be32(pb, 0); /* size placeholder*/
1155 put_tag(pb, "moov");
1156 mov->timescale = globalTimescale;
1158 for (i=0; i<MAX_STREAMS; i++) {
1159 if(mov->tracks[i].entry <= 0) continue;
1161 if(mov->tracks[i].enc->codec_type == CODEC_TYPE_VIDEO) {
1162 mov->tracks[i].timescale = mov->tracks[i].enc->frame_rate;
1163 mov->tracks[i].sampleDuration = mov->tracks[i].enc->frame_rate_base;
1165 else if(mov->tracks[i].enc->codec_type == CODEC_TYPE_AUDIO) {
1166 /* If AMR, track timescale = 8000, AMR_WB = 16000 */
1167 if(mov->tracks[i].enc->codec_id == CODEC_ID_AMR_NB) {
1168 mov->tracks[i].sampleDuration = 160; // Bytes per chunk
1169 mov->tracks[i].timescale = 8000;
1172 mov->tracks[i].timescale = mov->tracks[i].enc->sample_rate;
1173 mov->tracks[i].sampleDuration = mov->tracks[i].enc->frame_size;
1177 mov->tracks[i].trackDuration =
1178 mov->tracks[i].sampleCount * mov->tracks[i].sampleDuration;
1179 mov->tracks[i].time = mov->time;
1180 mov->tracks[i].trackID = i+1;
1183 mov_write_mvhd_tag(pb, mov);
1184 //mov_write_iods_tag(pb, mov);
1185 for (i=0; i<MAX_STREAMS; i++) {
1186 if(mov->tracks[i].entry > 0) {
1187 mov_write_trak_tag(pb, &(mov->tracks[i]));
1191 mov_write_udta_tag(pb, mov, s);
1193 return updateSize(pb, pos);
1196 int mov_write_mdat_tag(ByteIOContext *pb, MOVContext* mov)
1198 mov->mdat_pos = url_ftell(pb);
1199 put_be32(pb, 0); /* size placeholder*/
1200 put_tag(pb, "mdat");
1204 /* TODO: This needs to be more general */
1205 int mov_write_ftyp_tag(ByteIOContext *pb, AVFormatContext *s)
1207 MOVContext *mov = s->priv_data;
1209 put_be32(pb, 0x14 ); /* size */
1210 put_tag(pb, "ftyp");
1212 if ( mov->mode == MODE_3GP )
1213 put_tag(pb, "3gp4");
1214 else if ( mov->mode == MODE_3G2 )
1215 put_tag(pb, "3g2a");
1216 else if ( mov->mode == MODE_PSP )
1217 put_tag(pb, "MSNV");
1219 put_tag(pb, "isom");
1221 put_be32(pb, 0x200 );
1223 if ( mov->mode == MODE_3GP )
1224 put_tag(pb, "3gp4");
1225 else if ( mov->mode == MODE_3G2 )
1226 put_tag(pb, "3g2a");
1227 else if ( mov->mode == MODE_PSP )
1228 put_tag(pb, "MSNV");
1230 put_tag(pb, "mp41");
1235 static void mov_write_uuidprof_tag(ByteIOContext *pb, AVFormatContext *s)
1237 int AudioRate = s->streams[1]->codec.sample_rate;
1238 int FrameRate = ((s->streams[0]->codec.frame_rate) * (0x10000))/ (s->streams[0]->codec.frame_rate_base);
1240 //printf("audiorate = %d\n",AudioRate);
1241 //printf("framerate = %d / %d = 0x%x\n",s->streams[0]->codec.frame_rate,s->streams[0]->codec.frame_rate_base,FrameRate);
1243 put_be32(pb, 0x94 ); /* size */
1244 put_tag(pb, "uuid");
1245 put_tag(pb, "PROF");
1247 put_be32(pb, 0x21d24fce ); /* 96 bit UUID */
1248 put_be32(pb, 0xbb88695c );
1249 put_be32(pb, 0xfac9c740 );
1251 put_be32(pb, 0x0 ); /* ? */
1252 put_be32(pb, 0x3 ); /* 3 sections ? */
1254 put_be32(pb, 0x14 ); /* size */
1255 put_tag(pb, "FPRF");
1256 put_be32(pb, 0x0 ); /* ? */
1257 put_be32(pb, 0x0 ); /* ? */
1258 put_be32(pb, 0x0 ); /* ? */
1260 put_be32(pb, 0x2c ); /* size */
1261 put_tag(pb, "APRF"); /* audio */
1264 put_tag(pb, "mp4a");
1265 put_be32(pb, 0x20f );
1267 put_be32(pb, 0x40 );
1268 put_be32(pb, 0x40 );
1269 put_be32(pb, AudioRate ); //24000 ... audio rate?
1272 put_be32(pb, 0x34 ); /* size */
1273 put_tag(pb, "VPRF"); /* video */
1276 put_tag(pb, "mp4v");
1277 put_be32(pb, 0x103 );
1279 put_be32(pb, 0xc0 );
1280 put_be32(pb, 0xc0 );
1281 put_be32(pb, FrameRate); // was 0xefc29
1282 put_be32(pb, FrameRate ); // was 0xefc29
1283 put_be16(pb, s->streams[0]->codec.width);
1284 put_be16(pb, s->streams[0]->codec.height);
1285 put_be32(pb, 0x010001 );
1288 static int mov_write_header(AVFormatContext *s)
1290 ByteIOContext *pb = &s->pb;
1291 MOVContext *mov = s->priv_data;
1294 for(i=0; i<s->nb_streams; i++){
1295 AVCodecContext *c= &s->streams[i]->codec;
1297 if (c->codec_type == CODEC_TYPE_VIDEO){
1298 if (!codec_get_tag(codec_movvideo_tags, c->codec_id)){
1299 if(!codec_get_tag(codec_bmp_tags, c->codec_id))
1302 av_log(s, AV_LOG_INFO, "Warning, using MS style video codec tag, the file may be unplayable!\n");
1304 }else if(c->codec_type == CODEC_TYPE_AUDIO){
1305 if (!codec_get_tag(codec_movaudio_tags, c->codec_id)){
1306 if(!codec_get_tag(codec_wav_tags, c->codec_id))
1309 av_log(s, AV_LOG_INFO, "Warning, using MS style audio codec tag, the file may be unplayable!\n");
1314 /* Default mode == MP4 */
1315 mov->mode = MODE_MP4;
1317 if (s->oformat != NULL) {
1318 if (!strcmp("3gp", s->oformat->name)) mov->mode = MODE_3GP;
1319 else if (!strcmp("3g2", s->oformat->name)) mov->mode = MODE_3G2;
1320 else if (!strcmp("mov", s->oformat->name)) mov->mode = MODE_MOV;
1321 else if (!strcmp("psp", s->oformat->name)) mov->mode = MODE_PSP;
1323 if ( mov->mode == MODE_3GP || mov->mode == MODE_3G2 ||
1324 mov->mode == MODE_MP4 || mov->mode == MODE_PSP )
1325 mov_write_ftyp_tag(pb,s);
1326 if ( mov->mode == MODE_PSP ) {
1327 if ( s->nb_streams != 2 ) {
1328 av_log(s, AV_LOG_ERROR, "PSP mode need one video and one audio stream\n");
1331 mov_write_uuidprof_tag(pb,s);
1335 for (i=0; i<MAX_STREAMS; i++) {
1336 mov->tracks[i].mode = mov->mode;
1339 put_flush_packet(pb);
1344 static int mov_write_packet(AVFormatContext *s, AVPacket *pkt)
1346 MOVContext *mov = s->priv_data;
1347 ByteIOContext *pb = &s->pb;
1348 AVCodecContext *enc = &s->streams[pkt->stream_index]->codec;
1349 MOVTrack* trk = &mov->tracks[pkt->stream_index];
1351 unsigned int samplesInChunk = 0;
1352 int size= pkt->size;
1354 if (url_is_streamed(&s->pb)) return 0; /* Can't handle that */
1355 if (!size) return 0; /* Discard 0 sized packets */
1357 if (enc->codec_type == CODEC_TYPE_VIDEO ) {
1360 else if (enc->codec_type == CODEC_TYPE_AUDIO ) {
1361 if( enc->codec_id == CODEC_ID_AMR_NB) {
1362 /* We must find out how many AMR blocks there are in one packet */
1363 static uint16_t packed_size[16] =
1364 {13, 14, 16, 18, 20, 21, 27, 32, 6, 0, 0, 0, 0, 0, 0, 0};
1367 while (len < size && samplesInChunk < 100) {
1368 len += packed_size[(pkt->data[len] >> 3) & 0x0F];
1372 else if(enc->codec_id == CODEC_ID_PCM_ALAW) {
1373 samplesInChunk = size/enc->channels;
1375 else if(enc->codec_id == CODEC_ID_PCM_S16BE || enc->codec_id == CODEC_ID_PCM_S16LE) {
1376 samplesInChunk = size/(2*enc->channels);
1383 if ((enc->codec_id == CODEC_ID_MPEG4 || enc->codec_id == CODEC_ID_AAC)
1384 && trk->vosLen == 0) {
1385 // assert(enc->extradata_size);
1387 trk->vosLen = enc->extradata_size;
1388 trk->vosData = av_malloc(trk->vosLen);
1389 memcpy(trk->vosData, enc->extradata, trk->vosLen);
1392 cl = trk->entry / MOV_INDEX_CLUSTER_SIZE;
1393 id = trk->entry % MOV_INDEX_CLUSTER_SIZE;
1395 if (trk->ents_allocated <= trk->entry) {
1396 trk->cluster = av_realloc(trk->cluster, (cl+1)*sizeof(void*));
1399 trk->cluster[cl] = av_malloc(MOV_INDEX_CLUSTER_SIZE*sizeof(MOVIentry));
1400 if (!trk->cluster[cl])
1402 trk->ents_allocated += MOV_INDEX_CLUSTER_SIZE;
1404 if (mov->mdat_written == 0) {
1405 mov_write_mdat_tag(pb, mov);
1406 mov->mdat_written = 1;
1407 mov->time = s->timestamp;
1410 trk->cluster[cl][id].pos = url_ftell(pb);
1411 trk->cluster[cl][id].samplesInChunk = samplesInChunk;
1412 trk->cluster[cl][id].size = size;
1413 trk->cluster[cl][id].entries = samplesInChunk;
1414 if(enc->codec_type == CODEC_TYPE_VIDEO) {
1415 trk->cluster[cl][id].key_frame = !!(pkt->flags & PKT_FLAG_KEY);
1416 if(trk->cluster[cl][id].key_frame)
1417 trk->hasKeyframes = 1;
1421 trk->sampleCount += samplesInChunk;
1422 trk->mdat_size += size;
1424 put_buffer(pb, pkt->data, size);
1426 put_flush_packet(pb);
1430 static int mov_write_trailer(AVFormatContext *s)
1432 MOVContext *mov = s->priv_data;
1433 ByteIOContext *pb = &s->pb;
1437 offset_t moov_pos = url_ftell(pb);
1439 /* Write size of mdat tag */
1440 for (i=0, j=0; i<MAX_STREAMS; i++) {
1441 if(mov->tracks[i].ents_allocated > 0) {
1442 j += mov->tracks[i].mdat_size;
1445 url_fseek(pb, mov->mdat_pos, SEEK_SET);
1447 url_fseek(pb, moov_pos, SEEK_SET);
1449 mov_write_moov_tag(pb, mov, s);
1451 for (i=0; i<MAX_STREAMS; i++) {
1452 for (j=0; j<mov->tracks[i].ents_allocated/MOV_INDEX_CLUSTER_SIZE; j++) {
1453 av_free(mov->tracks[i].cluster[j]);
1455 av_free(mov->tracks[i].cluster);
1456 if( mov->tracks[i].vosLen ) av_free( mov->tracks[i].vosData );
1458 mov->tracks[i].cluster = NULL;
1459 mov->tracks[i].ents_allocated = mov->tracks[i].entry = 0;
1462 put_flush_packet(pb);
1467 static AVOutputFormat mov_oformat = {
1480 static AVOutputFormat _3gp_oformat = {
1493 static AVOutputFormat mp4_oformat = {
1506 static AVOutputFormat psp_oformat = {
1519 static AVOutputFormat _3g2_oformat = {
1532 int movenc_init(void)
1534 av_register_output_format(&mov_oformat);
1535 av_register_output_format(&_3gp_oformat);
1536 av_register_output_format(&mp4_oformat);
1537 av_register_output_format(&psp_oformat);
1538 av_register_output_format(&_3g2_oformat);