2 * MOV, 3GP, MP4 encoder.
3 * Copyright (c) 2003 Thomas Raivio.
4 * Copyright (c) 2004 Gildas Bazin <gbazin at videolan dot org>.
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
27 #define MOV_INDEX_CLUSTER_SIZE 16384
28 #define globalTimescale 1000
33 #define MODE_PSP 3 // example working PSP command line:
34 // ffmpeg -i testinput.avi -f psp -r 14.985 -s 320x240 -b 768 -ar 24000 -ab 32 M4V00001.MP4
37 typedef struct MOVIentry {
38 unsigned int flags, pos, size;
39 unsigned int samplesInChunk;
44 typedef struct MOVIndex {
63 typedef struct MOVContext {
70 MOVTrack tracks[MAX_STREAMS];
73 static int mov_write_esds_tag(ByteIOContext *pb, MOVTrack* track);
75 //FIXME supprt 64bit varaint with wide placeholders
76 static int updateSize (ByteIOContext *pb, int pos)
78 long curpos = url_ftell(pb);
79 url_fseek(pb, pos, SEEK_SET);
80 put_be32(pb, curpos - pos); /* rewrite size */
81 url_fseek(pb, curpos, SEEK_SET);
86 /* Chunk offset atom */
87 static int mov_write_stco_tag(ByteIOContext *pb, MOVTrack* track)
90 int pos = url_ftell(pb);
91 put_be32(pb, 0); /* size */
93 put_be32(pb, 0); /* version & flags */
94 put_be32(pb, track->entry); /* entry count */
95 for (i=0; i<track->entry; i++) {
96 int cl = i / MOV_INDEX_CLUSTER_SIZE;
97 int id = i % MOV_INDEX_CLUSTER_SIZE;
98 put_be32(pb, track->cluster[cl][id].pos);
100 return updateSize (pb, pos);
103 /* Sample size atom */
104 static int mov_write_stsz_tag(ByteIOContext *pb, MOVTrack* track)
107 int i, j, entries = 0, tst = -1, oldtst = -1;
109 int pos = url_ftell(pb);
110 put_be32(pb, 0); /* size */
112 put_be32(pb, 0); /* version & flags */
114 for (i=0; i<track->entry; i++) {
115 int cl = i / MOV_INDEX_CLUSTER_SIZE;
116 int id = i % MOV_INDEX_CLUSTER_SIZE;
117 tst = track->cluster[cl][id].size/track->cluster[cl][id].entries;
118 if(oldtst != -1 && tst != oldtst) {
122 entries += track->cluster[cl][id].entries;
125 int sSize = track->cluster[0][0].size/track->cluster[0][0].entries;
126 put_be32(pb, sSize); // sample size
127 put_be32(pb, entries); // sample count
130 put_be32(pb, 0); // sample size
131 put_be32(pb, entries); // sample count
132 for (i=0; i<track->entry; i++) {
133 int cl = i / MOV_INDEX_CLUSTER_SIZE;
134 int id = i % MOV_INDEX_CLUSTER_SIZE;
135 for ( j=0; j<track->cluster[cl][id].entries; j++) {
136 put_be32(pb, track->cluster[cl][id].size /
137 track->cluster[cl][id].entries);
141 return updateSize (pb, pos);
144 /* Sample to chunk atom */
145 static int mov_write_stsc_tag(ByteIOContext *pb, MOVTrack* track)
147 int index = 0, oldval = -1, i, entryPos, curpos;
149 int pos = url_ftell(pb);
150 put_be32(pb, 0); /* size */
152 put_be32(pb, 0); // version & flags
153 entryPos = url_ftell(pb);
154 put_be32(pb, track->entry); // entry count
155 for (i=0; i<track->entry; i++) {
156 int cl = i / MOV_INDEX_CLUSTER_SIZE;
157 int id = i % MOV_INDEX_CLUSTER_SIZE;
158 if(oldval != track->cluster[cl][id].samplesInChunk)
160 put_be32(pb, i+1); // first chunk
161 put_be32(pb, track->cluster[cl][id].samplesInChunk); // samples per chunk
162 put_be32(pb, 0x1); // sample description index
163 oldval = track->cluster[cl][id].samplesInChunk;
167 curpos = url_ftell(pb);
168 url_fseek(pb, entryPos, SEEK_SET);
169 put_be32(pb, index); // rewrite size
170 url_fseek(pb, curpos, SEEK_SET);
172 return updateSize (pb, pos);
175 /* Sync sample atom */
176 static int mov_write_stss_tag(ByteIOContext *pb, MOVTrack* track)
179 int i, index = 0, entryPos;
180 int pos = url_ftell(pb);
181 put_be32(pb, 0); // size
183 put_be32(pb, 0); // version & flags
184 entryPos = url_ftell(pb);
185 put_be32(pb, track->entry); // entry count
186 for (i=0; i<track->entry; i++) {
187 int cl = i / MOV_INDEX_CLUSTER_SIZE;
188 int id = i % MOV_INDEX_CLUSTER_SIZE;
189 if(track->cluster[cl][id].key_frame == 1) {
194 curpos = url_ftell(pb);
195 url_fseek(pb, entryPos, SEEK_SET);
196 put_be32(pb, index); // rewrite size
197 url_fseek(pb, curpos, SEEK_SET);
198 return updateSize (pb, pos);
201 static int mov_write_damr_tag(ByteIOContext *pb)
203 put_be32(pb, 0x11); /* size */
208 put_be16(pb, 0x80); /* Mode set (all modes for AMR_NB) */
209 put_be16(pb, 0xa); /* Mode change period (no restriction) */
210 //put_be16(pb, 0x81ff); /* Mode set (all modes for AMR_NB) */
211 //put_be16(pb, 1); /* Mode change period (no restriction) */
215 static int mov_write_wave_tag(ByteIOContext *pb, MOVTrack* track)
217 int pos = url_ftell(pb);
219 put_be32(pb, 0); /* size */
222 put_be32(pb, 12); /* size */
226 put_be32(pb, 12); /* size */
230 mov_write_esds_tag(pb, track);
232 put_be32(pb, 12); /* size */
236 put_be32(pb, 8); /* size */
237 put_be32(pb, 0); /* null tag */
239 return updateSize (pb, pos);
242 const CodecTag codec_movaudio_tags[] = {
243 { CODEC_ID_PCM_MULAW, MKTAG('u', 'l', 'a', 'w') },
244 { CODEC_ID_PCM_ALAW, MKTAG('a', 'l', 'a', 'w') },
245 { CODEC_ID_ADPCM_IMA_QT, MKTAG('i', 'm', 'a', '4') },
246 { CODEC_ID_MACE3, MKTAG('M', 'A', 'C', '3') },
247 { CODEC_ID_MACE6, MKTAG('M', 'A', 'C', '6') },
248 { CODEC_ID_AAC, MKTAG('m', 'p', '4', 'a') },
249 { CODEC_ID_AMR_NB, MKTAG('s', 'a', 'm', 'r') },
250 { CODEC_ID_PCM_S16BE, MKTAG('t', 'w', 'o', 's') },
251 { CODEC_ID_PCM_S16LE, MKTAG('s', 'o', 'w', 't') },
252 { CODEC_ID_MP3, MKTAG('.', 'm', 'p', '3') },
256 static int mov_write_audio_tag(ByteIOContext *pb, MOVTrack* track)
258 int pos = url_ftell(pb);
261 put_be32(pb, 0); /* size */
263 tag = track->enc->codec_tag;
265 tag = codec_get_tag(codec_movaudio_tags, track->enc->codec_id);
266 // if no mac fcc found, try with Microsoft tags
269 int tmp = codec_get_tag(codec_wav_tags, track->enc->codec_id);
270 tag = MKTAG('m', 's', ((tmp >> 8) & 0xff), (tmp & 0xff));
272 put_le32(pb, tag); // store it byteswapped
274 put_be32(pb, 0); /* Reserved */
275 put_be16(pb, 0); /* Reserved */
276 put_be16(pb, 1); /* Data-reference index, XXX == 1 */
278 /* SoundDescription */
279 if(track->mode == MODE_MOV && track->enc->codec_id == CODEC_ID_AAC)
280 put_be16(pb, 1); /* Version 1 */
282 put_be16(pb, 0); /* Version 0 */
283 put_be16(pb, 0); /* Revision level */
284 put_be32(pb, 0); /* Reserved */
286 put_be16(pb, track->enc->channels); /* Number of channels */
287 /* TODO: Currently hard-coded to 16-bit, there doesn't seem
288 to be a good way to get number of bits of audio */
289 put_be16(pb, 0x10); /* Reserved */
291 if(track->enc->codec_id == CODEC_ID_AAC ||
292 track->enc->codec_id == CODEC_ID_MP3)
294 put_be16(pb, 0xfffe); /* compression ID (vbr)*/
298 put_be16(pb, 0); /* compression ID (= 0) */
300 put_be16(pb, 0); /* packet size (= 0) */
301 put_be16(pb, track->timescale); /* Time scale */
302 put_be16(pb, 0); /* Reserved */
304 if(track->mode == MODE_MOV && track->enc->codec_id == CODEC_ID_AAC)
306 /* SoundDescription V1 extended info */
307 put_be32(pb, track->enc->frame_size); /* Samples per packet */
308 put_be32(pb, 1536); /* Bytes per packet */
309 put_be32(pb, 2); /* Bytes per frame */
310 put_be32(pb, 2); /* Bytes per sample */
313 if(track->enc->codec_id == CODEC_ID_AAC) {
314 if( track->mode == MODE_MOV ) mov_write_wave_tag(pb, track);
315 else mov_write_esds_tag(pb, track);
317 if(track->enc->codec_id == CODEC_ID_AMR_NB)
318 mov_write_damr_tag(pb);
319 return updateSize (pb, pos);
322 static int mov_write_d263_tag(ByteIOContext *pb)
324 put_be32(pb, 0xf); /* size */
332 /* TODO: No idea about these values */
333 static int mov_write_svq3_tag(ByteIOContext *pb)
339 put_be32(pb, 0xe2c0211d);
340 put_be32(pb, 0xc0000000);
345 static unsigned int descrLength(unsigned int len)
347 if (len < 0x00000080)
349 else if (len < 0x00004000)
351 else if(len < 0x00200000)
357 static void putDescr(ByteIOContext *pb, int tag, int size)
363 vals[3] = (uint8_t)(len & 0x7f);
365 vals[2] = (uint8_t)((len & 0x7f) | 0x80);
367 vals[1] = (uint8_t)((len & 0x7f) | 0x80);
369 vals[0] = (uint8_t)((len & 0x7f) | 0x80);
371 put_byte(pb, tag); // DescriptorTag
373 if (size < 0x00000080)
375 put_byte(pb, vals[3]);
377 else if (size < 0x00004000)
379 put_byte(pb, vals[2]);
380 put_byte(pb, vals[3]);
382 else if (size < 0x00200000)
384 put_byte(pb, vals[1]);
385 put_byte(pb, vals[2]);
386 put_byte(pb, vals[3]);
388 else if (size < 0x10000000)
390 put_byte(pb, vals[0]);
391 put_byte(pb, vals[1]);
392 put_byte(pb, vals[2]);
393 put_byte(pb, vals[3]);
397 static int mov_write_esds_tag(ByteIOContext *pb, MOVTrack* track) // Basic
399 int decoderSpecificInfoLen;
400 int pos = url_ftell(pb);
401 void *vosDataBackup=track->vosData;
402 int vosLenBackup=track->vosLen;
404 // we should be able to have these passed in, via vosData, then we wouldn't need to attack this routine at all
405 static const char PSPAACData[]={0x13,0x10};
406 static const char PSPMP4Data[]={0x00,0x00,0x01,0xB0,0x03,0x00,0x00,0x01,0xB5,0x09,0x00,0x00,0x01,0x00,0x00,0x00,0x01,0x20,0x00,0x84,0x5D,0x4C,0x28,0x50,0x20,0xF0,0xA3,0x1F };
409 if (track->mode == MODE_PSP) // fails on psp if this is not here
411 if (track->enc->codec_id == CODEC_ID_AAC)
414 track->vosData = PSPAACData;
417 if (track->enc->codec_id == CODEC_ID_MPEG4)
420 track->vosData = PSPMP4Data;
424 decoderSpecificInfoLen = track->vosLen ? descrLength(track->vosLen):0;
426 put_be32(pb, 0); // size
428 put_be32(pb, 0); // Version
431 putDescr(pb, 0x03, 3 + descrLength(13 + decoderSpecificInfoLen) +
433 put_be16(pb, 0x0001); // ID (= 1)
434 put_byte(pb, 0x00); // flags (= no flags)
436 // DecoderConfig descriptor
437 putDescr(pb, 0x04, 13 + decoderSpecificInfoLen);
439 if(track->enc->codec_id == CODEC_ID_AAC)
440 put_byte(pb, 0x40); // Object type indication
441 else if(track->enc->codec_id == CODEC_ID_MPEG4)
442 put_byte(pb, 0x20); // Object type indication (Visual 14496-2)
444 if(track->enc->codec_type == CODEC_TYPE_AUDIO)
445 put_byte(pb, 0x15); // flags (= Audiostream)
447 put_byte(pb, 0x11); // flags (= Visualstream)
449 put_byte(pb, 0x0); // Buffersize DB (24 bits)
450 put_be16(pb, 0x0dd2); // Buffersize DB
452 // TODO: find real values for these
453 put_be32(pb, track->enc->bit_rate); // maxbitrate
454 put_be32(pb, track->enc->bit_rate); // avg bitrate
458 // DecoderSpecific info descriptor
459 putDescr(pb, 0x05, track->vosLen);
460 put_buffer(pb, track->vosData, track->vosLen);
463 track->vosData = vosDataBackup;
464 track->vosLen = vosLenBackup;
467 putDescr(pb, 0x06, 1);
469 return updateSize (pb, pos);
472 const CodecTag codec_movvideo_tags[] = {
473 { CODEC_ID_SVQ1, MKTAG('S', 'V', 'Q', '1') },
474 { CODEC_ID_SVQ3, MKTAG('S', 'V', 'Q', '3') },
475 { CODEC_ID_MPEG4, MKTAG('m', 'p', '4', 'v') },
476 { CODEC_ID_H263, MKTAG('s', '2', '6', '3') },
477 { CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'c', ' ') },
481 static int mov_write_video_tag(ByteIOContext *pb, MOVTrack* track)
483 int pos = url_ftell(pb);
484 char compressor_name[32];
487 put_be32(pb, 0); /* size */
489 tag = track->enc->codec_tag;
491 tag = codec_get_tag(codec_movvideo_tags, track->enc->codec_id);
492 // if no mac fcc found, try with Microsoft tags
494 tag = codec_get_tag(codec_bmp_tags, track->enc->codec_id);
495 put_le32(pb, tag); // store it byteswapped
497 put_be32(pb, 0); /* Reserved */
498 put_be16(pb, 0); /* Reserved */
499 put_be16(pb, 1); /* Data-reference index */
501 put_be16(pb, 0); /* Codec stream version */
502 put_be16(pb, 0); /* Codec stream revision (=0) */
503 put_tag(pb, "FFMP"); /* Vendor */
504 if(track->enc->codec_id == CODEC_ID_RAWVIDEO) {
505 put_be32(pb, 0); /* Temporal Quality */
506 put_be32(pb, 0x400); /* Spatial Quality = lossless*/
508 put_be32(pb, 0x200); /* Temporal Quality = normal */
509 put_be32(pb, 0x200); /* Spatial Quality = normal */
511 put_be16(pb, track->enc->width); /* Video width */
512 put_be16(pb, track->enc->height); /* Video height */
513 put_be32(pb, 0x00480000); /* Horizontal resolution 72dpi */
514 put_be32(pb, 0x00480000); /* Vertical resolution 72dpi */
515 put_be32(pb, 0); /* Data size (= 0) */
516 put_be16(pb, 1); /* Frame count (= 1) */
518 memset(compressor_name,0,32);
519 if (track->enc->codec && track->enc->codec->name)
520 strncpy(compressor_name,track->enc->codec->name,31);
521 put_byte(pb, strlen(compressor_name));
522 put_buffer(pb, compressor_name, 31);
524 put_be16(pb, 0x18); /* Reserved */
525 put_be16(pb, 0xffff); /* Reserved */
526 if(track->enc->codec_id == CODEC_ID_MPEG4)
527 mov_write_esds_tag(pb, track);
528 else if(track->enc->codec_id == CODEC_ID_H263)
529 mov_write_d263_tag(pb);
530 else if(track->enc->codec_id == CODEC_ID_SVQ3)
531 mov_write_svq3_tag(pb);
533 return updateSize (pb, pos);
536 static int mov_write_stsd_tag(ByteIOContext *pb, MOVTrack* track)
538 int pos = url_ftell(pb);
539 put_be32(pb, 0); /* size */
541 put_be32(pb, 0); /* version & flags */
542 put_be32(pb, 1); /* entry count */
543 if (track->enc->codec_type == CODEC_TYPE_VIDEO)
544 mov_write_video_tag(pb, track);
545 else if (track->enc->codec_type == CODEC_TYPE_AUDIO)
546 mov_write_audio_tag(pb, track);
547 return updateSize(pb, pos);
551 /* Time to sample atom */
552 static int mov_write_stts_tag(ByteIOContext *pb, MOVTrack* track)
554 put_be32(pb, 0x18); /* size */
556 put_be32(pb, 0); /* version & flags */
557 put_be32(pb, 1); /* entry count */
559 put_be32(pb, track->sampleCount); /* sample count */
560 put_be32(pb, track->sampleDuration); /* sample duration */
564 static int mov_write_dref_tag(ByteIOContext *pb)
566 put_be32(pb, 28); /* size */
568 put_be32(pb, 0); /* version & flags */
569 put_be32(pb, 1); /* entry count */
571 put_be32(pb, 0xc); /* size */
573 put_be32(pb, 1); /* version & flags */
578 static int mov_write_stbl_tag(ByteIOContext *pb, MOVTrack* track)
580 int pos = url_ftell(pb);
581 put_be32(pb, 0); /* size */
583 mov_write_stsd_tag(pb, track);
584 mov_write_stts_tag(pb, track);
585 if (track->enc->codec_type == CODEC_TYPE_VIDEO &&
587 mov_write_stss_tag(pb, track);
588 mov_write_stsc_tag(pb, track);
589 mov_write_stsz_tag(pb, track);
590 mov_write_stco_tag(pb, track);
591 return updateSize(pb, pos);
594 static int mov_write_dinf_tag(ByteIOContext *pb)
596 int pos = url_ftell(pb);
597 put_be32(pb, 0); /* size */
599 mov_write_dref_tag(pb);
600 return updateSize(pb, pos);
603 static int mov_write_smhd_tag(ByteIOContext *pb)
605 put_be32(pb, 16); /* size */
607 put_be32(pb, 0); /* version & flags */
608 put_be16(pb, 0); /* reserved (balance, normally = 0) */
609 put_be16(pb, 0); /* reserved */
613 static int mov_write_vmhd_tag(ByteIOContext *pb)
615 put_be32(pb, 0x14); /* size (always 0x14) */
617 put_be32(pb, 0x01); /* version & flags */
618 put_be64(pb, 0); /* reserved (graphics mode = copy) */
622 static int mov_write_hdlr_tag(ByteIOContext *pb, MOVTrack* track)
624 char *descr, *hdlr, *hdlr_type;
625 int pos = url_ftell(pb);
627 if (!track) { /* no media --> data handler */
630 descr = "DataHandler";
632 hdlr = (track->mode == MODE_MOV) ? "mhlr" : "\0\0\0\0";
633 if (track->enc->codec_type == CODEC_TYPE_VIDEO) {
635 descr = "VideoHandler";
638 descr = "SoundHandler";
642 put_be32(pb, 0); /* size */
644 put_be32(pb, 0); /* Version & flags */
645 put_buffer(pb, hdlr, 4); /* handler */
646 put_tag(pb, hdlr_type); /* handler type */
647 put_be32(pb ,0); /* reserved */
648 put_be32(pb ,0); /* reserved */
649 put_be32(pb ,0); /* reserved */
650 put_byte(pb, strlen(descr)); /* string counter */
651 put_buffer(pb, descr, strlen(descr)); /* handler description */
652 return updateSize(pb, pos);
655 static int mov_write_minf_tag(ByteIOContext *pb, MOVTrack* track)
657 int pos = url_ftell(pb);
658 put_be32(pb, 0); /* size */
660 if(track->enc->codec_type == CODEC_TYPE_VIDEO)
661 mov_write_vmhd_tag(pb);
663 mov_write_smhd_tag(pb);
664 if (track->mode == MODE_MOV) /* FIXME: Why do it for MODE_MOV only ? */
665 mov_write_hdlr_tag(pb, NULL);
666 mov_write_dinf_tag(pb);
667 mov_write_stbl_tag(pb, track);
668 return updateSize(pb, pos);
671 static int mov_write_mdhd_tag(ByteIOContext *pb, MOVTrack* track)
673 put_be32(pb, 32); /* size */
675 put_be32(pb, 0); /* Version & flags */
676 put_be32(pb, track->time); /* creation time */
677 put_be32(pb, track->time); /* modification time */
678 put_be32(pb, track->timescale); /* time scale (sample rate for audio) */
679 put_be32(pb, track->trackDuration); /* duration */
680 put_be16(pb, 0); /* language, 0 = english */
681 put_be16(pb, 0); /* reserved (quality) */
685 static int mov_write_mdia_tag(ByteIOContext *pb, MOVTrack* track)
687 int pos = url_ftell(pb);
688 put_be32(pb, 0); /* size */
690 mov_write_mdhd_tag(pb, track);
691 mov_write_hdlr_tag(pb, track);
692 mov_write_minf_tag(pb, track);
693 return updateSize(pb, pos);
696 static int mov_write_tkhd_tag(ByteIOContext *pb, MOVTrack* track)
698 int64_t maxTrackLenTemp;
699 put_be32(pb, 0x5c); /* size (always 0x5c) */
701 put_be32(pb, 0xf); /* version & flags (track enabled) */
702 put_be32(pb, track->time); /* creation time */
703 put_be32(pb, track->time); /* modification time */
704 put_be32(pb, track->trackID); /* track-id */
705 put_be32(pb, 0); /* reserved */
706 maxTrackLenTemp = ((int64_t)globalTimescale*(int64_t)track->trackDuration)/(int64_t)track->timescale;
707 put_be32(pb, (long)maxTrackLenTemp); /* duration */
709 put_be32(pb, 0); /* reserved */
710 put_be32(pb, 0); /* reserved */
711 put_be32(pb, 0x0); /* reserved (Layer & Alternate group) */
712 /* Volume, only for audio */
713 if(track->enc->codec_type == CODEC_TYPE_AUDIO)
714 put_be16(pb, 0x0100);
717 put_be16(pb, 0); /* reserved */
719 /* Matrix structure */
720 put_be32(pb, 0x00010000); /* reserved */
721 put_be32(pb, 0x0); /* reserved */
722 put_be32(pb, 0x0); /* reserved */
723 put_be32(pb, 0x0); /* reserved */
724 put_be32(pb, 0x00010000); /* reserved */
725 put_be32(pb, 0x0); /* reserved */
726 put_be32(pb, 0x0); /* reserved */
727 put_be32(pb, 0x0); /* reserved */
728 put_be32(pb, 0x40000000); /* reserved */
730 /* Track width and height, for visual only */
731 if(track->enc->codec_type == CODEC_TYPE_VIDEO) {
732 double sample_aspect_ratio = av_q2d(track->enc->sample_aspect_ratio);
733 if( !sample_aspect_ratio ) sample_aspect_ratio = 1;
734 put_be32(pb, sample_aspect_ratio * track->enc->width*0x10000);
735 put_be32(pb, track->enc->height*0x10000);
744 // This box seems important for the psp playback ... without it the movie seems to hang
745 static int mov_write_edts_tag(ByteIOContext *pb, MOVTrack *track)
747 int64_t maxTrackLenTemp;
748 put_be32(pb, 0x24); /* size */
750 put_be32(pb, 0x1c); /* size */
755 maxTrackLenTemp = ((int64_t)globalTimescale*(int64_t)track->trackDuration)/(int64_t)track->timescale;
756 put_be32(pb, (long)maxTrackLenTemp); /* duration ... doesn't seem to effect psp */
759 put_be32(pb, 0x00010000);
763 // goes at the end of each track! ... Critical for PSP playback ("Incompatible data" without it)
764 static int mov_write_uuid_tag_psp(ByteIOContext *pb, MOVTrack *mov)
766 put_be32(pb, 0x34); /* size ... reports as 28 in mp4box! */
769 put_be32(pb, 0x21d24fce);
770 put_be32(pb, 0xbb88695c);
771 put_be32(pb, 0xfac9c740);
772 put_be32(pb, 0x1c); // another size here!
774 put_be32(pb, 0x00010012);
776 put_be32(pb, 0x55c40000);
782 static int mov_write_trak_tag(ByteIOContext *pb, MOVTrack* track)
784 int pos = url_ftell(pb);
785 put_be32(pb, 0); /* size */
787 mov_write_tkhd_tag(pb, track);
788 if (track->mode == MODE_PSP)
789 mov_write_edts_tag(pb, track); // PSP Movies require edts box
790 mov_write_mdia_tag(pb, track);
791 if (track->mode == MODE_PSP)
792 mov_write_uuid_tag_psp(pb,track); // PSP Movies require this uuid box
793 return updateSize(pb, pos);
797 /* TODO: Not sorted out, but not necessary either */
798 static int mov_write_iods_tag(ByteIOContext *pb, MOVContext *mov)
800 put_be32(pb, 0x15); /* size */
802 put_be32(pb, 0); /* version & flags */
803 put_be16(pb, 0x1007);
805 put_be16(pb, 0x4fff);
806 put_be16(pb, 0xfffe);
807 put_be16(pb, 0x01ff);
812 static int mov_write_mvhd_tag(ByteIOContext *pb, MOVContext *mov)
814 int maxTrackID = 1, maxTrackLen = 0, i;
815 int64_t maxTrackLenTemp;
817 put_be32(pb, 0x6c); /* size (always 0x6c) */
819 put_be32(pb, 0); /* version & flags */
820 put_be32(pb, mov->time); /* creation time */
821 put_be32(pb, mov->time); /* modification time */
822 put_be32(pb, mov->timescale); /* timescale */
823 for (i=0; i<MAX_STREAMS; i++) {
824 if(mov->tracks[i].entry > 0) {
825 maxTrackLenTemp = ((int64_t)globalTimescale*(int64_t)mov->tracks[i].trackDuration)/(int64_t)mov->tracks[i].timescale;
826 if(maxTrackLen < maxTrackLenTemp)
827 maxTrackLen = maxTrackLenTemp;
828 if(maxTrackID < mov->tracks[i].trackID)
829 maxTrackID = mov->tracks[i].trackID;
832 put_be32(pb, maxTrackLen); /* duration of longest track */
834 put_be32(pb, 0x00010000); /* reserved (preferred rate) 1.0 = normal */
835 put_be16(pb, 0x0100); /* reserved (preferred volume) 1.0 = normal */
836 put_be16(pb, 0); /* reserved */
837 put_be32(pb, 0); /* reserved */
838 put_be32(pb, 0); /* reserved */
840 /* Matrix structure */
841 put_be32(pb, 0x00010000); /* reserved */
842 put_be32(pb, 0x0); /* reserved */
843 put_be32(pb, 0x0); /* reserved */
844 put_be32(pb, 0x0); /* reserved */
845 put_be32(pb, 0x00010000); /* reserved */
846 put_be32(pb, 0x0); /* reserved */
847 put_be32(pb, 0x0); /* reserved */
848 put_be32(pb, 0x0); /* reserved */
849 put_be32(pb, 0x40000000); /* reserved */
851 put_be32(pb, 0); /* reserved (preview time) */
852 put_be32(pb, 0); /* reserved (preview duration) */
853 put_be32(pb, 0); /* reserved (poster time) */
854 put_be32(pb, 0); /* reserved (selection time) */
855 put_be32(pb, 0); /* reserved (selection duration) */
856 put_be32(pb, 0); /* reserved (current time) */
857 put_be32(pb, maxTrackID+1); /* Next track id */
861 static int mov_write_itunes_hdlr_tag(ByteIOContext *pb, MOVContext* mov,
864 int pos = url_ftell(pb);
865 put_be32(pb, 0); /* size */
874 return updateSize(pb, pos);
877 /* helper function to write a data tag with the specified string as data */
878 static int mov_write_string_data_tag(ByteIOContext *pb, MOVContext* mov,
879 AVFormatContext *s, const char *data)
881 int pos = url_ftell(pb);
882 put_be32(pb, 0); /* size */
886 put_buffer(pb, data, strlen(data));
887 return updateSize(pb, pos);
890 /* iTunes name of the song/movie */
891 static int mov_write_nam_tag(ByteIOContext *pb, MOVContext* mov,
896 int pos = url_ftell(pb);
897 put_be32(pb, 0); /* size */
898 put_tag(pb, "\251nam");
899 mov_write_string_data_tag(pb, mov, s, s->title);
900 size = updateSize(pb, pos);
905 /* iTunes name of the artist/performer */
906 static int mov_write_ART_tag(ByteIOContext *pb, MOVContext* mov,
910 if ( s->author[0] ) {
911 int pos = url_ftell(pb);
912 put_be32(pb, 0); /* size */
913 put_tag(pb, "\251ART");
914 // we use the author here as this is the only thing that we have...
915 mov_write_string_data_tag(pb, mov, s, s->author);
916 size = updateSize(pb, pos);
921 /* iTunes name of the writer */
922 static int mov_write_wrt_tag(ByteIOContext *pb, MOVContext* mov,
926 if ( s->author[0] ) {
927 int pos = url_ftell(pb);
928 put_be32(pb, 0); /* size */
929 put_tag(pb, "\251wrt");
930 mov_write_string_data_tag(pb, mov, s, s->author);
931 size = updateSize(pb, pos);
936 /* iTunes name of the album */
937 static int mov_write_alb_tag(ByteIOContext *pb, MOVContext* mov,
942 int pos = url_ftell(pb);
943 put_be32(pb, 0); /* size */
944 put_tag(pb, "\251alb");
945 mov_write_string_data_tag(pb, mov, s, s->album);
946 size = updateSize(pb, pos);
952 static int mov_write_day_tag(ByteIOContext *pb, MOVContext* mov,
958 int pos = url_ftell(pb);
959 put_be32(pb, 0); /* size */
960 put_tag(pb, "\251day");
961 snprintf(year, 5, "%04d", s->year);
962 mov_write_string_data_tag(pb, mov, s, year);
963 size = updateSize(pb, pos);
968 /* iTunes tool used to create the file */
969 static int mov_write_too_tag(ByteIOContext *pb, MOVContext* mov,
972 int pos = url_ftell(pb);
973 put_be32(pb, 0); /* size */
974 put_tag(pb, "\251too");
975 mov_write_string_data_tag(pb, mov, s, LIBAVFORMAT_IDENT);
976 return updateSize(pb, pos);
980 static int mov_write_cmt_tag(ByteIOContext *pb, MOVContext* mov,
984 if ( s->comment[0] ) {
985 int pos = url_ftell(pb);
986 put_be32(pb, 0); /* size */
987 put_tag(pb, "\251cmt");
988 mov_write_string_data_tag(pb, mov, s, s->comment);
989 size = updateSize(pb, pos);
994 /* iTunes custom genre */
995 static int mov_write_gen_tag(ByteIOContext *pb, MOVContext* mov,
1000 int pos = url_ftell(pb);
1001 put_be32(pb, 0); /* size */
1002 put_tag(pb, "\251gen");
1003 mov_write_string_data_tag(pb, mov, s, s->genre);
1004 size = updateSize(pb, pos);
1009 /* iTunes track number */
1010 static int mov_write_trkn_tag(ByteIOContext *pb, MOVContext* mov,
1015 int pos = url_ftell(pb);
1016 put_be32(pb, 0); /* size */
1017 put_tag(pb, "trkn");
1019 int pos = url_ftell(pb);
1020 put_be32(pb, 0); /* size */
1021 put_tag(pb, "data");
1022 put_be32(pb, 0); // 8 bytes empty
1024 put_be16(pb, 0); // empty
1025 put_be16(pb, s->track); // track number
1026 put_be16(pb, 0); // total track number
1027 put_be16(pb, 0); // empty
1028 updateSize(pb, pos);
1030 size = updateSize(pb, pos);
1035 /* iTunes meta data list */
1036 static int mov_write_ilst_tag(ByteIOContext *pb, MOVContext* mov,
1039 int pos = url_ftell(pb);
1040 put_be32(pb, 0); /* size */
1041 put_tag(pb, "ilst");
1042 mov_write_nam_tag(pb, mov, s);
1043 mov_write_ART_tag(pb, mov, s);
1044 mov_write_wrt_tag(pb, mov, s);
1045 mov_write_alb_tag(pb, mov, s);
1046 mov_write_day_tag(pb, mov, s);
1047 mov_write_too_tag(pb, mov, s);
1048 mov_write_cmt_tag(pb, mov, s);
1049 mov_write_gen_tag(pb, mov, s);
1050 mov_write_trkn_tag(pb, mov, s);
1051 return updateSize(pb, pos);
1054 /* iTunes meta data tag */
1055 static int mov_write_meta_tag(ByteIOContext *pb, MOVContext* mov,
1060 // only save meta tag if required
1061 if ( s->title[0] || s->author[0] || s->album[0] || s->year ||
1062 s->comment[0] || s->genre[0] || s->track ) {
1063 int pos = url_ftell(pb);
1064 put_be32(pb, 0); /* size */
1065 put_tag(pb, "meta");
1067 mov_write_itunes_hdlr_tag(pb, mov, s);
1068 mov_write_ilst_tag(pb, mov, s);
1069 size = updateSize(pb, pos);
1074 static int mov_write_udta_tag(ByteIOContext *pb, MOVContext* mov,
1077 int pos = url_ftell(pb);
1080 put_be32(pb, 0); /* size */
1081 put_tag(pb, "udta");
1083 /* iTunes meta data */
1084 mov_write_meta_tag(pb, mov, s);
1087 for (i=0; i<MAX_STREAMS; i++) {
1088 if(mov->tracks[i].entry <= 0) continue;
1089 if (mov->tracks[i].enc->codec_id == CODEC_ID_AAC ||
1090 mov->tracks[i].enc->codec_id == CODEC_ID_MPEG4) {
1091 int pos = url_ftell(pb);
1092 put_be32(pb, 0); /* size */
1093 put_tag(pb, "\251req");
1094 put_be16(pb, sizeof("QuickTime 6.0 or greater") - 1);
1096 put_buffer(pb, "QuickTime 6.0 or greater",
1097 sizeof("QuickTime 6.0 or greater") - 1);
1098 updateSize(pb, pos);
1104 if(mov->tracks[0].enc && !(mov->tracks[0].enc->flags & CODEC_FLAG_BITEXACT))
1106 int pos = url_ftell(pb);
1107 put_be32(pb, 0); /* size */
1108 put_tag(pb, "\251enc");
1109 put_be16(pb, sizeof(LIBAVFORMAT_IDENT) - 1); /* string length */
1111 put_buffer(pb, LIBAVFORMAT_IDENT, sizeof(LIBAVFORMAT_IDENT) - 1);
1112 updateSize(pb, pos);
1117 int pos = url_ftell(pb);
1118 put_be32(pb, 0); /* size */
1119 put_tag(pb, "\251nam");
1120 put_be16(pb, strlen(s->title)); /* string length */
1122 put_buffer(pb, s->title, strlen(s->title));
1123 updateSize(pb, pos);
1128 int pos = url_ftell(pb);
1129 put_be32(pb, 0); /* size */
1130 put_tag(pb, /*"\251aut"*/ "\251day" );
1131 put_be16(pb, strlen(s->author)); /* string length */
1133 put_buffer(pb, s->author, strlen(s->author));
1134 updateSize(pb, pos);
1139 int pos = url_ftell(pb);
1140 put_be32(pb, 0); /* size */
1141 put_tag(pb, "\251des");
1142 put_be16(pb, strlen(s->comment)); /* string length */
1144 put_buffer(pb, s->comment, strlen(s->comment));
1145 updateSize(pb, pos);
1148 return updateSize(pb, pos);
1151 static int mov_write_moov_tag(ByteIOContext *pb, MOVContext *mov,
1155 pos = url_ftell(pb);
1156 put_be32(pb, 0); /* size placeholder*/
1157 put_tag(pb, "moov");
1158 mov->timescale = globalTimescale;
1160 for (i=0; i<MAX_STREAMS; i++) {
1161 if(mov->tracks[i].entry <= 0) continue;
1163 if(mov->tracks[i].enc->codec_type == CODEC_TYPE_VIDEO) {
1164 mov->tracks[i].timescale = mov->tracks[i].enc->frame_rate;
1165 mov->tracks[i].sampleDuration = mov->tracks[i].enc->frame_rate_base;
1167 else if(mov->tracks[i].enc->codec_type == CODEC_TYPE_AUDIO) {
1168 /* If AMR, track timescale = 8000, AMR_WB = 16000 */
1169 if(mov->tracks[i].enc->codec_id == CODEC_ID_AMR_NB) {
1170 mov->tracks[i].sampleDuration = 160; // Bytes per chunk
1171 mov->tracks[i].timescale = 8000;
1174 mov->tracks[i].timescale = mov->tracks[i].enc->sample_rate;
1175 mov->tracks[i].sampleDuration = mov->tracks[i].enc->frame_size;
1179 mov->tracks[i].trackDuration =
1180 mov->tracks[i].sampleCount * mov->tracks[i].sampleDuration;
1181 mov->tracks[i].time = mov->time;
1182 mov->tracks[i].trackID = i+1;
1185 mov_write_mvhd_tag(pb, mov);
1186 //mov_write_iods_tag(pb, mov);
1187 for (i=0; i<MAX_STREAMS; i++) {
1188 if(mov->tracks[i].entry > 0) {
1189 mov_write_trak_tag(pb, &(mov->tracks[i]));
1193 mov_write_udta_tag(pb, mov, s);
1195 return updateSize(pb, pos);
1198 int mov_write_mdat_tag(ByteIOContext *pb, MOVContext* mov)
1200 mov->mdat_pos = url_ftell(pb);
1201 put_be32(pb, 0); /* size placeholder*/
1202 put_tag(pb, "mdat");
1206 /* TODO: This needs to be more general */
1207 int mov_write_ftyp_tag(ByteIOContext *pb, AVFormatContext *s)
1209 MOVContext *mov = s->priv_data;
1211 put_be32(pb, 0x14 ); /* size */
1212 put_tag(pb, "ftyp");
1214 if ( mov->mode == MODE_3GP )
1215 put_tag(pb, "3gp4");
1216 else if ( mov->mode == MODE_3G2 )
1217 put_tag(pb, "3g2a");
1218 else if ( mov->mode == MODE_PSP )
1219 put_tag(pb, "MSNV");
1221 put_tag(pb, "isom");
1223 put_be32(pb, 0x200 );
1225 if ( mov->mode == MODE_3GP )
1226 put_tag(pb, "3gp4");
1227 else if ( mov->mode == MODE_3G2 )
1228 put_tag(pb, "3g2a");
1229 else if ( mov->mode == MODE_PSP )
1230 put_tag(pb, "MSNV");
1232 put_tag(pb, "mp41");
1237 static void mov_write_uuidprof_tag(ByteIOContext *pb, AVFormatContext *s)
1239 int AudioRate = s->streams[1]->codec.sample_rate;
1240 int FrameRate = ((s->streams[0]->codec.frame_rate) * (0x10000))/ (s->streams[0]->codec.frame_rate_base);
1242 //printf("audiorate = %d\n",AudioRate);
1243 //printf("framerate = %d / %d = 0x%x\n",s->streams[0]->codec.frame_rate,s->streams[0]->codec.frame_rate_base,FrameRate);
1245 put_be32(pb, 0x94 ); /* size */
1246 put_tag(pb, "uuid");
1247 put_tag(pb, "PROF");
1249 put_be32(pb, 0x21d24fce ); /* 96 bit UUID */
1250 put_be32(pb, 0xbb88695c );
1251 put_be32(pb, 0xfac9c740 );
1253 put_be32(pb, 0x0 ); /* ? */
1254 put_be32(pb, 0x3 ); /* 3 sections ? */
1256 put_be32(pb, 0x14 ); /* size */
1257 put_tag(pb, "FPRF");
1258 put_be32(pb, 0x0 ); /* ? */
1259 put_be32(pb, 0x0 ); /* ? */
1260 put_be32(pb, 0x0 ); /* ? */
1262 put_be32(pb, 0x2c ); /* size */
1263 put_tag(pb, "APRF"); /* audio */
1266 put_tag(pb, "mp4a");
1267 put_be32(pb, 0x20f );
1269 put_be32(pb, 0x40 );
1270 put_be32(pb, 0x40 );
1271 put_be32(pb, AudioRate ); //24000 ... audio rate?
1274 put_be32(pb, 0x34 ); /* size */
1275 put_tag(pb, "VPRF"); /* video */
1278 put_tag(pb, "mp4v");
1279 put_be32(pb, 0x103 );
1281 put_be32(pb, 0xc0 );
1282 put_be32(pb, 0xc0 );
1283 put_be32(pb, FrameRate); // was 0xefc29
1284 put_be32(pb, FrameRate ); // was 0xefc29
1285 put_be16(pb, s->streams[0]->codec.width);
1286 put_be16(pb, s->streams[0]->codec.height);
1287 put_be32(pb, 0x010001 );
1290 static int mov_write_header(AVFormatContext *s)
1292 ByteIOContext *pb = &s->pb;
1293 MOVContext *mov = s->priv_data;
1296 for(i=0; i<s->nb_streams; i++){
1297 AVCodecContext *c= &s->streams[i]->codec;
1299 if (c->codec_type == CODEC_TYPE_VIDEO){
1300 if (!codec_get_tag(codec_movvideo_tags, c->codec_id)){
1301 if(!codec_get_tag(codec_bmp_tags, c->codec_id))
1304 av_log(s, AV_LOG_INFO, "Warning, using MS style video codec tag, the file may be unplayable!\n");
1306 }else if(c->codec_type == CODEC_TYPE_AUDIO){
1307 if (!codec_get_tag(codec_movaudio_tags, c->codec_id)){
1308 if(!codec_get_tag(codec_wav_tags, c->codec_id))
1311 av_log(s, AV_LOG_INFO, "Warning, using MS style audio codec tag, the file may be unplayable!\n");
1316 /* Default mode == MP4 */
1317 mov->mode = MODE_MP4;
1319 if (s->oformat != NULL) {
1320 if (!strcmp("3gp", s->oformat->name)) mov->mode = MODE_3GP;
1321 else if (!strcmp("3g2", s->oformat->name)) mov->mode = MODE_3G2;
1322 else if (!strcmp("mov", s->oformat->name)) mov->mode = MODE_MOV;
1323 else if (!strcmp("psp", s->oformat->name)) mov->mode = MODE_PSP;
1325 if ( mov->mode == MODE_3GP || mov->mode == MODE_3G2 ||
1326 mov->mode == MODE_MP4 || mov->mode == MODE_PSP )
1327 mov_write_ftyp_tag(pb,s);
1328 if ( mov->mode == MODE_PSP ) {
1329 if ( s->nb_streams != 2 ) {
1330 av_log(s, AV_LOG_ERROR, "PSP mode need one video and one audio stream\n");
1333 mov_write_uuidprof_tag(pb,s);
1337 for (i=0; i<MAX_STREAMS; i++) {
1338 mov->tracks[i].mode = mov->mode;
1341 put_flush_packet(pb);
1346 static int mov_write_packet(AVFormatContext *s, AVPacket *pkt)
1348 MOVContext *mov = s->priv_data;
1349 ByteIOContext *pb = &s->pb;
1350 AVCodecContext *enc = &s->streams[pkt->stream_index]->codec;
1351 MOVTrack* trk = &mov->tracks[pkt->stream_index];
1353 unsigned int samplesInChunk = 0;
1354 int size= pkt->size;
1356 if (url_is_streamed(&s->pb)) return 0; /* Can't handle that */
1357 if (!size) return 0; /* Discard 0 sized packets */
1359 if (enc->codec_type == CODEC_TYPE_VIDEO ) {
1362 else if (enc->codec_type == CODEC_TYPE_AUDIO ) {
1363 if( enc->codec_id == CODEC_ID_AMR_NB) {
1364 /* We must find out how many AMR blocks there are in one packet */
1365 static uint16_t packed_size[16] =
1366 {13, 14, 16, 18, 20, 21, 27, 32, 6, 0, 0, 0, 0, 0, 0, 0};
1369 while (len < size && samplesInChunk < 100) {
1370 len += packed_size[(pkt->data[len] >> 3) & 0x0F];
1374 else if(enc->codec_id == CODEC_ID_PCM_ALAW) {
1375 samplesInChunk = size/enc->channels;
1377 else if(enc->codec_id == CODEC_ID_PCM_S16BE || enc->codec_id == CODEC_ID_PCM_S16LE) {
1378 samplesInChunk = size/(2*enc->channels);
1385 if ((enc->codec_id == CODEC_ID_MPEG4 || enc->codec_id == CODEC_ID_AAC)
1386 && trk->vosLen == 0) {
1387 // assert(enc->extradata_size);
1389 trk->vosLen = enc->extradata_size;
1390 trk->vosData = av_malloc(trk->vosLen);
1391 memcpy(trk->vosData, enc->extradata, trk->vosLen);
1394 cl = trk->entry / MOV_INDEX_CLUSTER_SIZE;
1395 id = trk->entry % MOV_INDEX_CLUSTER_SIZE;
1397 if (trk->ents_allocated <= trk->entry) {
1398 trk->cluster = av_realloc(trk->cluster, (cl+1)*sizeof(void*));
1401 trk->cluster[cl] = av_malloc(MOV_INDEX_CLUSTER_SIZE*sizeof(MOVIentry));
1402 if (!trk->cluster[cl])
1404 trk->ents_allocated += MOV_INDEX_CLUSTER_SIZE;
1406 if (mov->mdat_written == 0) {
1407 mov_write_mdat_tag(pb, mov);
1408 mov->mdat_written = 1;
1409 mov->time = s->timestamp;
1412 trk->cluster[cl][id].pos = url_ftell(pb);
1413 trk->cluster[cl][id].samplesInChunk = samplesInChunk;
1414 trk->cluster[cl][id].size = size;
1415 trk->cluster[cl][id].entries = samplesInChunk;
1416 if(enc->codec_type == CODEC_TYPE_VIDEO) {
1417 trk->cluster[cl][id].key_frame = !!(pkt->flags & PKT_FLAG_KEY);
1418 if(trk->cluster[cl][id].key_frame)
1419 trk->hasKeyframes = 1;
1423 trk->sampleCount += samplesInChunk;
1424 trk->mdat_size += size;
1426 put_buffer(pb, pkt->data, size);
1428 put_flush_packet(pb);
1432 static int mov_write_trailer(AVFormatContext *s)
1434 MOVContext *mov = s->priv_data;
1435 ByteIOContext *pb = &s->pb;
1439 offset_t moov_pos = url_ftell(pb);
1441 /* Write size of mdat tag */
1442 for (i=0, j=0; i<MAX_STREAMS; i++) {
1443 if(mov->tracks[i].ents_allocated > 0) {
1444 j += mov->tracks[i].mdat_size;
1447 url_fseek(pb, mov->mdat_pos, SEEK_SET);
1449 url_fseek(pb, moov_pos, SEEK_SET);
1451 mov_write_moov_tag(pb, mov, s);
1453 for (i=0; i<MAX_STREAMS; i++) {
1454 for (j=0; j<mov->tracks[i].ents_allocated/MOV_INDEX_CLUSTER_SIZE; j++) {
1455 av_free(mov->tracks[i].cluster[j]);
1457 av_free(mov->tracks[i].cluster);
1458 if( mov->tracks[i].vosLen ) av_free( mov->tracks[i].vosData );
1460 mov->tracks[i].cluster = NULL;
1461 mov->tracks[i].ents_allocated = mov->tracks[i].entry = 0;
1464 put_flush_packet(pb);
1469 static AVOutputFormat mov_oformat = {
1482 static AVOutputFormat _3gp_oformat = {
1495 static AVOutputFormat mp4_oformat = {
1508 static AVOutputFormat psp_oformat = {
1521 static AVOutputFormat _3g2_oformat = {
1534 int movenc_init(void)
1536 av_register_output_format(&mov_oformat);
1537 av_register_output_format(&_3gp_oformat);
1538 av_register_output_format(&mp4_oformat);
1539 av_register_output_format(&psp_oformat);
1540 av_register_output_format(&_3g2_oformat);