1 /*****************************************************************************
2 * mp4.c: x264 mp4 output module
3 *****************************************************************************
4 * Copyright (C) 2003-2009 x264 project
6 * Authors: Laurent Aimar <fenrir@via.ecp.fr>
7 * Loren Merritt <lorenm@u.washington.edu>
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
19 * You should have received a copy of the GNU General Public License
20 * along with this program; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111, USA.
22 *****************************************************************************/
25 #include <gpac/isomedia.h>
30 GF_AVCConfig *p_config;
31 GF_ISOSample *p_sample;
40 static void recompute_bitrate_mp4( GF_ISOFile *p_file, int i_track )
42 u32 i, count, di, timescale, time_wnd, rate;
47 esd = gf_isom_get_esd( p_file, i_track, 1 );
51 esd->decoderConfig->avgBitrate = 0;
52 esd->decoderConfig->maxBitrate = 0;
55 timescale = gf_isom_get_media_timescale( p_file, i_track );
56 count = gf_isom_get_sample_count( p_file, i_track );
57 for( i = 0; i < count; i++ )
59 GF_ISOSample *samp = gf_isom_get_sample_info( p_file, i_track, i+1, &di, &offset );
62 fprintf( stderr, "mp4 [error]: failure reading back frame %u\n", i );
66 if( esd->decoderConfig->bufferSizeDB < samp->dataLength )
67 esd->decoderConfig->bufferSizeDB = samp->dataLength;
69 esd->decoderConfig->avgBitrate += samp->dataLength;
70 rate += samp->dataLength;
71 if( samp->DTS > time_wnd + timescale )
73 if( rate > esd->decoderConfig->maxBitrate )
74 esd->decoderConfig->maxBitrate = rate;
79 gf_isom_sample_del( &samp );
82 br = (Double)(s64)gf_isom_get_media_duration( p_file, i_track );
84 esd->decoderConfig->avgBitrate = (u32)(esd->decoderConfig->avgBitrate / br);
86 esd->decoderConfig->avgBitrate *= 8;
87 esd->decoderConfig->maxBitrate *= 8;
89 gf_isom_change_mpeg4_description( p_file, i_track, 1, esd );
90 gf_odf_desc_del( (GF_Descriptor*)esd );
93 static int close_file( hnd_t handle, int64_t largest_pts, int64_t second_largest_pts )
95 mp4_hnd_t *p_mp4 = handle;
96 uint64_t total_duration = 0;
101 if( p_mp4->p_config )
102 gf_odf_avc_cfg_del( p_mp4->p_config );
104 if( p_mp4->p_sample )
106 if( p_mp4->p_sample->data )
107 free( p_mp4->p_sample->data );
109 gf_isom_sample_del( &p_mp4->p_sample );
114 /* The mdhd duration is defined as CTS[final] - CTS[0] + duration of last frame.
115 * The mdhd duration (in seconds) should be able to be longer than the tkhd duration since the track is managed by edts.
116 * So, if mdhd duration is equal to the last DTS or less, we give the last composition time delta to the last sample duration.
117 * And then, the mdhd duration is updated, but it time-wise doesn't give the actual duration.
118 * The tkhd duration is the actual track duration. */
119 uint64_t mdhd_duration = (2 * largest_pts - second_largest_pts - p_mp4->i_delay_time) * p_mp4->i_time_inc;
120 total_duration = gf_isom_get_media_duration( p_mp4->p_file, p_mp4->i_track );
121 if( mdhd_duration != total_duration )
123 uint64_t last_dts = gf_isom_get_sample_dts( p_mp4->p_file, p_mp4->i_track, p_mp4->i_numframe );
124 uint32_t last_duration = (uint32_t)( mdhd_duration > last_dts ? mdhd_duration - last_dts : (largest_pts - second_largest_pts) * p_mp4->i_time_inc );
125 gf_isom_set_last_sample_duration( p_mp4->p_file, p_mp4->i_track, last_duration );
126 total_duration = gf_isom_get_media_duration( p_mp4->p_file, p_mp4->i_track );
129 /* Write an Edit Box if the first CTS offset is positive.
130 * A media_time is given by not the mvhd timescale but rather the mdhd timescale.
131 * The reason is that an Edit Box maps the presentation time-line to the media time-line.
132 * Any demuxers should follow the Edit Box if it exists. */
133 GF_ISOSample *sample = gf_isom_get_sample_info( p_mp4->p_file, p_mp4->i_track, 1, NULL, NULL );
134 if( sample->CTS_Offset > 0 )
136 uint32_t mvhd_timescale = gf_isom_get_timescale( p_mp4->p_file );
137 uint64_t tkhd_duration = (uint64_t)( mdhd_duration * ( (double)mvhd_timescale / p_mp4->i_time_res ) );
138 gf_isom_append_edit_segment( p_mp4->p_file, p_mp4->i_track, tkhd_duration, sample->CTS_Offset, GF_ISOM_EDIT_NORMAL );
140 gf_isom_sample_del( &sample );
142 recompute_bitrate_mp4( p_mp4->p_file, p_mp4->i_track );
143 gf_isom_set_pl_indication( p_mp4->p_file, GF_ISOM_PL_VISUAL, 0x15 );
144 gf_isom_set_storage_mode( p_mp4->p_file, GF_ISOM_STORE_FLAT );
145 gf_isom_close( p_mp4->p_file );
153 static int open_file( char *psz_filename, hnd_t *p_handle )
158 FILE *fh = fopen( psz_filename, "w" );
161 else if( !x264_is_regular_file( fh ) )
163 fprintf( stderr, "mp4 [error]: MP4 output is incompatible with non-regular file `%s'\n", psz_filename );
168 if( !(p_mp4 = malloc( sizeof(mp4_hnd_t) )) )
171 memset( p_mp4, 0, sizeof(mp4_hnd_t) );
172 p_mp4->p_file = gf_isom_open( psz_filename, GF_ISOM_OPEN_WRITE, NULL );
174 if( !(p_mp4->p_sample = gf_isom_sample_new()) )
176 close_file( p_mp4, 0, 0 );
180 gf_isom_set_brand_info( p_mp4->p_file, GF_ISOM_BRAND_AVC1, 0 );
187 static int set_param( hnd_t handle, x264_param_t *p_param )
189 mp4_hnd_t *p_mp4 = handle;
191 p_mp4->i_time_res = p_param->i_timebase_den;
192 p_mp4->i_time_inc = p_param->i_timebase_num;
194 p_mp4->i_track = gf_isom_new_track( p_mp4->p_file, 0, GF_ISOM_MEDIA_VISUAL,
197 p_mp4->p_config = gf_odf_avc_cfg_new();
198 gf_isom_avc_config_new( p_mp4->p_file, p_mp4->i_track, p_mp4->p_config,
199 NULL, NULL, &p_mp4->i_descidx );
201 gf_isom_set_track_enabled( p_mp4->p_file, p_mp4->i_track, 1 );
203 gf_isom_set_visual_info( p_mp4->p_file, p_mp4->i_track, p_mp4->i_descidx,
204 p_param->i_width, p_param->i_height );
206 if( p_param->vui.i_sar_width && p_param->vui.i_sar_height )
208 uint64_t dw = p_param->i_width << 16;
209 uint64_t dh = p_param->i_height << 16;
210 double sar = (double)p_param->vui.i_sar_width / p_param->vui.i_sar_height;
215 gf_isom_set_track_layout_info( p_mp4->p_file, p_mp4->i_track, dw, dh, 0, 0, 0 );
218 p_mp4->p_sample->data = malloc( p_param->i_width * p_param->i_height * 3 / 2 );
219 if( !p_mp4->p_sample->data )
225 static int write_headers( hnd_t handle, x264_nal_t *p_nal )
227 mp4_hnd_t *p_mp4 = handle;
228 GF_AVCConfigSlot *p_slot;
230 int sei_size = p_nal[0].i_payload;
231 int sps_size = p_nal[1].i_payload - 4;
232 int pps_size = p_nal[2].i_payload - 4;
234 uint8_t *sei = p_nal[0].p_payload;
235 uint8_t *sps = p_nal[1].p_payload + 4;
236 uint8_t *pps = p_nal[2].p_payload + 4;
240 p_mp4->p_config->configurationVersion = 1;
241 p_mp4->p_config->AVCProfileIndication = sps[1];
242 p_mp4->p_config->profile_compatibility = sps[2];
243 p_mp4->p_config->AVCLevelIndication = sps[3];
244 p_slot = malloc( sizeof(GF_AVCConfigSlot) );
247 p_slot->size = sps_size;
248 p_slot->data = malloc( p_slot->size );
251 memcpy( p_slot->data, sps, sps_size );
252 gf_list_add( p_mp4->p_config->sequenceParameterSets, p_slot );
256 p_slot = malloc( sizeof(GF_AVCConfigSlot) );
259 p_slot->size = pps_size;
260 p_slot->data = malloc( p_slot->size );
263 memcpy( p_slot->data, pps, pps_size );
264 gf_list_add( p_mp4->p_config->pictureParameterSets, p_slot );
265 gf_isom_avc_config_update( p_mp4->p_file, p_mp4->i_track, 1, p_mp4->p_config );
269 memcpy( p_mp4->p_sample->data + p_mp4->p_sample->dataLength, sei, sei_size );
270 p_mp4->p_sample->dataLength += sei_size;
272 return sei_size + sps_size + pps_size;
274 static int write_frame( hnd_t handle, uint8_t *p_nalu, int i_size, x264_picture_t *p_picture )
276 mp4_hnd_t *p_mp4 = handle;
280 memcpy( p_mp4->p_sample->data + p_mp4->p_sample->dataLength, p_nalu, i_size );
281 p_mp4->p_sample->dataLength += i_size;
283 if( !p_mp4->i_numframe )
284 p_mp4->i_delay_time = p_picture->i_dts * -1;
286 dts = (p_picture->i_dts + p_mp4->i_delay_time) * p_mp4->i_time_inc;
287 cts = (p_picture->i_pts + p_mp4->i_delay_time) * p_mp4->i_time_inc;
289 p_mp4->p_sample->IsRAP = p_picture->b_keyframe;
290 p_mp4->p_sample->DTS = dts;
291 p_mp4->p_sample->CTS_Offset = (uint32_t)(cts - dts);
292 gf_isom_add_sample( p_mp4->p_file, p_mp4->i_track, p_mp4->i_descidx, p_mp4->p_sample );
294 p_mp4->p_sample->dataLength = 0;
300 cli_output_t mp4_output = { open_file, set_param, write_headers, write_frame, close_file };