2 * ISO Media common code
3 * copyright (c) 2001 Fabrice Bellard
4 * copyright (c) 2002 Francois Revol <revol@free.fr>
5 * copyright (c) 2006 Baptiste Coudurier <baptiste.coudurier@free.fr>
7 * This file is part of FFmpeg.
9 * FFmpeg is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public
11 * License as published by the Free Software Foundation; either
12 * version 2.1 of the License, or (at your option) any later version.
14 * FFmpeg is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with FFmpeg; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
24 #ifndef AVFORMAT_ISOM_H
25 #define AVFORMAT_ISOM_H
30 #include "libavutil/encryption_info.h"
31 #include "libavutil/mastering_display_metadata.h"
32 #include "libavutil/spherical.h"
33 #include "libavutil/stereo3d.h"
40 extern const AVCodecTag ff_mp4_obj_type[];
41 extern const AVCodecTag ff_codec_movvideo_tags[];
42 extern const AVCodecTag ff_codec_movaudio_tags[];
43 extern const AVCodecTag ff_codec_movsubtitle_tags[];
44 extern const AVCodecTag ff_codec_movdata_tags[];
46 int ff_mov_iso639_to_lang(const char lang[4], int mp4);
47 int ff_mov_lang_to_iso639(unsigned code, char to[4]);
51 /* the QuickTime file format is quite convoluted...
52 * it has lots of index tables, each indexing something in another one...
53 * Here we just use what is needed to read the chunks
56 typedef struct MOVStts {
61 typedef struct MOVStsc {
67 typedef struct MOVElst {
73 typedef struct MOVDref {
79 int16_t nlvl_to, nlvl_from;
82 typedef struct MOVAtom {
84 int64_t size; /* total size (excluding the size and type fields) */
87 struct MOVParseTableEntry;
89 typedef struct MOVFragment {
91 uint64_t base_data_offset;
93 uint64_t implicit_offset;
100 typedef struct MOVTrackExt {
108 typedef struct MOVSbgp {
113 typedef struct MOVEncryptionIndex {
114 // Individual encrypted samples. If there are no elements, then the default
115 // settings will be used.
116 unsigned int nb_encrypted_samples;
117 AVEncryptionInfo **encrypted_samples;
119 uint8_t* auxiliary_info_sizes;
120 size_t auxiliary_info_sample_count;
121 uint8_t auxiliary_info_default_size;
122 uint64_t* auxiliary_offsets; ///< Absolute seek position
123 size_t auxiliary_offsets_count;
124 } MOVEncryptionIndex;
126 typedef struct MOVFragmentStreamInfo {
129 int64_t first_tfra_pts;
132 MOVEncryptionIndex *encryption_index;
133 } MOVFragmentStreamInfo;
135 typedef struct MOVFragmentIndexItem {
140 MOVFragmentStreamInfo * stream_info;
141 } MOVFragmentIndexItem;
143 typedef struct MOVFragmentIndex {
148 MOVFragmentIndexItem * item;
151 typedef struct MOVIndexRange {
156 typedef struct MOVStreamContext {
159 int ffindex; ///< AVStream index
161 unsigned int chunk_count;
162 int64_t *chunk_offsets;
163 unsigned int stts_count;
165 unsigned int ctts_count;
166 unsigned int ctts_allocated_size;
168 unsigned int stsc_count;
170 unsigned int stsc_index;
172 unsigned int stps_count;
173 unsigned *stps_data; ///< partial sync sample for mpeg-2 open gop
175 unsigned int elst_count;
178 unsigned int sample_size; ///< may contain value calculated from stsd or value from stsz atom
179 unsigned int stsz_sample_size; ///< always contains sample size from stsz atom
180 unsigned int sample_count;
183 unsigned int keyframe_count;
186 int64_t time_offset; ///< time offset of the edit list entries
187 int64_t min_corrected_pts; ///< minimum Composition time shown by the edits excluding empty edits.
189 int64_t current_index;
190 MOVIndexRange* index_ranges;
191 MOVIndexRange* current_index_range;
192 unsigned int bytes_per_frame;
193 unsigned int samples_per_frame;
194 int dv_audio_container;
195 int pseudo_stream_id; ///< -1 means demux all ids
196 int16_t audio_cid; ///< stsd audio compression id
197 unsigned drefs_count;
201 int width; ///< tkhd width
202 int height; ///< tkhd height
203 int dts_shift; ///< dts shift when ctts is negative
204 uint32_t palette[256];
207 uint32_t tmcd_flags; ///< tmcd track flags
208 int64_t track_end; ///< used for dts generation in fragmented movie files
209 int start_pad; ///< amount of samples to skip due to enc-dec delay
210 unsigned int rap_group_count;
213 int nb_frames_for_fps;
214 int64_t duration_for_fps;
216 /** extradata array (and size) for multiple stsd */
223 int32_t *display_matrix;
224 AVStereo3D *stereo3d;
225 AVSphericalMapping *spherical;
226 size_t spherical_size;
227 AVMasteringDisplayMetadata *mastering;
228 AVContentLightMetadata *coll;
233 int has_sidx; // If there is an sidx entry for this stream.
235 struct AVAESCTR* aes_ctr;
236 unsigned int per_sample_iv_size; // Either 0, 8, or 16.
237 AVEncryptionInfo *default_encrypted_sample;
238 MOVEncryptionIndex *encryption_index;
242 typedef struct MOVContext {
243 const AVClass *class; ///< class for private options
246 int64_t duration; ///< duration of the longest track
247 int found_moov; ///< 'moov' atom has been found
248 int found_mdat; ///< 'mdat' atom has been found
249 int found_hdlr_mdta; ///< 'hdlr' atom with type 'mdta' has been found
250 int trak_index; ///< Index of the current 'trak'
252 unsigned meta_keys_count;
253 DVDemuxContext *dv_demux;
254 AVFormatContext *dv_fctx;
255 int isom; ///< 1 if file is ISO Media (mp4/3gp)
256 MOVFragment fragment; ///< current fragment in moof atom
257 MOVTrackExt *trex_data;
259 int itunes_metadata; ///< metadata are itunes style
260 int handbrake_version;
262 unsigned int nb_chapter_tracks;
263 int use_absolute_path;
265 int advanced_editlist;
267 int seek_individually;
268 int64_t next_root_atom; ///< offset of the next root atom
271 int *bitrates; ///< bitrates read before streams creation
275 int has_looked_for_mfra;
276 MOVFragmentIndex frag_index;
278 unsigned int aax_mode; ///< 'aax' file has been detected
279 uint8_t file_key[20];
281 void *activation_bytes;
282 int activation_bytes_size;
283 void *audible_fixed_key;
284 int audible_fixed_key_size;
285 struct AVAES *aes_decrypt;
286 uint8_t *decryption_key;
287 int decryption_key_len;
289 int32_t movie_display_matrix[3][3]; ///< display matrix from mvhd
292 int ff_mp4_read_descr_len(AVIOContext *pb);
293 int ff_mp4_read_descr(AVFormatContext *fc, AVIOContext *pb, int *tag);
294 int ff_mp4_read_dec_config_descr(AVFormatContext *fc, AVStream *st, AVIOContext *pb);
295 void ff_mp4_parse_es_descr(AVIOContext *pb, int *es_id);
297 #define MP4ODescrTag 0x01
298 #define MP4IODescrTag 0x02
299 #define MP4ESDescrTag 0x03
300 #define MP4DecConfigDescrTag 0x04
301 #define MP4DecSpecificDescrTag 0x05
302 #define MP4SLDescrTag 0x06
304 #define MOV_TFHD_BASE_DATA_OFFSET 0x01
305 #define MOV_TFHD_STSD_ID 0x02
306 #define MOV_TFHD_DEFAULT_DURATION 0x08
307 #define MOV_TFHD_DEFAULT_SIZE 0x10
308 #define MOV_TFHD_DEFAULT_FLAGS 0x20
309 #define MOV_TFHD_DURATION_IS_EMPTY 0x010000
310 #define MOV_TFHD_DEFAULT_BASE_IS_MOOF 0x020000
312 #define MOV_TRUN_DATA_OFFSET 0x01
313 #define MOV_TRUN_FIRST_SAMPLE_FLAGS 0x04
314 #define MOV_TRUN_SAMPLE_DURATION 0x100
315 #define MOV_TRUN_SAMPLE_SIZE 0x200
316 #define MOV_TRUN_SAMPLE_FLAGS 0x400
317 #define MOV_TRUN_SAMPLE_CTS 0x800
319 #define MOV_FRAG_SAMPLE_FLAG_DEGRADATION_PRIORITY_MASK 0x0000ffff
320 #define MOV_FRAG_SAMPLE_FLAG_IS_NON_SYNC 0x00010000
321 #define MOV_FRAG_SAMPLE_FLAG_PADDING_MASK 0x000e0000
322 #define MOV_FRAG_SAMPLE_FLAG_REDUNDANCY_MASK 0x00300000
323 #define MOV_FRAG_SAMPLE_FLAG_DEPENDED_MASK 0x00c00000
324 #define MOV_FRAG_SAMPLE_FLAG_DEPENDS_MASK 0x03000000
326 #define MOV_FRAG_SAMPLE_FLAG_DEPENDS_NO 0x02000000
327 #define MOV_FRAG_SAMPLE_FLAG_DEPENDS_YES 0x01000000
329 #define MOV_TKHD_FLAG_ENABLED 0x0001
330 #define MOV_TKHD_FLAG_IN_MOVIE 0x0002
331 #define MOV_TKHD_FLAG_IN_PREVIEW 0x0004
332 #define MOV_TKHD_FLAG_IN_POSTER 0x0008
334 #define MOV_SAMPLE_DEPENDENCY_UNKNOWN 0x0
335 #define MOV_SAMPLE_DEPENDENCY_YES 0x1
336 #define MOV_SAMPLE_DEPENDENCY_NO 0x2
339 #define TAG_IS_AVCI(tag) \
340 ((tag) == MKTAG('a', 'i', '5', 'p') || \
341 (tag) == MKTAG('a', 'i', '5', 'q') || \
342 (tag) == MKTAG('a', 'i', '5', '2') || \
343 (tag) == MKTAG('a', 'i', '5', '3') || \
344 (tag) == MKTAG('a', 'i', '5', '5') || \
345 (tag) == MKTAG('a', 'i', '5', '6') || \
346 (tag) == MKTAG('a', 'i', '1', 'p') || \
347 (tag) == MKTAG('a', 'i', '1', 'q') || \
348 (tag) == MKTAG('a', 'i', '1', '2') || \
349 (tag) == MKTAG('a', 'i', '1', '3') || \
350 (tag) == MKTAG('a', 'i', '1', '5') || \
351 (tag) == MKTAG('a', 'i', '1', '6') || \
352 (tag) == MKTAG('a', 'i', 'v', 'x') || \
353 (tag) == MKTAG('A', 'V', 'i', 'n'))
356 int ff_mov_read_esds(AVFormatContext *fc, AVIOContext *pb);
358 int ff_mov_read_stsd_entries(MOVContext *c, AVIOContext *pb, int entries);
359 void ff_mov_write_chan(AVIOContext *pb, int64_t channel_layout);
361 #define FF_MOV_FLAG_MFRA_AUTO -1
362 #define FF_MOV_FLAG_MFRA_DTS 1
363 #define FF_MOV_FLAG_MFRA_PTS 2
366 * Compute codec id for 'lpcm' tag.
367 * See CoreAudioTypes and AudioStreamBasicDescription at Apple.
369 static inline enum AVCodecID ff_mov_get_lpcm_codec_id(int bps, int flags)
376 return ff_get_pcm_codec_id(bps, flags & 1, flags & 2, flags & 4 ? -1 : 0);
379 #endif /* AVFORMAT_ISOM_H */