git.sesse.net Git - ffmpeg/blob - libavformat/mov.c

   1 /*
   2  * MOV demuxer
   3  * Copyright (c) 2001 Fabrice Bellard
   4  * Copyright (c) 2009 Baptiste Coudurier <baptiste dot coudurier at gmail dot com>
   5  *
   6  * This file is part of Libav.
   7  *
   8  * Libav is free software; you can redistribute it and/or
   9  * modify it under the terms of the GNU Lesser General Public
  10  * License as published by the Free Software Foundation; either
  11  * version 2.1 of the License, or (at your option) any later version.
  12  *
  13  * Libav is distributed in the hope that it will be useful,
  14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  16  * Lesser General Public License for more details.
  17  *
  18  * You should have received a copy of the GNU Lesser General Public
  19  * License along with Libav; if not, write to the Free Software
  20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21  */
  22
  23 #include <limits.h>
  24
  25 //#define DEBUG
  26 //#define MOV_EXPORT_ALL_METADATA
  27
  28 #include "libavutil/intreadwrite.h"
  29 #include "libavutil/intfloat_readwrite.h"
  30 #include "libavutil/mathematics.h"
  31 #include "libavutil/avstring.h"
  32 #include "libavutil/dict.h"
  33 #include "avformat.h"
  34 #include "avio_internal.h"
  35 #include "riff.h"
  36 #include "isom.h"
  37 #include "libavcodec/get_bits.h"
  38 #include "id3v1.h"
  39
  40 #if CONFIG_ZLIB
  41 #include <zlib.h>
  42 #endif
  43
  44 /*
  45  * First version by Francois Revol revol@free.fr
  46  * Seek function by Gael Chardon gael.dev@4now.net
  47  *
  48  * Features and limitations:
  49  * - reads most of the QT files I have (at least the structure),
  50  *   Sample QuickTime files with mp3 audio can be found at: http://www.3ivx.com/showcase.html
  51  * - the code is quite ugly... maybe I won't do it recursive next time :-)
  52  *
  53  * Funny I didn't know about http://sourceforge.net/projects/qt-ffmpeg/
  54  * when coding this :) (it's a writer anyway)
  55  *
  56  * Reference documents:
  57  * http://www.geocities.com/xhelmboyx/quicktime/formats/qtm-layout.txt
  58  * Apple:
  59  *  http://developer.apple.com/documentation/QuickTime/QTFF/
  60  *  http://developer.apple.com/documentation/QuickTime/QTFF/qtff.pdf
  61  * QuickTime is a trademark of Apple (AFAIK :))
  62  */
  63
  64 #include "qtpalette.h"
  65
  66
  67 #undef NDEBUG
  68 #include <assert.h>
  69
  70 /* XXX: it's the first time I make a recursive parser I think... sorry if it's ugly :P */
  71
  72 /* those functions parse an atom */
  73 /* return code:
  74   0: continue to parse next atom
  75  <0: error occurred, exit
  76 */
  77 /* links atom IDs to parse functions */
  78 typedef struct MOVParseTableEntry {
  79     uint32_t type;
  80     int (*parse)(MOVContext *ctx, AVIOContext *pb, MOVAtom atom);
  81 } MOVParseTableEntry;
  82
  83 static const MOVParseTableEntry mov_default_parse_table[];
  84
  85 static int mov_metadata_track_or_disc_number(MOVContext *c, AVIOContext *pb,
  86                                              unsigned len, const char *key)
  87 {
  88     char buf[16];
  89
  90     short current, total;
  91     avio_rb16(pb); // unknown
  92     current = avio_rb16(pb);
  93     total = avio_rb16(pb);
  94     if (!total)
  95         snprintf(buf, sizeof(buf), "%d", current);
  96     else
  97         snprintf(buf, sizeof(buf), "%d/%d", current, total);
  98     av_dict_set(&c->fc->metadata, key, buf, 0);
  99
 100     return 0;
 101 }
 102
 103 static int mov_metadata_int8_bypass_padding(MOVContext *c, AVIOContext *pb,
 104                                             unsigned len, const char *key)
 105 {
 106     char buf[16];
 107
 108     /* bypass padding bytes */
 109     avio_r8(pb);
 110     avio_r8(pb);
 111     avio_r8(pb);
 112
 113     snprintf(buf, sizeof(buf), "%hu", avio_r8(pb));
 114     av_dict_set(&c->fc->metadata, key, buf, 0);
 115
 116     return 0;
 117 }
 118
 119 static int mov_metadata_stik(MOVContext *c, AVIOContext *pb,
 120                              unsigned len, const char *key)
 121 {
 122   char buf[16];
 123
 124   snprintf(buf, sizeof(buf), "%hu", avio_r8(pb));
 125   av_dict_set(&c->fc->metadata, key, buf, 0);
 126
 127   return 0;
 128 }
 129
 130 static int mov_metadata_gnre(MOVContext *c, AVIOContext *pb,
 131                              unsigned len, const char *key)
 132 {
 133     short genre;
 134     char buf[20];
 135
 136     avio_r8(pb); // unknown
 137
 138     genre = avio_r8(pb);
 139     if (genre < 1 || genre > ID3v1_GENRE_MAX)
 140         return 0;
 141     snprintf(buf, sizeof(buf), "%s", ff_id3v1_genre_str[genre-1]);
 142     av_dict_set(&c->fc->metadata, key, buf, 0);
 143
 144     return 0;
 145 }
 146
 147 static const uint32_t mac_to_unicode[128] = {
 148     0x00C4,0x00C5,0x00C7,0x00C9,0x00D1,0x00D6,0x00DC,0x00E1,
 149     0x00E0,0x00E2,0x00E4,0x00E3,0x00E5,0x00E7,0x00E9,0x00E8,
 150     0x00EA,0x00EB,0x00ED,0x00EC,0x00EE,0x00EF,0x00F1,0x00F3,
 151     0x00F2,0x00F4,0x00F6,0x00F5,0x00FA,0x00F9,0x00FB,0x00FC,
 152     0x2020,0x00B0,0x00A2,0x00A3,0x00A7,0x2022,0x00B6,0x00DF,
 153     0x00AE,0x00A9,0x2122,0x00B4,0x00A8,0x2260,0x00C6,0x00D8,
 154     0x221E,0x00B1,0x2264,0x2265,0x00A5,0x00B5,0x2202,0x2211,
 155     0x220F,0x03C0,0x222B,0x00AA,0x00BA,0x03A9,0x00E6,0x00F8,
 156     0x00BF,0x00A1,0x00AC,0x221A,0x0192,0x2248,0x2206,0x00AB,
 157     0x00BB,0x2026,0x00A0,0x00C0,0x00C3,0x00D5,0x0152,0x0153,
 158     0x2013,0x2014,0x201C,0x201D,0x2018,0x2019,0x00F7,0x25CA,
 159     0x00FF,0x0178,0x2044,0x20AC,0x2039,0x203A,0xFB01,0xFB02,
 160     0x2021,0x00B7,0x201A,0x201E,0x2030,0x00C2,0x00CA,0x00C1,
 161     0x00CB,0x00C8,0x00CD,0x00CE,0x00CF,0x00CC,0x00D3,0x00D4,
 162     0xF8FF,0x00D2,0x00DA,0x00DB,0x00D9,0x0131,0x02C6,0x02DC,
 163     0x00AF,0x02D8,0x02D9,0x02DA,0x00B8,0x02DD,0x02DB,0x02C7,
 164 };
 165
 166 static int mov_read_mac_string(MOVContext *c, AVIOContext *pb, int len,
 167                                char *dst, int dstlen)
 168 {
 169     char *p = dst;
 170     char *end = dst+dstlen-1;
 171     int i;
 172
 173     for (i = 0; i < len; i++) {
 174         uint8_t t, c = avio_r8(pb);
 175         if (c < 0x80 && p < end)
 176             *p++ = c;
 177         else
 178             PUT_UTF8(mac_to_unicode[c-0x80], t, if (p < end) *p++ = t;);
 179     }
 180     *p = 0;
 181     return p - dst;
 182 }
 183
 184 static int mov_read_udta_string(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 185 {
 186 #ifdef MOV_EXPORT_ALL_METADATA
 187     char tmp_key[5];
 188 #endif
 189     char str[1024], key2[16], language[4] = {0};
 190     const char *key = NULL;
 191     uint16_t str_size, langcode = 0;
 192     uint32_t data_type = 0;
 193     int (*parse)(MOVContext*, AVIOContext*, unsigned, const char*) = NULL;
 194
 195     switch (atom.type) {
 196     case MKTAG(0xa9,'n','a','m'): key = "title";     break;
 197     case MKTAG(0xa9,'a','u','t'):
 198     case MKTAG(0xa9,'A','R','T'): key = "artist";    break;
 199     case MKTAG( 'a','A','R','T'): key = "album_artist";    break;
 200     case MKTAG(0xa9,'w','r','t'): key = "composer";  break;
 201     case MKTAG( 'c','p','r','t'):
 202     case MKTAG(0xa9,'c','p','y'): key = "copyright"; break;
 203     case MKTAG(0xa9,'c','m','t'):
 204     case MKTAG(0xa9,'i','n','f'): key = "comment";   break;
 205     case MKTAG(0xa9,'a','l','b'): key = "album";     break;
 206     case MKTAG(0xa9,'d','a','y'): key = "date";      break;
 207     case MKTAG(0xa9,'g','e','n'): key = "genre";     break;
 208     case MKTAG( 'g','n','r','e'): key = "genre";
 209         parse = mov_metadata_gnre; break;
 210     case MKTAG(0xa9,'t','o','o'):
 211     case MKTAG(0xa9,'s','w','r'): key = "encoder";   break;
 212     case MKTAG(0xa9,'e','n','c'): key = "encoder";   break;
 213     case MKTAG( 'd','e','s','c'): key = "description";break;
 214     case MKTAG( 'l','d','e','s'): key = "synopsis";  break;
 215     case MKTAG( 't','v','s','h'): key = "show";      break;
 216     case MKTAG( 't','v','e','n'): key = "episode_id";break;
 217     case MKTAG( 't','v','n','n'): key = "network";   break;
 218     case MKTAG( 't','r','k','n'): key = "track";
 219         parse = mov_metadata_track_or_disc_number; break;
 220     case MKTAG( 'd','i','s','k'): key = "disc";
 221         parse = mov_metadata_track_or_disc_number; break;
 222     case MKTAG( 't','v','e','s'): key = "episode_sort";
 223         parse = mov_metadata_int8_bypass_padding; break;
 224     case MKTAG( 't','v','s','n'): key = "season_number";
 225         parse = mov_metadata_int8_bypass_padding; break;
 226     case MKTAG( 's','t','i','k'): key = "media_type";
 227         parse = mov_metadata_stik; break;
 228     }
 229
 230     if (c->itunes_metadata && atom.size > 8) {
 231         int data_size = avio_rb32(pb);
 232         int tag = avio_rl32(pb);
 233         if (tag == MKTAG('d','a','t','a')) {
 234             data_type = avio_rb32(pb); // type
 235             avio_rb32(pb); // unknown
 236             str_size = data_size - 16;
 237             atom.size -= 16;
 238         } else return 0;
 239     } else if (atom.size > 4 && key && !c->itunes_metadata) {
 240         str_size = avio_rb16(pb); // string length
 241         langcode = avio_rb16(pb);
 242         ff_mov_lang_to_iso639(langcode, language);
 243         atom.size -= 4;
 244     } else
 245         str_size = atom.size;
 246
 247 #ifdef MOV_EXPORT_ALL_METADATA
 248     if (!key) {
 249         snprintf(tmp_key, 5, "%.4s", (char*)&atom.type);
 250         key = tmp_key;
 251     }
 252 #endif
 253
 254     if (!key)
 255         return 0;
 256     if (atom.size < 0)
 257         return -1;
 258
 259     str_size = FFMIN3(sizeof(str)-1, str_size, atom.size);
 260
 261     if (parse)
 262         parse(c, pb, str_size, key);
 263     else {
 264         if (data_type == 3 || (data_type == 0 && langcode < 0x800)) { // MAC Encoded
 265             mov_read_mac_string(c, pb, str_size, str, sizeof(str));
 266         } else {
 267             avio_read(pb, str, str_size);
 268             str[str_size] = 0;
 269         }
 270         av_dict_set(&c->fc->metadata, key, str, 0);
 271         if (*language && strcmp(language, "und")) {
 272             snprintf(key2, sizeof(key2), "%s-%s", key, language);
 273             av_dict_set(&c->fc->metadata, key2, str, 0);
 274         }
 275     }
 276     av_dlog(c->fc, "lang \"%3s\" ", language);
 277     av_dlog(c->fc, "tag \"%s\" value \"%s\" atom \"%.4s\" %d %"PRId64"\n",
 278             key, str, (char*)&atom.type, str_size, atom.size);
 279
 280     return 0;
 281 }
 282
 283 static int mov_read_chpl(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 284 {
 285     int64_t start;
 286     int i, nb_chapters, str_len, version;
 287     char str[256+1];
 288
 289     if ((atom.size -= 5) < 0)
 290         return 0;
 291
 292     version = avio_r8(pb);
 293     avio_rb24(pb);
 294     if (version)
 295         avio_rb32(pb); // ???
 296     nb_chapters = avio_r8(pb);
 297
 298     for (i = 0; i < nb_chapters; i++) {
 299         if (atom.size < 9)
 300             return 0;
 301
 302         start = avio_rb64(pb);
 303         str_len = avio_r8(pb);
 304
 305         if ((atom.size -= 9+str_len) < 0)
 306             return 0;
 307
 308         avio_read(pb, str, str_len);
 309         str[str_len] = 0;
 310         avpriv_new_chapter(c->fc, i, (AVRational){1,10000000}, start, AV_NOPTS_VALUE, str);
 311     }
 312     return 0;
 313 }
 314
 315 static int mov_read_default(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 316 {
 317     int64_t total_size = 0;
 318     MOVAtom a;
 319     int i;
 320
 321     if (atom.size < 0)
 322         atom.size = INT64_MAX;
 323     while (total_size + 8 < atom.size && !pb->eof_reached) {
 324         int (*parse)(MOVContext*, AVIOContext*, MOVAtom) = NULL;
 325         a.size = atom.size;
 326         a.type=0;
 327         if (atom.size >= 8) {
 328             a.size = avio_rb32(pb);
 329             a.type = avio_rl32(pb);
 330         }
 331         av_dlog(c->fc, "type: %08x '%.4s' parent:'%.4s' sz: %"PRId64" %"PRId64" %"PRId64"\n",
 332                 a.type, (char*)&a.type, (char*)&atom.type, a.size, total_size, atom.size);
 333         total_size += 8;
 334         if (a.size == 1) { /* 64 bit extended size */
 335             a.size = avio_rb64(pb) - 8;
 336             total_size += 8;
 337         }
 338         if (a.size == 0) {
 339             a.size = atom.size - total_size;
 340             if (a.size <= 8)
 341                 break;
 342         }
 343         a.size -= 8;
 344         if (a.size < 0)
 345             break;
 346         a.size = FFMIN(a.size, atom.size - total_size);
 347
 348         for (i = 0; mov_default_parse_table[i].type; i++)
 349             if (mov_default_parse_table[i].type == a.type) {
 350                 parse = mov_default_parse_table[i].parse;
 351                 break;
 352             }
 353
 354         // container is user data
 355         if (!parse && (atom.type == MKTAG('u','d','t','a') ||
 356                        atom.type == MKTAG('i','l','s','t')))
 357             parse = mov_read_udta_string;
 358
 359         if (!parse) { /* skip leaf atoms data */
 360             avio_skip(pb, a.size);
 361         } else {
 362             int64_t start_pos = avio_tell(pb);
 363             int64_t left;
 364             int err = parse(c, pb, a);
 365             if (err < 0)
 366                 return err;
 367             if (c->found_moov && c->found_mdat &&
 368                 (!pb->seekable || start_pos + a.size == avio_size(pb)))
 369                 return 0;
 370             left = a.size - avio_tell(pb) + start_pos;
 371             if (left > 0) /* skip garbage at atom end */
 372                 avio_skip(pb, left);
 373         }
 374
 375         total_size += a.size;
 376     }
 377
 378     if (total_size < atom.size && atom.size < 0x7ffff)
 379         avio_skip(pb, atom.size - total_size);
 380
 381     return 0;
 382 }
 383
 384 static int mov_read_dref(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 385 {
 386     AVStream *st;
 387     MOVStreamContext *sc;
 388     int entries, i, j;
 389
 390     if (c->fc->nb_streams < 1)
 391         return 0;
 392     st = c->fc->streams[c->fc->nb_streams-1];
 393     sc = st->priv_data;
 394
 395     avio_rb32(pb); // version + flags
 396     entries = avio_rb32(pb);
 397     if (entries >= UINT_MAX / sizeof(*sc->drefs))
 398         return -1;
 399     sc->drefs = av_mallocz(entries * sizeof(*sc->drefs));
 400     if (!sc->drefs)
 401         return AVERROR(ENOMEM);
 402     sc->drefs_count = entries;
 403
 404     for (i = 0; i < sc->drefs_count; i++) {
 405         MOVDref *dref = &sc->drefs[i];
 406         uint32_t size = avio_rb32(pb);
 407         int64_t next = avio_tell(pb) + size - 4;
 408
 409         if (size < 12)
 410             return -1;
 411
 412         dref->type = avio_rl32(pb);
 413         avio_rb32(pb); // version + flags
 414         av_dlog(c->fc, "type %.4s size %d\n", (char*)&dref->type, size);
 415
 416         if (dref->type == MKTAG('a','l','i','s') && size > 150) {
 417             /* macintosh alias record */
 418             uint16_t volume_len, len;
 419             int16_t type;
 420
 421             avio_skip(pb, 10);
 422
 423             volume_len = avio_r8(pb);
 424             volume_len = FFMIN(volume_len, 27);
 425             avio_read(pb, dref->volume, 27);
 426             dref->volume[volume_len] = 0;
 427             av_log(c->fc, AV_LOG_DEBUG, "volume %s, len %d\n", dref->volume, volume_len);
 428
 429             avio_skip(pb, 12);
 430
 431             len = avio_r8(pb);
 432             len = FFMIN(len, 63);
 433             avio_read(pb, dref->filename, 63);
 434             dref->filename[len] = 0;
 435             av_log(c->fc, AV_LOG_DEBUG, "filename %s, len %d\n", dref->filename, len);
 436
 437             avio_skip(pb, 16);
 438
 439             /* read next level up_from_alias/down_to_target */
 440             dref->nlvl_from = avio_rb16(pb);
 441             dref->nlvl_to   = avio_rb16(pb);
 442             av_log(c->fc, AV_LOG_DEBUG, "nlvl from %d, nlvl to %d\n",
 443                    dref->nlvl_from, dref->nlvl_to);
 444
 445             avio_skip(pb, 16);
 446
 447             for (type = 0; type != -1 && avio_tell(pb) < next; ) {
 448                 type = avio_rb16(pb);
 449                 len = avio_rb16(pb);
 450                 av_log(c->fc, AV_LOG_DEBUG, "type %d, len %d\n", type, len);
 451                 if (len&1)
 452                     len += 1;
 453                 if (type == 2) { // absolute path
 454                     av_free(dref->path);
 455                     dref->path = av_mallocz(len+1);
 456                     if (!dref->path)
 457                         return AVERROR(ENOMEM);
 458                     avio_read(pb, dref->path, len);
 459                     if (len > volume_len && !strncmp(dref->path, dref->volume, volume_len)) {
 460                         len -= volume_len;
 461                         memmove(dref->path, dref->path+volume_len, len);
 462                         dref->path[len] = 0;
 463                     }
 464                     for (j = 0; j < len; j++)
 465                         if (dref->path[j] == ':')
 466                             dref->path[j] = '/';
 467                     av_log(c->fc, AV_LOG_DEBUG, "path %s\n", dref->path);
 468                 } else if (type == 0) { // directory name
 469                     av_free(dref->dir);
 470                     dref->dir = av_malloc(len+1);
 471                     if (!dref->dir)
 472                         return AVERROR(ENOMEM);
 473                     avio_read(pb, dref->dir, len);
 474                     dref->dir[len] = 0;
 475                     for (j = 0; j < len; j++)
 476                         if (dref->dir[j] == ':')
 477                             dref->dir[j] = '/';
 478                     av_log(c->fc, AV_LOG_DEBUG, "dir %s\n", dref->dir);
 479                 } else
 480                     avio_skip(pb, len);
 481             }
 482         }
 483         avio_seek(pb, next, SEEK_SET);
 484     }
 485     return 0;
 486 }
 487
 488 static int mov_read_hdlr(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 489 {
 490     AVStream *st;
 491     uint32_t type;
 492     uint32_t av_unused ctype;
 493
 494     if (c->fc->nb_streams < 1) // meta before first trak
 495         return 0;
 496
 497     st = c->fc->streams[c->fc->nb_streams-1];
 498
 499     avio_r8(pb); /* version */
 500     avio_rb24(pb); /* flags */
 501
 502     /* component type */
 503     ctype = avio_rl32(pb);
 504     type = avio_rl32(pb); /* component subtype */
 505
 506     av_dlog(c->fc, "ctype= %.4s (0x%08x)\n", (char*)&ctype, ctype);
 507     av_dlog(c->fc, "stype= %.4s\n", (char*)&type);
 508
 509     if     (type == MKTAG('v','i','d','e'))
 510         st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
 511     else if (type == MKTAG('s','o','u','n'))
 512         st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
 513     else if (type == MKTAG('m','1','a',' '))
 514         st->codec->codec_id = CODEC_ID_MP2;
 515     else if ((type == MKTAG('s','u','b','p')) || (type == MKTAG('c','l','c','p')))
 516         st->codec->codec_type = AVMEDIA_TYPE_SUBTITLE;
 517
 518     avio_rb32(pb); /* component  manufacture */
 519     avio_rb32(pb); /* component flags */
 520     avio_rb32(pb); /* component flags mask */
 521
 522     return 0;
 523 }
 524
 525 int ff_mov_read_esds(AVFormatContext *fc, AVIOContext *pb, MOVAtom atom)
 526 {
 527     AVStream *st;
 528     int tag;
 529
 530     if (fc->nb_streams < 1)
 531         return 0;
 532     st = fc->streams[fc->nb_streams-1];
 533
 534     avio_rb32(pb); /* version + flags */
 535     ff_mp4_read_descr(fc, pb, &tag);
 536     if (tag == MP4ESDescrTag) {
 537         ff_mp4_parse_es_descr(pb, NULL);
 538     } else
 539         avio_rb16(pb); /* ID */
 540
 541     ff_mp4_read_descr(fc, pb, &tag);
 542     if (tag == MP4DecConfigDescrTag)
 543         ff_mp4_read_dec_config_descr(fc, st, pb);
 544     return 0;
 545 }
 546
 547 static int mov_read_esds(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 548 {
 549     return ff_mov_read_esds(c->fc, pb, atom);
 550 }
 551
 552 static int mov_read_dac3(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 553 {
 554     AVStream *st;
 555     int ac3info, acmod, lfeon, bsmod;
 556
 557     if (c->fc->nb_streams < 1)
 558         return 0;
 559     st = c->fc->streams[c->fc->nb_streams-1];
 560
 561     ac3info = avio_rb24(pb);
 562     bsmod = (ac3info >> 14) & 0x7;
 563     acmod = (ac3info >> 11) & 0x7;
 564     lfeon = (ac3info >> 10) & 0x1;
 565     st->codec->channels = ((int[]){2,1,2,3,3,4,4,5})[acmod] + lfeon;
 566     st->codec->audio_service_type = bsmod;
 567     if (st->codec->channels > 1 && bsmod == 0x7)
 568         st->codec->audio_service_type = AV_AUDIO_SERVICE_TYPE_KARAOKE;
 569
 570     return 0;
 571 }
 572
 573 static int mov_read_wfex(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 574 {
 575     AVStream *st;
 576
 577     if (c->fc->nb_streams < 1)
 578         return 0;
 579     st = c->fc->streams[c->fc->nb_streams-1];
 580
 581     ff_get_wav_header(pb, st->codec, atom.size);
 582
 583     return 0;
 584 }
 585
 586 static int mov_read_pasp(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 587 {
 588     const int num = avio_rb32(pb);
 589     const int den = avio_rb32(pb);
 590     AVStream *st;
 591
 592     if (c->fc->nb_streams < 1)
 593         return 0;
 594     st = c->fc->streams[c->fc->nb_streams-1];
 595
 596     if ((st->sample_aspect_ratio.den != 1 || st->sample_aspect_ratio.num) && // default
 597         (den != st->sample_aspect_ratio.den || num != st->sample_aspect_ratio.num)) {
 598         av_log(c->fc, AV_LOG_WARNING,
 599                "sample aspect ratio already set to %d:%d, ignoring 'pasp' atom (%d:%d)\n",
 600                st->sample_aspect_ratio.num, st->sample_aspect_ratio.den,
 601                num, den);
 602     } else if (den != 0) {
 603         st->sample_aspect_ratio.num = num;
 604         st->sample_aspect_ratio.den = den;
 605     }
 606     return 0;
 607 }
 608
 609 /* this atom contains actual media data */
 610 static int mov_read_mdat(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 611 {
 612     if (atom.size == 0) /* wrong one (MP4) */
 613         return 0;
 614     c->found_mdat=1;
 615     return 0; /* now go for moov */
 616 }
 617
 618 /* read major brand, minor version and compatible brands and store them as metadata */
 619 static int mov_read_ftyp(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 620 {
 621     uint32_t minor_ver;
 622     int comp_brand_size;
 623     char minor_ver_str[11]; /* 32 bit integer -> 10 digits + null */
 624     char* comp_brands_str;
 625     uint8_t type[5] = {0};
 626
 627     avio_read(pb, type, 4);
 628     if (strcmp(type, "qt  "))
 629         c->isom = 1;
 630     av_log(c->fc, AV_LOG_DEBUG, "ISO: File Type Major Brand: %.4s\n",(char *)&type);
 631     av_dict_set(&c->fc->metadata, "major_brand", type, 0);
 632     minor_ver = avio_rb32(pb); /* minor version */
 633     snprintf(minor_ver_str, sizeof(minor_ver_str), "%d", minor_ver);
 634     av_dict_set(&c->fc->metadata, "minor_version", minor_ver_str, 0);
 635
 636     comp_brand_size = atom.size - 8;
 637     if (comp_brand_size < 0)
 638         return -1;
 639     comp_brands_str = av_malloc(comp_brand_size + 1); /* Add null terminator */
 640     if (!comp_brands_str)
 641         return AVERROR(ENOMEM);
 642     avio_read(pb, comp_brands_str, comp_brand_size);
 643     comp_brands_str[comp_brand_size] = 0;
 644     av_dict_set(&c->fc->metadata, "compatible_brands", comp_brands_str, 0);
 645     av_freep(&comp_brands_str);
 646
 647     return 0;
 648 }
 649
 650 /* this atom should contain all header atoms */
 651 static int mov_read_moov(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 652 {
 653     if (mov_read_default(c, pb, atom) < 0)
 654         return -1;
 655     /* we parsed the 'moov' atom, we can terminate the parsing as soon as we find the 'mdat' */
 656     /* so we don't parse the whole file if over a network */
 657     c->found_moov=1;
 658     return 0; /* now go for mdat */
 659 }
 660
 661 static int mov_read_moof(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 662 {
 663     c->fragment.moof_offset = avio_tell(pb) - 8;
 664     av_dlog(c->fc, "moof offset %"PRIx64"\n", c->fragment.moof_offset);
 665     return mov_read_default(c, pb, atom);
 666 }
 667
 668 static void mov_metadata_creation_time(AVDictionary **metadata, time_t time)
 669 {
 670     char buffer[32];
 671     if (time) {
 672         struct tm *ptm;
 673         time -= 2082844800;  /* seconds between 1904-01-01 and Epoch */
 674         ptm = gmtime(&time);
 675         if (!ptm) return;
 676         strftime(buffer, sizeof(buffer), "%Y-%m-%d %H:%M:%S", ptm);
 677         av_dict_set(metadata, "creation_time", buffer, 0);
 678     }
 679 }
 680
 681 static int mov_read_mdhd(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 682 {
 683     AVStream *st;
 684     MOVStreamContext *sc;
 685     int version;
 686     char language[4] = {0};
 687     unsigned lang;
 688     time_t creation_time;
 689
 690     if (c->fc->nb_streams < 1)
 691         return 0;
 692     st = c->fc->streams[c->fc->nb_streams-1];
 693     sc = st->priv_data;
 694
 695     version = avio_r8(pb);
 696     if (version > 1)
 697         return -1; /* unsupported */
 698
 699     avio_rb24(pb); /* flags */
 700     if (version == 1) {
 701         creation_time = avio_rb64(pb);
 702         avio_rb64(pb);
 703     } else {
 704         creation_time = avio_rb32(pb);
 705         avio_rb32(pb); /* modification time */
 706     }
 707     mov_metadata_creation_time(&st->metadata, creation_time);
 708
 709     sc->time_scale = avio_rb32(pb);
 710     st->duration = (version == 1) ? avio_rb64(pb) : avio_rb32(pb); /* duration */
 711
 712     lang = avio_rb16(pb); /* language */
 713     if (ff_mov_lang_to_iso639(lang, language))
 714         av_dict_set(&st->metadata, "language", language, 0);
 715     avio_rb16(pb); /* quality */
 716
 717     return 0;
 718 }
 719
 720 static int mov_read_mvhd(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 721 {
 722     time_t creation_time;
 723     int version = avio_r8(pb); /* version */
 724     avio_rb24(pb); /* flags */
 725
 726     if (version == 1) {
 727         creation_time = avio_rb64(pb);
 728         avio_rb64(pb);
 729     } else {
 730         creation_time = avio_rb32(pb);
 731         avio_rb32(pb); /* modification time */
 732     }
 733     mov_metadata_creation_time(&c->fc->metadata, creation_time);
 734     c->time_scale = avio_rb32(pb); /* time scale */
 735
 736     av_dlog(c->fc, "time scale = %i\n", c->time_scale);
 737
 738     c->duration = (version == 1) ? avio_rb64(pb) : avio_rb32(pb); /* duration */
 739     avio_rb32(pb); /* preferred scale */
 740
 741     avio_rb16(pb); /* preferred volume */
 742
 743     avio_skip(pb, 10); /* reserved */
 744
 745     avio_skip(pb, 36); /* display matrix */
 746
 747     avio_rb32(pb); /* preview time */
 748     avio_rb32(pb); /* preview duration */
 749     avio_rb32(pb); /* poster time */
 750     avio_rb32(pb); /* selection time */
 751     avio_rb32(pb); /* selection duration */
 752     avio_rb32(pb); /* current time */
 753     avio_rb32(pb); /* next track ID */
 754
 755     return 0;
 756 }
 757
 758 static int mov_read_smi(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 759 {
 760     AVStream *st;
 761
 762     if (c->fc->nb_streams < 1)
 763         return 0;
 764     st = c->fc->streams[c->fc->nb_streams-1];
 765
 766     if ((uint64_t)atom.size > (1<<30))
 767         return -1;
 768
 769     // currently SVQ3 decoder expect full STSD header - so let's fake it
 770     // this should be fixed and just SMI header should be passed
 771     av_free(st->codec->extradata);
 772     st->codec->extradata = av_mallocz(atom.size + 0x5a + FF_INPUT_BUFFER_PADDING_SIZE);
 773     if (!st->codec->extradata)
 774         return AVERROR(ENOMEM);
 775     st->codec->extradata_size = 0x5a + atom.size;
 776     memcpy(st->codec->extradata, "SVQ3", 4); // fake
 777     avio_read(pb, st->codec->extradata + 0x5a, atom.size);
 778     av_dlog(c->fc, "Reading SMI %"PRId64"  %s\n", atom.size, st->codec->extradata + 0x5a);
 779     return 0;
 780 }
 781
 782 static int mov_read_enda(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 783 {
 784     AVStream *st;
 785     int little_endian;
 786
 787     if (c->fc->nb_streams < 1)
 788         return 0;
 789     st = c->fc->streams[c->fc->nb_streams-1];
 790
 791     little_endian = avio_rb16(pb);
 792     av_dlog(c->fc, "enda %d\n", little_endian);
 793     if (little_endian == 1) {
 794         switch (st->codec->codec_id) {
 795         case CODEC_ID_PCM_S24BE:
 796             st->codec->codec_id = CODEC_ID_PCM_S24LE;
 797             break;
 798         case CODEC_ID_PCM_S32BE:
 799             st->codec->codec_id = CODEC_ID_PCM_S32LE;
 800             break;
 801         case CODEC_ID_PCM_F32BE:
 802             st->codec->codec_id = CODEC_ID_PCM_F32LE;
 803             break;
 804         case CODEC_ID_PCM_F64BE:
 805             st->codec->codec_id = CODEC_ID_PCM_F64LE;
 806             break;
 807         default:
 808             break;
 809         }
 810     }
 811     return 0;
 812 }
 813
 814 /* FIXME modify qdm2/svq3/h264 decoders to take full atom as extradata */
 815 static int mov_read_extradata(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 816 {
 817     AVStream *st;
 818     uint64_t size;
 819     uint8_t *buf;
 820
 821     if (c->fc->nb_streams < 1) // will happen with jp2 files
 822         return 0;
 823     st= c->fc->streams[c->fc->nb_streams-1];
 824     size= (uint64_t)st->codec->extradata_size + atom.size + 8 + FF_INPUT_BUFFER_PADDING_SIZE;
 825     if (size > INT_MAX || (uint64_t)atom.size > INT_MAX)
 826         return -1;
 827     buf= av_realloc(st->codec->extradata, size);
 828     if (!buf)
 829         return -1;
 830     st->codec->extradata= buf;
 831     buf+= st->codec->extradata_size;
 832     st->codec->extradata_size= size - FF_INPUT_BUFFER_PADDING_SIZE;
 833     AV_WB32(       buf    , atom.size + 8);
 834     AV_WL32(       buf + 4, atom.type);
 835     avio_read(pb, buf + 8, atom.size);
 836     return 0;
 837 }
 838
 839 static int mov_read_wave(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 840 {
 841     AVStream *st;
 842
 843     if (c->fc->nb_streams < 1)
 844         return 0;
 845     st = c->fc->streams[c->fc->nb_streams-1];
 846
 847     if ((uint64_t)atom.size > (1<<30))
 848         return -1;
 849
 850     if (st->codec->codec_id == CODEC_ID_QDM2 || st->codec->codec_id == CODEC_ID_QDMC) {
 851         // pass all frma atom to codec, needed at least for QDMC and QDM2
 852         av_free(st->codec->extradata);
 853         st->codec->extradata = av_mallocz(atom.size + FF_INPUT_BUFFER_PADDING_SIZE);
 854         if (!st->codec->extradata)
 855             return AVERROR(ENOMEM);
 856         st->codec->extradata_size = atom.size;
 857         avio_read(pb, st->codec->extradata, atom.size);
 858     } else if (atom.size > 8) { /* to read frma, esds atoms */
 859         if (mov_read_default(c, pb, atom) < 0)
 860             return -1;
 861     } else
 862         avio_skip(pb, atom.size);
 863     return 0;
 864 }
 865
 866 /**
 867  * This function reads atom content and puts data in extradata without tag
 868  * nor size unlike mov_read_extradata.
 869  */
 870 static int mov_read_glbl(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 871 {
 872     AVStream *st;
 873
 874     if (c->fc->nb_streams < 1)
 875         return 0;
 876     st = c->fc->streams[c->fc->nb_streams-1];
 877
 878     if ((uint64_t)atom.size > (1<<30))
 879         return -1;
 880
 881     av_free(st->codec->extradata);
 882     st->codec->extradata = av_mallocz(atom.size + FF_INPUT_BUFFER_PADDING_SIZE);
 883     if (!st->codec->extradata)
 884         return AVERROR(ENOMEM);
 885     st->codec->extradata_size = atom.size;
 886     avio_read(pb, st->codec->extradata, atom.size);
 887     return 0;
 888 }
 889
 890 /**
 891  * An strf atom is a BITMAPINFOHEADER struct. This struct is 40 bytes itself,
 892  * but can have extradata appended at the end after the 40 bytes belonging
 893  * to the struct.
 894  */
 895 static int mov_read_strf(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 896 {
 897     AVStream *st;
 898
 899     if (c->fc->nb_streams < 1)
 900         return 0;
 901     if (atom.size <= 40)
 902         return 0;
 903     st = c->fc->streams[c->fc->nb_streams-1];
 904
 905     if ((uint64_t)atom.size > (1<<30))
 906         return -1;
 907
 908     av_free(st->codec->extradata);
 909     st->codec->extradata = av_mallocz(atom.size - 40 + FF_INPUT_BUFFER_PADDING_SIZE);
 910     if (!st->codec->extradata)
 911         return AVERROR(ENOMEM);
 912     st->codec->extradata_size = atom.size - 40;
 913     avio_skip(pb, 40);
 914     avio_read(pb, st->codec->extradata, atom.size - 40);
 915     return 0;
 916 }
 917
 918 static int mov_read_stco(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 919 {
 920     AVStream *st;
 921     MOVStreamContext *sc;
 922     unsigned int i, entries;
 923
 924     if (c->fc->nb_streams < 1)
 925         return 0;
 926     st = c->fc->streams[c->fc->nb_streams-1];
 927     sc = st->priv_data;
 928
 929     avio_r8(pb); /* version */
 930     avio_rb24(pb); /* flags */
 931
 932     entries = avio_rb32(pb);
 933
 934     if (entries >= UINT_MAX/sizeof(int64_t))
 935         return -1;
 936
 937     sc->chunk_offsets = av_malloc(entries * sizeof(int64_t));
 938     if (!sc->chunk_offsets)
 939         return AVERROR(ENOMEM);
 940     sc->chunk_count = entries;
 941
 942     if      (atom.type == MKTAG('s','t','c','o'))
 943         for (i=0; i<entries; i++)
 944             sc->chunk_offsets[i] = avio_rb32(pb);
 945     else if (atom.type == MKTAG('c','o','6','4'))
 946         for (i=0; i<entries; i++)
 947             sc->chunk_offsets[i] = avio_rb64(pb);
 948     else
 949         return -1;
 950
 951     return 0;
 952 }
 953
 954 /**
 955  * Compute codec id for 'lpcm' tag.
 956  * See CoreAudioTypes and AudioStreamBasicDescription at Apple.
 957  */
 958 enum CodecID ff_mov_get_lpcm_codec_id(int bps, int flags)
 959 {
 960     if (flags & 1) { // floating point
 961         if (flags & 2) { // big endian
 962             if      (bps == 32) return CODEC_ID_PCM_F32BE;
 963             else if (bps == 64) return CODEC_ID_PCM_F64BE;
 964         } else {
 965             if      (bps == 32) return CODEC_ID_PCM_F32LE;
 966             else if (bps == 64) return CODEC_ID_PCM_F64LE;
 967         }
 968     } else {
 969         if (flags & 2) {
 970             if      (bps == 8)
 971                 // signed integer
 972                 if (flags & 4)  return CODEC_ID_PCM_S8;
 973                 else            return CODEC_ID_PCM_U8;
 974             else if (bps == 16) return CODEC_ID_PCM_S16BE;
 975             else if (bps == 24) return CODEC_ID_PCM_S24BE;
 976             else if (bps == 32) return CODEC_ID_PCM_S32BE;
 977         } else {
 978             if      (bps == 8)
 979                 if (flags & 4)  return CODEC_ID_PCM_S8;
 980                 else            return CODEC_ID_PCM_U8;
 981             else if (bps == 16) return CODEC_ID_PCM_S16LE;
 982             else if (bps == 24) return CODEC_ID_PCM_S24LE;
 983             else if (bps == 32) return CODEC_ID_PCM_S32LE;
 984         }
 985     }
 986     return CODEC_ID_NONE;
 987 }
 988
 989 int ff_mov_read_stsd_entries(MOVContext *c, AVIOContext *pb, int entries)
 990 {
 991     AVStream *st;
 992     MOVStreamContext *sc;
 993     int j, pseudo_stream_id;
 994
 995     if (c->fc->nb_streams < 1)
 996         return 0;
 997     st = c->fc->streams[c->fc->nb_streams-1];
 998     sc = st->priv_data;
 999
1000     for (pseudo_stream_id=0; pseudo_stream_id<entries; pseudo_stream_id++) {
1001         //Parsing Sample description table
1002         enum CodecID id;
1003         int dref_id = 1;
1004         MOVAtom a = { AV_RL32("stsd") };
1005         int64_t start_pos = avio_tell(pb);
1006         int size = avio_rb32(pb); /* size */
1007         uint32_t format = avio_rl32(pb); /* data format */
1008
1009         if (size >= 16) {
1010             avio_rb32(pb); /* reserved */
1011             avio_rb16(pb); /* reserved */
1012             dref_id = avio_rb16(pb);
1013         }
1014
1015         if (st->codec->codec_tag &&
1016             st->codec->codec_tag != format &&
1017             (c->fc->video_codec_id ? ff_codec_get_id(codec_movvideo_tags, format) != c->fc->video_codec_id
1018                                    : st->codec->codec_tag != MKTAG('j','p','e','g'))
1019            ){
1020             /* Multiple fourcc, we skip JPEG. This is not correct, we should
1021              * export it as a separate AVStream but this needs a few changes
1022              * in the MOV demuxer, patch welcome. */
1023         multiple_stsd:
1024             av_log(c->fc, AV_LOG_WARNING, "multiple fourcc not supported\n");
1025             avio_skip(pb, size - (avio_tell(pb) - start_pos));
1026             continue;
1027         }
1028         /* we cannot demux concatenated h264 streams because of different extradata */
1029         if (st->codec->codec_tag && st->codec->codec_tag == AV_RL32("avc1"))
1030             goto multiple_stsd;
1031         sc->pseudo_stream_id = st->codec->codec_tag ? -1 : pseudo_stream_id;
1032         sc->dref_id= dref_id;
1033
1034         st->codec->codec_tag = format;
1035         id = ff_codec_get_id(codec_movaudio_tags, format);
1036         if (id<=0 && ((format&0xFFFF) == 'm'+('s'<<8) || (format&0xFFFF) == 'T'+('S'<<8)))
1037             id = ff_codec_get_id(ff_codec_wav_tags, av_bswap32(format)&0xFFFF);
1038
1039         if (st->codec->codec_type != AVMEDIA_TYPE_VIDEO && id > 0) {
1040             st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
1041         } else if (st->codec->codec_type != AVMEDIA_TYPE_AUDIO && /* do not overwrite codec type */
1042                    format && format != MKTAG('m','p','4','s')) { /* skip old asf mpeg4 tag */
1043             id = ff_codec_get_id(codec_movvideo_tags, format);
1044             if (id <= 0)
1045                 id = ff_codec_get_id(ff_codec_bmp_tags, format);
1046             if (id > 0)
1047                 st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
1048             else if (st->codec->codec_type == AVMEDIA_TYPE_DATA){
1049                 id = ff_codec_get_id(ff_codec_movsubtitle_tags, format);
1050                 if (id > 0)
1051                     st->codec->codec_type = AVMEDIA_TYPE_SUBTITLE;
1052             }
1053         }
1054
1055         av_dlog(c->fc, "size=%d 4CC= %c%c%c%c codec_type=%d\n", size,
1056                 (format >> 0) & 0xff, (format >> 8) & 0xff, (format >> 16) & 0xff,
1057                 (format >> 24) & 0xff, st->codec->codec_type);
1058
1059         if (st->codec->codec_type==AVMEDIA_TYPE_VIDEO) {
1060             unsigned int color_depth, len;
1061             int color_greyscale;
1062
1063             st->codec->codec_id = id;
1064             avio_rb16(pb); /* version */
1065             avio_rb16(pb); /* revision level */
1066             avio_rb32(pb); /* vendor */
1067             avio_rb32(pb); /* temporal quality */
1068             avio_rb32(pb); /* spatial quality */
1069
1070             st->codec->width = avio_rb16(pb); /* width */
1071             st->codec->height = avio_rb16(pb); /* height */
1072
1073             avio_rb32(pb); /* horiz resolution */
1074             avio_rb32(pb); /* vert resolution */
1075             avio_rb32(pb); /* data size, always 0 */
1076             avio_rb16(pb); /* frames per samples */
1077
1078             len = avio_r8(pb); /* codec name, pascal string */
1079             if (len > 31)
1080                 len = 31;
1081             mov_read_mac_string(c, pb, len, st->codec->codec_name, 32);
1082             if (len < 31)
1083                 avio_skip(pb, 31 - len);
1084             /* codec_tag YV12 triggers an UV swap in rawdec.c */
1085             if (!memcmp(st->codec->codec_name, "Planar Y'CbCr 8-bit 4:2:0", 25))
1086                 st->codec->codec_tag=MKTAG('I', '4', '2', '0');
1087
1088             st->codec->bits_per_coded_sample = avio_rb16(pb); /* depth */
1089             st->codec->color_table_id = avio_rb16(pb); /* colortable id */
1090             av_dlog(c->fc, "depth %d, ctab id %d\n",
1091                    st->codec->bits_per_coded_sample, st->codec->color_table_id);
1092             /* figure out the palette situation */
1093             color_depth = st->codec->bits_per_coded_sample & 0x1F;
1094             color_greyscale = st->codec->bits_per_coded_sample & 0x20;
1095
1096             /* if the depth is 2, 4, or 8 bpp, file is palettized */
1097             if ((color_depth == 2) || (color_depth == 4) ||
1098                 (color_depth == 8)) {
1099                 /* for palette traversal */
1100                 unsigned int color_start, color_count, color_end;
1101                 unsigned char r, g, b;
1102
1103                 if (color_greyscale) {
1104                     int color_index, color_dec;
1105                     /* compute the greyscale palette */
1106                     st->codec->bits_per_coded_sample = color_depth;
1107                     color_count = 1 << color_depth;
1108                     color_index = 255;
1109                     color_dec = 256 / (color_count - 1);
1110                     for (j = 0; j < color_count; j++) {
1111                         r = g = b = color_index;
1112                         sc->palette[j] =
1113                             (r << 16) | (g << 8) | (b);
1114                         color_index -= color_dec;
1115                         if (color_index < 0)
1116                             color_index = 0;
1117                     }
1118                 } else if (st->codec->color_table_id) {
1119                     const uint8_t *color_table;
1120                     /* if flag bit 3 is set, use the default palette */
1121                     color_count = 1 << color_depth;
1122                     if (color_depth == 2)
1123                         color_table = ff_qt_default_palette_4;
1124                     else if (color_depth == 4)
1125                         color_table = ff_qt_default_palette_16;
1126                     else
1127                         color_table = ff_qt_default_palette_256;
1128
1129                     for (j = 0; j < color_count; j++) {
1130                         r = color_table[j * 3 + 0];
1131                         g = color_table[j * 3 + 1];
1132                         b = color_table[j * 3 + 2];
1133                         sc->palette[j] =
1134                             (r << 16) | (g << 8) | (b);
1135                     }
1136                 } else {
1137                     /* load the palette from the file */
1138                     color_start = avio_rb32(pb);
1139                     color_count = avio_rb16(pb);
1140                     color_end = avio_rb16(pb);
1141                     if ((color_start <= 255) &&
1142                         (color_end <= 255)) {
1143                         for (j = color_start; j <= color_end; j++) {
1144                             /* each R, G, or B component is 16 bits;
1145                              * only use the top 8 bits; skip alpha bytes
1146                              * up front */
1147                             avio_r8(pb);
1148                             avio_r8(pb);
1149                             r = avio_r8(pb);
1150                             avio_r8(pb);
1151                             g = avio_r8(pb);
1152                             avio_r8(pb);
1153                             b = avio_r8(pb);
1154                             avio_r8(pb);
1155                             sc->palette[j] =
1156                                 (r << 16) | (g << 8) | (b);
1157                         }
1158                     }
1159                 }
1160                 sc->has_palette = 1;
1161             }
1162         } else if (st->codec->codec_type==AVMEDIA_TYPE_AUDIO) {
1163             int bits_per_sample, flags;
1164             uint16_t version = avio_rb16(pb);
1165
1166             st->codec->codec_id = id;
1167             avio_rb16(pb); /* revision level */
1168             avio_rb32(pb); /* vendor */
1169
1170             st->codec->channels = avio_rb16(pb);             /* channel count */
1171             av_dlog(c->fc, "audio channels %d\n", st->codec->channels);
1172             st->codec->bits_per_coded_sample = avio_rb16(pb);      /* sample size */
1173
1174             sc->audio_cid = avio_rb16(pb);
1175             avio_rb16(pb); /* packet size = 0 */
1176
1177             st->codec->sample_rate = ((avio_rb32(pb) >> 16));
1178
1179             //Read QT version 1 fields. In version 0 these do not exist.
1180             av_dlog(c->fc, "version =%d, isom =%d\n",version,c->isom);
1181             if (!c->isom) {
1182                 if (version==1) {
1183                     sc->samples_per_frame = avio_rb32(pb);
1184                     avio_rb32(pb); /* bytes per packet */
1185                     sc->bytes_per_frame = avio_rb32(pb);
1186                     avio_rb32(pb); /* bytes per sample */
1187                 } else if (version==2) {
1188                     avio_rb32(pb); /* sizeof struct only */
1189                     st->codec->sample_rate = av_int2dbl(avio_rb64(pb)); /* float 64 */
1190                     st->codec->channels = avio_rb32(pb);
1191                     avio_rb32(pb); /* always 0x7F000000 */
1192                     st->codec->bits_per_coded_sample = avio_rb32(pb); /* bits per channel if sound is uncompressed */
1193                     flags = avio_rb32(pb); /* lpcm format specific flag */
1194                     sc->bytes_per_frame = avio_rb32(pb); /* bytes per audio packet if constant */
1195                     sc->samples_per_frame = avio_rb32(pb); /* lpcm frames per audio packet if constant */
1196                     if (format == MKTAG('l','p','c','m'))
1197                         st->codec->codec_id = ff_mov_get_lpcm_codec_id(st->codec->bits_per_coded_sample, flags);
1198                 }
1199             }
1200
1201             switch (st->codec->codec_id) {
1202             case CODEC_ID_PCM_S8:
1203             case CODEC_ID_PCM_U8:
1204                 if (st->codec->bits_per_coded_sample == 16)
1205                     st->codec->codec_id = CODEC_ID_PCM_S16BE;
1206                 break;
1207             case CODEC_ID_PCM_S16LE:
1208             case CODEC_ID_PCM_S16BE:
1209                 if (st->codec->bits_per_coded_sample == 8)
1210                     st->codec->codec_id = CODEC_ID_PCM_S8;
1211                 else if (st->codec->bits_per_coded_sample == 24)
1212                     st->codec->codec_id =
1213                         st->codec->codec_id == CODEC_ID_PCM_S16BE ?
1214                         CODEC_ID_PCM_S24BE : CODEC_ID_PCM_S24LE;
1215                 break;
1216             /* set values for old format before stsd version 1 appeared */
1217             case CODEC_ID_MACE3:
1218                 sc->samples_per_frame = 6;
1219                 sc->bytes_per_frame = 2*st->codec->channels;
1220                 break;
1221             case CODEC_ID_MACE6:
1222                 sc->samples_per_frame = 6;
1223                 sc->bytes_per_frame = 1*st->codec->channels;
1224                 break;
1225             case CODEC_ID_ADPCM_IMA_QT:
1226                 sc->samples_per_frame = 64;
1227                 sc->bytes_per_frame = 34*st->codec->channels;
1228                 break;
1229             case CODEC_ID_GSM:
1230                 sc->samples_per_frame = 160;
1231                 sc->bytes_per_frame = 33;
1232                 break;
1233             default:
1234                 break;
1235             }
1236
1237             bits_per_sample = av_get_bits_per_sample(st->codec->codec_id);
1238             if (bits_per_sample) {
1239                 st->codec->bits_per_coded_sample = bits_per_sample;
1240                 sc->sample_size = (bits_per_sample >> 3) * st->codec->channels;
1241             }
1242         } else if (st->codec->codec_type==AVMEDIA_TYPE_SUBTITLE){
1243             // ttxt stsd contains display flags, justification, background
1244             // color, fonts, and default styles, so fake an atom to read it
1245             MOVAtom fake_atom = { .size = size - (avio_tell(pb) - start_pos) };
1246             if (format != AV_RL32("mp4s")) // mp4s contains a regular esds atom
1247                 mov_read_glbl(c, pb, fake_atom);
1248             st->codec->codec_id= id;
1249             st->codec->width = sc->width;
1250             st->codec->height = sc->height;
1251         } else {
1252             /* other codec type, just skip (rtp, mp4s, tmcd ...) */
1253             avio_skip(pb, size - (avio_tell(pb) - start_pos));
1254         }
1255         /* this will read extra atoms at the end (wave, alac, damr, avcC, SMI ...) */
1256         a.size = size - (avio_tell(pb) - start_pos);
1257         if (a.size > 8) {
1258             if (mov_read_default(c, pb, a) < 0)
1259                 return -1;
1260         } else if (a.size > 0)
1261             avio_skip(pb, a.size);
1262     }
1263
1264     if (st->codec->codec_type==AVMEDIA_TYPE_AUDIO && st->codec->sample_rate==0 && sc->time_scale>1)
1265         st->codec->sample_rate= sc->time_scale;
1266
1267     /* special codec parameters handling */
1268     switch (st->codec->codec_id) {
1269 #if CONFIG_DV_DEMUXER
1270     case CODEC_ID_DVAUDIO:
1271         c->dv_fctx = avformat_alloc_context();
1272         c->dv_demux = avpriv_dv_init_demux(c->dv_fctx);
1273         if (!c->dv_demux) {
1274             av_log(c->fc, AV_LOG_ERROR, "dv demux context init error\n");
1275             return -1;
1276         }
1277         sc->dv_audio_container = 1;
1278         st->codec->codec_id = CODEC_ID_PCM_S16LE;
1279         break;
1280 #endif
1281     /* no ifdef since parameters are always those */
1282     case CODEC_ID_QCELP:
1283         // force sample rate for qcelp when not stored in mov
1284         if (st->codec->codec_tag != MKTAG('Q','c','l','p'))
1285             st->codec->sample_rate = 8000;
1286         st->codec->frame_size= 160;
1287         st->codec->channels= 1; /* really needed */
1288         break;
1289     case CODEC_ID_AMR_NB:
1290     case CODEC_ID_AMR_WB:
1291         st->codec->frame_size= sc->samples_per_frame;
1292         st->codec->channels= 1; /* really needed */
1293         /* force sample rate for amr, stsd in 3gp does not store sample rate */
1294         if (st->codec->codec_id == CODEC_ID_AMR_NB)
1295             st->codec->sample_rate = 8000;
1296         else if (st->codec->codec_id == CODEC_ID_AMR_WB)
1297             st->codec->sample_rate = 16000;
1298         break;
1299     case CODEC_ID_MP2:
1300     case CODEC_ID_MP3:
1301         st->codec->codec_type = AVMEDIA_TYPE_AUDIO; /* force type after stsd for m1a hdlr */
1302         st->need_parsing = AVSTREAM_PARSE_FULL;
1303         break;
1304     case CODEC_ID_GSM:
1305     case CODEC_ID_ADPCM_MS:
1306     case CODEC_ID_ADPCM_IMA_WAV:
1307         st->codec->frame_size = sc->samples_per_frame;
1308         st->codec->block_align = sc->bytes_per_frame;
1309         break;
1310     case CODEC_ID_ALAC:
1311         if (st->codec->extradata_size == 36) {
1312             st->codec->frame_size = AV_RB32(st->codec->extradata+12);
1313             st->codec->channels   = AV_RB8 (st->codec->extradata+21);
1314             st->codec->sample_rate = AV_RB32(st->codec->extradata+32);
1315         }
1316         break;
1317     default:
1318         break;
1319     }
1320
1321     return 0;
1322 }
1323
1324 static int mov_read_stsd(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1325 {
1326     int entries;
1327
1328     avio_r8(pb); /* version */
1329     avio_rb24(pb); /* flags */
1330     entries = avio_rb32(pb);
1331
1332     return ff_mov_read_stsd_entries(c, pb, entries);
1333 }
1334
1335 static int mov_read_stsc(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1336 {
1337     AVStream *st;
1338     MOVStreamContext *sc;
1339     unsigned int i, entries;
1340
1341     if (c->fc->nb_streams < 1)
1342         return 0;
1343     st = c->fc->streams[c->fc->nb_streams-1];
1344     sc = st->priv_data;
1345
1346     avio_r8(pb); /* version */
1347     avio_rb24(pb); /* flags */
1348
1349     entries = avio_rb32(pb);
1350
1351     av_dlog(c->fc, "track[%i].stsc.entries = %i\n", c->fc->nb_streams-1, entries);
1352
1353     if (entries >= UINT_MAX / sizeof(*sc->stsc_data))
1354         return -1;
1355     sc->stsc_data = av_malloc(entries * sizeof(*sc->stsc_data));
1356     if (!sc->stsc_data)
1357         return AVERROR(ENOMEM);
1358     sc->stsc_count = entries;
1359
1360     for (i=0; i<entries; i++) {
1361         sc->stsc_data[i].first = avio_rb32(pb);
1362         sc->stsc_data[i].count = avio_rb32(pb);
1363         sc->stsc_data[i].id = avio_rb32(pb);
1364     }
1365     return 0;
1366 }
1367
1368 static int mov_read_stps(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1369 {
1370     AVStream *st;
1371     MOVStreamContext *sc;
1372     unsigned i, entries;
1373
1374     if (c->fc->nb_streams < 1)
1375         return 0;
1376     st = c->fc->streams[c->fc->nb_streams-1];
1377     sc = st->priv_data;
1378
1379     avio_rb32(pb); // version + flags
1380
1381     entries = avio_rb32(pb);
1382     if (entries >= UINT_MAX / sizeof(*sc->stps_data))
1383         return -1;
1384     sc->stps_data = av_malloc(entries * sizeof(*sc->stps_data));
1385     if (!sc->stps_data)
1386         return AVERROR(ENOMEM);
1387     sc->stps_count = entries;
1388
1389     for (i = 0; i < entries; i++) {
1390         sc->stps_data[i] = avio_rb32(pb);
1391         //av_dlog(c->fc, "stps %d\n", sc->stps_data[i]);
1392     }
1393
1394     return 0;
1395 }
1396
1397 static int mov_read_stss(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1398 {
1399     AVStream *st;
1400     MOVStreamContext *sc;
1401     unsigned int i, entries;
1402
1403     if (c->fc->nb_streams < 1)
1404         return 0;
1405     st = c->fc->streams[c->fc->nb_streams-1];
1406     sc = st->priv_data;
1407
1408     avio_r8(pb); /* version */
1409     avio_rb24(pb); /* flags */
1410
1411     entries = avio_rb32(pb);
1412
1413     av_dlog(c->fc, "keyframe_count = %d\n", entries);
1414
1415     if (entries >= UINT_MAX / sizeof(int))
1416         return -1;
1417     sc->keyframes = av_malloc(entries * sizeof(int));
1418     if (!sc->keyframes)
1419         return AVERROR(ENOMEM);
1420     sc->keyframe_count = entries;
1421
1422     for (i=0; i<entries; i++) {
1423         sc->keyframes[i] = avio_rb32(pb);
1424         //av_dlog(c->fc, "keyframes[]=%d\n", sc->keyframes[i]);
1425     }
1426     return 0;
1427 }
1428
1429 static int mov_read_stsz(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1430 {
1431     AVStream *st;
1432     MOVStreamContext *sc;
1433     unsigned int i, entries, sample_size, field_size, num_bytes;
1434     GetBitContext gb;
1435     unsigned char* buf;
1436
1437     if (c->fc->nb_streams < 1)
1438         return 0;
1439     st = c->fc->streams[c->fc->nb_streams-1];
1440     sc = st->priv_data;
1441
1442     avio_r8(pb); /* version */
1443     avio_rb24(pb); /* flags */
1444
1445     if (atom.type == MKTAG('s','t','s','z')) {
1446         sample_size = avio_rb32(pb);
1447         if (!sc->sample_size) /* do not overwrite value computed in stsd */
1448             sc->sample_size = sample_size;
1449         field_size = 32;
1450     } else {
1451         sample_size = 0;
1452         avio_rb24(pb); /* reserved */
1453         field_size = avio_r8(pb);
1454     }
1455     entries = avio_rb32(pb);
1456
1457     av_dlog(c->fc, "sample_size = %d sample_count = %d\n", sc->sample_size, entries);
1458
1459     sc->sample_count = entries;
1460     if (sample_size)
1461         return 0;
1462
1463     if (field_size != 4 && field_size != 8 && field_size != 16 && field_size != 32) {
1464         av_log(c->fc, AV_LOG_ERROR, "Invalid sample field size %d\n", field_size);
1465         return -1;
1466     }
1467
1468     if (entries >= UINT_MAX / sizeof(int) || entries >= (UINT_MAX - 4) / field_size)
1469         return -1;
1470     sc->sample_sizes = av_malloc(entries * sizeof(int));
1471     if (!sc->sample_sizes)
1472         return AVERROR(ENOMEM);
1473
1474     num_bytes = (entries*field_size+4)>>3;
1475
1476     buf = av_malloc(num_bytes+FF_INPUT_BUFFER_PADDING_SIZE);
1477     if (!buf) {
1478         av_freep(&sc->sample_sizes);
1479         return AVERROR(ENOMEM);
1480     }
1481
1482     if (avio_read(pb, buf, num_bytes) < num_bytes) {
1483         av_freep(&sc->sample_sizes);
1484         av_free(buf);
1485         return -1;
1486     }
1487
1488     init_get_bits(&gb, buf, 8*num_bytes);
1489
1490     for (i=0; i<entries; i++)
1491         sc->sample_sizes[i] = get_bits_long(&gb, field_size);
1492
1493     av_free(buf);
1494     return 0;
1495 }
1496
1497 static int mov_read_stts(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1498 {
1499     AVStream *st;
1500     MOVStreamContext *sc;
1501     unsigned int i, entries;
1502     int64_t duration=0;
1503     int64_t total_sample_count=0;
1504
1505     if (c->fc->nb_streams < 1)
1506         return 0;
1507     st = c->fc->streams[c->fc->nb_streams-1];
1508     sc = st->priv_data;
1509
1510     avio_r8(pb); /* version */
1511     avio_rb24(pb); /* flags */
1512     entries = avio_rb32(pb);
1513
1514     av_dlog(c->fc, "track[%i].stts.entries = %i\n",
1515             c->fc->nb_streams-1, entries);
1516
1517     if (!entries || entries >= UINT_MAX / sizeof(*sc->stts_data))
1518         return AVERROR(EINVAL);
1519
1520     sc->stts_data = av_malloc(entries * sizeof(*sc->stts_data));
1521     if (!sc->stts_data)
1522         return AVERROR(ENOMEM);
1523
1524     sc->stts_count = entries;
1525
1526     for (i=0; i<entries; i++) {
1527         int sample_duration;
1528         int sample_count;
1529
1530         sample_count=avio_rb32(pb);
1531         sample_duration = avio_rb32(pb);
1532         sc->stts_data[i].count= sample_count;
1533         sc->stts_data[i].duration= sample_duration;
1534
1535         av_dlog(c->fc, "sample_count=%d, sample_duration=%d\n",
1536                 sample_count, sample_duration);
1537
1538         duration+=(int64_t)sample_duration*sample_count;
1539         total_sample_count+=sample_count;
1540     }
1541
1542     st->nb_frames= total_sample_count;
1543     if (duration)
1544         st->duration= duration;
1545     return 0;
1546 }
1547
1548 static int mov_read_ctts(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1549 {
1550     AVStream *st;
1551     MOVStreamContext *sc;
1552     unsigned int i, entries;
1553
1554     if (c->fc->nb_streams < 1)
1555         return 0;
1556     st = c->fc->streams[c->fc->nb_streams-1];
1557     sc = st->priv_data;
1558
1559     avio_r8(pb); /* version */
1560     avio_rb24(pb); /* flags */
1561     entries = avio_rb32(pb);
1562
1563     av_dlog(c->fc, "track[%i].ctts.entries = %i\n", c->fc->nb_streams-1, entries);
1564
1565     if (entries >= UINT_MAX / sizeof(*sc->ctts_data))
1566         return -1;
1567     sc->ctts_data = av_malloc(entries * sizeof(*sc->ctts_data));
1568     if (!sc->ctts_data)
1569         return AVERROR(ENOMEM);
1570     sc->ctts_count = entries;
1571
1572     for (i=0; i<entries; i++) {
1573         int count    =avio_rb32(pb);
1574         int duration =avio_rb32(pb);
1575
1576         sc->ctts_data[i].count   = count;
1577         sc->ctts_data[i].duration= duration;
1578         if (duration < 0)
1579             sc->dts_shift = FFMAX(sc->dts_shift, -duration);
1580     }
1581
1582     av_dlog(c->fc, "dts shift %d\n", sc->dts_shift);
1583
1584     return 0;
1585 }
1586
1587 static void mov_build_index(MOVContext *mov, AVStream *st)
1588 {
1589     MOVStreamContext *sc = st->priv_data;
1590     int64_t current_offset;
1591     int64_t current_dts = 0;
1592     unsigned int stts_index = 0;
1593     unsigned int stsc_index = 0;
1594     unsigned int stss_index = 0;
1595     unsigned int stps_index = 0;
1596     unsigned int i, j;
1597     uint64_t stream_size = 0;
1598
1599     /* adjust first dts according to edit list */
1600     if (sc->time_offset && mov->time_scale > 0) {
1601         if (sc->time_offset < 0)
1602             sc->time_offset = av_rescale(sc->time_offset, sc->time_scale, mov->time_scale);
1603         current_dts = -sc->time_offset;
1604         if (sc->ctts_data && sc->stts_data &&
1605             sc->ctts_data[0].duration / sc->stts_data[0].duration > 16) {
1606             /* more than 16 frames delay, dts are likely wrong
1607                this happens with files created by iMovie */
1608             sc->wrong_dts = 1;
1609             st->codec->has_b_frames = 1;
1610         }
1611     }
1612
1613     /* only use old uncompressed audio chunk demuxing when stts specifies it */
1614     if (!(st->codec->codec_type == AVMEDIA_TYPE_AUDIO &&
1615           sc->stts_count == 1 && sc->stts_data[0].duration == 1)) {
1616         unsigned int current_sample = 0;
1617         unsigned int stts_sample = 0;
1618         unsigned int sample_size;
1619         unsigned int distance = 0;
1620         int key_off = sc->keyframes && sc->keyframes[0] == 1;
1621
1622         current_dts -= sc->dts_shift;
1623
1624         if (sc->sample_count >= UINT_MAX / sizeof(*st->index_entries))
1625             return;
1626         st->index_entries = av_malloc(sc->sample_count*sizeof(*st->index_entries));
1627         if (!st->index_entries)
1628             return;
1629         st->index_entries_allocated_size = sc->sample_count*sizeof(*st->index_entries);
1630
1631         for (i = 0; i < sc->chunk_count; i++) {
1632             current_offset = sc->chunk_offsets[i];
1633             while (stsc_index + 1 < sc->stsc_count &&
1634                 i + 1 == sc->stsc_data[stsc_index + 1].first)
1635                 stsc_index++;
1636             for (j = 0; j < sc->stsc_data[stsc_index].count; j++) {
1637                 int keyframe = 0;
1638                 if (current_sample >= sc->sample_count) {
1639                     av_log(mov->fc, AV_LOG_ERROR, "wrong sample count\n");
1640                     return;
1641                 }
1642
1643                 if (!sc->keyframe_count || current_sample+key_off == sc->keyframes[stss_index]) {
1644                     keyframe = 1;
1645                     if (stss_index + 1 < sc->keyframe_count)
1646                         stss_index++;
1647                 } else if (sc->stps_count && current_sample+key_off == sc->stps_data[stps_index]) {
1648                     keyframe = 1;
1649                     if (stps_index + 1 < sc->stps_count)
1650                         stps_index++;
1651                 }
1652                 if (keyframe)
1653                     distance = 0;
1654                 sample_size = sc->sample_size > 0 ? sc->sample_size : sc->sample_sizes[current_sample];
1655                 if (sc->pseudo_stream_id == -1 ||
1656                    sc->stsc_data[stsc_index].id - 1 == sc->pseudo_stream_id) {
1657                     AVIndexEntry *e = &st->index_entries[st->nb_index_entries++];
1658                     e->pos = current_offset;
1659                     e->timestamp = current_dts;
1660                     e->size = sample_size;
1661                     e->min_distance = distance;
1662                     e->flags = keyframe ? AVINDEX_KEYFRAME : 0;
1663                     av_dlog(mov->fc, "AVIndex stream %d, sample %d, offset %"PRIx64", dts %"PRId64", "
1664                             "size %d, distance %d, keyframe %d\n", st->index, current_sample,
1665                             current_offset, current_dts, sample_size, distance, keyframe);
1666                 }
1667
1668                 current_offset += sample_size;
1669                 stream_size += sample_size;
1670                 current_dts += sc->stts_data[stts_index].duration;
1671                 distance++;
1672                 stts_sample++;
1673                 current_sample++;
1674                 if (stts_index + 1 < sc->stts_count && stts_sample == sc->stts_data[stts_index].count) {
1675                     stts_sample = 0;
1676                     stts_index++;
1677                 }
1678             }
1679         }
1680         if (st->duration > 0)
1681             st->codec->bit_rate = stream_size*8*sc->time_scale/st->duration;
1682     } else {
1683         unsigned chunk_samples, total = 0;
1684
1685         // compute total chunk count
1686         for (i = 0; i < sc->stsc_count; i++) {
1687             unsigned count, chunk_count;
1688
1689             chunk_samples = sc->stsc_data[i].count;
1690             if (sc->samples_per_frame && chunk_samples % sc->samples_per_frame) {
1691                 av_log(mov->fc, AV_LOG_ERROR, "error unaligned chunk\n");
1692                 return;
1693             }
1694
1695             if (sc->samples_per_frame >= 160) { // gsm
1696                 count = chunk_samples / sc->samples_per_frame;
1697             } else if (sc->samples_per_frame > 1) {
1698                 unsigned samples = (1024/sc->samples_per_frame)*sc->samples_per_frame;
1699                 count = (chunk_samples+samples-1) / samples;
1700             } else {
1701                 count = (chunk_samples+1023) / 1024;
1702             }
1703
1704             if (i < sc->stsc_count - 1)
1705                 chunk_count = sc->stsc_data[i+1].first - sc->stsc_data[i].first;
1706             else
1707                 chunk_count = sc->chunk_count - (sc->stsc_data[i].first - 1);
1708             total += chunk_count * count;
1709         }
1710
1711         av_dlog(mov->fc, "chunk count %d\n", total);
1712         if (total >= UINT_MAX / sizeof(*st->index_entries))
1713             return;
1714         st->index_entries = av_malloc(total*sizeof(*st->index_entries));
1715         if (!st->index_entries)
1716             return;
1717         st->index_entries_allocated_size = total*sizeof(*st->index_entries);
1718
1719         // populate index
1720         for (i = 0; i < sc->chunk_count; i++) {
1721             current_offset = sc->chunk_offsets[i];
1722             if (stsc_index + 1 < sc->stsc_count &&
1723                 i + 1 == sc->stsc_data[stsc_index + 1].first)
1724                 stsc_index++;
1725             chunk_samples = sc->stsc_data[stsc_index].count;
1726
1727             while (chunk_samples > 0) {
1728                 AVIndexEntry *e;
1729                 unsigned size, samples;
1730
1731                 if (sc->samples_per_frame >= 160) { // gsm
1732                     samples = sc->samples_per_frame;
1733                     size = sc->bytes_per_frame;
1734                 } else {
1735                     if (sc->samples_per_frame > 1) {
1736                         samples = FFMIN((1024 / sc->samples_per_frame)*
1737                                         sc->samples_per_frame, chunk_samples);
1738                         size = (samples / sc->samples_per_frame) * sc->bytes_per_frame;
1739                     } else {
1740                         samples = FFMIN(1024, chunk_samples);
1741                         size = samples * sc->sample_size;
1742                     }
1743                 }
1744
1745                 if (st->nb_index_entries >= total) {
1746                     av_log(mov->fc, AV_LOG_ERROR, "wrong chunk count %d\n", total);
1747                     return;
1748                 }
1749                 e = &st->index_entries[st->nb_index_entries++];
1750                 e->pos = current_offset;
1751                 e->timestamp = current_dts;
1752                 e->size = size;
1753                 e->min_distance = 0;
1754                 e->flags = AVINDEX_KEYFRAME;
1755                 av_dlog(mov->fc, "AVIndex stream %d, chunk %d, offset %"PRIx64", dts %"PRId64", "
1756                         "size %d, duration %d\n", st->index, i, current_offset, current_dts,
1757                         size, samples);
1758
1759                 current_offset += size;
1760                 current_dts += samples;
1761                 chunk_samples -= samples;
1762             }
1763         }
1764     }
1765 }
1766
1767 static int mov_open_dref(AVIOContext **pb, char *src, MOVDref *ref)
1768 {
1769     /* try relative path, we do not try the absolute because it can leak information about our
1770        system to an attacker */
1771     if (ref->nlvl_to > 0 && ref->nlvl_from > 0) {
1772         char filename[1024];
1773         char *src_path;
1774         int i, l;
1775
1776         /* find a source dir */
1777         src_path = strrchr(src, '/');
1778         if (src_path)
1779             src_path++;
1780         else
1781             src_path = src;
1782
1783         /* find a next level down to target */
1784         for (i = 0, l = strlen(ref->path) - 1; l >= 0; l--)
1785             if (ref->path[l] == '/') {
1786                 if (i == ref->nlvl_to - 1)
1787                     break;
1788                 else
1789                     i++;
1790             }
1791
1792         /* compose filename if next level down to target was found */
1793         if (i == ref->nlvl_to - 1 && src_path - src  < sizeof(filename)) {
1794             memcpy(filename, src, src_path - src);
1795             filename[src_path - src] = 0;
1796
1797             for (i = 1; i < ref->nlvl_from; i++)
1798                 av_strlcat(filename, "../", 1024);
1799
1800             av_strlcat(filename, ref->path + l + 1, 1024);
1801
1802             if (!avio_open(pb, filename, AVIO_FLAG_READ))
1803                 return 0;
1804         }
1805     }
1806
1807     return AVERROR(ENOENT);
1808 }
1809
1810 static int mov_read_trak(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1811 {
1812     AVStream *st;
1813     MOVStreamContext *sc;
1814     int ret;
1815
1816     st = avformat_new_stream(c->fc, NULL);
1817     if (!st) return AVERROR(ENOMEM);
1818     st->id = c->fc->nb_streams;
1819     sc = av_mallocz(sizeof(MOVStreamContext));
1820     if (!sc) return AVERROR(ENOMEM);
1821
1822     st->priv_data = sc;
1823     st->codec->codec_type = AVMEDIA_TYPE_DATA;
1824     sc->ffindex = st->index;
1825
1826     if ((ret = mov_read_default(c, pb, atom)) < 0)
1827         return ret;
1828
1829     /* sanity checks */
1830     if (sc->chunk_count && (!sc->stts_count || !sc->stsc_count ||
1831                             (!sc->sample_size && !sc->sample_count))) {
1832         av_log(c->fc, AV_LOG_ERROR, "stream %d, missing mandatory atoms, broken header\n",
1833                st->index);
1834         return 0;
1835     }
1836
1837     if (sc->time_scale <= 0) {
1838         av_log(c->fc, AV_LOG_WARNING, "stream %d, timescale not set\n", st->index);
1839         sc->time_scale = c->time_scale;
1840         if (sc->time_scale <= 0)
1841             sc->time_scale = 1;
1842     }
1843
1844     av_set_pts_info(st, 64, 1, sc->time_scale);
1845
1846     if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO &&
1847         !st->codec->frame_size && sc->stts_count == 1) {
1848         st->codec->frame_size = av_rescale(sc->stts_data[0].duration,
1849                                            st->codec->sample_rate, sc->time_scale);
1850         av_dlog(c->fc, "frame size %d\n", st->codec->frame_size);
1851     }
1852
1853     mov_build_index(c, st);
1854
1855     if (sc->dref_id-1 < sc->drefs_count && sc->drefs[sc->dref_id-1].path) {
1856         MOVDref *dref = &sc->drefs[sc->dref_id - 1];
1857         if (mov_open_dref(&sc->pb, c->fc->filename, dref) < 0)
1858             av_log(c->fc, AV_LOG_ERROR,
1859                    "stream %d, error opening alias: path='%s', dir='%s', "
1860                    "filename='%s', volume='%s', nlvl_from=%d, nlvl_to=%d\n",
1861                    st->index, dref->path, dref->dir, dref->filename,
1862                    dref->volume, dref->nlvl_from, dref->nlvl_to);
1863     } else
1864         sc->pb = c->fc->pb;
1865
1866     if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
1867         if (!st->sample_aspect_ratio.num &&
1868             (st->codec->width != sc->width || st->codec->height != sc->height)) {
1869             st->sample_aspect_ratio = av_d2q(((double)st->codec->height * sc->width) /
1870                                              ((double)st->codec->width * sc->height), INT_MAX);
1871         }
1872
1873         av_reduce(&st->avg_frame_rate.num, &st->avg_frame_rate.den,
1874                   sc->time_scale*st->nb_frames, st->duration, INT_MAX);
1875
1876         if (sc->stts_count == 1 || (sc->stts_count == 2 && sc->stts_data[1].count == 1))
1877             av_reduce(&st->r_frame_rate.num, &st->r_frame_rate.den,
1878                       sc->time_scale, sc->stts_data[0].duration, INT_MAX);
1879     }
1880
1881     switch (st->codec->codec_id) {
1882 #if CONFIG_H261_DECODER
1883     case CODEC_ID_H261:
1884 #endif
1885 #if CONFIG_H263_DECODER
1886     case CODEC_ID_H263:
1887 #endif
1888 #if CONFIG_H264_DECODER
1889     case CODEC_ID_H264:
1890 #endif
1891 #if CONFIG_MPEG4_DECODER
1892     case CODEC_ID_MPEG4:
1893 #endif
1894         st->codec->width = 0; /* let decoder init width/height */
1895         st->codec->height= 0;
1896         break;
1897     }
1898
1899     /* Do not need those anymore. */
1900     av_freep(&sc->chunk_offsets);
1901     av_freep(&sc->stsc_data);
1902     av_freep(&sc->sample_sizes);
1903     av_freep(&sc->keyframes);
1904     av_freep(&sc->stts_data);
1905     av_freep(&sc->stps_data);
1906
1907     return 0;
1908 }
1909
1910 static int mov_read_ilst(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1911 {
1912     int ret;
1913     c->itunes_metadata = 1;
1914     ret = mov_read_default(c, pb, atom);
1915     c->itunes_metadata = 0;
1916     return ret;
1917 }
1918
1919 static int mov_read_meta(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1920 {
1921     while (atom.size > 8) {
1922         uint32_t tag = avio_rl32(pb);
1923         atom.size -= 4;
1924         if (tag == MKTAG('h','d','l','r')) {
1925             avio_seek(pb, -8, SEEK_CUR);
1926             atom.size += 8;
1927             return mov_read_default(c, pb, atom);
1928         }
1929     }
1930     return 0;
1931 }
1932
1933 static int mov_read_tkhd(MOVContext *c, AVIOContext *pb, MOVAtom atom)
1934 {
1935     int i;
1936     int width;
1937     int height;
1938     int64_t disp_transform[2];
1939     int display_matrix[3][2];
1940     AVStream *st;
1941     MOVStreamContext *sc;
1942     int version;
1943
1944     if (c->fc->nb_streams < 1)
1945         return 0;
1946     st = c->fc->streams[c->fc->nb_streams-1];
1947     sc = st->priv_data;
1948
1949     version = avio_r8(pb);
1950     avio_rb24(pb); /* flags */
1951     /*
1952     MOV_TRACK_ENABLED 0x0001
1953     MOV_TRACK_IN_MOVIE 0x0002
1954     MOV_TRACK_IN_PREVIEW 0x0004
1955     MOV_TRACK_IN_POSTER 0x0008
1956     */
1957
1958     if (version == 1) {
1959         avio_rb64(pb);
1960         avio_rb64(pb);
1961     } else {
1962         avio_rb32(pb); /* creation time */
1963         avio_rb32(pb); /* modification time */
1964     }
1965     st->id = (int)avio_rb32(pb); /* track id (NOT 0 !)*/
1966     avio_rb32(pb); /* reserved */
1967
1968     /* highlevel (considering edits) duration in movie timebase */
1969     (version == 1) ? avio_rb64(pb) : avio_rb32(pb);
1970     avio_rb32(pb); /* reserved */
1971     avio_rb32(pb); /* reserved */
1972
1973     avio_rb16(pb); /* layer */
1974     avio_rb16(pb); /* alternate group */
1975     avio_rb16(pb); /* volume */
1976     avio_rb16(pb); /* reserved */
1977
1978     //read in the display matrix (outlined in ISO 14496-12, Section 6.2.2)
1979     // they're kept in fixed point format through all calculations
1980     // ignore u,v,z b/c we don't need the scale factor to calc aspect ratio
1981     for (i = 0; i < 3; i++) {
1982         display_matrix[i][0] = avio_rb32(pb);   // 16.16 fixed point
1983         display_matrix[i][1] = avio_rb32(pb);   // 16.16 fixed point
1984         avio_rb32(pb);           // 2.30 fixed point (not used)
1985     }
1986
1987     width = avio_rb32(pb);       // 16.16 fixed point track width
1988     height = avio_rb32(pb);      // 16.16 fixed point track height
1989     sc->width = width >> 16;
1990     sc->height = height >> 16;
1991
1992     // transform the display width/height according to the matrix
1993     // skip this if the display matrix is the default identity matrix
1994     // or if it is rotating the picture, ex iPhone 3GS
1995     // to keep the same scale, use [width height 1<<16]
1996     if (width && height &&
1997         ((display_matrix[0][0] != 65536  ||
1998           display_matrix[1][1] != 65536) &&
1999          !display_matrix[0][1] &&
2000          !display_matrix[1][0] &&
2001          !display_matrix[2][0] && !display_matrix[2][1])) {
2002         for (i = 0; i < 2; i++)
2003             disp_transform[i] =
2004                 (int64_t)  width  * display_matrix[0][i] +
2005                 (int64_t)  height * display_matrix[1][i] +
2006                 ((int64_t) display_matrix[2][i] << 16);
2007
2008         //sample aspect ratio is new width/height divided by old width/height
2009         st->sample_aspect_ratio = av_d2q(
2010             ((double) disp_transform[0] * height) /
2011             ((double) disp_transform[1] * width), INT_MAX);
2012     }
2013     return 0;
2014 }
2015
2016 static int mov_read_tfhd(MOVContext *c, AVIOContext *pb, MOVAtom atom)
2017 {
2018     MOVFragment *frag = &c->fragment;
2019     MOVTrackExt *trex = NULL;
2020     int flags, track_id, i;
2021
2022     avio_r8(pb); /* version */
2023     flags = avio_rb24(pb);
2024
2025     track_id = avio_rb32(pb);
2026     if (!track_id)
2027         return -1;
2028     frag->track_id = track_id;
2029     for (i = 0; i < c->trex_count; i++)
2030         if (c->trex_data[i].track_id == frag->track_id) {
2031             trex = &c->trex_data[i];
2032             break;
2033         }
2034     if (!trex) {
2035         av_log(c->fc, AV_LOG_ERROR, "could not find corresponding trex\n");
2036         return -1;
2037     }
2038
2039     if (flags & 0x01) frag->base_data_offset = avio_rb64(pb);
2040     else              frag->base_data_offset = frag->moof_offset;
2041     if (flags & 0x02) frag->stsd_id          = avio_rb32(pb);
2042     else              frag->stsd_id          = trex->stsd_id;
2043
2044     frag->duration = flags & 0x08 ? avio_rb32(pb) : trex->duration;
2045     frag->size     = flags & 0x10 ? avio_rb32(pb) : trex->size;
2046     frag->flags    = flags & 0x20 ? avio_rb32(pb) : trex->flags;
2047     av_dlog(c->fc, "frag flags 0x%x\n", frag->flags);
2048     return 0;
2049 }
2050
2051 static int mov_read_chap(MOVContext *c, AVIOContext *pb, MOVAtom atom)
2052 {
2053     c->chapter_track = avio_rb32(pb);
2054     return 0;
2055 }
2056
2057 static int mov_read_trex(MOVContext *c, AVIOContext *pb, MOVAtom atom)
2058 {
2059     MOVTrackExt *trex;
2060
2061     if ((uint64_t)c->trex_count+1 >= UINT_MAX / sizeof(*c->trex_data))
2062         return -1;
2063     trex = av_realloc(c->trex_data, (c->trex_count+1)*sizeof(*c->trex_data));
2064     if (!trex)
2065         return AVERROR(ENOMEM);
2066     c->trex_data = trex;
2067     trex = &c->trex_data[c->trex_count++];
2068     avio_r8(pb); /* version */
2069     avio_rb24(pb); /* flags */
2070     trex->track_id = avio_rb32(pb);
2071     trex->stsd_id  = avio_rb32(pb);
2072     trex->duration = avio_rb32(pb);
2073     trex->size     = avio_rb32(pb);
2074     trex->flags    = avio_rb32(pb);
2075     return 0;
2076 }
2077
2078 static int mov_read_trun(MOVContext *c, AVIOContext *pb, MOVAtom atom)
2079 {
2080     MOVFragment *frag = &c->fragment;
2081     AVStream *st = NULL;
2082     MOVStreamContext *sc;
2083     MOVStts *ctts_data;
2084     uint64_t offset;
2085     int64_t dts;
2086     int data_offset = 0;
2087     unsigned entries, first_sample_flags = frag->flags;
2088     int flags, distance, i;
2089
2090     for (i = 0; i < c->fc->nb_streams; i++) {
2091         if (c->fc->streams[i]->id == frag->track_id) {
2092             st = c->fc->streams[i];
2093             break;
2094         }
2095     }
2096     if (!st) {
2097         av_log(c->fc, AV_LOG_ERROR, "could not find corresponding track id %d\n", frag->track_id);
2098         return -1;
2099     }
2100     sc = st->priv_data;
2101     if (sc->pseudo_stream_id+1 != frag->stsd_id)
2102         return 0;
2103     avio_r8(pb); /* version */
2104     flags = avio_rb24(pb);
2105     entries = avio_rb32(pb);
2106     av_dlog(c->fc, "flags 0x%x entries %d\n", flags, entries);
2107
2108     /* Always assume the presence of composition time offsets.
2109      * Without this assumption, for instance, we cannot deal with a track in fragmented movies that meet the following.
2110      *  1) in the initial movie, there are no samples.
2111      *  2) in the first movie fragment, there is only one sample without composition time offset.
2112      *  3) in the subsequent movie fragments, there are samples with composition time offset. */
2113     if (!sc->ctts_count && sc->sample_count)
2114     {
2115         /* Complement ctts table if moov atom doesn't have ctts atom. */
2116         ctts_data = av_malloc(sizeof(*sc->ctts_data));
2117         if (!ctts_data)
2118             return AVERROR(ENOMEM);
2119         sc->ctts_data = ctts_data;
2120         sc->ctts_data[sc->ctts_count].count = sc->sample_count;
2121         sc->ctts_data[sc->ctts_count].duration = 0;
2122         sc->ctts_count++;
2123     }
2124     if ((uint64_t)entries+sc->ctts_count >= UINT_MAX/sizeof(*sc->ctts_data))
2125         return -1;
2126     ctts_data = av_realloc(sc->ctts_data,
2127                            (entries+sc->ctts_count)*sizeof(*sc->ctts_data));
2128     if (!ctts_data)
2129         return AVERROR(ENOMEM);
2130     sc->ctts_data = ctts_data;
2131
2132     if (flags & 0x001) data_offset        = avio_rb32(pb);
2133     if (flags & 0x004) first_sample_flags = avio_rb32(pb);
2134     dts = st->duration - sc->time_offset;
2135     offset = frag->base_data_offset + data_offset;
2136     distance = 0;
2137     av_dlog(c->fc, "first sample flags 0x%x\n", first_sample_flags);
2138     for (i = 0; i < entries; i++) {
2139         unsigned sample_size = frag->size;
2140         int sample_flags = i ? frag->flags : first_sample_flags;
2141         unsigned sample_duration = frag->duration;
2142         int keyframe;
2143
2144         if (flags & 0x100) sample_duration = avio_rb32(pb);
2145         if (flags & 0x200) sample_size     = avio_rb32(pb);
2146         if (flags & 0x400) sample_flags    = avio_rb32(pb);
2147         sc->ctts_data[sc->ctts_count].count = 1;
2148         sc->ctts_data[sc->ctts_count].duration = (flags & 0x800) ? avio_rb32(pb) : 0;
2149         sc->ctts_count++;
2150         if ((keyframe = st->codec->codec_type == AVMEDIA_TYPE_AUDIO ||
2151              (flags & 0x004 && !i && !sample_flags) || sample_flags & 0x2000000))
2152             distance = 0;
2153         av_add_index_entry(st, offset, dts, sample_size, distance,
2154                            keyframe ? AVINDEX_KEYFRAME : 0);
2155         av_dlog(c->fc, "AVIndex stream %d, sample %d, offset %"PRIx64", dts %"PRId64", "
2156                 "size %d, distance %d, keyframe %d\n", st->index, sc->sample_count+i,
2157                 offset, dts, sample_size, distance, keyframe);
2158         distance++;
2159         dts += sample_duration;
2160         offset += sample_size;
2161     }
2162     frag->moof_offset = offset;
2163     st->duration = dts + sc->time_offset;
2164     return 0;
2165 }
2166
2167 /* this atom should be null (from specs), but some buggy files put the 'moov' atom inside it... */
2168 /* like the files created with Adobe Premiere 5.0, for samples see */
2169 /* http://graphics.tudelft.nl/~wouter/publications/soundtests/ */
2170 static int mov_read_wide(MOVContext *c, AVIOContext *pb, MOVAtom atom)
2171 {
2172     int err;
2173
2174     if (atom.size < 8)
2175         return 0; /* continue */
2176     if (avio_rb32(pb) != 0) { /* 0 sized mdat atom... use the 'wide' atom size */
2177         avio_skip(pb, atom.size - 4);
2178         return 0;
2179     }
2180     atom.type = avio_rl32(pb);
2181     atom.size -= 8;
2182     if (atom.type != MKTAG('m','d','a','t')) {
2183         avio_skip(pb, atom.size);
2184         return 0;
2185     }
2186     err = mov_read_mdat(c, pb, atom);
2187     return err;
2188 }
2189
2190 static int mov_read_cmov(MOVContext *c, AVIOContext *pb, MOVAtom atom)
2191 {
2192 #if CONFIG_ZLIB
2193     AVIOContext ctx;
2194     uint8_t *cmov_data;
2195     uint8_t *moov_data; /* uncompressed data */
2196     long cmov_len, moov_len;
2197     int ret = -1;
2198
2199     avio_rb32(pb); /* dcom atom */
2200     if (avio_rl32(pb) != MKTAG('d','c','o','m'))
2201         return -1;
2202     if (avio_rl32(pb) != MKTAG('z','l','i','b')) {
2203         av_log(c->fc, AV_LOG_ERROR, "unknown compression for cmov atom !");
2204         return -1;
2205     }
2206     avio_rb32(pb); /* cmvd atom */
2207     if (avio_rl32(pb) != MKTAG('c','m','v','d'))
2208         return -1;
2209     moov_len = avio_rb32(pb); /* uncompressed size */
2210     cmov_len = atom.size - 6 * 4;
2211
2212     cmov_data = av_malloc(cmov_len);
2213     if (!cmov_data)
2214         return AVERROR(ENOMEM);
2215     moov_data = av_malloc(moov_len);
2216     if (!moov_data) {
2217         av_free(cmov_data);
2218         return AVERROR(ENOMEM);
2219     }
2220     avio_read(pb, cmov_data, cmov_len);
2221     if (uncompress (moov_data, (uLongf *) &moov_len, (const Bytef *)cmov_data, cmov_len) != Z_OK)
2222         goto free_and_return;
2223     if (ffio_init_context(&ctx, moov_data, moov_len, 0, NULL, NULL, NULL, NULL) != 0)
2224         goto free_and_return;
2225     atom.type = MKTAG('m','o','o','v');
2226     atom.size = moov_len;
2227     ret = mov_read_default(c, &ctx, atom);
2228 free_and_return:
2229     av_free(moov_data);
2230     av_free(cmov_data);
2231     return ret;
2232 #else
2233     av_log(c->fc, AV_LOG_ERROR, "this file requires zlib support compiled in\n");
2234     return -1;
2235 #endif
2236 }
2237
2238 /* edit list atom */
2239 static int mov_read_elst(MOVContext *c, AVIOContext *pb, MOVAtom atom)
2240 {
2241     MOVStreamContext *sc;
2242     int i, edit_count, version;
2243
2244     if (c->fc->nb_streams < 1)
2245         return 0;
2246     sc = c->fc->streams[c->fc->nb_streams-1]->priv_data;
2247
2248     version = avio_r8(pb); /* version */
2249     avio_rb24(pb); /* flags */
2250     edit_count = avio_rb32(pb); /* entries */
2251
2252     if ((uint64_t)edit_count*12+8 > atom.size)
2253         return -1;
2254
2255     for (i=0; i<edit_count; i++){
2256         int64_t time;
2257         int64_t duration;
2258         if (version == 1) {
2259             duration = avio_rb64(pb);
2260             time     = avio_rb64(pb);
2261         } else {
2262             duration = avio_rb32(pb); /* segment duration */
2263             time     = (int32_t)avio_rb32(pb); /* media time */
2264         }
2265         avio_rb32(pb); /* Media rate */
2266         if (i == 0 && time >= -1) {
2267             sc->time_offset = time != -1 ? time : -duration;
2268         }
2269     }
2270
2271     if (edit_count > 1)
2272         av_log(c->fc, AV_LOG_WARNING, "multiple edit list entries, "
2273                "a/v desync might occur, patch welcome\n");
2274
2275     av_dlog(c->fc, "track[%i].edit_count = %i\n", c->fc->nb_streams-1, edit_count);
2276     return 0;
2277 }
2278
2279 static const MOVParseTableEntry mov_default_parse_table[] = {
2280 { MKTAG('a','v','s','s'), mov_read_extradata },
2281 { MKTAG('c','h','p','l'), mov_read_chpl },
2282 { MKTAG('c','o','6','4'), mov_read_stco },
2283 { MKTAG('c','t','t','s'), mov_read_ctts }, /* composition time to sample */
2284 { MKTAG('d','i','n','f'), mov_read_default },
2285 { MKTAG('d','r','e','f'), mov_read_dref },
2286 { MKTAG('e','d','t','s'), mov_read_default },
2287 { MKTAG('e','l','s','t'), mov_read_elst },
2288 { MKTAG('e','n','d','a'), mov_read_enda },
2289 { MKTAG('f','i','e','l'), mov_read_extradata },
2290 { MKTAG('f','t','y','p'), mov_read_ftyp },
2291 { MKTAG('g','l','b','l'), mov_read_glbl },
2292 { MKTAG('h','d','l','r'), mov_read_hdlr },
2293 { MKTAG('i','l','s','t'), mov_read_ilst },
2294 { MKTAG('j','p','2','h'), mov_read_extradata },
2295 { MKTAG('m','d','a','t'), mov_read_mdat },
2296 { MKTAG('m','d','h','d'), mov_read_mdhd },
2297 { MKTAG('m','d','i','a'), mov_read_default },
2298 { MKTAG('m','e','t','a'), mov_read_meta },
2299 { MKTAG('m','i','n','f'), mov_read_default },
2300 { MKTAG('m','o','o','f'), mov_read_moof },
2301 { MKTAG('m','o','o','v'), mov_read_moov },
2302 { MKTAG('m','v','e','x'), mov_read_default },
2303 { MKTAG('m','v','h','d'), mov_read_mvhd },
2304 { MKTAG('S','M','I',' '), mov_read_smi }, /* Sorenson extension ??? */
2305 { MKTAG('a','l','a','c'), mov_read_extradata }, /* alac specific atom */
2306 { MKTAG('a','v','c','C'), mov_read_glbl },
2307 { MKTAG('p','a','s','p'), mov_read_pasp },
2308 { MKTAG('s','t','b','l'), mov_read_default },
2309 { MKTAG('s','t','c','o'), mov_read_stco },
2310 { MKTAG('s','t','p','s'), mov_read_stps },
2311 { MKTAG('s','t','r','f'), mov_read_strf },
2312 { MKTAG('s','t','s','c'), mov_read_stsc },
2313 { MKTAG('s','t','s','d'), mov_read_stsd }, /* sample description */
2314 { MKTAG('s','t','s','s'), mov_read_stss }, /* sync sample */
2315 { MKTAG('s','t','s','z'), mov_read_stsz }, /* sample size */
2316 { MKTAG('s','t','t','s'), mov_read_stts },
2317 { MKTAG('s','t','z','2'), mov_read_stsz }, /* compact sample size */
2318 { MKTAG('t','k','h','d'), mov_read_tkhd }, /* track header */
2319 { MKTAG('t','f','h','d'), mov_read_tfhd }, /* track fragment header */
2320 { MKTAG('t','r','a','k'), mov_read_trak },
2321 { MKTAG('t','r','a','f'), mov_read_default },
2322 { MKTAG('t','r','e','f'), mov_read_default },
2323 { MKTAG('c','h','a','p'), mov_read_chap },
2324 { MKTAG('t','r','e','x'), mov_read_trex },
2325 { MKTAG('t','r','u','n'), mov_read_trun },
2326 { MKTAG('u','d','t','a'), mov_read_default },
2327 { MKTAG('w','a','v','e'), mov_read_wave },
2328 { MKTAG('e','s','d','s'), mov_read_esds },
2329 { MKTAG('d','a','c','3'), mov_read_dac3 }, /* AC-3 info */
2330 { MKTAG('w','i','d','e'), mov_read_wide }, /* place holder */
2331 { MKTAG('w','f','e','x'), mov_read_wfex },
2332 { MKTAG('c','m','o','v'), mov_read_cmov },
2333 { 0, NULL }
2334 };
2335
2336 static int mov_probe(AVProbeData *p)
2337 {
2338     unsigned int offset;
2339     uint32_t tag;
2340     int score = 0;
2341
2342     /* check file header */
2343     offset = 0;
2344     for (;;) {
2345         /* ignore invalid offset */
2346         if ((offset + 8) > (unsigned int)p->buf_size)
2347             return score;
2348         tag = AV_RL32(p->buf + offset + 4);
2349         switch(tag) {
2350         /* check for obvious tags */
2351         case MKTAG('j','P',' ',' '): /* jpeg 2000 signature */
2352         case MKTAG('m','o','o','v'):
2353         case MKTAG('m','d','a','t'):
2354         case MKTAG('p','n','o','t'): /* detect movs with preview pics like ew.mov and april.mov */
2355         case MKTAG('u','d','t','a'): /* Packet Video PVAuthor adds this and a lot of more junk */
2356         case MKTAG('f','t','y','p'):
2357             return AVPROBE_SCORE_MAX;
2358         /* those are more common words, so rate then a bit less */
2359         case MKTAG('e','d','i','w'): /* xdcam files have reverted first tags */
2360         case MKTAG('w','i','d','e'):
2361         case MKTAG('f','r','e','e'):
2362         case MKTAG('j','u','n','k'):
2363         case MKTAG('p','i','c','t'):
2364             return AVPROBE_SCORE_MAX - 5;
2365         case MKTAG(0x82,0x82,0x7f,0x7d):
2366         case MKTAG('s','k','i','p'):
2367         case MKTAG('u','u','i','d'):
2368         case MKTAG('p','r','f','l'):
2369             offset = AV_RB32(p->buf+offset) + offset;
2370             /* if we only find those cause probedata is too small at least rate them */
2371             score = AVPROBE_SCORE_MAX - 50;
2372             break;
2373         default:
2374             /* unrecognized tag */
2375             return score;
2376         }
2377     }
2378 }
2379
2380 // must be done after parsing all trak because there's no order requirement
2381 static void mov_read_chapters(AVFormatContext *s)
2382 {
2383     MOVContext *mov = s->priv_data;
2384     AVStream *st = NULL;
2385     MOVStreamContext *sc;
2386     int64_t cur_pos;
2387     int i;
2388
2389     for (i = 0; i < s->nb_streams; i++)
2390         if (s->streams[i]->id == mov->chapter_track) {
2391             st = s->streams[i];
2392             break;
2393         }
2394     if (!st) {
2395         av_log(s, AV_LOG_ERROR, "Referenced QT chapter track not found\n");
2396         return;
2397     }
2398
2399     st->discard = AVDISCARD_ALL;
2400     sc = st->priv_data;
2401     cur_pos = avio_tell(sc->pb);
2402
2403     for (i = 0; i < st->nb_index_entries; i++) {
2404         AVIndexEntry *sample = &st->index_entries[i];
2405         int64_t end = i+1 < st->nb_index_entries ? st->index_entries[i+1].timestamp : st->duration;
2406         uint8_t *title;
2407         uint16_t ch;
2408         int len, title_len;
2409
2410         if (avio_seek(sc->pb, sample->pos, SEEK_SET) != sample->pos) {
2411             av_log(s, AV_LOG_ERROR, "Chapter %d not found in file\n", i);
2412             goto finish;
2413         }
2414
2415         // the first two bytes are the length of the title
2416         len = avio_rb16(sc->pb);
2417         if (len > sample->size-2)
2418             continue;
2419         title_len = 2*len + 1;
2420         if (!(title = av_mallocz(title_len)))
2421             goto finish;
2422
2423         // The samples could theoretically be in any encoding if there's an encd
2424         // atom following, but in practice are only utf-8 or utf-16, distinguished
2425         // instead by the presence of a BOM
2426         if (!len) {
2427             title[0] = 0;
2428         } else {
2429             ch = avio_rb16(sc->pb);
2430             if (ch == 0xfeff)
2431                 avio_get_str16be(sc->pb, len, title, title_len);
2432             else if (ch == 0xfffe)
2433                 avio_get_str16le(sc->pb, len, title, title_len);
2434             else {
2435                 AV_WB16(title, ch);
2436                 if (len == 1 || len == 2)
2437                     title[len] = 0;
2438                 else
2439                     avio_get_str(sc->pb, len - 2, title + 2, title_len - 2);
2440             }
2441         }
2442
2443         avpriv_new_chapter(s, i, st->time_base, sample->timestamp, end, title);
2444         av_freep(&title);
2445     }
2446 finish:
2447     avio_seek(sc->pb, cur_pos, SEEK_SET);
2448 }
2449
2450 static int mov_read_header(AVFormatContext *s, AVFormatParameters *ap)
2451 {
2452     MOVContext *mov = s->priv_data;
2453     AVIOContext *pb = s->pb;
2454     int err;
2455     MOVAtom atom = { AV_RL32("root") };
2456
2457     mov->fc = s;
2458     /* .mov and .mp4 aren't streamable anyway (only progressive download if moov is before mdat) */
2459     if (pb->seekable)
2460         atom.size = avio_size(pb);
2461     else
2462         atom.size = INT64_MAX;
2463
2464     /* check MOV header */
2465     if ((err = mov_read_default(mov, pb, atom)) < 0) {
2466         av_log(s, AV_LOG_ERROR, "error reading header: %d\n", err);
2467         return err;
2468     }
2469     if (!mov->found_moov) {
2470         av_log(s, AV_LOG_ERROR, "moov atom not found\n");
2471         return -1;
2472     }
2473     av_dlog(mov->fc, "on_parse_exit_offset=%"PRId64"\n", avio_tell(pb));
2474
2475     if (pb->seekable && mov->chapter_track > 0)
2476         mov_read_chapters(s);
2477
2478     return 0;
2479 }
2480
2481 static AVIndexEntry *mov_find_next_sample(AVFormatContext *s, AVStream **st)
2482 {
2483     AVIndexEntry *sample = NULL;
2484     int64_t best_dts = INT64_MAX;
2485     int i;
2486     for (i = 0; i < s->nb_streams; i++) {
2487         AVStream *avst = s->streams[i];
2488         MOVStreamContext *msc = avst->priv_data;
2489         if (msc->pb && msc->current_sample < avst->nb_index_entries) {
2490             AVIndexEntry *current_sample = &avst->index_entries[msc->current_sample];
2491             int64_t dts = av_rescale(current_sample->timestamp, AV_TIME_BASE, msc->time_scale);
2492             av_dlog(s, "stream %d, sample %d, dts %"PRId64"\n", i, msc->current_sample, dts);
2493             if (!sample || (!s->pb->seekable && current_sample->pos < sample->pos) ||
2494                 (s->pb->seekable &&
2495                  ((msc->pb != s->pb && dts < best_dts) || (msc->pb == s->pb &&
2496                  ((FFABS(best_dts - dts) <= AV_TIME_BASE && current_sample->pos < sample->pos) ||
2497                   (FFABS(best_dts - dts) > AV_TIME_BASE && dts < best_dts)))))) {
2498                 sample = current_sample;
2499                 best_dts = dts;
2500                 *st = avst;
2501             }
2502         }
2503     }
2504     return sample;
2505 }
2506
2507 static int mov_read_packet(AVFormatContext *s, AVPacket *pkt)
2508 {
2509     MOVContext *mov = s->priv_data;
2510     MOVStreamContext *sc;
2511     AVIndexEntry *sample;
2512     AVStream *st = NULL;
2513     int ret;
2514  retry:
2515     sample = mov_find_next_sample(s, &st);
2516     if (!sample) {
2517         mov->found_mdat = 0;
2518         if (s->pb->seekable||
2519             mov_read_default(mov, s->pb, (MOVAtom){ AV_RL32("root"), INT64_MAX }) < 0 ||
2520             s->pb->eof_reached)
2521             return AVERROR_EOF;
2522         av_dlog(s, "read fragments, offset 0x%"PRIx64"\n", avio_tell(s->pb));
2523         goto retry;
2524     }
2525     sc = st->priv_data;
2526     /* must be done just before reading, to avoid infinite loop on sample */
2527     sc->current_sample++;
2528
2529     if (st->discard != AVDISCARD_ALL) {
2530         if (avio_seek(sc->pb, sample->pos, SEEK_SET) != sample->pos) {
2531             av_log(mov->fc, AV_LOG_ERROR, "stream %d, offset 0x%"PRIx64": partial file\n",
2532                    sc->ffindex, sample->pos);
2533             return -1;
2534         }
2535         ret = av_get_packet(sc->pb, pkt, sample->size);
2536         if (ret < 0)
2537             return ret;
2538         if (sc->has_palette) {
2539             uint8_t *pal;
2540
2541             pal = av_packet_new_side_data(pkt, AV_PKT_DATA_PALETTE, AVPALETTE_SIZE);
2542             if (!pal) {
2543                 av_log(mov->fc, AV_LOG_ERROR, "Cannot append palette to packet\n");
2544             } else {
2545                 memcpy(pal, sc->palette, AVPALETTE_SIZE);
2546                 sc->has_palette = 0;
2547             }
2548         }
2549 #if CONFIG_DV_DEMUXER
2550         if (mov->dv_demux && sc->dv_audio_container) {
2551             avpriv_dv_produce_packet(mov->dv_demux, pkt, pkt->data, pkt->size);
2552             av_free(pkt->data);
2553             pkt->size = 0;
2554             ret = avpriv_dv_get_packet(mov->dv_demux, pkt);
2555             if (ret < 0)
2556                 return ret;
2557         }
2558 #endif
2559     }
2560
2561     pkt->stream_index = sc->ffindex;
2562     pkt->dts = sample->timestamp;
2563     if (sc->ctts_data) {
2564         pkt->pts = pkt->dts + sc->dts_shift + sc->ctts_data[sc->ctts_index].duration;
2565         /* update ctts context */
2566         sc->ctts_sample++;
2567         if (sc->ctts_index < sc->ctts_count &&
2568             sc->ctts_data[sc->ctts_index].count == sc->ctts_sample) {
2569             sc->ctts_index++;
2570             sc->ctts_sample = 0;
2571         }
2572         if (sc->wrong_dts)
2573             pkt->dts = AV_NOPTS_VALUE;
2574     } else {
2575         int64_t next_dts = (sc->current_sample < st->nb_index_entries) ?
2576             st->index_entries[sc->current_sample].timestamp : st->duration;
2577         pkt->duration = next_dts - pkt->dts;
2578         pkt->pts = pkt->dts;
2579     }
2580     if (st->discard == AVDISCARD_ALL)
2581         goto retry;
2582     pkt->flags |= sample->flags & AVINDEX_KEYFRAME ? AV_PKT_FLAG_KEY : 0;
2583     pkt->pos = sample->pos;
2584     av_dlog(s, "stream %d, pts %"PRId64", dts %"PRId64", pos 0x%"PRIx64", duration %d\n",
2585             pkt->stream_index, pkt->pts, pkt->dts, pkt->pos, pkt->duration);
2586     return 0;
2587 }
2588
2589 static int mov_seek_stream(AVFormatContext *s, AVStream *st, int64_t timestamp, int flags)
2590 {
2591     MOVStreamContext *sc = st->priv_data;
2592     int sample, time_sample;
2593     int i;
2594
2595     sample = av_index_search_timestamp(st, timestamp, flags);
2596     av_dlog(s, "stream %d, timestamp %"PRId64", sample %d\n", st->index, timestamp, sample);
2597     if (sample < 0 && st->nb_index_entries && timestamp < st->index_entries[0].timestamp)
2598         sample = 0;
2599     if (sample < 0) /* not sure what to do */
2600         return -1;
2601     sc->current_sample = sample;
2602     av_dlog(s, "stream %d, found sample %d\n", st->index, sc->current_sample);
2603     /* adjust ctts index */
2604     if (sc->ctts_data) {
2605         time_sample = 0;
2606         for (i = 0; i < sc->ctts_count; i++) {
2607             int next = time_sample + sc->ctts_data[i].count;
2608             if (next > sc->current_sample) {
2609                 sc->ctts_index = i;
2610                 sc->ctts_sample = sc->current_sample - time_sample;
2611                 break;
2612             }
2613             time_sample = next;
2614         }
2615     }
2616     return sample;
2617 }
2618
2619 static int mov_read_seek(AVFormatContext *s, int stream_index, int64_t sample_time, int flags)
2620 {
2621     AVStream *st;
2622     int64_t seek_timestamp, timestamp;
2623     int sample;
2624     int i;
2625
2626     if (stream_index >= s->nb_streams)
2627         return -1;
2628     if (sample_time < 0)
2629         sample_time = 0;
2630
2631     st = s->streams[stream_index];
2632     sample = mov_seek_stream(s, st, sample_time, flags);
2633     if (sample < 0)
2634         return -1;
2635
2636     /* adjust seek timestamp to found sample timestamp */
2637     seek_timestamp = st->index_entries[sample].timestamp;
2638
2639     for (i = 0; i < s->nb_streams; i++) {
2640         st = s->streams[i];
2641         if (stream_index == i)
2642             continue;
2643
2644         timestamp = av_rescale_q(seek_timestamp, s->streams[stream_index]->time_base, st->time_base);
2645         mov_seek_stream(s, st, timestamp, flags);
2646     }
2647     return 0;
2648 }
2649
2650 static int mov_read_close(AVFormatContext *s)
2651 {
2652     MOVContext *mov = s->priv_data;
2653     int i, j;
2654
2655     for (i = 0; i < s->nb_streams; i++) {
2656         AVStream *st = s->streams[i];
2657         MOVStreamContext *sc = st->priv_data;
2658
2659         av_freep(&sc->ctts_data);
2660         for (j = 0; j < sc->drefs_count; j++) {
2661             av_freep(&sc->drefs[j].path);
2662             av_freep(&sc->drefs[j].dir);
2663         }
2664         av_freep(&sc->drefs);
2665         if (sc->pb && sc->pb != s->pb)
2666             avio_close(sc->pb);
2667     }
2668
2669     if (mov->dv_demux) {
2670         for (i = 0; i < mov->dv_fctx->nb_streams; i++) {
2671             av_freep(&mov->dv_fctx->streams[i]->codec);
2672             av_freep(&mov->dv_fctx->streams[i]);
2673         }
2674         av_freep(&mov->dv_fctx);
2675         av_freep(&mov->dv_demux);
2676     }
2677
2678     av_freep(&mov->trex_data);
2679
2680     return 0;
2681 }
2682
2683 AVInputFormat ff_mov_demuxer = {
2684     .name           = "mov,mp4,m4a,3gp,3g2,mj2",
2685     .long_name      = NULL_IF_CONFIG_SMALL("QuickTime/MPEG-4/Motion JPEG 2000 format"),
2686     .priv_data_size = sizeof(MOVContext),
2687     .read_probe     = mov_probe,
2688     .read_header    = mov_read_header,
2689     .read_packet    = mov_read_packet,
2690     .read_close     = mov_read_close,
2691     .read_seek      = mov_read_seek,
2692 };