git.sesse.net Git - ffmpeg/blob - libavformat/westwood.c

   1 /*
   2  * Westwood Studios Multimedia Formats Demuxer (VQA, AUD)
   3  * Copyright (c) 2003 The ffmpeg Project
   4  *
   5  * This file is part of FFmpeg.
   6  *
   7  * FFmpeg is free software; you can redistribute it and/or
   8  * modify it under the terms of the GNU Lesser General Public
   9  * License as published by the Free Software Foundation; either
  10  * version 2.1 of the License, or (at your option) any later version.
  11  *
  12  * FFmpeg is distributed in the hope that it will be useful,
  13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  15  * Lesser General Public License for more details.
  16  *
  17  * You should have received a copy of the GNU Lesser General Public
  18  * License along with FFmpeg; if not, write to the Free Software
  19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20  */
  21
  22 /**
  23  * @file westwood.c
  24  * Westwood Studios VQA & AUD file demuxers
  25  * by Mike Melanson (melanson@pcisys.net)
  26  * for more information on the Westwood file formats, visit:
  27  *   http://www.pcisys.net/~melanson/codecs/
  28  *   http://www.geocities.com/SiliconValley/8682/aud3.txt
  29  *
  30  * Implementation note: There is no definite file signature for AUD files.
  31  * The demuxer uses a probabilistic strategy for content detection. This
  32  * entails performing sanity checks on certain header values in order to
  33  * qualify a file. Refer to wsaud_probe() for the precise parameters.
  34  */
  35
  36 #include "avformat.h"
  37
  38 #define AUD_HEADER_SIZE 12
  39 #define AUD_CHUNK_PREAMBLE_SIZE 8
  40 #define AUD_CHUNK_SIGNATURE 0x0000DEAF
  41
  42 #define FORM_TAG MKBETAG('F', 'O', 'R', 'M')
  43 #define WVQA_TAG MKBETAG('W', 'V', 'Q', 'A')
  44 #define VQHD_TAG MKBETAG('V', 'Q', 'H', 'D')
  45 #define FINF_TAG MKBETAG('F', 'I', 'N', 'F')
  46 #define SND0_TAG MKBETAG('S', 'N', 'D', '0')
  47 #define SND1_TAG MKBETAG('S', 'N', 'D', '1')
  48 #define SND2_TAG MKBETAG('S', 'N', 'D', '2')
  49 #define VQFR_TAG MKBETAG('V', 'Q', 'F', 'R')
  50
  51 /* don't know what these tags are for, but acknowledge their existence */
  52 #define CINF_TAG MKBETAG('C', 'I', 'N', 'F')
  53 #define CINH_TAG MKBETAG('C', 'I', 'N', 'H')
  54 #define CIND_TAG MKBETAG('C', 'I', 'N', 'D')
  55 #define PINF_TAG MKBETAG('P', 'I', 'N', 'F')
  56 #define PINH_TAG MKBETAG('P', 'I', 'N', 'H')
  57 #define PIND_TAG MKBETAG('P', 'I', 'N', 'D')
  58 #define CMDS_TAG MKBETAG('C', 'M', 'D', 'S')
  59
  60 #define VQA_HEADER_SIZE 0x2A
  61 #define VQA_FRAMERATE 15
  62 #define VQA_VIDEO_PTS_INC (90000 / VQA_FRAMERATE)
  63 #define VQA_PREAMBLE_SIZE 8
  64
  65 typedef struct WsAudDemuxContext {
  66     int audio_samplerate;
  67     int audio_channels;
  68     int audio_bits;
  69     int audio_type;
  70     int audio_stream_index;
  71     int64_t audio_frame_counter;
  72 } WsAudDemuxContext;
  73
  74 typedef struct WsVqaDemuxContext {
  75     int audio_samplerate;
  76     int audio_channels;
  77     int audio_bits;
  78
  79     int audio_stream_index;
  80     int video_stream_index;
  81
  82     int64_t audio_frame_counter;
  83     int64_t video_pts;
  84 } WsVqaDemuxContext;
  85
  86 static int wsaud_probe(AVProbeData *p)
  87 {
  88     int field;
  89
  90     /* Probabilistic content detection strategy: There is no file signature
  91      * so perform sanity checks on various header parameters:
  92      *   8000 <= sample rate (16 bits) <= 48000  ==> 40001 acceptable numbers
  93      *   compression type (8 bits) = 1 or 99     ==> 2 acceptable numbers
  94      * There is a total of 24 bits. The number space contains 2^24 =
  95      * 16777216 numbers. There are 40001 * 2 = 80002 acceptable combinations
  96      * of numbers. There is a 80002/16777216 = 0.48% chance of a false
  97      * positive.
  98      */
  99
 100     if (p->buf_size < AUD_HEADER_SIZE)
 101         return 0;
 102
 103     /* check sample rate */
 104     field = LE_16(&p->buf[0]);
 105     if ((field < 8000) || (field > 48000))
 106         return 0;
 107
 108     /* note: only check for WS IMA (type 99) right now since there is no
 109      * support for type 1 */
 110     if (p->buf[11] != 99)
 111         return 0;
 112
 113     /* return 1/2 certainty since this file check is a little sketchy */
 114     return AVPROBE_SCORE_MAX / 2;
 115 }
 116
 117 static int wsaud_read_header(AVFormatContext *s,
 118                              AVFormatParameters *ap)
 119 {
 120     WsAudDemuxContext *wsaud = (WsAudDemuxContext *)s->priv_data;
 121     ByteIOContext *pb = &s->pb;
 122     AVStream *st;
 123     unsigned char header[AUD_HEADER_SIZE];
 124
 125     if (get_buffer(pb, header, AUD_HEADER_SIZE) != AUD_HEADER_SIZE)
 126         return AVERROR_IO;
 127     wsaud->audio_samplerate = LE_16(&header[0]);
 128     if (header[11] == 99)
 129         wsaud->audio_type = CODEC_ID_ADPCM_IMA_WS;
 130     else
 131         return AVERROR_INVALIDDATA;
 132
 133     /* flag 0 indicates stereo */
 134     wsaud->audio_channels = (header[10] & 0x1) + 1;
 135     /* flag 1 indicates 16 bit audio */
 136     wsaud->audio_bits = (((header[10] & 0x2) >> 1) + 1) * 8;
 137
 138     /* initialize the audio decoder stream */
 139     st = av_new_stream(s, 0);
 140     if (!st)
 141         return AVERROR_NOMEM;
 142     av_set_pts_info(st, 33, 1, wsaud->audio_samplerate);
 143     st->codec->codec_type = CODEC_TYPE_AUDIO;
 144     st->codec->codec_id = wsaud->audio_type;
 145     st->codec->codec_tag = 0;  /* no tag */
 146     st->codec->channels = wsaud->audio_channels;
 147     st->codec->sample_rate = wsaud->audio_samplerate;
 148     st->codec->bits_per_sample = wsaud->audio_bits;
 149     st->codec->bit_rate = st->codec->channels * st->codec->sample_rate *
 150         st->codec->bits_per_sample / 4;
 151     st->codec->block_align = st->codec->channels * st->codec->bits_per_sample;
 152
 153     wsaud->audio_stream_index = st->index;
 154     wsaud->audio_frame_counter = 0;
 155
 156     return 0;
 157 }
 158
 159 static int wsaud_read_packet(AVFormatContext *s,
 160                              AVPacket *pkt)
 161 {
 162     WsAudDemuxContext *wsaud = (WsAudDemuxContext *)s->priv_data;
 163     ByteIOContext *pb = &s->pb;
 164     unsigned char preamble[AUD_CHUNK_PREAMBLE_SIZE];
 165     unsigned int chunk_size;
 166     int ret = 0;
 167
 168     if (get_buffer(pb, preamble, AUD_CHUNK_PREAMBLE_SIZE) !=
 169         AUD_CHUNK_PREAMBLE_SIZE)
 170         return AVERROR_IO;
 171
 172     /* validate the chunk */
 173     if (LE_32(&preamble[4]) != AUD_CHUNK_SIGNATURE)
 174         return AVERROR_INVALIDDATA;
 175
 176     chunk_size = LE_16(&preamble[0]);
 177     ret= av_get_packet(pb, pkt, chunk_size);
 178     if (ret != chunk_size)
 179         return AVERROR_IO;
 180     pkt->stream_index = wsaud->audio_stream_index;
 181     pkt->pts = wsaud->audio_frame_counter;
 182     pkt->pts /= wsaud->audio_samplerate;
 183
 184     /* 2 samples/byte, 1 or 2 samples per frame depending on stereo */
 185     wsaud->audio_frame_counter += (chunk_size * 2) / wsaud->audio_channels;
 186
 187     return ret;
 188 }
 189
 190 static int wsaud_read_close(AVFormatContext *s)
 191 {
 192 //    WsAudDemuxContext *wsaud = (WsAudDemuxContext *)s->priv_data;
 193
 194     return 0;
 195 }
 196
 197
 198 static int wsvqa_probe(AVProbeData *p)
 199 {
 200     /* need 12 bytes to qualify */
 201     if (p->buf_size < 12)
 202         return 0;
 203
 204     /* check for the VQA signatures */
 205     if ((BE_32(&p->buf[0]) != FORM_TAG) ||
 206         (BE_32(&p->buf[8]) != WVQA_TAG))
 207         return 0;
 208
 209     return AVPROBE_SCORE_MAX;
 210 }
 211
 212 static int wsvqa_read_header(AVFormatContext *s,
 213                              AVFormatParameters *ap)
 214 {
 215     WsVqaDemuxContext *wsvqa = (WsVqaDemuxContext *)s->priv_data;
 216     ByteIOContext *pb = &s->pb;
 217     AVStream *st;
 218     unsigned char *header;
 219     unsigned char scratch[VQA_PREAMBLE_SIZE];
 220     unsigned int chunk_tag;
 221     unsigned int chunk_size;
 222
 223     /* initialize the video decoder stream */
 224     st = av_new_stream(s, 0);
 225     if (!st)
 226         return AVERROR_NOMEM;
 227     av_set_pts_info(st, 33, 1, 90000);
 228     wsvqa->video_stream_index = st->index;
 229     st->codec->codec_type = CODEC_TYPE_VIDEO;
 230     st->codec->codec_id = CODEC_ID_WS_VQA;
 231     st->codec->codec_tag = 0;  /* no fourcc */
 232
 233     /* skip to the start of the VQA header */
 234     url_fseek(pb, 20, SEEK_SET);
 235
 236     /* the VQA header needs to go to the decoder */
 237     st->codec->extradata_size = VQA_HEADER_SIZE;
 238     st->codec->extradata = av_mallocz(VQA_HEADER_SIZE + FF_INPUT_BUFFER_PADDING_SIZE);
 239     header = (unsigned char *)st->codec->extradata;
 240     if (get_buffer(pb, st->codec->extradata, VQA_HEADER_SIZE) !=
 241         VQA_HEADER_SIZE) {
 242         av_free(st->codec->extradata);
 243         return AVERROR_IO;
 244     }
 245     st->codec->width = LE_16(&header[6]);
 246     st->codec->height = LE_16(&header[8]);
 247
 248     st->codec->time_base.num = 1;
 249     st->codec->time_base.den = VQA_FRAMERATE;
 250
 251     /* initialize the audio decoder stream for VQA v1 or nonzero samplerate */
 252     if (LE_16(&header[24]) || (LE_16(&header[0]) == 1)) {
 253         st = av_new_stream(s, 0);
 254         if (!st)
 255             return AVERROR_NOMEM;
 256         av_set_pts_info(st, 33, 1, 90000);
 257         st->codec->codec_type = CODEC_TYPE_AUDIO;
 258         if (LE_16(&header[0]) == 1)
 259             st->codec->codec_id = CODEC_ID_WESTWOOD_SND1;
 260         else
 261             st->codec->codec_id = CODEC_ID_ADPCM_IMA_WS;
 262         st->codec->codec_tag = 0;  /* no tag */
 263         st->codec->sample_rate = LE_16(&header[24]);
 264         if (!st->codec->sample_rate)
 265             st->codec->sample_rate = 22050;
 266         st->codec->channels = header[26];
 267         if (!st->codec->channels)
 268             st->codec->channels = 1;
 269         st->codec->bits_per_sample = 16;
 270         st->codec->bit_rate = st->codec->channels * st->codec->sample_rate *
 271             st->codec->bits_per_sample / 4;
 272         st->codec->block_align = st->codec->channels * st->codec->bits_per_sample;
 273
 274         wsvqa->audio_stream_index = st->index;
 275         wsvqa->audio_samplerate = st->codec->sample_rate;
 276         wsvqa->audio_channels = st->codec->channels;
 277         wsvqa->audio_frame_counter = 0;
 278     }
 279
 280     /* there are 0 or more chunks before the FINF chunk; iterate until
 281      * FINF has been skipped and the file will be ready to be demuxed */
 282     do {
 283         if (get_buffer(pb, scratch, VQA_PREAMBLE_SIZE) != VQA_PREAMBLE_SIZE) {
 284             av_free(st->codec->extradata);
 285             return AVERROR_IO;
 286         }
 287         chunk_tag = BE_32(&scratch[0]);
 288         chunk_size = BE_32(&scratch[4]);
 289
 290         /* catch any unknown header tags, for curiousity */
 291         switch (chunk_tag) {
 292         case CINF_TAG:
 293         case CINH_TAG:
 294         case CIND_TAG:
 295         case PINF_TAG:
 296         case PINH_TAG:
 297         case PIND_TAG:
 298         case FINF_TAG:
 299         case CMDS_TAG:
 300             break;
 301
 302         default:
 303             av_log (s, AV_LOG_ERROR, " note: unknown chunk seen (%c%c%c%c)\n",
 304                 scratch[0], scratch[1],
 305                 scratch[2], scratch[3]);
 306             break;
 307         }
 308
 309         url_fseek(pb, chunk_size, SEEK_CUR);
 310     } while (chunk_tag != FINF_TAG);
 311
 312     wsvqa->video_pts = wsvqa->audio_frame_counter = 0;
 313
 314     return 0;
 315 }
 316
 317 static int wsvqa_read_packet(AVFormatContext *s,
 318                              AVPacket *pkt)
 319 {
 320     WsVqaDemuxContext *wsvqa = (WsVqaDemuxContext *)s->priv_data;
 321     ByteIOContext *pb = &s->pb;
 322     int ret = -1;
 323     unsigned char preamble[VQA_PREAMBLE_SIZE];
 324     unsigned int chunk_type;
 325     unsigned int chunk_size;
 326     int skip_byte;
 327
 328     while (get_buffer(pb, preamble, VQA_PREAMBLE_SIZE) == VQA_PREAMBLE_SIZE) {
 329         chunk_type = BE_32(&preamble[0]);
 330         chunk_size = BE_32(&preamble[4]);
 331         skip_byte = chunk_size & 0x01;
 332
 333         if ((chunk_type == SND1_TAG) || (chunk_type == SND2_TAG) || (chunk_type == VQFR_TAG)) {
 334
 335             if (av_new_packet(pkt, chunk_size))
 336                 return AVERROR_IO;
 337             ret = get_buffer(pb, pkt->data, chunk_size);
 338             if (ret != chunk_size) {
 339                 av_free_packet(pkt);
 340                 return AVERROR_IO;
 341             }
 342
 343             if (chunk_type == SND2_TAG) {
 344                 pkt->stream_index = wsvqa->audio_stream_index;
 345
 346                 pkt->pts = 90000;
 347                 pkt->pts *= wsvqa->audio_frame_counter;
 348                 pkt->pts /= wsvqa->audio_samplerate;
 349
 350                 /* 2 samples/byte, 1 or 2 samples per frame depending on stereo */
 351                 wsvqa->audio_frame_counter += (chunk_size * 2) / wsvqa->audio_channels;
 352             } else if(chunk_type == SND1_TAG) {
 353                 pkt->stream_index = wsvqa->audio_stream_index;
 354
 355                 pkt->pts = 90000;
 356                 pkt->pts *= wsvqa->audio_frame_counter;
 357                 pkt->pts /= wsvqa->audio_samplerate;
 358
 359                 /* unpacked size is stored in header */
 360                 wsvqa->audio_frame_counter += LE_16(pkt->data) / wsvqa->audio_channels;
 361             } else {
 362                 pkt->stream_index = wsvqa->video_stream_index;
 363                 pkt->pts = wsvqa->video_pts;
 364                 wsvqa->video_pts += VQA_VIDEO_PTS_INC;
 365             }
 366             /* stay on 16-bit alignment */
 367             if (skip_byte)
 368                 url_fseek(pb, 1, SEEK_CUR);
 369
 370             return ret;
 371         } else {
 372             switch(chunk_type){
 373             case CMDS_TAG:
 374             case SND0_TAG:
 375                 break;
 376             default:
 377                 av_log(s, AV_LOG_INFO, "Skipping unknown chunk 0x%08X\n", chunk_type);
 378             }
 379             url_fseek(pb, chunk_size + skip_byte, SEEK_CUR);
 380         }
 381     }
 382
 383     return ret;
 384 }
 385
 386 static int wsvqa_read_close(AVFormatContext *s)
 387 {
 388 //    WsVqaDemuxContext *wsvqa = (WsVqaDemuxContext *)s->priv_data;
 389
 390     return 0;
 391 }
 392
 393 #ifdef CONFIG_WSAUD_DEMUXER
 394 AVInputFormat wsaud_demuxer = {
 395     "wsaud",
 396     "Westwood Studios audio format",
 397     sizeof(WsAudDemuxContext),
 398     wsaud_probe,
 399     wsaud_read_header,
 400     wsaud_read_packet,
 401     wsaud_read_close,
 402 };
 403 #endif
 404 #ifdef CONFIG_WSVQA_DEMUXER
 405 AVInputFormat wsvqa_demuxer = {
 406     "wsvqa",
 407     "Westwood Studios VQA format",
 408     sizeof(WsVqaDemuxContext),
 409     wsvqa_probe,
 410     wsvqa_read_header,
 411     wsvqa_read_packet,
 412     wsvqa_read_close,
 413 };
 414 #endif