2 * WAV encoder and decoder
3 * Copyright (c) 2001, 2002 Fabrice Bellard.
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Lesser General Public
7 * License as published by the Free Software Foundation; either
8 * version 2 of the License, or (at your option) any later version.
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
15 * You should have received a copy of the GNU Lesser General Public
16 * License along with this library; if not, write to the Free Software
17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 #include "allformats.h"
23 const CodecTag codec_wav_tags[] = {
24 { CODEC_ID_MP2, 0x50 },
25 { CODEC_ID_MP3, 0x55 },
26 { CODEC_ID_AC3, 0x2000 },
27 { CODEC_ID_DTS, 0x2001 },
28 { CODEC_ID_PCM_S16LE, 0x01 },
29 { CODEC_ID_PCM_U8, 0x01 }, /* must come after s16le in this list */
30 { CODEC_ID_PCM_S24LE, 0x01 },
31 { CODEC_ID_PCM_S32LE, 0x01 },
32 { CODEC_ID_PCM_ALAW, 0x06 },
33 { CODEC_ID_PCM_MULAW, 0x07 },
34 { CODEC_ID_ADPCM_MS, 0x02 },
35 { CODEC_ID_ADPCM_IMA_WAV, 0x11 },
36 { CODEC_ID_ADPCM_YAMAHA, 0x20 },
37 { CODEC_ID_ADPCM_G726, 0x45 },
38 { CODEC_ID_ADPCM_IMA_DK4, 0x61 }, /* rogue format number */
39 { CODEC_ID_ADPCM_IMA_DK3, 0x62 }, /* rogue format number */
40 { CODEC_ID_WMAV1, 0x160 },
41 { CODEC_ID_WMAV2, 0x161 },
42 { CODEC_ID_AAC, 0x706d },
43 { CODEC_ID_VORBIS, ('V'<<8)+'o' }, //HACK/FIXME, does vorbis in WAV/AVI have an (in)official id?
44 { CODEC_ID_SONIC, 0x2048 },
45 { CODEC_ID_SONIC_LS, 0x2048 },
46 { CODEC_ID_ADPCM_CT, 0x200 },
47 { CODEC_ID_ADPCM_SWF, ('S'<<8)+'F' },
48 { CODEC_ID_TRUESPEECH, 0x22 },
50 // for NuppelVideo (nuv.c)
51 { CODEC_ID_PCM_S16LE, MKTAG('R', 'A', 'W', 'A') },
52 { CODEC_ID_MP3, MKTAG('L', 'A', 'M', 'E') },
57 /* WAVEFORMATEX header */
58 /* returns the size or -1 on error */
59 int put_wav_header(ByteIOContext *pb, AVCodecContext *enc)
61 int bps, blkalign, bytespersec;
64 if(!enc->codec_tag || enc->codec_tag > 0xffff)
65 enc->codec_tag = codec_get_tag(codec_wav_tags, enc->codec_id);
69 put_le16(pb, enc->codec_tag);
70 put_le16(pb, enc->channels);
71 put_le32(pb, enc->sample_rate);
72 if (enc->codec_id == CODEC_ID_PCM_U8 ||
73 enc->codec_id == CODEC_ID_PCM_ALAW ||
74 enc->codec_id == CODEC_ID_PCM_MULAW) {
76 } else if (enc->codec_id == CODEC_ID_MP2 || enc->codec_id == CODEC_ID_MP3) {
78 } else if (enc->codec_id == CODEC_ID_ADPCM_IMA_WAV || enc->codec_id == CODEC_ID_ADPCM_MS || enc->codec_id == CODEC_ID_ADPCM_G726 || enc->codec_id == CODEC_ID_ADPCM_YAMAHA) { //
80 } else if (enc->codec_id == CODEC_ID_PCM_S24LE) {
82 } else if (enc->codec_id == CODEC_ID_PCM_S32LE) {
88 if (enc->codec_id == CODEC_ID_MP2 || enc->codec_id == CODEC_ID_MP3) {
89 blkalign = enc->frame_size; //this is wrong, but seems many demuxers dont work if this is set correctly
90 //blkalign = 144 * enc->bit_rate/enc->sample_rate;
91 } else if (enc->codec_id == CODEC_ID_ADPCM_G726) { //
93 } else if (enc->block_align != 0) { /* specified by the codec */
94 blkalign = enc->block_align;
96 blkalign = enc->channels*bps >> 3;
97 if (enc->codec_id == CODEC_ID_PCM_U8 ||
98 enc->codec_id == CODEC_ID_PCM_S24LE ||
99 enc->codec_id == CODEC_ID_PCM_S32LE ||
100 enc->codec_id == CODEC_ID_PCM_S16LE) {
101 bytespersec = enc->sample_rate * blkalign;
103 bytespersec = enc->bit_rate / 8;
105 put_le32(pb, bytespersec); /* bytes per second */
106 put_le16(pb, blkalign); /* block align */
107 put_le16(pb, bps); /* bits per sample */
108 if (enc->codec_id == CODEC_ID_MP3) {
109 put_le16(pb, 12); /* wav_extra_size */
111 put_le16(pb, 1); /* wID */
112 put_le32(pb, 2); /* fdwFlags */
113 put_le16(pb, 1152); /* nBlockSize */
114 put_le16(pb, 1); /* nFramesPerBlock */
115 put_le16(pb, 1393); /* nCodecDelay */
116 } else if (enc->codec_id == CODEC_ID_MP2) {
117 put_le16(pb, 22); /* wav_extra_size */
119 put_le16(pb, 2); /* fwHeadLayer */
120 put_le32(pb, enc->bit_rate); /* dwHeadBitrate */
121 put_le16(pb, enc->channels == 2 ? 1 : 8); /* fwHeadMode */
122 put_le16(pb, 0); /* fwHeadModeExt */
123 put_le16(pb, 1); /* wHeadEmphasis */
124 put_le16(pb, 16); /* fwHeadFlags */
125 put_le32(pb, 0); /* dwPTSLow */
126 put_le32(pb, 0); /* dwPTSHigh */
127 } else if (enc->codec_id == CODEC_ID_ADPCM_IMA_WAV) {
128 put_le16(pb, 2); /* wav_extra_size */
130 put_le16(pb, ((enc->block_align - 4 * enc->channels) / (4 * enc->channels)) * 8 + 1); /* wSamplesPerBlock */
131 } else if(enc->extradata_size){
132 put_le16(pb, enc->extradata_size);
133 put_buffer(pb, enc->extradata, enc->extradata_size);
134 hdrsize += enc->extradata_size;
145 #endif //CONFIG_MUXERS
147 /* We could be given one of the three possible structures here:
148 * WAVEFORMAT, PCMWAVEFORMAT or WAVEFORMATEX. Each structure
149 * is an expansion of the previous one with the fields added
150 * at the bottom. PCMWAVEFORMAT adds 'WORD wBitsPerSample' and
151 * WAVEFORMATEX adds 'WORD cbSize' and basically makes itself
152 * an openended structure.
154 void get_wav_header(ByteIOContext *pb, AVCodecContext *codec, int size)
159 codec->codec_type = CODEC_TYPE_AUDIO;
160 codec->codec_tag = id;
161 codec->channels = get_le16(pb);
162 codec->sample_rate = get_le32(pb);
163 codec->bit_rate = get_le32(pb) * 8;
164 codec->block_align = get_le16(pb);
165 if (size == 14) { /* We're dealing with plain vanilla WAVEFORMAT */
166 codec->bits_per_sample = 8;
168 codec->bits_per_sample = get_le16(pb);
169 codec->codec_id = wav_codec_get_id(id, codec->bits_per_sample);
171 if (size > 16) { /* We're obviously dealing with WAVEFORMATEX */
172 codec->extradata_size = get_le16(pb);
173 if (codec->extradata_size > 0) {
174 if (codec->extradata_size > size - 18)
175 codec->extradata_size = size - 18;
176 codec->extradata = av_mallocz(codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
177 get_buffer(pb, codec->extradata, codec->extradata_size);
179 codec->extradata_size = 0;
181 /* It is possible for the chunk to contain garbage at the end */
182 if (size - codec->extradata_size - 18 > 0)
183 url_fskip(pb, size - codec->extradata_size - 18);
188 int wav_codec_get_id(unsigned int tag, int bps)
191 id = codec_get_id(codec_wav_tags, tag);
194 /* handle specific u8 codec */
195 if (id == CODEC_ID_PCM_S16LE && bps == 8)
196 id = CODEC_ID_PCM_U8;
197 if (id == CODEC_ID_PCM_S16LE && bps == 24)
198 id = CODEC_ID_PCM_S24LE;
199 if (id == CODEC_ID_PCM_S16LE && bps == 32)
200 id = CODEC_ID_PCM_S32LE;
210 static int wav_write_header(AVFormatContext *s)
212 WAVContext *wav = s->priv_data;
213 ByteIOContext *pb = &s->pb;
217 put_le32(pb, 0); /* file length */
221 fmt = start_tag(pb, "fmt ");
222 if (put_wav_header(pb, s->streams[0]->codec) < 0) {
228 av_set_pts_info(s->streams[0], 64, 1, s->streams[0]->codec->sample_rate);
231 wav->data = start_tag(pb, "data");
233 put_flush_packet(pb);
238 static int wav_write_packet(AVFormatContext *s, AVPacket *pkt)
240 ByteIOContext *pb = &s->pb;
241 put_buffer(pb, pkt->data, pkt->size);
245 static int wav_write_trailer(AVFormatContext *s)
247 ByteIOContext *pb = &s->pb;
248 WAVContext *wav = s->priv_data;
251 if (!url_is_streamed(&s->pb)) {
252 end_tag(pb, wav->data);
254 /* update file size */
255 file_size = url_ftell(pb);
256 url_fseek(pb, 4, SEEK_SET);
257 put_le32(pb, (uint32_t)(file_size - 8));
258 url_fseek(pb, file_size, SEEK_SET);
260 put_flush_packet(pb);
264 #endif //CONFIG_MUXERS
266 /* return the size of the found tag */
268 static int find_tag(ByteIOContext *pb, uint32_t tag1)
280 url_fseek(pb, size, SEEK_CUR);
287 static int wav_probe(AVProbeData *p)
289 /* check file header */
290 if (p->buf_size <= 32)
292 if (p->buf[0] == 'R' && p->buf[1] == 'I' &&
293 p->buf[2] == 'F' && p->buf[3] == 'F' &&
294 p->buf[8] == 'W' && p->buf[9] == 'A' &&
295 p->buf[10] == 'V' && p->buf[11] == 'E')
296 return AVPROBE_SCORE_MAX;
302 static int wav_read_header(AVFormatContext *s,
303 AVFormatParameters *ap)
307 ByteIOContext *pb = &s->pb;
309 WAVContext *wav = s->priv_data;
311 /* check RIFF header */
314 if (tag != MKTAG('R', 'I', 'F', 'F'))
316 get_le32(pb); /* file size */
318 if (tag != MKTAG('W', 'A', 'V', 'E'))
321 /* parse fmt header */
322 size = find_tag(pb, MKTAG('f', 'm', 't', ' '));
325 st = av_new_stream(s, 0);
327 return AVERROR_NOMEM;
329 get_wav_header(pb, st->codec, size);
330 st->need_parsing = 1;
332 av_set_pts_info(st, 64, 1, st->codec->sample_rate);
334 size = find_tag(pb, MKTAG('d', 'a', 't', 'a'));
337 wav->data_end= url_ftell(pb) + size;
341 #define MAX_SIZE 4096
343 static int wav_read_packet(AVFormatContext *s,
348 WAVContext *wav = s->priv_data;
350 if (url_feof(&s->pb))
354 left= wav->data_end - url_ftell(&s->pb);
356 left = find_tag(&(s->pb), MKTAG('d', 'a', 't', 'a'));
360 wav->data_end= url_ftell(&s->pb) + left;
364 if (st->codec->block_align > 1) {
365 if (size < st->codec->block_align)
366 size = st->codec->block_align;
367 size = (size / st->codec->block_align) * st->codec->block_align;
369 size= FFMIN(size, left);
370 if (av_new_packet(pkt, size))
372 pkt->stream_index = 0;
374 ret = get_buffer(&s->pb, pkt->data, pkt->size);
377 /* note: we need to modify the packet size here to handle the last
383 static int wav_read_close(AVFormatContext *s)
388 static int wav_read_seek(AVFormatContext *s,
389 int stream_index, int64_t timestamp, int flags)
394 switch(st->codec->codec_id) {
399 /* use generic seeking with dynamically generated indexes */
404 return pcm_read_seek(s, stream_index, timestamp, flags);
408 static AVInputFormat wav_demuxer = {
420 static AVOutputFormat wav_muxer = {
432 #endif //CONFIG_MUXERS
434 int ff_wav_init(void)
436 av_register_input_format(&wav_demuxer);
438 av_register_output_format(&wav_muxer);
439 #endif //CONFIG_MUXERS