2 * MP3 muxer and demuxer
3 * Copyright (c) 2003 Fabrice Bellard
5 * This file is part of FFmpeg.
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
23 #include "libavutil/avstring.h"
24 #include "libavcodec/mpegaudio.h"
25 #include "libavcodec/mpegaudiodecheader.h"
29 #define ID3v1_TAG_SIZE 128
31 #define ID3v1_GENRE_MAX 125
33 static const char * const id3v1_genre_str[ID3v1_GENRE_MAX + 1] = {
67 [33] = "Instrumental",
80 [46] = "Instrumental Pop",
81 [47] = "Instrumental Rock",
85 [51] = "Techno-Industrial",
90 [56] = "Southern Rock",
95 [61] = "Christian Rap",
98 [64] = "Native American",
101 [67] = "Psychadelic",
112 [78] = "Rock & Roll",
116 [82] = "National Folk",
118 [84] = "Fast Fusion",
125 [91] = "Gothic Rock",
126 [92] = "Progressive Rock",
127 [93] = "Psychedelic Rock",
128 [94] = "Symphonic Rock",
132 [98] = "Easy Listening",
138 [104] = "Chamber Music",
141 [107] = "Booty Bass",
143 [109] = "Porn Groove",
151 [117] = "Power Ballad",
152 [118] = "Rhythmic Soul",
158 [124] = "Euro-House",
159 [125] = "Dance Hall",
162 static unsigned int id3v2_get_size(ByteIOContext *s, int len)
166 v= (v<<7) + (get_byte(s)&0x7F);
170 static void id3v2_read_ttag(AVFormatContext *s, int taglen, const char *key)
173 int len, dstlen = sizeof(dst) - 1;
180 taglen--; /* account for encoding type byte */
182 switch(get_byte(s->pb)) { /* encoding type */
184 case 0: /* ISO-8859-1 (0 - 255 maps directly into unicode) */
188 PUT_UTF8(get_byte(s->pb), tmp, if (q - dst < dstlen - 1) *q++ = tmp;)
194 len = FFMIN(taglen, dstlen-1);
195 get_buffer(s->pb, dst, len);
200 if (!strcmp(key, "genre")
201 && (sscanf(dst, "(%d)", &genre) == 1 || sscanf(dst, "%d", &genre) == 1)
202 && genre <= ID3v1_GENRE_MAX)
203 av_strlcpy(dst, id3v1_genre_str[genre], sizeof(dst));
206 av_metadata_set(&s->metadata, key, dst);
212 * Handles ID3v2.2, 2.3 and 2.4.
216 static void id3v2_parse(AVFormatContext *s, int len, uint8_t version, uint8_t flags)
227 reason = "compression";
246 reason = "unsynchronization";
250 if(isv34 && flags & 0x40) /* Extended header present, just skip over it */
251 url_fskip(s->pb, id3v2_get_size(s->pb, 4));
253 while(len >= taghdrlen) {
255 tag = get_be32(s->pb);
256 tlen = id3v2_get_size(s->pb, 4);
257 get_be16(s->pb); /* flags */
259 tag = get_be24(s->pb);
260 tlen = id3v2_get_size(s->pb, 3);
262 len -= taghdrlen + tlen;
267 next = url_ftell(s->pb) + tlen;
270 case MKBETAG('T', 'I', 'T', '2'):
271 case MKBETAG(0, 'T', 'T', '2'):
272 id3v2_read_ttag(s, tlen, "title");
274 case MKBETAG('T', 'P', 'E', '1'):
275 case MKBETAG(0, 'T', 'P', '1'):
276 id3v2_read_ttag(s, tlen, "author");
278 case MKBETAG('T', 'A', 'L', 'B'):
279 case MKBETAG(0, 'T', 'A', 'L'):
280 id3v2_read_ttag(s, tlen, "album");
282 case MKBETAG('T', 'C', 'O', 'N'):
283 case MKBETAG(0, 'T', 'C', 'O'):
284 id3v2_read_ttag(s, tlen, "genre");
286 case MKBETAG('T', 'C', 'O', 'P'):
287 case MKBETAG(0, 'T', 'C', 'R'):
288 id3v2_read_ttag(s, tlen, "copyright");
290 case MKBETAG('T', 'R', 'C', 'K'):
291 case MKBETAG(0, 'T', 'R', 'K'):
292 id3v2_read_ttag(s, tlen, "track");
295 /* padding, skip to end */
296 url_fskip(s->pb, len);
300 /* Skip to end of tag */
301 url_fseek(s->pb, next, SEEK_SET);
304 if(version == 4 && flags & 0x10) /* Footer preset, always 10 bytes, skip over it */
305 url_fskip(s->pb, 10);
309 av_log(s, AV_LOG_INFO, "ID3v2.%d tag skipped, cannot handle %s\n", version, reason);
310 url_fskip(s->pb, len);
313 static void id3v1_get_string(AVFormatContext *s, const char *key,
314 const uint8_t *buf, int buf_size)
320 for(i = 0; i < buf_size; i++) {
324 if ((q - str) >= sizeof(str) - 1)
331 av_metadata_set(&s->metadata, key, str);
334 /* 'buf' must be ID3v1_TAG_SIZE byte long */
335 static int id3v1_parse_tag(AVFormatContext *s, const uint8_t *buf)
340 if (!(buf[0] == 'T' &&
344 id3v1_get_string(s, "title", buf + 3, 30);
345 id3v1_get_string(s, "author", buf + 33, 30);
346 id3v1_get_string(s, "album", buf + 63, 30);
347 id3v1_get_string(s, "year", buf + 93, 4);
348 id3v1_get_string(s, "comment", buf + 97, 30);
349 if (buf[125] == 0 && buf[126] != 0) {
350 snprintf(str, sizeof(str), "%d", buf[126]);
351 av_metadata_set(&s->metadata, "track", str);
354 if (genre <= ID3v1_GENRE_MAX)
355 av_metadata_set(&s->metadata, "genre", id3v1_genre_str[genre]);
361 static int mp3_read_probe(AVProbeData *p)
363 int max_frames, first_frames = 0;
364 int fsize, frames, sample_rate;
366 uint8_t *buf, *buf0, *buf2, *end;
367 AVCodecContext avctx;
370 if(ff_id3v2_match(buf0)) {
371 buf0 += ff_id3v2_tag_len(buf0);
376 end = p->buf + p->buf_size - sizeof(uint32_t);
378 for(; buf < end; buf= buf2+1) {
381 for(frames = 0; buf2 < end; frames++) {
382 header = AV_RB32(buf2);
383 fsize = ff_mpa_decode_header(&avctx, header, &sample_rate, &sample_rate, &sample_rate, &sample_rate);
388 max_frames = FFMAX(max_frames, frames);
390 first_frames= frames;
392 if (first_frames>=3) return AVPROBE_SCORE_MAX/2+1;
393 else if(max_frames>500)return AVPROBE_SCORE_MAX/2;
394 else if(max_frames>=3) return AVPROBE_SCORE_MAX/4;
395 else if(buf0!=p->buf) return AVPROBE_SCORE_MAX/4-1;
396 else if(max_frames>=1) return 1;
401 * Try to find Xing/Info/VBRI tags and compute duration from info therein
403 static int mp3_parse_vbr_tags(AVFormatContext *s, AVStream *st, int64_t base)
406 int frames = -1; /* Total number of frames in file */
407 const int64_t xing_offtbl[2][2] = {{32, 17}, {17,9}};
412 if(ff_mpa_check_header(v) < 0)
415 if (ff_mpegaudio_decode_header(&c, v) == 0)
416 vbrtag_size = c.frame_size;
420 /* Check for Xing / Info tag */
421 url_fseek(s->pb, xing_offtbl[c.lsf == 1][c.nb_channels == 1], SEEK_CUR);
423 if(v == MKBETAG('X', 'i', 'n', 'g') || v == MKBETAG('I', 'n', 'f', 'o')) {
426 frames = get_be32(s->pb);
429 /* Check for VBRI tag (always 32 bytes after end of mpegaudio header) */
430 url_fseek(s->pb, base + 4 + 32, SEEK_SET);
432 if(v == MKBETAG('V', 'B', 'R', 'I')) {
433 /* Check tag version */
434 if(get_be16(s->pb) == 1) {
435 /* skip delay, quality and total bytes */
436 url_fseek(s->pb, 8, SEEK_CUR);
437 frames = get_be32(s->pb);
444 /* Skip the vbr tag frame */
445 url_fseek(s->pb, base + vbrtag_size, SEEK_SET);
447 spf = c.lsf ? 576 : 1152; /* Samples per frame, layer 3 */
448 st->duration = av_rescale_q(frames, (AVRational){spf, c.sample_rate},
453 static int mp3_read_header(AVFormatContext *s,
454 AVFormatParameters *ap)
457 uint8_t buf[ID3v1_TAG_SIZE];
458 int len, ret, filesize;
461 st = av_new_stream(s, 0);
463 return AVERROR(ENOMEM);
465 st->codec->codec_type = CODEC_TYPE_AUDIO;
466 st->codec->codec_id = CODEC_ID_MP3;
467 st->need_parsing = AVSTREAM_PARSE_FULL;
470 /* try to get the TAG */
471 if (!url_is_streamed(s->pb)) {
472 /* XXX: change that */
473 filesize = url_fsize(s->pb);
474 if (filesize > 128) {
475 url_fseek(s->pb, filesize - 128, SEEK_SET);
476 ret = get_buffer(s->pb, buf, ID3v1_TAG_SIZE);
477 if (ret == ID3v1_TAG_SIZE) {
478 id3v1_parse_tag(s, buf);
480 url_fseek(s->pb, 0, SEEK_SET);
484 /* if ID3v2 header found, skip it */
485 ret = get_buffer(s->pb, buf, ID3v2_HEADER_SIZE);
486 if (ret != ID3v2_HEADER_SIZE)
488 if (ff_id3v2_match(buf)) {
489 /* parse ID3v2 header */
490 len = ((buf[6] & 0x7f) << 21) |
491 ((buf[7] & 0x7f) << 14) |
492 ((buf[8] & 0x7f) << 7) |
494 id3v2_parse(s, len, buf[3], buf[5]);
496 url_fseek(s->pb, 0, SEEK_SET);
499 off = url_ftell(s->pb);
500 if (mp3_parse_vbr_tags(s, st, off) < 0)
501 url_fseek(s->pb, off, SEEK_SET);
503 /* the parameters will be extracted from the compressed bitstream */
507 #define MP3_PACKET_SIZE 1024
509 static int mp3_read_packet(AVFormatContext *s, AVPacket *pkt)
512 // AVStream *st = s->streams[0];
514 size= MP3_PACKET_SIZE;
516 ret= av_get_packet(s->pb, pkt, size);
518 pkt->stream_index = 0;
522 /* note: we need to modify the packet size here to handle the last
528 #if CONFIG_MP2_MUXER || CONFIG_MP3_MUXER
529 static int id3v1_set_string(AVFormatContext *s, const char *key,
530 uint8_t *buf, int buf_size)
533 if ((tag = av_metadata_get(s->metadata, key, NULL, 0)))
534 strncpy(buf, tag->value, buf_size);
538 static int id3v1_create_tag(AVFormatContext *s, uint8_t *buf)
543 memset(buf, 0, ID3v1_TAG_SIZE); /* fail safe */
547 count += id3v1_set_string(s, "title", buf + 3, 30);
548 count += id3v1_set_string(s, "author", buf + 33, 30);
549 count += id3v1_set_string(s, "album", buf + 63, 30);
550 count += id3v1_set_string(s, "year", buf + 93, 4);
551 count += id3v1_set_string(s, "comment", buf + 97, 30);
552 if ((tag = av_metadata_get(s->metadata, "track", NULL, 0))) {
554 buf[126] = atoi(tag->value);
557 if ((tag = av_metadata_get(s->metadata, "genre", NULL, 0))) {
558 for(i = 0; i <= ID3v1_GENRE_MAX; i++) {
559 if (!strcasecmp(tag->value, id3v1_genre_str[i])) {
571 static void id3v2_put_size(AVFormatContext *s, int size)
573 put_byte(s->pb, size >> 21 & 0x7f);
574 put_byte(s->pb, size >> 14 & 0x7f);
575 put_byte(s->pb, size >> 7 & 0x7f);
576 put_byte(s->pb, size & 0x7f);
579 static void id3v2_put_ttag(AVFormatContext *s, const char *string, uint32_t tag)
581 int len = strlen(string);
582 put_be32(s->pb, tag);
583 id3v2_put_size(s, len + 1);
585 put_byte(s->pb, 3); /* UTF-8 */
586 put_buffer(s->pb, string, len);
591 * Write an ID3v2.4 header at beginning of stream
594 static int mp3_write_header(struct AVFormatContext *s)
596 AVMetadataTag *title, *author, *album, *genre, *copyright, *track, *year;
599 title = av_metadata_get(s->metadata, "title", NULL, 0);
600 author = av_metadata_get(s->metadata, "author", NULL, 0);
601 album = av_metadata_get(s->metadata, "album", NULL, 0);
602 genre = av_metadata_get(s->metadata, "genre", NULL, 0);
603 copyright = av_metadata_get(s->metadata, "copyright", NULL, 0);
604 track = av_metadata_get(s->metadata, "track", NULL, 0);
605 year = av_metadata_get(s->metadata, "year", NULL, 0);
607 if(title) totlen += 11 + strlen(title->value);
608 if(author) totlen += 11 + strlen(author->value);
609 if(album) totlen += 11 + strlen(album->value);
610 if(genre) totlen += 11 + strlen(genre->value);
611 if(copyright) totlen += 11 + strlen(copyright->value);
612 if(track) totlen += 11 + strlen(track->value);
613 if(year) totlen += 11 + strlen(year->value);
614 if(!(s->streams[0]->codec->flags & CODEC_FLAG_BITEXACT))
615 totlen += strlen(LIBAVFORMAT_IDENT) + 11;
620 put_be32(s->pb, MKBETAG('I', 'D', '3', 0x04)); /* ID3v2.4 */
622 put_byte(s->pb, 0); /* flags */
624 id3v2_put_size(s, totlen);
626 if(title) id3v2_put_ttag(s, title->value, MKBETAG('T', 'I', 'T', '2'));
627 if(author) id3v2_put_ttag(s, author->value, MKBETAG('T', 'P', 'E', '1'));
628 if(album) id3v2_put_ttag(s, album->value, MKBETAG('T', 'A', 'L', 'B'));
629 if(genre) id3v2_put_ttag(s, genre->value, MKBETAG('T', 'C', 'O', 'N'));
630 if(copyright) id3v2_put_ttag(s, copyright->value, MKBETAG('T', 'C', 'O', 'P'));
631 if(track) id3v2_put_ttag(s, track->value, MKBETAG('T', 'R', 'C', 'K'));
632 if(year) id3v2_put_ttag(s, year->value, MKBETAG('T', 'Y', 'E', 'R'));
633 if(!(s->streams[0]->codec->flags & CODEC_FLAG_BITEXACT))
634 id3v2_put_ttag(s, LIBAVFORMAT_IDENT, MKBETAG('T', 'E', 'N', 'C'));
638 static int mp3_write_packet(struct AVFormatContext *s, AVPacket *pkt)
640 put_buffer(s->pb, pkt->data, pkt->size);
641 put_flush_packet(s->pb);
645 static int mp3_write_trailer(struct AVFormatContext *s)
647 uint8_t buf[ID3v1_TAG_SIZE];
649 /* write the id3v1 tag */
650 if (id3v1_create_tag(s, buf) > 0) {
651 put_buffer(s->pb, buf, ID3v1_TAG_SIZE);
652 put_flush_packet(s->pb);
656 #endif /* CONFIG_MP2_MUXER || CONFIG_MP3_MUXER */
658 #if CONFIG_MP3_DEMUXER
659 AVInputFormat mp3_demuxer = {
661 NULL_IF_CONFIG_SMALL("MPEG audio layer 2/3"),
666 .flags= AVFMT_GENERIC_INDEX,
667 .extensions = "mp2,mp3,m2a", /* XXX: use probe */
671 AVOutputFormat mp2_muxer = {
673 NULL_IF_CONFIG_SMALL("MPEG audio layer 2"),
685 AVOutputFormat mp3_muxer = {
687 NULL_IF_CONFIG_SMALL("MPEG audio layer 3"),