3 * Copyright (c) 2003 Fabrice Bellard
5 * This file is part of FFmpeg.
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
24 #include "libavutil/avstring.h"
25 #include "libavutil/intreadwrite.h"
27 int ff_id3v2_match(const uint8_t *buf, const char * magic)
29 return buf[0] == magic[0] &&
34 (buf[6] & 0x80) == 0 &&
35 (buf[7] & 0x80) == 0 &&
36 (buf[8] & 0x80) == 0 &&
40 int ff_id3v2_tag_len(const uint8_t * buf)
42 int len = ((buf[6] & 0x7f) << 21) +
43 ((buf[7] & 0x7f) << 14) +
44 ((buf[8] & 0x7f) << 7) +
48 len += ID3v2_HEADER_SIZE;
52 void ff_id3v2_read(AVFormatContext *s, const char *magic)
55 uint8_t buf[ID3v2_HEADER_SIZE];
57 ret = get_buffer(s->pb, buf, ID3v2_HEADER_SIZE);
58 if (ret != ID3v2_HEADER_SIZE)
60 if (ff_id3v2_match(buf, magic)) {
61 /* parse ID3v2 header */
62 len = ((buf[6] & 0x7f) << 21) |
63 ((buf[7] & 0x7f) << 14) |
64 ((buf[8] & 0x7f) << 7) |
66 ff_id3v2_parse(s, len, buf[3], buf[5]);
68 url_fseek(s->pb, 0, SEEK_SET);
72 static unsigned int get_size(ByteIOContext *s, int len)
76 v = (v << 7) + (get_byte(s) & 0x7F);
80 static void read_ttag(AVFormatContext *s, ByteIOContext *pb, int taglen, const char *key)
83 const char *val = NULL;
84 int len, dstlen = sizeof(dst) - 1;
86 unsigned int (*get)(ByteIOContext*) = get_be16;
92 taglen--; /* account for encoding type byte */
94 switch (get_byte(pb)) { /* encoding type */
96 case 0: /* ISO-8859-1 (0 - 255 maps directly into unicode) */
98 while (taglen-- && q - dst < dstlen - 7) {
100 PUT_UTF8(get_byte(pb), tmp, *q++ = tmp;)
105 case 1: /* UTF-16 with BOM */
107 switch (get_be16(pb)) {
113 av_log(s, AV_LOG_ERROR, "Incorrect BOM value in tag %s.\n", key);
118 case 2: /* UTF-16BE without BOM */
120 while (taglen > 1 && q - dst < dstlen - 7) {
124 GET_UTF16(ch, ((taglen -= 2) >= 0 ? get(pb) : 0), break;)
125 PUT_UTF8(ch, tmp, *q++ = tmp;)
131 len = FFMIN(taglen, dstlen);
132 get_buffer(pb, dst, len);
136 av_log(s, AV_LOG_WARNING, "Unknown encoding in tag %s\n.", key);
139 if (!(strcmp(key, "TCON") && strcmp(key, "TCO"))
140 && (sscanf(dst, "(%d)", &genre) == 1 || sscanf(dst, "%d", &genre) == 1)
141 && genre <= ID3v1_GENRE_MAX)
142 val = ff_id3v1_genre_str[genre];
143 else if (!(strcmp(key, "TXXX") && strcmp(key, "TXX"))) {
144 /* dst now contains two 0-terminated strings */
148 val = dst + FFMIN(len + 1, dstlen);
154 av_metadata_set2(&s->metadata, key, val, 0);
157 void ff_id3v2_parse(AVFormatContext *s, int len, uint8_t version, uint8_t flags)
159 int isv34, tlen, unsync;
165 unsigned char *buffer = NULL;
171 reason = "compression";
189 unsync = flags & 0x80;
191 if (isv34 && flags & 0x40) /* Extended header present, just skip over it */
192 url_fskip(s->pb, get_size(s->pb, 4));
194 while (len >= taghdrlen) {
199 get_buffer(s->pb, tag, 4);
202 tlen = get_be32(s->pb);
204 tlen = get_size(s->pb, 4);
205 tflags = get_be16(s->pb);
206 tunsync = tflags & 0x02;
208 get_buffer(s->pb, tag, 3);
210 tlen = get_be24(s->pb);
212 len -= taghdrlen + tlen;
217 next = url_ftell(s->pb) + tlen;
220 if (unsync || tunsync) {
222 av_fast_malloc(&buffer, &buffer_size, tlen);
223 for (i = 0, j = 0; i < tlen; i++, j++) {
224 buffer[j] = get_byte(s->pb);
225 if (j > 0 && !buffer[j] && buffer[j - 1] == 0xff) {
226 /* Unsynchronised byte, skip it */
230 init_put_byte(&pb, buffer, j, 0, NULL, NULL, NULL, NULL);
231 read_ttag(s, &pb, j, tag);
233 read_ttag(s, s->pb, tlen, tag);
238 av_log(s, AV_LOG_WARNING, "invalid frame id, assuming padding");
239 url_fskip(s->pb, tlen);
242 /* Skip to end of tag */
243 url_fseek(s->pb, next, SEEK_SET);
248 url_fskip(s->pb, len);
250 if (version == 4 && flags & 0x10) /* Footer preset, always 10 bytes, skip over it */
251 url_fskip(s->pb, 10);
257 av_log(s, AV_LOG_INFO, "ID3v2.%d tag skipped, cannot handle %s\n", version, reason);
258 url_fskip(s->pb, len);
262 const AVMetadataConv ff_id3v2_metadata_conv[] = {
265 { "TCOM", "composer"},
268 { "TCOP", "copyright"},
271 { "TENC", "encoded_by"},
272 { "TEN", "encoded_by"},
275 { "TLAN", "language"},
278 { "TPE2", "album_artist"},
279 { "TP2", "album_artist"},
280 { "TPE3", "performer"},
281 { "TP3", "performer"},
283 { "TPUB", "publisher"},
286 { "TSOA", "album-sort"},
287 { "TSOP", "artist-sort"},
288 { "TSOT", "title-sort"},
289 { "TSSE", "encoder"},
293 const char ff_id3v2_tags[][4] = {
294 "TALB", "TBPM", "TCOM", "TCON", "TCOP", "TDEN", "TDLY", "TDOR", "TDRC",
295 "TDRL", "TDTG", "TENC", "TEXT", "TFLT", "TIPL", "TIT1", "TIT2", "TIT3",
296 "TKEY", "TLAN", "TLEN", "TMCL", "TMED", "TMOO", "TOAL", "TOFN", "TOLY",
297 "TOPE", "TOWN", "TPE1", "TPE2", "TPE3", "TPE4", "TPOS", "TPRO", "TPUB",
298 "TRCK", "TRSN", "TRSO", "TSOA", "TSOP", "TSOT", "TSRC", "TSSE", "TSST",