3 * Copyright (c) 2003 Fabrice Bellard
5 * This file is part of FFmpeg.
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
24 #include "libavutil/avstring.h"
26 int ff_id3v2_match(const uint8_t *buf)
28 return buf[0] == 'I' &&
33 (buf[6] & 0x80) == 0 &&
34 (buf[7] & 0x80) == 0 &&
35 (buf[8] & 0x80) == 0 &&
39 int ff_id3v2_tag_len(const uint8_t * buf)
41 int len = ((buf[6] & 0x7f) << 21) +
42 ((buf[7] & 0x7f) << 14) +
43 ((buf[8] & 0x7f) << 7) +
47 len += ID3v2_HEADER_SIZE;
51 void ff_id3v2_read(AVFormatContext *s)
54 uint8_t buf[ID3v2_HEADER_SIZE];
56 ret = get_buffer(s->pb, buf, ID3v2_HEADER_SIZE);
57 if (ret != ID3v2_HEADER_SIZE)
59 if (ff_id3v2_match(buf)) {
60 /* parse ID3v2 header */
61 len = ((buf[6] & 0x7f) << 21) |
62 ((buf[7] & 0x7f) << 14) |
63 ((buf[8] & 0x7f) << 7) |
65 ff_id3v2_parse(s, len, buf[3], buf[5]);
67 url_fseek(s->pb, 0, SEEK_SET);
71 static unsigned int get_size(ByteIOContext *s, int len)
75 v = (v << 7) + (get_byte(s) & 0x7F);
79 static void read_ttag(AVFormatContext *s, int taglen, const char *key)
82 const char *val = NULL;
83 int len, dstlen = sizeof(dst) - 1;
85 unsigned int (*get)(ByteIOContext*) = get_be16;
91 taglen--; /* account for encoding type byte */
93 switch (get_byte(s->pb)) { /* encoding type */
95 case 0: /* ISO-8859-1 (0 - 255 maps directly into unicode) */
97 while (taglen-- && q - dst < dstlen - 7) {
99 PUT_UTF8(get_byte(s->pb), tmp, *q++ = tmp;)
104 case 1: /* UTF-16 with BOM */
106 switch (get_be16(s->pb)) {
112 av_log(s, AV_LOG_ERROR, "Incorrect BOM value in tag %s.\n", key);
117 case 2: /* UTF-16BE without BOM */
119 while (taglen > 1 && q - dst < dstlen - 7) {
123 GET_UTF16(ch, ((taglen -= 2) >= 0 ? get(s->pb) : 0), break;)
124 PUT_UTF8(ch, tmp, *q++ = tmp;)
130 len = FFMIN(taglen, dstlen);
131 get_buffer(s->pb, dst, len);
135 av_log(s, AV_LOG_WARNING, "Unknown encoding in tag %s\n.", key);
138 if (!(strcmp(key, "TCON") && strcmp(key, "TCO"))
139 && (sscanf(dst, "(%d)", &genre) == 1 || sscanf(dst, "%d", &genre) == 1)
140 && genre <= ID3v1_GENRE_MAX)
141 val = ff_id3v1_genre_str[genre];
142 else if (!(strcmp(key, "TXXX") && strcmp(key, "TXX"))) {
143 /* dst now contains two 0-terminated strings */
147 val = dst + FFMIN(len + 1, dstlen);
153 av_metadata_set2(&s->metadata, key, val, 0);
156 void ff_id3v2_parse(AVFormatContext *s, int len, uint8_t version, uint8_t flags)
167 reason = "compression";
186 reason = "unsynchronization";
190 if (isv34 && flags & 0x40) /* Extended header present, just skip over it */
191 url_fskip(s->pb, get_size(s->pb, 4));
193 while (len >= taghdrlen) {
195 get_buffer(s->pb, tag, 4);
198 tlen = get_be32(s->pb);
200 tlen = get_size(s->pb, 4);
201 get_be16(s->pb); /* flags */
203 get_buffer(s->pb, tag, 3);
205 tlen = get_be24(s->pb);
207 len -= taghdrlen + tlen;
212 next = url_ftell(s->pb) + tlen;
215 read_ttag(s, tlen, tag);
218 av_log(s, AV_LOG_WARNING, "invalid frame id, assuming padding");
219 url_fskip(s->pb, len);
222 /* Skip to end of tag */
223 url_fseek(s->pb, next, SEEK_SET);
226 if (version == 4 && flags & 0x10) /* Footer preset, always 10 bytes, skip over it */
227 url_fskip(s->pb, 10);
231 av_log(s, AV_LOG_INFO, "ID3v2.%d tag skipped, cannot handle %s\n", version, reason);
232 url_fskip(s->pb, len);
235 const AVMetadataConv ff_id3v2_metadata_conv[] = {
238 { "TCOM", "composer"},
241 { "TCOP", "copyright"},
244 { "TENC", "encoded_by"},
245 { "TEN", "encoded_by"},
248 { "TLAN", "language"},
251 { "TPE2", "album_artist"},
252 { "TP2", "album_artist"},
253 { "TPE3", "performer"},
254 { "TP3", "performer"},
256 { "TPUB", "publisher"},
259 { "TSOA", "album-sort"},
260 { "TSOP", "artist-sort"},
261 { "TSOT", "title-sort"},
262 { "TSSE", "encoder"},
266 const char ff_id3v2_tags[][4] = {
267 "TALB", "TBPM", "TCOM", "TCON", "TCOP", "TDEN", "TDLY", "TDOR", "TDRC",
268 "TDRL", "TDTG", "TENC", "TEXT", "TFLT", "TIPL", "TIT1", "TIT2", "TIT3",
269 "TKEY", "TLAN", "TLEN", "TMCL", "TMED", "TMOO", "TOAL", "TOFN", "TOLY",
270 "TOPE", "TOWN", "TPE1", "TPE2", "TPE3", "TPE4", "TPOS", "TPRO", "TPUB",
271 "TRCK", "TRSN", "TRSO", "TSOA", "TSOP", "TSOT", "TSRC", "TSSE", "TSST",