Accept FS#8469 by Bryan Childs with a few adjustments: Remove duplicate strip_extensi...
[Rockbox.git] / firmware / id3.c
blob1820078469e1b799a8b95819fcbebf7273121459
1 /***************************************************************************
2 * __________ __ ___.
3 * Open \______ \ ____ ____ | | _\_ |__ _______ ___
4 * Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
5 * Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
6 * Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
7 * \/ \/ \/ \/ \/
8 * $Id$
10 * Copyright (C) 2002 by Daniel Stenberg
12 * All files in this archive are subject to the GNU General Public License.
13 * See the file COPYING in the source tree root for full license agreement.
15 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
16 * KIND, either express or implied.
18 ****************************************************************************/
20 * Parts of this code has been stolen from the Ample project and was written
21 * by David H�deman. It has since been extended and enhanced pretty much by
22 * all sorts of friendly Rockbox people.
26 /* tagResolver and associated code copyright 2003 Thomas Paul Diffenbach
29 #include <stdio.h>
30 #include <stdlib.h>
31 #include <string.h>
32 #include <errno.h>
33 #include <stdbool.h>
34 #include <stddef.h>
35 #include <ctype.h>
36 #include "config.h"
37 #include "file.h"
38 #include "logf.h"
39 #include "atoi.h"
41 #include "id3.h"
42 #include "mp3data.h"
43 #include "system.h"
44 #include "replaygain.h"
45 #include "rbunicode.h"
47 /** Database of audio formats **/
48 const struct afmt_entry audio_formats[AFMT_NUM_CODECS] =
50 /* Unknown file format */
51 [AFMT_UNKNOWN] =
52 AFMT_ENTRY("???", NULL, NULL, NULL ),
54 /* MPEG Audio layer 1 */
55 [AFMT_MPA_L1] =
56 AFMT_ENTRY("MP1", "mpa", NULL, "mp1\0" ),
57 /* MPEG Audio layer 2 */
58 [AFMT_MPA_L2] =
59 AFMT_ENTRY("MP2", "mpa", NULL, "mpa\0mp2\0" ),
60 /* MPEG Audio layer 3 */
61 [AFMT_MPA_L3] =
62 AFMT_ENTRY("MP3", "mpa", "mp3_enc", "mp3\0" ),
64 #if CONFIG_CODEC == SWCODEC
65 /* Audio Interchange File Format */
66 [AFMT_AIFF] =
67 AFMT_ENTRY("AIFF", "aiff", "aiff_enc", "aiff\0aif\0"),
68 /* Uncompressed PCM in a WAV file */
69 [AFMT_PCM_WAV] =
70 AFMT_ENTRY("WAV", "wav", "wav_enc", "wav\0" ),
71 /* Ogg Vorbis */
72 [AFMT_OGG_VORBIS] =
73 AFMT_ENTRY("Ogg", "vorbis", NULL, "ogg\0" ),
74 /* FLAC */
75 [AFMT_FLAC] =
76 AFMT_ENTRY("FLAC", "flac", NULL, "flac\0" ),
77 /* Musepack */
78 [AFMT_MPC] =
79 AFMT_ENTRY("MPC", "mpc", NULL, "mpc\0" ),
80 /* A/52 (aka AC3) audio */
81 [AFMT_A52] =
82 AFMT_ENTRY("AC3", "a52", NULL, "a52\0ac3\0" ),
83 /* WavPack */
84 [AFMT_WAVPACK] =
85 AFMT_ENTRY("WV", "wavpack", "wavpack_enc", "wv\0" ),
86 /* Apple Lossless Audio Codec */
87 [AFMT_ALAC] =
88 AFMT_ENTRY("ALAC", "alac", NULL, "m4a\0m4b\0" ),
89 /* Advanced Audio Coding in M4A container */
90 [AFMT_AAC] =
91 AFMT_ENTRY("AAC", "aac", NULL, "mp4\0" ),
92 /* Shorten */
93 [AFMT_SHN] =
94 AFMT_ENTRY("SHN", "shorten", NULL, "shn\0" ),
95 /* SID File Format */
96 [AFMT_SID] =
97 AFMT_ENTRY("SID", "sid", NULL, "sid\0" ),
98 /* ADX File Format */
99 [AFMT_ADX] =
100 AFMT_ENTRY("ADX", "adx", NULL, "adx\0" ),
101 /* NESM (NES Sound Format) */
102 [AFMT_NSF] =
103 AFMT_ENTRY("NSF", "nsf", NULL, "nsf\0nsfe\0" ),
104 /* Speex File Format */
105 [AFMT_SPEEX] =
106 AFMT_ENTRY("Speex","speex", NULL, "spx\0" ),
107 /* SPC700 Save State */
108 [AFMT_SPC] =
109 AFMT_ENTRY("SPC", "spc", NULL, "spc\0" ),
110 /* APE (Monkey's Audio) */
111 [AFMT_APE] =
112 AFMT_ENTRY("APE", "ape", NULL, "ape\0mac\0" ),
113 /* WMA (WMAV1/V2 in ASF) */
114 [AFMT_WMA] =
115 AFMT_ENTRY("WMA", "wma", NULL, "wma\0wmv\0asf\0" ),
116 #endif
119 #if CONFIG_CODEC == SWCODEC && defined (HAVE_RECORDING)
120 /* get REC_FORMAT_* corresponding AFMT_* */
121 const int rec_format_afmt[REC_NUM_FORMATS] =
123 /* give AFMT_UNKNOWN by default */
124 [0 ... REC_NUM_FORMATS-1] = AFMT_UNKNOWN,
125 /* add new entries below this line */
126 [REC_FORMAT_AIFF] = AFMT_AIFF,
127 [REC_FORMAT_MPA_L3] = AFMT_MPA_L3,
128 [REC_FORMAT_WAVPACK] = AFMT_WAVPACK,
129 [REC_FORMAT_PCM_WAV] = AFMT_PCM_WAV,
132 /* get AFMT_* corresponding REC_FORMAT_* */
133 const int afmt_rec_format[AFMT_NUM_CODECS] =
135 /* give -1 by default */
136 [0 ... AFMT_NUM_CODECS-1] = -1,
137 /* add new entries below this line */
138 [AFMT_AIFF] = REC_FORMAT_AIFF,
139 [AFMT_MPA_L3] = REC_FORMAT_MPA_L3,
140 [AFMT_WAVPACK] = REC_FORMAT_WAVPACK,
141 [AFMT_PCM_WAV] = REC_FORMAT_PCM_WAV,
143 #endif /* CONFIG_CODEC == SWCODEC && defined (HAVE_RECORDING) */
144 /****/
146 unsigned long unsync(unsigned long b0,
147 unsigned long b1,
148 unsigned long b2,
149 unsigned long b3)
151 return (((long)(b0 & 0x7F) << (3*7)) |
152 ((long)(b1 & 0x7F) << (2*7)) |
153 ((long)(b2 & 0x7F) << (1*7)) |
154 ((long)(b3 & 0x7F) << (0*7)));
157 static const char* const genres[] = {
158 "Blues", "Classic Rock", "Country", "Dance", "Disco", "Funk", "Grunge",
159 "Hip-Hop", "Jazz", "Metal", "New Age", "Oldies", "Other", "Pop", "R&B",
160 "Rap", "Reggae", "Rock", "Techno", "Industrial", "Alternative", "Ska",
161 "Death Metal", "Pranks", "Soundtrack", "Euro-Techno", "Ambient", "Trip-Hop",
162 "Vocal", "Jazz+Funk", "Fusion", "Trance", "Classical", "Instrumental",
163 "Acid", "House", "Game", "Sound Clip", "Gospel", "Noise", "AlternRock",
164 "Bass", "Soul", "Punk", "Space", "Meditative", "Instrumental Pop",
165 "Instrumental Rock", "Ethnic", "Gothic", "Darkwave", "Techno-Industrial",
166 "Electronic", "Pop-Folk", "Eurodance", "Dream", "Southern Rock", "Comedy",
167 "Cult", "Gangsta", "Top 40", "Christian Rap", "Pop/Funk", "Jungle",
168 "Native American", "Cabaret", "New Wave", "Psychadelic", "Rave",
169 "Showtunes", "Trailer", "Lo-Fi", "Tribal", "Acid Punk", "Acid Jazz",
170 "Polka", "Retro", "Musical", "Rock & Roll", "Hard Rock",
172 /* winamp extensions */
173 "Folk", "Folk-Rock", "National Folk", "Swing", "Fast Fusion", "Bebob",
174 "Latin", "Revival", "Celtic", "Bluegrass", "Avantgarde", "Gothic Rock",
175 "Progressive Rock", "Psychedelic Rock", "Symphonic Rock", "Slow Rock",
176 "Big Band", "Chorus", "Easy Listening", "Acoustic", "Humour", "Speech",
177 "Chanson", "Opera", "Chamber Music", "Sonata", "Symphony", "Booty Bass",
178 "Primus", "Porn Groove", "Satire", "Slow Jam", "Club", "Tango", "Samba",
179 "Folklore", "Ballad", "Power Ballad", "Rhythmic Soul", "Freestyle",
180 "Duet", "Punk Rock", "Drum Solo", "A capella", "Euro-House", "Dance Hall",
181 "Goa", "Drum & Bass", "Club-House", "Hardcore", "Terror", "Indie",
182 "BritPop", "Negerpunk", "Polsk Punk", "Beat", "Christian Gangsta Rap",
183 "Heavy Metal", "Black Metal", "Crossover", "Contemporary Christian",
184 "Christian Rock", "Merengue", "Salsa", "Thrash Metal", "Anime", "Jpop",
185 "Synthpop"
188 char* id3_get_num_genre(const unsigned int genre_num)
190 if (genre_num < sizeof(genres)/sizeof(char*))
191 return (char*)genres[genre_num];
192 return NULL;
195 /* True if the string is from the "genres" array */
196 static bool id3_is_genre_string(const char *string)
198 return ( string >= genres[0] &&
199 string <= genres[sizeof(genres)/sizeof(char*) - 1] );
202 char* id3_get_codec(const struct mp3entry* id3)
204 if (id3->codectype < AFMT_NUM_CODECS) {
205 return (char*)audio_formats[id3->codectype].label;
206 } else {
207 return NULL;
212 HOW TO ADD ADDITIONAL ID3 VERSION 2 TAGS
213 Code and comments by Thomas Paul Diffenbach
215 To add another ID3v2 Tag, do the following:
216 1. add a char* named for the tag to struct mp3entry in id3.h,
217 (I (tpd) prefer to use char* rather than ints, even for what seems like
218 numerical values, for cases where a number won't do, e.g.,
219 YEAR: "circa 1765", "1790/1977" (composed/performed), "28 Feb 1969"
220 TRACK: "1/12", "1 of 12", GENRE: "Freeform genre name"
221 Text is more flexible, and as the main use of id3 data is to
222 display it, converting it to an int just means reconverting to
223 display it, at a runtime cost.)
225 2. If any special processing beyond copying the tag value from the Id3
226 block to the struct mp3entry is rrequired (such as converting to an
227 int), write a function to perform this special processing.
229 This function's prototype must match that of
230 typedef tagPostProcessFunc, that is it must be:
231 int func( struct mp3entry*, char* tag, int bufferpos )
232 the first argument is a pointer to the current mp3entry structure the
233 second argument is a pointer to the null terminated string value of the
234 tag found the third argument is the offset of the next free byte in the
235 mp3entry's buffer your function should return the corrected offset; if
236 you don't lengthen or shorten the tag string, you can return the third
237 argument unchanged.
239 Unless you have a good reason no to, make the function static.
240 TO JUST COPY THE TAG NO SPECIAL PROCESSING FUNCTION IS NEEDED.
242 3. add one or more entries to the tagList array, using the format:
243 char* ID3 Tag symbolic name -- see the ID3 specification for these,
244 sizeof() that name minus 1,
245 offsetof( struct mp3entry, variable_name_in_struct_mp3entry ),
246 pointer to your special processing function or NULL
247 if you need no special processing
248 flag indicating if this tag is binary or textual
249 Many ID3 symbolic names come in more than one form. You can add both
250 forms, each referencing the same variable in struct mp3entry.
251 If both forms are present, the last found will be used.
252 Note that the offset can be zero, in which case no entry will be set
253 in the mp3entry struct; the frame is still read into the buffer and
254 the special processing function is called (several times, if there
255 are several frames with the same name).
257 4. Alternately, use the TAG_LIST_ENTRY macro with
258 ID3 tag symbolic name,
259 variable in struct mp3entry,
260 special processing function address
262 5. Add code to wps-display.c function get_tag to assign a printf-like
263 format specifier for the tag */
265 /* Structure for ID3 Tag extraction information */
266 struct tag_resolver {
267 const char* tag;
268 int tag_length;
269 size_t offset;
270 int (*ppFunc)(struct mp3entry*, char* tag, int bufferpos);
271 bool binary;
274 static bool global_ff_found;
276 static int unsynchronize(char* tag, int len, bool *ff_found)
278 int i;
279 unsigned char c;
280 unsigned char *rp, *wp;
282 wp = rp = (unsigned char *)tag;
284 rp = (unsigned char *)tag;
285 for(i = 0;i < len;i++) {
286 /* Read the next byte and write it back, but don't increment the
287 write pointer */
288 c = *rp++;
289 *wp = c;
290 if(*ff_found) {
291 /* Increment the write pointer if it isn't an unsynch pattern */
292 if(c != 0)
293 wp++;
294 *ff_found = false;
295 } else {
296 if(c == 0xff)
297 *ff_found = true;
298 wp++;
301 return (long)wp - (long)tag;
304 static int unsynchronize_frame(char* tag, int len)
306 bool ff_found = false;
308 return unsynchronize(tag, len, &ff_found);
311 static int read_unsynched(int fd, void *buf, int len)
313 int i;
314 int rc;
315 int remaining = len;
316 char *wp;
317 char *rp;
319 wp = buf;
321 while(remaining) {
322 rp = wp;
323 rc = read(fd, rp, remaining);
324 if(rc <= 0)
325 return rc;
327 i = unsynchronize(wp, remaining, &global_ff_found);
328 remaining -= i;
329 wp += i;
332 return len;
335 static int skip_unsynched(int fd, int len)
337 int rc;
338 int remaining = len;
339 int rlen;
340 char buf[32];
342 while(remaining) {
343 rlen = MIN(sizeof(buf), (unsigned int)remaining);
344 rc = read(fd, buf, rlen);
345 if(rc <= 0)
346 return rc;
348 remaining -= unsynchronize(buf, rlen, &global_ff_found);
351 return len;
354 /* parse numeric value from string */
355 static int parsetracknum( struct mp3entry* entry, char* tag, int bufferpos )
357 entry->tracknum = atoi( tag );
358 return bufferpos;
361 /* parse numeric value from string */
362 static int parsediscnum( struct mp3entry* entry, char* tag, int bufferpos )
364 entry->discnum = atoi( tag );
365 return bufferpos;
368 /* parse numeric value from string */
369 static int parseyearnum( struct mp3entry* entry, char* tag, int bufferpos )
371 entry->year = atoi( tag );
372 return bufferpos;
375 /* parse numeric genre from string, version 2.2 and 2.3 */
376 static int parsegenre( struct mp3entry* entry, char* tag, int bufferpos )
378 if(entry->id3version >= ID3_VER_2_4) {
379 /* In version 2.4 and up, there are no parentheses, and the genre frame
380 is a list of strings, either numbers or text. */
382 /* Is it a number? */
383 if(isdigit(tag[0])) {
384 entry->genre_string = id3_get_num_genre(atoi( tag ));
385 return tag - entry->id3v2buf;
386 } else {
387 entry->genre_string = tag;
388 return bufferpos;
390 } else {
391 if( tag[0] == '(' && tag[1] != '(' ) {
392 entry->genre_string = id3_get_num_genre(atoi( tag + 1 ));
393 return tag - entry->id3v2buf;
395 else {
396 entry->genre_string = tag;
397 return bufferpos;
402 #if CONFIG_CODEC == SWCODEC
403 /* parse user defined text, looking for replaygain information. */
404 static int parseuser( struct mp3entry* entry, char* tag, int bufferpos )
406 char* value = NULL;
407 int desc_len = strlen(tag);
408 int value_len = 0;
410 if ((tag - entry->id3v2buf + desc_len + 2) < bufferpos) {
411 /* At least part of the value was read, so we can safely try to
412 * parse it
414 value = tag + desc_len + 1;
415 value_len = parse_replaygain(tag, value, entry, tag,
416 bufferpos - (tag - entry->id3v2buf));
419 return tag - entry->id3v2buf + value_len;
422 /* parse RVA2 binary data and convert to replaygain information. */
423 static int parserva2( struct mp3entry* entry, char* tag, int bufferpos )
425 int desc_len = strlen(tag);
426 int end_pos = tag - entry->id3v2buf + desc_len + 5;
427 int value_len = 0;
428 unsigned char* value = tag + desc_len + 1;
430 /* Only parse RVA2 replaygain tags if tag version == 2.4 and channel
431 * type is master volume.
433 if (entry->id3version == ID3_VER_2_4 && end_pos < bufferpos
434 && *value++ == 1) {
435 long gain = 0;
436 long peak = 0;
437 long peakbits;
438 long peakbytes;
439 bool album = false;
441 /* The RVA2 specification is unclear on some things (id string and
442 * peak volume), but this matches how Quod Libet use them.
445 gain = (int16_t) ((value[0] << 8) | value[1]);
446 value += 2;
447 peakbits = *value++;
448 peakbytes = (peakbits + 7) / 8;
450 /* Only use the topmost 24 bits for peak volume */
451 if (peakbytes > 3) {
452 peakbytes = 3;
455 /* Make sure the peak bits were read */
456 if (end_pos + peakbytes < bufferpos) {
457 long shift = ((8 - (peakbits & 7)) & 7) + (3 - peakbytes) * 8;
459 for ( ; peakbytes; peakbytes--) {
460 peak <<= 8;
461 peak += *value++;
464 peak <<= shift;
466 if (peakbits > 24) {
467 peak += *value >> (8 - shift);
471 if (strcasecmp(tag, "album") == 0) {
472 album = true;
473 } else if (strcasecmp(tag, "track") != 0) {
474 gain = 0;
477 value_len = parse_replaygain_int(album, gain, peak * 2, entry,
478 tag, sizeof(entry->id3v2buf) - (tag - entry->id3v2buf));
481 return tag - entry->id3v2buf + value_len;
483 #endif
485 static const struct tag_resolver taglist[] = {
486 { "TPE1", 4, offsetof(struct mp3entry, artist), NULL, false },
487 { "TP1", 3, offsetof(struct mp3entry, artist), NULL, false },
488 { "TIT2", 4, offsetof(struct mp3entry, title), NULL, false },
489 { "TT2", 3, offsetof(struct mp3entry, title), NULL, false },
490 { "TALB", 4, offsetof(struct mp3entry, album), NULL, false },
491 { "TAL", 3, offsetof(struct mp3entry, album), NULL, false },
492 { "TRK", 3, offsetof(struct mp3entry, track_string), &parsetracknum, false },
493 { "TPOS", 4, offsetof(struct mp3entry, disc_string), &parsediscnum, false },
494 { "TRCK", 4, offsetof(struct mp3entry, track_string), &parsetracknum, false },
495 { "TDRC", 4, offsetof(struct mp3entry, year_string), &parseyearnum, false },
496 { "TYER", 4, offsetof(struct mp3entry, year_string), &parseyearnum, false },
497 { "TYE", 3, offsetof(struct mp3entry, year_string), &parseyearnum, false },
498 { "TCOM", 4, offsetof(struct mp3entry, composer), NULL, false },
499 { "TPE2", 4, offsetof(struct mp3entry, albumartist), NULL, false },
500 { "TP2", 3, offsetof(struct mp3entry, albumartist), NULL, false },
501 { "TIT1", 4, offsetof(struct mp3entry, grouping), NULL, false },
502 { "TT1", 3, offsetof(struct mp3entry, grouping), NULL, false },
503 { "COMM", 4, offsetof(struct mp3entry, comment), NULL, false },
504 { "TCON", 4, offsetof(struct mp3entry, genre_string), &parsegenre, false },
505 { "TCO", 3, offsetof(struct mp3entry, genre_string), &parsegenre, false },
506 #if CONFIG_CODEC == SWCODEC
507 { "TXXX", 4, 0, &parseuser, false },
508 { "RVA2", 4, 0, &parserva2, true },
509 #endif
512 #define TAGLIST_SIZE ((int)(sizeof(taglist) / sizeof(taglist[0])))
514 /* Get the length of an ID3 string in the given encoding. Returns the length
515 * in bytes, including end nil, or -1 if the encoding is unknown.
517 static int unicode_len(char encoding, const void* string)
519 int len = 0;
521 if (encoding == 0x01 || encoding == 0x02) {
522 char first;
523 const char *s = string;
524 /* string might be unaligned, so using short* can crash on ARM and SH1 */
525 do {
526 first = *s++;
527 } while ((first | *s++) != 0);
529 len = s - (const char*) string;
530 } else {
531 len = strlen((char*) string) + 1;
534 return len;
537 /* Checks to see if the passed in string is a 16-bit wide Unicode v2
538 string. If it is, we convert it to a UTF-8 string. If it's not unicode,
539 we convert from the default codepage */
540 static int unicode_munge(char* string, char* utf8buf, int *len) {
541 long tmp;
542 bool le = false;
543 int i = 0;
544 unsigned char *str = (unsigned char *)string;
545 int templen = 0;
546 unsigned char* utf8 = (unsigned char *)utf8buf;
548 switch (str[0]) {
549 case 0x00: /* Type 0x00 is ordinary ISO 8859-1 */
550 str++;
551 (*len)--;
552 utf8 = iso_decode(str, utf8, -1, *len);
553 *utf8 = 0;
554 *len = (unsigned long)utf8 - (unsigned long)utf8buf;
555 break;
557 case 0x01: /* Unicode with or without BOM */
558 case 0x02:
559 (*len)--;
560 str++;
562 /* Handle frames with more than one string
563 (needed for TXXX frames).*/
564 do {
565 tmp = bytes2int(0, 0, str[0], str[1]);
567 /* Now check if there is a BOM
568 (zero-width non-breaking space, 0xfeff)
569 and if it is in little or big endian format */
570 if(tmp == 0xfffe) { /* Little endian? */
571 le = true;
572 str += 2;
573 (*len)-=2;
574 } else if(tmp == 0xfeff) { /* Big endian? */
575 str += 2;
576 (*len)-=2;
577 } else
578 /* If there is no BOM (which is a specification violation),
579 let's try to guess it. If one of the bytes is 0x00, it is
580 probably the most significant one. */
581 if(str[1] == 0)
582 le = true;
584 do {
585 if(le)
586 utf8 = utf16LEdecode(str, utf8, 1);
587 else
588 utf8 = utf16BEdecode(str, utf8, 1);
590 str+=2;
591 i += 2;
592 } while((str[0] || str[1]) && (i < *len));
594 *utf8++ = 0; /* Terminate the string */
595 templen += (strlen(&utf8buf[templen]) + 1);
596 str += 2;
597 i+=2;
598 } while(i < *len);
599 *len = templen - 1;
600 break;
602 case 0x03: /* UTF-8 encoded string */
603 for(i=0; i < *len; i++)
604 utf8[i] = str[i+1];
605 (*len)--;
606 break;
608 default: /* Plain old string */
609 utf8 = iso_decode(str, utf8, -1, *len);
610 *utf8 = 0;
611 *len = (unsigned long)utf8 - (unsigned long)utf8buf;
612 break;
614 return 0;
618 * Sets the title of an MP3 entry based on its ID3v1 tag.
620 * Arguments: file - the MP3 file to scen for a ID3v1 tag
621 * entry - the entry to set the title in
623 * Returns: true if a title was found and created, else false
625 static bool setid3v1title(int fd, struct mp3entry *entry)
627 unsigned char buffer[128];
628 static const char offsets[] = {3, 33, 63, 97, 93, 125, 127};
629 int i, j;
630 unsigned char* utf8;
632 if (-1 == lseek(fd, -128, SEEK_END))
633 return false;
635 if (read(fd, buffer, sizeof buffer) != sizeof buffer)
636 return false;
638 if (strncmp((char *)buffer, "TAG", 3))
639 return false;
641 entry->id3v1len = 128;
642 entry->id3version = ID3_VER_1_0;
644 for (i=0; i < (int)sizeof offsets; i++) {
645 unsigned char* ptr = (unsigned char *)buffer + offsets[i];
647 switch(i) {
648 case 0:
649 case 1:
650 case 2:
651 /* kill trailing space in strings */
652 for (j=29; j && (ptr[j]==0 || ptr[j]==' '); j--)
653 ptr[j] = 0;
654 /* convert string to utf8 */
655 utf8 = (unsigned char *)entry->id3v1buf[i];
656 utf8 = iso_decode(ptr, utf8, -1, 30);
657 /* make sure string is terminated */
658 *utf8 = 0;
659 break;
661 case 3:
662 /* kill trailing space in strings */
663 for (j=27; j && (ptr[j]==0 || ptr[j]==' '); j--)
664 ptr[j] = 0;
665 /* convert string to utf8 */
666 utf8 = (unsigned char *)entry->id3v1buf[3];
667 utf8 = iso_decode(ptr, utf8, -1, 28);
668 /* make sure string is terminated */
669 *utf8 = 0;
670 break;
672 case 4:
673 ptr[4] = 0;
674 entry->year = atoi((char *)ptr);
675 break;
677 case 5:
678 /* id3v1.1 uses last two bytes of comment field for track
679 number: first must be 0 and second is track num */
680 if (!ptr[0] && ptr[1]) {
681 entry->tracknum = ptr[1];
682 entry->id3version = ID3_VER_1_1;
684 break;
686 case 6:
687 /* genre */
688 entry->genre_string = id3_get_num_genre(ptr[0]);
689 break;
693 entry->title = entry->id3v1buf[0];
694 entry->artist = entry->id3v1buf[1];
695 entry->album = entry->id3v1buf[2];
696 entry->comment = entry->id3v1buf[3];
698 return true;
703 * Sets the title of an MP3 entry based on its ID3v2 tag.
705 * Arguments: file - the MP3 file to scan for a ID3v2 tag
706 * entry - the entry to set the title in
708 * Returns: true if a title was found and created, else false
710 static void setid3v2title(int fd, struct mp3entry *entry)
712 int minframesize;
713 int size;
714 long bufferpos = 0, totframelen, framelen;
715 char header[10];
716 char tmp[4];
717 unsigned char version;
718 char *buffer = entry->id3v2buf;
719 int bytesread = 0;
720 int buffersize = sizeof(entry->id3v2buf);
721 unsigned char global_flags;
722 int flags;
723 int skip;
724 bool global_unsynch = false;
725 bool unsynch = false;
726 int data_length_ind;
727 int i, j;
728 int rc;
730 global_ff_found = false;
732 /* Bail out if the tag is shorter than 10 bytes */
733 if(entry->id3v2len < 10)
734 return;
736 /* Read the ID3 tag version from the header */
737 lseek(fd, 0, SEEK_SET);
738 if(10 != read(fd, header, 10))
739 return;
741 /* Get the total ID3 tag size */
742 size = entry->id3v2len - 10;
744 version = header[3];
745 switch ( version ) {
746 case 2:
747 version = ID3_VER_2_2;
748 minframesize = 8;
749 break;
751 case 3:
752 version = ID3_VER_2_3;
753 minframesize = 12;
754 break;
756 case 4:
757 version = ID3_VER_2_4;
758 minframesize = 12;
759 break;
761 default:
762 /* unsupported id3 version */
763 return;
765 entry->id3version = version;
766 entry->tracknum = entry->year = entry->discnum = 0;
767 entry->title = entry->artist = entry->album = NULL; /* FIXME incomplete */
769 global_flags = header[5];
771 /* Skip the extended header if it is present */
772 if(global_flags & 0x40) {
773 if(version == ID3_VER_2_3) {
774 if(10 != read(fd, header, 10))
775 return;
776 /* The 2.3 extended header size doesn't include the header size
777 field itself. Also, it is not unsynched. */
778 framelen =
779 bytes2int(header[0], header[1], header[2], header[3]) + 4;
781 /* Skip the rest of the header */
782 lseek(fd, framelen - 10, SEEK_CUR);
785 if(version >= ID3_VER_2_4) {
786 if(4 != read(fd, header, 4))
787 return;
789 /* The 2.4 extended header size does include the entire header,
790 so here we can just skip it. This header is unsynched. */
791 framelen = unsync(header[0], header[1],
792 header[2], header[3]);
794 lseek(fd, framelen - 4, SEEK_CUR);
798 /* Is unsynchronization applied? */
799 if(global_flags & 0x80) {
800 global_unsynch = true;
804 * We must have at least minframesize bytes left for the
805 * remaining frames to be interesting
807 while (size >= minframesize && bufferpos < buffersize - 1) {
808 flags = 0;
810 /* Read frame header and check length */
811 if(version >= ID3_VER_2_3) {
812 if(global_unsynch && version <= ID3_VER_2_3)
813 rc = read_unsynched(fd, header, 10);
814 else
815 rc = read(fd, header, 10);
816 if(rc != 10)
817 return;
818 /* Adjust for the 10 bytes we read */
819 size -= 10;
821 flags = bytes2int(0, 0, header[8], header[9]);
823 if (version >= ID3_VER_2_4) {
824 framelen = unsync(header[4], header[5],
825 header[6], header[7]);
826 } else {
827 /* version .3 files don't use synchsafe ints for
828 * size */
829 framelen = bytes2int(header[4], header[5],
830 header[6], header[7]);
832 } else {
833 if(6 != read(fd, header, 6))
834 return;
835 /* Adjust for the 6 bytes we read */
836 size -= 6;
838 framelen = bytes2int(0, header[3], header[4], header[5]);
841 logf("framelen = %ld", framelen);
842 if(framelen == 0){
843 if (header[0] == 0 && header[1] == 0 && header[2] == 0)
844 return;
845 else
846 continue;
849 unsynch = false;
850 data_length_ind = 0;
852 if(flags)
854 skip = 0;
856 if (version >= ID3_VER_2_4) {
857 if(flags & 0x0040) { /* Grouping identity */
858 lseek(fd, 1, SEEK_CUR); /* Skip 1 byte */
859 framelen--;
861 } else {
862 if(flags & 0x0020) { /* Grouping identity */
863 lseek(fd, 1, SEEK_CUR); /* Skip 1 byte */
864 framelen--;
868 if(flags & 0x000c) /* Compression or encryption */
870 /* Skip it */
871 size -= framelen;
872 lseek(fd, framelen, SEEK_CUR);
873 continue;
876 if(flags & 0x0002) /* Unsynchronization */
877 unsynch = true;
879 if (version >= ID3_VER_2_4) {
880 if(flags & 0x0001) { /* Data length indicator */
881 if(4 != read(fd, tmp, 4))
882 return;
884 data_length_ind = unsync(tmp[0], tmp[1], tmp[2], tmp[3]);
885 framelen -= 4;
890 /* Keep track of the remaining frame size */
891 totframelen = framelen;
893 /* If the frame is larger than the remaining buffer space we try
894 to read as much as would fit in the buffer */
895 if(framelen >= buffersize - bufferpos)
896 framelen = buffersize - bufferpos - 1;
898 logf("id3v2 frame: %.4s", header);
900 /* Check for certain frame headers
902 'size' is the amount of frame bytes remaining. We decrement it by
903 the amount of bytes we read. If we fail to read as many bytes as
904 we expect, we assume that we can't read from this file, and bail
905 out.
907 For each frame. we will iterate over the list of supported tags,
908 and read the tag into entry's buffer. All tags will be kept as
909 strings, for cases where a number won't do, e.g., YEAR: "circa
910 1765", "1790/1977" (composed/performed), "28 Feb 1969" TRACK:
911 "1/12", "1 of 12", GENRE: "Freeform genre name" Text is more
912 flexible, and as the main use of id3 data is to display it,
913 converting it to an int just means reconverting to display it, at a
914 runtime cost.
916 For tags that the current code does convert to ints, a post
917 processing function will be called via a pointer to function. */
919 for (i=0; i<TAGLIST_SIZE; i++) {
920 const struct tag_resolver* tr = &taglist[i];
921 char** ptag = tr->offset ? (char**) (((char*)entry) + tr->offset)
922 : NULL;
923 char* tag;
925 /* Only ID3_VER_2_2 uses frames with three-character names. */
926 if (((version == ID3_VER_2_2) && (tr->tag_length != 3))
927 || ((version > ID3_VER_2_2) && (tr->tag_length != 4))) {
928 continue;
931 /* Note that parser functions sometimes set *ptag to NULL, so
932 * the "!*ptag" check here doesn't always have the desired
933 * effect. Should the parser functions (parsegenre in
934 * particular) be updated to handle the case of being called
935 * multiple times, or should the "*ptag" check be removed?
937 if( (!ptag || !*ptag) && !memcmp( header, tr->tag, tr->tag_length ) ) {
939 /* found a tag matching one in tagList, and not yet filled */
940 tag = buffer + bufferpos;
942 if(global_unsynch && version <= ID3_VER_2_3)
943 bytesread = read_unsynched(fd, tag, framelen);
944 else
945 bytesread = read(fd, tag, framelen);
947 if( bytesread != framelen )
948 return;
950 size -= bytesread;
952 if(unsynch || (global_unsynch && version >= ID3_VER_2_4))
953 bytesread = unsynchronize_frame(tag, bytesread);
955 /* the COMM frame has a 3 char field to hold an ISO-639-1
956 * language string and an optional short description;
957 * remove them so unicode_munge can work correctly
960 if(!memcmp( header, "COMM", 4 )) {
961 int offset;
962 /* ignore comments with iTunes 7 soundcheck/gapless data */
963 if(!strncmp(tag+4, "iTun", 4))
964 break;
965 offset = 3 + unicode_len(*tag, tag + 4);
966 if(bytesread > offset) {
967 bytesread -= offset;
968 memmove(tag + 1, tag + 1 + offset, bytesread - 1);
972 /* Attempt to parse Unicode string only if the tag contents
973 aren't binary */
974 if(!tr->binary) {
975 /* UTF-8 could potentially be 3 times larger */
976 /* so we need to create a new buffer */
977 char utf8buf[(3 * bytesread) + 1];
979 unicode_munge( tag, utf8buf, &bytesread );
981 if(bytesread >= buffersize - bufferpos)
982 bytesread = buffersize - bufferpos - 1;
984 for (j = 0; j < bytesread; j++)
985 tag[j] = utf8buf[j];
987 /* remove trailing spaces */
988 while ( bytesread > 0 && isspace(tag[bytesread-1]))
989 bytesread--;
992 tag[bytesread] = 0;
993 bufferpos += bytesread + 1;
995 if (ptag)
996 *ptag = tag;
998 if( tr->ppFunc )
999 bufferpos = tr->ppFunc(entry, tag, bufferpos);
1001 /* Seek to the next frame */
1002 if(framelen < totframelen)
1003 lseek(fd, totframelen - framelen, SEEK_CUR);
1004 break;
1008 if( i == TAGLIST_SIZE ) {
1009 /* no tag in tagList was found, or it was a repeat.
1010 skip it using the total size */
1012 if(global_unsynch && version <= ID3_VER_2_3) {
1013 size -= skip_unsynched(fd, totframelen);
1014 } else {
1015 if(data_length_ind)
1016 totframelen = data_length_ind;
1018 size -= totframelen;
1019 if( lseek(fd, totframelen, SEEK_CUR) == -1 )
1020 return;
1027 * Calculates the size of the ID3v2 tag.
1029 * Arguments: file - the file to search for a tag.
1031 * Returns: the size of the tag or 0 if none was found
1033 int getid3v2len(int fd)
1035 char buf[6];
1036 int offset;
1038 /* Make sure file has a ID3 tag */
1039 if((-1 == lseek(fd, 0, SEEK_SET)) ||
1040 (read(fd, buf, 6) != 6) ||
1041 (strncmp(buf, "ID3", strlen("ID3")) != 0))
1042 offset = 0;
1044 /* Now check what the ID3v2 size field says */
1045 else
1046 if(read(fd, buf, 4) != 4)
1047 offset = 0;
1048 else
1049 offset = unsync(buf[0], buf[1], buf[2], buf[3]) + 10;
1051 logf("ID3V2 Length: 0x%x", offset);
1052 return offset;
1056 * Calculates the length (in milliseconds) of an MP3 file.
1058 * Modified to only use integers.
1060 * Arguments: file - the file to calculate the length upon
1061 * entry - the entry to update with the length
1063 * Returns: the song length in milliseconds,
1064 * 0 means that it couldn't be calculated
1066 static int getsonglength(int fd, struct mp3entry *entry)
1068 unsigned long filetime = 0;
1069 struct mp3info info;
1070 long bytecount;
1072 /* Start searching after ID3v2 header */
1073 if(-1 == lseek(fd, entry->id3v2len, SEEK_SET))
1074 return 0;
1076 bytecount = get_mp3file_info(fd, &info);
1078 logf("Space between ID3V2 tag and first audio frame: 0x%lx bytes",
1079 bytecount);
1081 if(bytecount < 0)
1082 return -1;
1084 bytecount += entry->id3v2len;
1086 /* Validate byte count, in case the file has been edited without
1087 * updating the header.
1089 if (info.byte_count)
1091 const unsigned long expected = entry->filesize - entry->id3v1len
1092 - entry->id3v2len;
1093 const unsigned long diff = MAX(10240, info.byte_count / 20);
1095 if ((info.byte_count > expected + diff)
1096 || (info.byte_count < expected - diff))
1098 logf("Note: info.byte_count differs from expected value by "
1099 "%ld bytes", labs((long) (expected - info.byte_count)));
1100 info.byte_count = 0;
1101 info.frame_count = 0;
1102 info.file_time = 0;
1103 info.enc_padding = 0;
1105 /* Even if the bitrate was based on "known bad" values, it
1106 * should still be better for VBR files than using the bitrate
1107 * of the first audio frame.
1112 entry->bitrate = info.bitrate;
1113 entry->frequency = info.frequency;
1114 entry->version = info.version;
1115 entry->layer = info.layer;
1116 switch(entry->layer) {
1117 #if CONFIG_CODEC==SWCODEC
1118 case 0:
1119 entry->codectype=AFMT_MPA_L1;
1120 break;
1121 #endif
1122 case 1:
1123 entry->codectype=AFMT_MPA_L2;
1124 break;
1125 case 2:
1126 entry->codectype=AFMT_MPA_L3;
1127 break;
1130 /* If the file time hasn't been established, this may be a fixed
1131 rate MP3, so just use the default formula */
1133 filetime = info.file_time;
1135 if(filetime == 0)
1137 /* Prevent a division by zero */
1138 if (info.bitrate < 8)
1139 filetime = 0;
1140 else
1141 filetime = (entry->filesize - bytecount) / (info.bitrate / 8);
1142 /* bitrate is in kbps so this delivers milliseconds. Doing bitrate / 8
1143 * instead of filesize * 8 is exact, because mpeg audio bitrates are
1144 * always multiples of 8, and it avoids overflows. */
1147 entry->frame_count = info.frame_count;
1149 entry->vbr = info.is_vbr;
1150 entry->has_toc = info.has_toc;
1152 #if CONFIG_CODEC==SWCODEC
1153 entry->lead_trim = info.enc_delay;
1154 entry->tail_trim = info.enc_padding;
1155 #endif
1157 memcpy(entry->toc, info.toc, sizeof(info.toc));
1159 entry->vbr_header_pos = info.vbr_header_pos;
1161 /* Update the seek point for the first playable frame */
1162 entry->first_frame_offset = bytecount;
1163 logf("First frame is at %lx", entry->first_frame_offset);
1165 return filetime;
1169 * Checks all relevant information (such as ID3v1 tag, ID3v2 tag, length etc)
1170 * about an MP3 file and updates it's entry accordingly.
1172 Note, that this returns true for successful, false for error! */
1173 bool get_mp3_metadata(int fd, struct mp3entry *entry, const char *filename)
1175 #if CONFIG_CODEC != SWCODEC
1176 memset(entry, 0, sizeof(struct mp3entry));
1177 #endif
1179 strncpy(entry->path, filename, sizeof(entry->path));
1181 entry->title = NULL;
1182 entry->filesize = filesize(fd);
1183 entry->id3v2len = getid3v2len(fd);
1184 entry->tracknum = 0;
1185 entry->discnum = 0;
1187 if (entry->id3v2len)
1188 setid3v2title(fd, entry);
1189 int len = getsonglength(fd, entry);
1190 if (len < 0)
1191 return false;
1192 entry->length = len;
1194 /* Subtract the meta information from the file size to get
1195 the true size of the MP3 stream */
1196 entry->filesize -= entry->first_frame_offset;
1198 /* only seek to end of file if no id3v2 tags were found */
1199 if (!entry->id3v2len) {
1200 setid3v1title(fd, entry);
1203 if(!entry->length || (entry->filesize < 8 ))
1204 /* no song length or less than 8 bytes is hereby considered to be an
1205 invalid mp3 and won't be played by us! */
1206 return false;
1208 return true;
1211 /* Note, that this returns false for successful, true for error! */
1212 bool mp3info(struct mp3entry *entry, const char *filename)
1214 int fd;
1215 bool result;
1217 fd = open(filename, O_RDONLY);
1218 if (fd < 0)
1219 return true;
1221 result = !get_mp3_metadata(fd, entry, filename);
1223 close(fd);
1225 return result;
1228 void adjust_mp3entry(struct mp3entry *entry, void *dest, void *orig)
1230 long offset;
1231 if (orig > dest)
1232 offset = - ((size_t)orig - (size_t)dest);
1233 else
1234 offset = (size_t)dest - (size_t)orig;
1236 if (entry->title)
1237 entry->title += offset;
1238 if (entry->artist)
1239 entry->artist += offset;
1240 if (entry->album)
1241 entry->album += offset;
1242 if (entry->genre_string && !id3_is_genre_string(entry->genre_string))
1243 /* Don't adjust that if it points to an entry of the "genres" array */
1244 entry->genre_string += offset;
1245 if (entry->track_string)
1246 entry->track_string += offset;
1247 if (entry->disc_string)
1248 entry->disc_string += offset;
1249 if (entry->year_string)
1250 entry->year_string += offset;
1251 if (entry->composer)
1252 entry->composer += offset;
1253 if (entry->comment)
1254 entry->comment += offset;
1255 if (entry->albumartist)
1256 entry->albumartist += offset;
1257 if (entry->grouping)
1258 entry->grouping += offset;
1259 #if CONFIG_CODEC == SWCODEC
1260 if (entry->track_gain_string)
1261 entry->track_gain_string += offset;
1262 if (entry->album_gain_string)
1263 entry->album_gain_string += offset;
1264 #endif
1267 void copy_mp3entry(struct mp3entry *dest, struct mp3entry *orig)
1269 memcpy(dest, orig, sizeof(struct mp3entry));
1270 adjust_mp3entry(dest, dest, orig);
1273 #ifdef DEBUG_STANDALONE
1275 char *secs2str(int ms)
1277 static char buffer[32];
1278 int secs = ms/1000;
1279 ms %= 1000;
1280 snprintf(buffer, sizeof(buffer), "%d:%02d.%d", secs/60, secs%60, ms/100);
1281 return buffer;
1284 int main(int argc, char **argv)
1286 int i;
1287 for(i=1; i<argc; i++) {
1288 struct mp3entry mp3;
1289 mp3.album = "Bogus";
1290 if(mp3info(&mp3, argv[i], false)) {
1291 printf("Failed to get %s\n", argv[i]);
1292 return 0;
1295 printf("****** File: %s\n"
1296 " Title: %s\n"
1297 " Artist: %s\n"
1298 " Album: %s\n"
1299 " Genre: %s (%d) \n"
1300 " Composer: %s\n"
1301 " Year: %s (%d)\n"
1302 " Track: %s (%d)\n"
1303 " Length: %s / %d s\n"
1304 " Bitrate: %d\n"
1305 " Frequency: %d\n",
1306 argv[i],
1307 mp3.title?mp3.title:"<blank>",
1308 mp3.artist?mp3.artist:"<blank>",
1309 mp3.album?mp3.album:"<blank>",
1310 mp3.genre_string?mp3.genre_string:"<blank>",
1311 mp3.genre,
1312 mp3.composer?mp3.composer:"<blank>",
1313 mp3.year_string?mp3.year_string:"<blank>",
1314 mp3.year,
1315 mp3.track_string?mp3.track_string:"<blank>",
1316 mp3.tracknum,
1317 secs2str(mp3.length),
1318 mp3.length/1000,
1319 mp3.bitrate,
1320 mp3.frequency);
1323 return 0;
1326 #endif