Fix FS#8196 - Gather Runtime Data > User Rating not working
[Rockbox.git] / firmware / id3.c
blobe2f45468b224bdb0b43d207fc0a3717edac1d442
1 /***************************************************************************
2 * __________ __ ___.
3 * Open \______ \ ____ ____ | | _\_ |__ _______ ___
4 * Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
5 * Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
6 * Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
7 * \/ \/ \/ \/ \/
8 * $Id$
10 * Copyright (C) 2002 by Daniel Stenberg
12 * All files in this archive are subject to the GNU General Public License.
13 * See the file COPYING in the source tree root for full license agreement.
15 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
16 * KIND, either express or implied.
18 ****************************************************************************/
20 * Parts of this code has been stolen from the Ample project and was written
21 * by David H�deman. It has since been extended and enhanced pretty much by
22 * all sorts of friendly Rockbox people.
26 /* tagResolver and associated code copyright 2003 Thomas Paul Diffenbach
29 #include <stdio.h>
30 #include <stdlib.h>
31 #include <string.h>
32 #include <errno.h>
33 #include <stdbool.h>
34 #include <stddef.h>
35 #include <ctype.h>
36 #include "config.h"
37 #include "file.h"
38 #include "logf.h"
39 #include "atoi.h"
41 #include "id3.h"
42 #include "mp3data.h"
43 #include "system.h"
44 #include "replaygain.h"
45 #include "rbunicode.h"
47 /** Database of audio formats **/
48 const struct afmt_entry audio_formats[AFMT_NUM_CODECS] =
50 /* Unknown file format */
51 [AFMT_UNKNOWN] =
52 AFMT_ENTRY("???", NULL, NULL, NULL ),
54 /* MPEG Audio layer 1 */
55 [AFMT_MPA_L1] =
56 AFMT_ENTRY("MP1", "mpa", NULL, "mp1\0" ),
57 /* MPEG Audio layer 2 */
58 [AFMT_MPA_L2] =
59 AFMT_ENTRY("MP2", "mpa", NULL, "mpa\0mp2\0" ),
60 /* MPEG Audio layer 3 */
61 [AFMT_MPA_L3] =
62 AFMT_ENTRY("MP3", "mpa", "mp3_enc", "mp3\0" ),
64 #if CONFIG_CODEC == SWCODEC
65 /* Audio Interchange File Format */
66 [AFMT_AIFF] =
67 AFMT_ENTRY("AIFF", "aiff", "aiff_enc", "aiff\0aif\0"),
68 /* Uncompressed PCM in a WAV file */
69 [AFMT_PCM_WAV] =
70 AFMT_ENTRY("WAV", "wav", "wav_enc", "wav\0" ),
71 /* Ogg Vorbis */
72 [AFMT_OGG_VORBIS] =
73 AFMT_ENTRY("Ogg", "vorbis", NULL, "ogg\0" ),
74 /* FLAC */
75 [AFMT_FLAC] =
76 AFMT_ENTRY("FLAC", "flac", NULL, "flac\0" ),
77 /* Musepack */
78 [AFMT_MPC] =
79 AFMT_ENTRY("MPC", "mpc", NULL, "mpc\0" ),
80 /* A/52 (aka AC3) audio */
81 [AFMT_A52] =
82 AFMT_ENTRY("AC3", "a52", NULL, "a52\0ac3\0" ),
83 /* WavPack */
84 [AFMT_WAVPACK] =
85 AFMT_ENTRY("WV", "wavpack", "wavpack_enc", "wv\0" ),
86 /* Apple Lossless Audio Codec */
87 [AFMT_ALAC] =
88 AFMT_ENTRY("ALAC", "alac", NULL, "m4a\0m4b\0" ),
89 /* Advanced Audio Coding in M4A container */
90 [AFMT_AAC] =
91 AFMT_ENTRY("AAC", "aac", NULL, "mp4\0" ),
92 /* Shorten */
93 [AFMT_SHN] =
94 AFMT_ENTRY("SHN", "shorten", NULL, "shn\0" ),
95 /* SID File Format */
96 [AFMT_SID] =
97 AFMT_ENTRY("SID", "sid", NULL, "sid\0" ),
98 /* ADX File Format */
99 [AFMT_ADX] =
100 AFMT_ENTRY("ADX", "adx", NULL, "adx\0" ),
101 /* NESM (NES Sound Format) */
102 [AFMT_NSF] =
103 AFMT_ENTRY("NSF", "nsf", NULL, "nsf\0nsfe\0" ),
104 /* Speex File Format */
105 [AFMT_SPEEX] =
106 AFMT_ENTRY("Speex","speex", NULL, "spx\0" ),
107 /* SPC700 Save State */
108 [AFMT_SPC] =
109 AFMT_ENTRY("SPC", "spc", NULL, "spc\0" ),
110 /* APE (Monkey's Audio) */
111 [AFMT_APE] =
112 AFMT_ENTRY("APE", "ape", NULL, "ape\0mac\0" ),
113 /* WMA (WMAV1/V2 in ASF) */
114 [AFMT_WMA] =
115 AFMT_ENTRY("WMA", "wma", NULL, "wma\0wmv\0asf\0" ),
116 #endif
119 #if CONFIG_CODEC == SWCODEC && defined (HAVE_RECORDING)
120 /* get REC_FORMAT_* corresponding AFMT_* */
121 const int rec_format_afmt[REC_NUM_FORMATS] =
123 /* give AFMT_UNKNOWN by default */
124 [0 ... REC_NUM_FORMATS-1] = AFMT_UNKNOWN,
125 /* add new entries below this line */
126 [REC_FORMAT_AIFF] = AFMT_AIFF,
127 [REC_FORMAT_MPA_L3] = AFMT_MPA_L3,
128 [REC_FORMAT_WAVPACK] = AFMT_WAVPACK,
129 [REC_FORMAT_PCM_WAV] = AFMT_PCM_WAV,
132 /* get AFMT_* corresponding REC_FORMAT_* */
133 const int afmt_rec_format[AFMT_NUM_CODECS] =
135 /* give -1 by default */
136 [0 ... AFMT_NUM_CODECS-1] = -1,
137 /* add new entries below this line */
138 [AFMT_AIFF] = REC_FORMAT_AIFF,
139 [AFMT_MPA_L3] = REC_FORMAT_MPA_L3,
140 [AFMT_WAVPACK] = REC_FORMAT_WAVPACK,
141 [AFMT_PCM_WAV] = REC_FORMAT_PCM_WAV,
143 #endif /* CONFIG_CODEC == SWCODEC && defined (HAVE_RECORDING) */
144 /****/
146 unsigned long unsync(unsigned long b0,
147 unsigned long b1,
148 unsigned long b2,
149 unsigned long b3)
151 return (((long)(b0 & 0x7F) << (3*7)) |
152 ((long)(b1 & 0x7F) << (2*7)) |
153 ((long)(b2 & 0x7F) << (1*7)) |
154 ((long)(b3 & 0x7F) << (0*7)));
157 static const char* const genres[] = {
158 "Blues", "Classic Rock", "Country", "Dance", "Disco", "Funk", "Grunge",
159 "Hip-Hop", "Jazz", "Metal", "New Age", "Oldies", "Other", "Pop", "R&B",
160 "Rap", "Reggae", "Rock", "Techno", "Industrial", "Alternative", "Ska",
161 "Death Metal", "Pranks", "Soundtrack", "Euro-Techno", "Ambient", "Trip-Hop",
162 "Vocal", "Jazz+Funk", "Fusion", "Trance", "Classical", "Instrumental",
163 "Acid", "House", "Game", "Sound Clip", "Gospel", "Noise", "AlternRock",
164 "Bass", "Soul", "Punk", "Space", "Meditative", "Instrumental Pop",
165 "Instrumental Rock", "Ethnic", "Gothic", "Darkwave", "Techno-Industrial",
166 "Electronic", "Pop-Folk", "Eurodance", "Dream", "Southern Rock", "Comedy",
167 "Cult", "Gangsta", "Top 40", "Christian Rap", "Pop/Funk", "Jungle",
168 "Native American", "Cabaret", "New Wave", "Psychadelic", "Rave",
169 "Showtunes", "Trailer", "Lo-Fi", "Tribal", "Acid Punk", "Acid Jazz",
170 "Polka", "Retro", "Musical", "Rock & Roll", "Hard Rock",
172 /* winamp extensions */
173 "Folk", "Folk-Rock", "National Folk", "Swing", "Fast Fusion", "Bebob",
174 "Latin", "Revival", "Celtic", "Bluegrass", "Avantgarde", "Gothic Rock",
175 "Progressive Rock", "Psychedelic Rock", "Symphonic Rock", "Slow Rock",
176 "Big Band", "Chorus", "Easy Listening", "Acoustic", "Humour", "Speech",
177 "Chanson", "Opera", "Chamber Music", "Sonata", "Symphony", "Booty Bass",
178 "Primus", "Porn Groove", "Satire", "Slow Jam", "Club", "Tango", "Samba",
179 "Folklore", "Ballad", "Power Ballad", "Rhythmic Soul", "Freestyle",
180 "Duet", "Punk Rock", "Drum Solo", "A capella", "Euro-House", "Dance Hall",
181 "Goa", "Drum & Bass", "Club-House", "Hardcore", "Terror", "Indie",
182 "BritPop", "Negerpunk", "Polsk Punk", "Beat", "Christian Gangsta Rap",
183 "Heavy Metal", "Black Metal", "Crossover", "Contemporary Christian",
184 "Christian Rock", "Merengue", "Salsa", "Thrash Metal", "Anime", "Jpop",
185 "Synthpop"
188 char* id3_get_num_genre(const unsigned int genre_num)
190 if (genre_num < sizeof(genres)/sizeof(char*))
191 return (char*)genres[genre_num];
192 return NULL;
195 /* True if the string is from the "genres" array */
196 static bool id3_is_genre_string(const char *string)
198 return ( string >= genres[0] &&
199 string <= genres[sizeof(genres)/sizeof(char*) - 1] );
202 char* id3_get_codec(const struct mp3entry* id3)
204 if (id3->codectype < AFMT_NUM_CODECS) {
205 return (char*)audio_formats[id3->codectype].label;
206 } else {
207 return NULL;
212 HOW TO ADD ADDITIONAL ID3 VERSION 2 TAGS
213 Code and comments by Thomas Paul Diffenbach
215 To add another ID3v2 Tag, do the following:
216 1. add a char* named for the tag to struct mp3entry in id3.h,
217 (I (tpd) prefer to use char* rather than ints, even for what seems like
218 numerical values, for cases where a number won't do, e.g.,
219 YEAR: "circa 1765", "1790/1977" (composed/performed), "28 Feb 1969"
220 TRACK: "1/12", "1 of 12", GENRE: "Freeform genre name"
221 Text is more flexible, and as the main use of id3 data is to
222 display it, converting it to an int just means reconverting to
223 display it, at a runtime cost.)
225 2. If any special processing beyond copying the tag value from the Id3
226 block to the struct mp3entry is rrequired (such as converting to an
227 int), write a function to perform this special processing.
229 This function's prototype must match that of
230 typedef tagPostProcessFunc, that is it must be:
231 int func( struct mp3entry*, char* tag, int bufferpos )
232 the first argument is a pointer to the current mp3entry structure the
233 second argument is a pointer to the null terminated string value of the
234 tag found the third argument is the offset of the next free byte in the
235 mp3entry's buffer your function should return the corrected offset; if
236 you don't lengthen or shorten the tag string, you can return the third
237 argument unchanged.
239 Unless you have a good reason no to, make the function static.
240 TO JUST COPY THE TAG NO SPECIAL PROCESSING FUNCTION IS NEEDED.
242 3. add one or more entries to the tagList array, using the format:
243 char* ID3 Tag symbolic name -- see the ID3 specification for these,
244 sizeof() that name minus 1,
245 offsetof( struct mp3entry, variable_name_in_struct_mp3entry ),
246 pointer to your special processing function or NULL
247 if you need no special processing
248 flag indicating if this tag is binary or textual
249 Many ID3 symbolic names come in more than one form. You can add both
250 forms, each referencing the same variable in struct mp3entry.
251 If both forms are present, the last found will be used.
252 Note that the offset can be zero, in which case no entry will be set
253 in the mp3entry struct; the frame is still read into the buffer and
254 the special processing function is called (several times, if there
255 are several frames with the same name).
257 4. Alternately, use the TAG_LIST_ENTRY macro with
258 ID3 tag symbolic name,
259 variable in struct mp3entry,
260 special processing function address
262 5. Add code to wps-display.c function get_tag to assign a printf-like
263 format specifier for the tag */
265 /* Structure for ID3 Tag extraction information */
266 struct tag_resolver {
267 const char* tag;
268 int tag_length;
269 size_t offset;
270 int (*ppFunc)(struct mp3entry*, char* tag, int bufferpos);
271 bool binary;
274 static bool global_ff_found;
276 static int unsynchronize(char* tag, int len, bool *ff_found)
278 int i;
279 unsigned char c;
280 unsigned char *rp, *wp;
282 wp = rp = (unsigned char *)tag;
284 rp = (unsigned char *)tag;
285 for(i = 0;i < len;i++) {
286 /* Read the next byte and write it back, but don't increment the
287 write pointer */
288 c = *rp++;
289 *wp = c;
290 if(*ff_found) {
291 /* Increment the write pointer if it isn't an unsynch pattern */
292 if(c != 0)
293 wp++;
294 *ff_found = false;
295 } else {
296 if(c == 0xff)
297 *ff_found = true;
298 wp++;
301 return (long)wp - (long)tag;
304 static int unsynchronize_frame(char* tag, int len)
306 bool ff_found = false;
308 return unsynchronize(tag, len, &ff_found);
311 static int read_unsynched(int fd, void *buf, int len)
313 int i;
314 int rc;
315 int remaining = len;
316 char *wp;
317 char *rp;
319 wp = buf;
321 while(remaining) {
322 rp = wp;
323 rc = read(fd, rp, remaining);
324 if(rc <= 0)
325 return rc;
327 i = unsynchronize(wp, remaining, &global_ff_found);
328 remaining -= i;
329 wp += i;
332 return len;
335 static int skip_unsynched(int fd, int len)
337 int rc;
338 int remaining = len;
339 int rlen;
340 char buf[32];
342 while(remaining) {
343 rlen = MIN(sizeof(buf), (unsigned int)remaining);
344 rc = read(fd, buf, rlen);
345 if(rc <= 0)
346 return rc;
348 remaining -= unsynchronize(buf, rlen, &global_ff_found);
351 return len;
354 /* parse numeric value from string */
355 static int parsetracknum( struct mp3entry* entry, char* tag, int bufferpos )
357 entry->tracknum = atoi( tag );
358 return bufferpos;
361 /* parse numeric value from string */
362 static int parsediscnum( struct mp3entry* entry, char* tag, int bufferpos )
364 entry->discnum = atoi( tag );
365 return bufferpos;
368 /* parse numeric value from string */
369 static int parseyearnum( struct mp3entry* entry, char* tag, int bufferpos )
371 entry->year = atoi( tag );
372 return bufferpos;
375 /* parse numeric genre from string, version 2.2 and 2.3 */
376 static int parsegenre( struct mp3entry* entry, char* tag, int bufferpos )
378 if(entry->id3version >= ID3_VER_2_4) {
379 /* In version 2.4 and up, there are no parentheses, and the genre frame
380 is a list of strings, either numbers or text. */
382 /* Is it a number? */
383 if(isdigit(tag[0])) {
384 entry->genre_string = id3_get_num_genre(atoi( tag ));
385 return tag - entry->id3v2buf;
386 } else {
387 entry->genre_string = tag;
388 return bufferpos;
390 } else {
391 if( tag[0] == '(' && tag[1] != '(' ) {
392 entry->genre_string = id3_get_num_genre(atoi( tag + 1 ));
393 return tag - entry->id3v2buf;
395 else {
396 entry->genre_string = tag;
397 return bufferpos;
402 #if CONFIG_CODEC == SWCODEC
403 /* parse user defined text, looking for replaygain information. */
404 static int parseuser( struct mp3entry* entry, char* tag, int bufferpos )
406 char* value = NULL;
407 int desc_len = strlen(tag);
408 int value_len = 0;
410 if ((tag - entry->id3v2buf + desc_len + 2) < bufferpos) {
411 /* At least part of the value was read, so we can safely try to
412 * parse it
414 value = tag + desc_len + 1;
415 value_len = parse_replaygain(tag, value, entry, tag,
416 bufferpos - (tag - entry->id3v2buf));
419 return tag - entry->id3v2buf + value_len;
422 /* parse RVA2 binary data and convert to replaygain information. */
423 static int parserva2( struct mp3entry* entry, char* tag, int bufferpos )
425 int desc_len = strlen(tag);
426 int end_pos = tag - entry->id3v2buf + desc_len + 5;
427 int value_len = 0;
428 unsigned char* value = tag + desc_len + 1;
430 /* Only parse RVA2 replaygain tags if tag version == 2.4 and channel
431 * type is master volume.
433 if (entry->id3version == ID3_VER_2_4 && end_pos < bufferpos
434 && *value++ == 1) {
435 long gain = 0;
436 long peak = 0;
437 long peakbits;
438 long peakbytes;
439 bool album = false;
441 /* The RVA2 specification is unclear on some things (id string and
442 * peak volume), but this matches how Quod Libet use them.
445 gain = (int16_t) ((value[0] << 8) | value[1]);
446 value += 2;
447 peakbits = *value++;
448 peakbytes = (peakbits + 7) / 8;
450 /* Only use the topmost 24 bits for peak volume */
451 if (peakbytes > 3) {
452 peakbytes = 3;
455 /* Make sure the peak bits were read */
456 if (end_pos + peakbytes < bufferpos) {
457 long shift = ((8 - (peakbits & 7)) & 7) + (3 - peakbytes) * 8;
459 for ( ; peakbytes; peakbytes--) {
460 peak <<= 8;
461 peak += *value++;
464 peak <<= shift;
466 if (peakbits > 24) {
467 peak += *value >> (8 - shift);
471 if (strcasecmp(tag, "album") == 0) {
472 album = true;
473 } else if (strcasecmp(tag, "track") != 0) {
474 gain = 0;
477 value_len = parse_replaygain_int(album, gain, peak * 2, entry,
478 tag, sizeof(entry->id3v2buf) - (tag - entry->id3v2buf));
481 return tag - entry->id3v2buf + value_len;
483 #endif
485 static const struct tag_resolver taglist[] = {
486 { "TPE1", 4, offsetof(struct mp3entry, artist), NULL, false },
487 { "TP1", 3, offsetof(struct mp3entry, artist), NULL, false },
488 { "TIT2", 4, offsetof(struct mp3entry, title), NULL, false },
489 { "TT2", 3, offsetof(struct mp3entry, title), NULL, false },
490 { "TALB", 4, offsetof(struct mp3entry, album), NULL, false },
491 { "TAL", 3, offsetof(struct mp3entry, album), NULL, false },
492 { "TRK", 3, offsetof(struct mp3entry, track_string), &parsetracknum, false },
493 { "TPOS", 4, offsetof(struct mp3entry, disc_string), &parsediscnum, false },
494 { "TRCK", 4, offsetof(struct mp3entry, track_string), &parsetracknum, false },
495 { "TDRC", 4, offsetof(struct mp3entry, year_string), &parseyearnum, false },
496 { "TYER", 4, offsetof(struct mp3entry, year_string), &parseyearnum, false },
497 { "TYE", 3, offsetof(struct mp3entry, year_string), &parseyearnum, false },
498 { "TCOM", 4, offsetof(struct mp3entry, composer), NULL, false },
499 { "TPE2", 4, offsetof(struct mp3entry, albumartist), NULL, false },
500 { "TP2", 3, offsetof(struct mp3entry, albumartist), NULL, false },
501 { "TIT1", 4, offsetof(struct mp3entry, grouping), NULL, false },
502 { "TT1", 3, offsetof(struct mp3entry, grouping), NULL, false },
503 { "COMM", 4, offsetof(struct mp3entry, comment), NULL, false },
504 { "TCON", 4, offsetof(struct mp3entry, genre_string), &parsegenre, false },
505 { "TCO", 3, offsetof(struct mp3entry, genre_string), &parsegenre, false },
506 #if CONFIG_CODEC == SWCODEC
507 { "TXXX", 4, 0, &parseuser, false },
508 { "RVA2", 4, 0, &parserva2, true },
509 #endif
512 #define TAGLIST_SIZE ((int)(sizeof(taglist) / sizeof(taglist[0])))
514 /* Get the length of an ID3 string in the given encoding. Returns the length
515 * in bytes, including end nil, or -1 if the encoding is unknown.
517 static int unicode_len(char encoding, const void* string)
519 int len = 0;
521 if (encoding == 0x01 || encoding == 0x02) {
522 char first;
523 const char *s = string;
524 /* string might be unaligned, so using short* can crash on ARM and SH1 */
525 do {
526 first = *s++;
527 } while ((first | *s++) != 0);
529 len = s - (const char*) string;
530 } else {
531 len = strlen((char*) string) + 1;
534 return len;
537 /* Checks to see if the passed in string is a 16-bit wide Unicode v2
538 string. If it is, we convert it to a UTF-8 string. If it's not unicode,
539 we convert from the default codepage */
540 static int unicode_munge(char* string, char* utf8buf, int *len) {
541 long tmp;
542 bool le = false;
543 int i = 0;
544 unsigned char *str = (unsigned char *)string;
545 int templen = 0;
546 unsigned char* utf8 = (unsigned char *)utf8buf;
548 switch (str[0]) {
549 case 0x00: /* Type 0x00 is ordinary ISO 8859-1 */
550 str++;
551 (*len)--;
552 utf8 = iso_decode(str, utf8, -1, *len);
553 *utf8 = 0;
554 *len = (unsigned long)utf8 - (unsigned long)utf8buf;
555 break;
557 case 0x01: /* Unicode with or without BOM */
558 case 0x02:
559 (*len)--;
560 str++;
562 /* Handle frames with more than one string
563 (needed for TXXX frames).*/
564 do {
565 tmp = bytes2int(0, 0, str[0], str[1]);
567 /* Now check if there is a BOM
568 (zero-width non-breaking space, 0xfeff)
569 and if it is in little or big endian format */
570 if(tmp == 0xfffe) { /* Little endian? */
571 le = true;
572 str += 2;
573 (*len)-=2;
574 } else if(tmp == 0xfeff) { /* Big endian? */
575 str += 2;
576 (*len)-=2;
577 } else
578 /* If there is no BOM (which is a specification violation),
579 let's try to guess it. If one of the bytes is 0x00, it is
580 probably the most significant one. */
581 if(str[1] == 0)
582 le = true;
584 do {
585 if(le)
586 utf8 = utf16LEdecode(str, utf8, 1);
587 else
588 utf8 = utf16BEdecode(str, utf8, 1);
590 str+=2;
591 i += 2;
592 } while((str[0] || str[1]) && (i < *len));
594 *utf8++ = 0; /* Terminate the string */
595 templen += (strlen(&utf8buf[templen]) + 1);
596 str += 2;
597 i+=2;
598 } while(i < *len);
599 *len = templen - 1;
600 break;
602 case 0x03: /* UTF-8 encoded string */
603 for(i=0; i < *len; i++)
604 utf8[i] = str[i+1];
605 (*len)--;
606 break;
608 default: /* Plain old string */
609 utf8 = iso_decode(str, utf8, -1, *len);
610 *utf8 = 0;
611 *len = (unsigned long)utf8 - (unsigned long)utf8buf;
612 break;
614 return 0;
618 * Sets the title of an MP3 entry based on its ID3v1 tag.
620 * Arguments: file - the MP3 file to scen for a ID3v1 tag
621 * entry - the entry to set the title in
623 * Returns: true if a title was found and created, else false
625 static bool setid3v1title(int fd, struct mp3entry *entry)
627 unsigned char buffer[128];
628 static const char offsets[] = {3, 33, 63, 97, 93, 125, 127};
629 int i, j;
630 unsigned char* utf8;
632 if (-1 == lseek(fd, -128, SEEK_END))
633 return false;
635 if (read(fd, buffer, sizeof buffer) != sizeof buffer)
636 return false;
638 if (strncmp((char *)buffer, "TAG", 3))
639 return false;
641 entry->id3v1len = 128;
642 entry->id3version = ID3_VER_1_0;
644 for (i=0; i < (int)sizeof offsets; i++) {
645 unsigned char* ptr = (unsigned char *)buffer + offsets[i];
647 switch(i) {
648 case 0:
649 case 1:
650 case 2:
651 /* kill trailing space in strings */
652 for (j=29; j && (ptr[j]==0 || ptr[j]==' '); j--)
653 ptr[j] = 0;
654 /* convert string to utf8 */
655 utf8 = (unsigned char *)entry->id3v1buf[i];
656 utf8 = iso_decode(ptr, utf8, -1, 30);
657 /* make sure string is terminated */
658 *utf8 = 0;
659 break;
661 case 3:
662 /* kill trailing space in strings */
663 for (j=27; j && (ptr[j]==0 || ptr[j]==' '); j--)
664 ptr[j] = 0;
665 /* convert string to utf8 */
666 utf8 = (unsigned char *)entry->id3v1buf[3];
667 utf8 = iso_decode(ptr, utf8, -1, 28);
668 /* make sure string is terminated */
669 *utf8 = 0;
670 break;
672 case 4:
673 ptr[4] = 0;
674 entry->year = atoi((char *)ptr);
675 break;
677 case 5:
678 /* id3v1.1 uses last two bytes of comment field for track
679 number: first must be 0 and second is track num */
680 if (!ptr[0] && ptr[1]) {
681 entry->tracknum = ptr[1];
682 entry->id3version = ID3_VER_1_1;
684 break;
686 case 6:
687 /* genre */
688 entry->genre_string = id3_get_num_genre(ptr[0]);
689 break;
693 entry->title = entry->id3v1buf[0];
694 entry->artist = entry->id3v1buf[1];
695 entry->album = entry->id3v1buf[2];
696 entry->comment = entry->id3v1buf[3];
698 return true;
703 * Sets the title of an MP3 entry based on its ID3v2 tag.
705 * Arguments: file - the MP3 file to scan for a ID3v2 tag
706 * entry - the entry to set the title in
708 * Returns: true if a title was found and created, else false
710 static void setid3v2title(int fd, struct mp3entry *entry)
712 int minframesize;
713 int size;
714 long bufferpos = 0, totframelen, framelen;
715 char header[10];
716 char tmp[4];
717 unsigned char version;
718 char *buffer = entry->id3v2buf;
719 int bytesread = 0;
720 int buffersize = sizeof(entry->id3v2buf);
721 unsigned char global_flags;
722 int flags;
723 int skip;
724 bool global_unsynch = false;
725 bool unsynch = false;
726 int data_length_ind;
727 int i, j;
728 int rc;
730 global_ff_found = false;
732 /* Bail out if the tag is shorter than 10 bytes */
733 if(entry->id3v2len < 10)
734 return;
736 /* Read the ID3 tag version from the header */
737 lseek(fd, 0, SEEK_SET);
738 if(10 != read(fd, header, 10))
739 return;
741 /* Get the total ID3 tag size */
742 size = entry->id3v2len - 10;
744 version = header[3];
745 switch ( version ) {
746 case 2:
747 version = ID3_VER_2_2;
748 minframesize = 8;
749 break;
751 case 3:
752 version = ID3_VER_2_3;
753 minframesize = 12;
754 break;
756 case 4:
757 version = ID3_VER_2_4;
758 minframesize = 12;
759 break;
761 default:
762 /* unsupported id3 version */
763 return;
765 entry->id3version = version;
766 entry->tracknum = entry->year = entry->discnum = 0;
767 entry->title = entry->artist = entry->album = NULL; /* FIXME incomplete */
769 global_flags = header[5];
771 /* Skip the extended header if it is present */
772 if(global_flags & 0x40) {
773 if(version == ID3_VER_2_3) {
774 if(10 != read(fd, header, 10))
775 return;
776 /* The 2.3 extended header size doesn't include the header size
777 field itself. Also, it is not unsynched. */
778 framelen =
779 bytes2int(header[0], header[1], header[2], header[3]) + 4;
781 /* Skip the rest of the header */
782 lseek(fd, framelen - 10, SEEK_CUR);
785 if(version >= ID3_VER_2_4) {
786 if(4 != read(fd, header, 4))
787 return;
789 /* The 2.4 extended header size does include the entire header,
790 so here we can just skip it. This header is unsynched. */
791 framelen = unsync(header[0], header[1],
792 header[2], header[3]);
794 lseek(fd, framelen - 4, SEEK_CUR);
798 /* Is unsynchronization applied? */
799 if(global_flags & 0x80) {
800 global_unsynch = true;
804 * We must have at least minframesize bytes left for the
805 * remaining frames to be interesting
807 while (size >= minframesize && bufferpos < buffersize - 1) {
808 flags = 0;
810 /* Read frame header and check length */
811 if(version >= ID3_VER_2_3) {
812 if(global_unsynch && version <= ID3_VER_2_3)
813 rc = read_unsynched(fd, header, 10);
814 else
815 rc = read(fd, header, 10);
816 if(rc != 10)
817 return;
818 /* Adjust for the 10 bytes we read */
819 size -= 10;
821 flags = bytes2int(0, 0, header[8], header[9]);
823 if (version >= ID3_VER_2_4) {
824 framelen = unsync(header[4], header[5],
825 header[6], header[7]);
826 } else {
827 /* version .3 files don't use synchsafe ints for
828 * size */
829 framelen = bytes2int(header[4], header[5],
830 header[6], header[7]);
832 } else {
833 if(6 != read(fd, header, 6))
834 return;
835 /* Adjust for the 6 bytes we read */
836 size -= 6;
838 framelen = bytes2int(0, header[3], header[4], header[5]);
841 /* Keep track of the total size */
842 totframelen = framelen;
844 logf("framelen = %ld", framelen);
845 if(framelen == 0){
846 if (header[0] == 0 && header[1] == 0 && header[2] == 0)
847 return;
848 else
849 continue;
852 unsynch = false;
853 data_length_ind = 0;
855 if(flags)
857 skip = 0;
859 if (version >= ID3_VER_2_4) {
860 if(flags & 0x0040) { /* Grouping identity */
861 lseek(fd, 1, SEEK_CUR); /* Skip 1 byte */
862 framelen--;
864 } else {
865 if(flags & 0x0020) { /* Grouping identity */
866 lseek(fd, 1, SEEK_CUR); /* Skip 1 byte */
867 framelen--;
871 if(flags & 0x000c) /* Compression or encryption */
873 /* Skip it using the total size in case
874 it was truncated */
875 size -= totframelen;
876 lseek(fd, totframelen, SEEK_CUR);
877 continue;
880 if(flags & 0x0002) /* Unsynchronization */
881 unsynch = true;
883 if (version >= ID3_VER_2_4) {
884 if(flags & 0x0001) { /* Data length indicator */
885 if(4 != read(fd, tmp, 4))
886 return;
888 data_length_ind = unsync(tmp[0], tmp[1], tmp[2], tmp[3]);
889 framelen -= 4;
894 /* If the frame is larger than the remaining buffer space we try
895 to read as much as would fit in the buffer */
896 if(framelen >= buffersize - bufferpos)
897 framelen = buffersize - bufferpos - 1;
899 logf("id3v2 frame: %.4s", header);
901 /* Check for certain frame headers
903 'size' is the amount of frame bytes remaining. We decrement it by
904 the amount of bytes we read. If we fail to read as many bytes as
905 we expect, we assume that we can't read from this file, and bail
906 out.
908 For each frame. we will iterate over the list of supported tags,
909 and read the tag into entry's buffer. All tags will be kept as
910 strings, for cases where a number won't do, e.g., YEAR: "circa
911 1765", "1790/1977" (composed/performed), "28 Feb 1969" TRACK:
912 "1/12", "1 of 12", GENRE: "Freeform genre name" Text is more
913 flexible, and as the main use of id3 data is to display it,
914 converting it to an int just means reconverting to display it, at a
915 runtime cost.
917 For tags that the current code does convert to ints, a post
918 processing function will be called via a pointer to function. */
920 for (i=0; i<TAGLIST_SIZE; i++) {
921 const struct tag_resolver* tr = &taglist[i];
922 char** ptag = tr->offset ? (char**) (((char*)entry) + tr->offset)
923 : NULL;
924 char* tag;
926 /* Only ID3_VER_2_2 uses frames with three-character names. */
927 if (((version == ID3_VER_2_2) && (tr->tag_length != 3))
928 || ((version > ID3_VER_2_2) && (tr->tag_length != 4))) {
929 continue;
932 /* Note that parser functions sometimes set *ptag to NULL, so
933 * the "!*ptag" check here doesn't always have the desired
934 * effect. Should the parser functions (parsegenre in
935 * particular) be updated to handle the case of being called
936 * multiple times, or should the "*ptag" check be removed?
938 if( (!ptag || !*ptag) && !memcmp( header, tr->tag, tr->tag_length ) ) {
940 /* found a tag matching one in tagList, and not yet filled */
941 tag = buffer + bufferpos;
943 if(global_unsynch && version <= ID3_VER_2_3)
944 bytesread = read_unsynched(fd, tag, framelen);
945 else
946 bytesread = read(fd, tag, framelen);
948 if( bytesread != framelen )
949 return;
951 size -= bytesread;
953 if(unsynch || (global_unsynch && version >= ID3_VER_2_4))
954 bytesread = unsynchronize_frame(tag, bytesread);
956 /* the COMM frame has a 3 char field to hold an ISO-639-1
957 * language string and an optional short description;
958 * remove them so unicode_munge can work correctly
961 if(!memcmp( header, "COMM", 4 )) {
962 int offset;
963 /* ignore comments with iTunes 7 soundcheck/gapless data */
964 if(!strncmp(tag+4, "iTun", 4))
965 break;
966 offset = 3 + unicode_len(*tag, tag + 4);
967 if(bytesread > offset) {
968 bytesread -= offset;
969 memmove(tag + 1, tag + 1 + offset, bytesread - 1);
973 /* Attempt to parse Unicode string only if the tag contents
974 aren't binary */
975 if(!tr->binary) {
976 /* UTF-8 could potentially be 3 times larger */
977 /* so we need to create a new buffer */
978 char utf8buf[(3 * bytesread) + 1];
980 unicode_munge( tag, utf8buf, &bytesread );
982 if(bytesread >= buffersize - bufferpos)
983 bytesread = buffersize - bufferpos - 1;
985 for (j = 0; j < bytesread; j++)
986 tag[j] = utf8buf[j];
988 /* remove trailing spaces */
989 while ( bytesread > 0 && isspace(tag[bytesread-1]))
990 bytesread--;
993 tag[bytesread] = 0;
994 bufferpos += bytesread + 1;
996 if (ptag)
997 *ptag = tag;
999 if( tr->ppFunc )
1000 bufferpos = tr->ppFunc(entry, tag, bufferpos);
1002 /* Seek to the next frame */
1003 if(framelen < totframelen)
1004 lseek(fd, totframelen - framelen, SEEK_CUR);
1005 break;
1009 if( i == TAGLIST_SIZE ) {
1010 /* no tag in tagList was found, or it was a repeat.
1011 skip it using the total size */
1013 if(global_unsynch && version <= ID3_VER_2_3) {
1014 size -= skip_unsynched(fd, totframelen);
1015 } else {
1016 if(data_length_ind)
1017 totframelen = data_length_ind;
1019 size -= totframelen;
1020 if( lseek(fd, totframelen, SEEK_CUR) == -1 )
1021 return;
1028 * Calculates the size of the ID3v2 tag.
1030 * Arguments: file - the file to search for a tag.
1032 * Returns: the size of the tag or 0 if none was found
1034 int getid3v2len(int fd)
1036 char buf[6];
1037 int offset;
1039 /* Make sure file has a ID3 tag */
1040 if((-1 == lseek(fd, 0, SEEK_SET)) ||
1041 (read(fd, buf, 6) != 6) ||
1042 (strncmp(buf, "ID3", strlen("ID3")) != 0))
1043 offset = 0;
1045 /* Now check what the ID3v2 size field says */
1046 else
1047 if(read(fd, buf, 4) != 4)
1048 offset = 0;
1049 else
1050 offset = unsync(buf[0], buf[1], buf[2], buf[3]) + 10;
1052 logf("ID3V2 Length: 0x%x", offset);
1053 return offset;
1057 * Calculates the length (in milliseconds) of an MP3 file.
1059 * Modified to only use integers.
1061 * Arguments: file - the file to calculate the length upon
1062 * entry - the entry to update with the length
1064 * Returns: the song length in milliseconds,
1065 * 0 means that it couldn't be calculated
1067 static int getsonglength(int fd, struct mp3entry *entry)
1069 unsigned long filetime = 0;
1070 struct mp3info info;
1071 long bytecount;
1073 /* Start searching after ID3v2 header */
1074 if(-1 == lseek(fd, entry->id3v2len, SEEK_SET))
1075 return 0;
1077 bytecount = get_mp3file_info(fd, &info);
1079 logf("Space between ID3V2 tag and first audio frame: 0x%lx bytes",
1080 bytecount);
1082 if(bytecount < 0)
1083 return -1;
1085 bytecount += entry->id3v2len;
1087 /* Validate byte count, in case the file has been edited without
1088 * updating the header.
1090 if (info.byte_count)
1092 const unsigned long expected = entry->filesize - entry->id3v1len
1093 - entry->id3v2len;
1094 const unsigned long diff = MAX(10240, info.byte_count / 20);
1096 if ((info.byte_count > expected + diff)
1097 || (info.byte_count < expected - diff))
1099 logf("Note: info.byte_count differs from expected value by "
1100 "%ld bytes", labs((long) (expected - info.byte_count)));
1101 info.byte_count = 0;
1102 info.frame_count = 0;
1103 info.file_time = 0;
1104 info.enc_padding = 0;
1106 /* Even if the bitrate was based on "known bad" values, it
1107 * should still be better for VBR files than using the bitrate
1108 * of the first audio frame.
1113 entry->bitrate = info.bitrate;
1114 entry->frequency = info.frequency;
1115 entry->version = info.version;
1116 entry->layer = info.layer;
1117 switch(entry->layer) {
1118 #if CONFIG_CODEC==SWCODEC
1119 case 0:
1120 entry->codectype=AFMT_MPA_L1;
1121 break;
1122 #endif
1123 case 1:
1124 entry->codectype=AFMT_MPA_L2;
1125 break;
1126 case 2:
1127 entry->codectype=AFMT_MPA_L3;
1128 break;
1131 /* If the file time hasn't been established, this may be a fixed
1132 rate MP3, so just use the default formula */
1134 filetime = info.file_time;
1136 if(filetime == 0)
1138 /* Prevent a division by zero */
1139 if (info.bitrate < 8)
1140 filetime = 0;
1141 else
1142 filetime = (entry->filesize - bytecount) / (info.bitrate / 8);
1143 /* bitrate is in kbps so this delivers milliseconds. Doing bitrate / 8
1144 * instead of filesize * 8 is exact, because mpeg audio bitrates are
1145 * always multiples of 8, and it avoids overflows. */
1148 entry->frame_count = info.frame_count;
1150 entry->vbr = info.is_vbr;
1151 entry->has_toc = info.has_toc;
1153 #if CONFIG_CODEC==SWCODEC
1154 entry->lead_trim = info.enc_delay;
1155 entry->tail_trim = info.enc_padding;
1156 #endif
1158 memcpy(entry->toc, info.toc, sizeof(info.toc));
1160 entry->vbr_header_pos = info.vbr_header_pos;
1162 /* Update the seek point for the first playable frame */
1163 entry->first_frame_offset = bytecount;
1164 logf("First frame is at %lx", entry->first_frame_offset);
1166 return filetime;
1170 * Checks all relevant information (such as ID3v1 tag, ID3v2 tag, length etc)
1171 * about an MP3 file and updates it's entry accordingly.
1173 Note, that this returns true for successful, false for error! */
1174 bool get_mp3_metadata(int fd, struct mp3entry *entry, const char *filename)
1176 #if CONFIG_CODEC != SWCODEC
1177 memset(entry, 0, sizeof(struct mp3entry));
1178 #endif
1180 strncpy(entry->path, filename, sizeof(entry->path));
1182 entry->title = NULL;
1183 entry->filesize = filesize(fd);
1184 entry->id3v2len = getid3v2len(fd);
1185 entry->tracknum = 0;
1186 entry->discnum = 0;
1188 if (entry->id3v2len)
1189 setid3v2title(fd, entry);
1190 int len = getsonglength(fd, entry);
1191 if (len < 0)
1192 return false;
1193 entry->length = len;
1195 /* Subtract the meta information from the file size to get
1196 the true size of the MP3 stream */
1197 entry->filesize -= entry->first_frame_offset;
1199 /* only seek to end of file if no id3v2 tags were found */
1200 if (!entry->id3v2len) {
1201 setid3v1title(fd, entry);
1204 if(!entry->length || (entry->filesize < 8 ))
1205 /* no song length or less than 8 bytes is hereby considered to be an
1206 invalid mp3 and won't be played by us! */
1207 return false;
1209 return true;
1212 /* Note, that this returns false for successful, true for error! */
1213 bool mp3info(struct mp3entry *entry, const char *filename)
1215 int fd;
1216 bool result;
1218 fd = open(filename, O_RDONLY);
1219 if (fd < 0)
1220 return true;
1222 result = !get_mp3_metadata(fd, entry, filename);
1224 close(fd);
1226 return result;
1229 void adjust_mp3entry(struct mp3entry *entry, void *dest, void *orig)
1231 long offset;
1232 if (orig > dest)
1233 offset = - ((size_t)orig - (size_t)dest);
1234 else
1235 offset = (size_t)dest - (size_t)orig;
1237 if (entry->title)
1238 entry->title += offset;
1239 if (entry->artist)
1240 entry->artist += offset;
1241 if (entry->album)
1242 entry->album += offset;
1243 if (entry->genre_string && !id3_is_genre_string(entry->genre_string))
1244 /* Don't adjust that if it points to an entry of the "genres" array */
1245 entry->genre_string += offset;
1246 if (entry->track_string)
1247 entry->track_string += offset;
1248 if (entry->disc_string)
1249 entry->disc_string += offset;
1250 if (entry->year_string)
1251 entry->year_string += offset;
1252 if (entry->composer)
1253 entry->composer += offset;
1254 if (entry->comment)
1255 entry->comment += offset;
1256 if (entry->albumartist)
1257 entry->albumartist += offset;
1258 if (entry->grouping)
1259 entry->grouping += offset;
1260 #if CONFIG_CODEC == SWCODEC
1261 if (entry->track_gain_string)
1262 entry->track_gain_string += offset;
1263 if (entry->album_gain_string)
1264 entry->album_gain_string += offset;
1265 #endif
1268 void copy_mp3entry(struct mp3entry *dest, struct mp3entry *orig)
1270 memcpy(dest, orig, sizeof(struct mp3entry));
1271 adjust_mp3entry(dest, dest, orig);
1274 #ifdef DEBUG_STANDALONE
1276 char *secs2str(int ms)
1278 static char buffer[32];
1279 int secs = ms/1000;
1280 ms %= 1000;
1281 snprintf(buffer, sizeof(buffer), "%d:%02d.%d", secs/60, secs%60, ms/100);
1282 return buffer;
1285 int main(int argc, char **argv)
1287 int i;
1288 for(i=1; i<argc; i++) {
1289 struct mp3entry mp3;
1290 mp3.album = "Bogus";
1291 if(mp3info(&mp3, argv[i], false)) {
1292 printf("Failed to get %s\n", argv[i]);
1293 return 0;
1296 printf("****** File: %s\n"
1297 " Title: %s\n"
1298 " Artist: %s\n"
1299 " Album: %s\n"
1300 " Genre: %s (%d) \n"
1301 " Composer: %s\n"
1302 " Year: %s (%d)\n"
1303 " Track: %s (%d)\n"
1304 " Length: %s / %d s\n"
1305 " Bitrate: %d\n"
1306 " Frequency: %d\n",
1307 argv[i],
1308 mp3.title?mp3.title:"<blank>",
1309 mp3.artist?mp3.artist:"<blank>",
1310 mp3.album?mp3.album:"<blank>",
1311 mp3.genre_string?mp3.genre_string:"<blank>",
1312 mp3.genre,
1313 mp3.composer?mp3.composer:"<blank>",
1314 mp3.year_string?mp3.year_string:"<blank>",
1315 mp3.year,
1316 mp3.track_string?mp3.track_string:"<blank>",
1317 mp3.tracknum,
1318 secs2str(mp3.length),
1319 mp3.length/1000,
1320 mp3.bitrate,
1321 mp3.frequency);
1324 return 0;
1327 #endif