Do the clamping a little better.
[kugel-rb.git] / firmware / id3.c
blobeaaf2a9ecd899052e4069c5c1c80aa117ad2521e
1 /***************************************************************************
2 * __________ __ ___.
3 * Open \______ \ ____ ____ | | _\_ |__ _______ ___
4 * Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
5 * Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
6 * Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
7 * \/ \/ \/ \/ \/
8 * $Id$
10 * Copyright (C) 2002 by Daniel Stenberg
12 * All files in this archive are subject to the GNU General Public License.
13 * See the file COPYING in the source tree root for full license agreement.
15 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
16 * KIND, either express or implied.
18 ****************************************************************************/
20 * Parts of this code has been stolen from the Ample project and was written
21 * by David H�deman. It has since been extended and enhanced pretty much by
22 * all sorts of friendly Rockbox people.
26 /* tagResolver and associated code copyright 2003 Thomas Paul Diffenbach
29 #include <stdio.h>
30 #include <stdlib.h>
31 #include <string.h>
32 #include <errno.h>
33 #include <stdbool.h>
34 #include <stddef.h>
35 #include <ctype.h>
36 #include "config.h"
37 #include "file.h"
38 #include "debug.h"
39 #include "atoi.h"
41 #include "id3.h"
42 #include "mp3data.h"
43 #include "system.h"
44 #include "replaygain.h"
45 #include "rbunicode.h"
47 /** Database of audio formats **/
48 const struct afmt_entry audio_formats[AFMT_NUM_CODECS] =
50 /* Unknown file format */
51 [AFMT_UNKNOWN] =
52 AFMT_ENTRY("???", NULL, NULL, NULL ),
54 /* MPEG Audio layer 1 */
55 [AFMT_MPA_L1] =
56 AFMT_ENTRY("MP1", "mpa", NULL, "mp1\0" ),
57 /* MPEG Audio layer 2 */
58 [AFMT_MPA_L2] =
59 AFMT_ENTRY("MP2", "mpa", NULL, "mpa\0mp2\0" ),
60 /* MPEG Audio layer 3 */
61 [AFMT_MPA_L3] =
62 AFMT_ENTRY("MP3", "mpa", "mp3_enc", "mp3\0" ),
64 #if CONFIG_CODEC == SWCODEC
65 /* Audio Interchange File Format */
66 [AFMT_AIFF] =
67 AFMT_ENTRY("AIFF", "aiff", "aiff_enc", "aiff\0aif\0"),
68 /* Uncompressed PCM in a WAV file */
69 [AFMT_PCM_WAV] =
70 AFMT_ENTRY("WAV", "wav", "wav_enc", "wav\0" ),
71 /* Ogg Vorbis */
72 [AFMT_OGG_VORBIS] =
73 AFMT_ENTRY("Ogg", "vorbis", NULL, "ogg\0" ),
74 /* FLAC */
75 [AFMT_FLAC] =
76 AFMT_ENTRY("FLAC", "flac", NULL, "flac\0" ),
77 /* Musepack */
78 [AFMT_MPC] =
79 AFMT_ENTRY("MPC", "mpc", NULL, "mpc\0" ),
80 /* A/52 (aka AC3) audio */
81 [AFMT_A52] =
82 AFMT_ENTRY("AC3", "a52", NULL, "a52\0ac3\0" ),
83 /* WavPack */
84 [AFMT_WAVPACK] =
85 AFMT_ENTRY("WV", "wavpack", "wavpack_enc", "wv\0" ),
86 /* Apple Lossless Audio Codec */
87 [AFMT_ALAC] =
88 AFMT_ENTRY("ALAC", "alac", NULL, "m4a\0m4b\0" ),
89 /* Advanced Audio Coding in M4A container */
90 [AFMT_AAC] =
91 AFMT_ENTRY("AAC", "aac", NULL, "mp4\0" ),
92 /* Shorten */
93 [AFMT_SHN] =
94 AFMT_ENTRY("SHN", "shorten", NULL, "shn\0" ),
95 /* SID File Format */
96 [AFMT_SID] =
97 AFMT_ENTRY("SID", "sid", NULL, "sid\0" ),
98 /* ADX File Format */
99 [AFMT_ADX] =
100 AFMT_ENTRY("ADX", "adx", NULL, "adx\0" ),
101 /* NESM (NES Sound Format) */
102 [AFMT_NSF] =
103 AFMT_ENTRY("NSF", "nsf", NULL, "nsf\0nsfe\0" ),
104 /* Speex File Format */
105 [AFMT_SPEEX] =
106 AFMT_ENTRY("Speex","speex", NULL, "spx\0" ),
107 /* SPC700 Save State */
108 [AFMT_SPC] =
109 AFMT_ENTRY("SPC", "spc", NULL, "spc\0" ),
110 #endif
113 #if CONFIG_CODEC == SWCODEC && defined (HAVE_RECORDING)
114 /* get REC_FORMAT_* corresponding AFMT_* */
115 const int rec_format_afmt[REC_NUM_FORMATS] =
117 /* give AFMT_UNKNOWN by default */
118 [0 ... REC_NUM_FORMATS-1] = AFMT_UNKNOWN,
119 /* add new entries below this line */
120 [REC_FORMAT_AIFF] = AFMT_AIFF,
121 [REC_FORMAT_MPA_L3] = AFMT_MPA_L3,
122 [REC_FORMAT_WAVPACK] = AFMT_WAVPACK,
123 [REC_FORMAT_PCM_WAV] = AFMT_PCM_WAV,
126 /* get AFMT_* corresponding REC_FORMAT_* */
127 const int afmt_rec_format[AFMT_NUM_CODECS] =
129 /* give -1 by default */
130 [0 ... AFMT_NUM_CODECS-1] = -1,
131 /* add new entries below this line */
132 [AFMT_AIFF] = REC_FORMAT_AIFF,
133 [AFMT_MPA_L3] = REC_FORMAT_MPA_L3,
134 [AFMT_WAVPACK] = REC_FORMAT_WAVPACK,
135 [AFMT_PCM_WAV] = REC_FORMAT_PCM_WAV,
137 #endif /* CONFIG_CODEC == SWCODEC && defined (HAVE_RECORDING) */
138 /****/
140 unsigned long unsync(unsigned long b0,
141 unsigned long b1,
142 unsigned long b2,
143 unsigned long b3)
145 return (((long)(b0 & 0x7F) << (3*7)) |
146 ((long)(b1 & 0x7F) << (2*7)) |
147 ((long)(b2 & 0x7F) << (1*7)) |
148 ((long)(b3 & 0x7F) << (0*7)));
151 static const char* const genres[] = {
152 "Blues", "Classic Rock", "Country", "Dance", "Disco", "Funk", "Grunge",
153 "Hip-Hop", "Jazz", "Metal", "New Age", "Oldies", "Other", "Pop", "R&B",
154 "Rap", "Reggae", "Rock", "Techno", "Industrial", "Alternative", "Ska",
155 "Death Metal", "Pranks", "Soundtrack", "Euro-Techno", "Ambient", "Trip-Hop",
156 "Vocal", "Jazz+Funk", "Fusion", "Trance", "Classical", "Instrumental",
157 "Acid", "House", "Game", "Sound Clip", "Gospel", "Noise", "AlternRock",
158 "Bass", "Soul", "Punk", "Space", "Meditative", "Instrumental Pop",
159 "Instrumental Rock", "Ethnic", "Gothic", "Darkwave", "Techno-Industrial",
160 "Electronic", "Pop-Folk", "Eurodance", "Dream", "Southern Rock", "Comedy",
161 "Cult", "Gangsta", "Top 40", "Christian Rap", "Pop/Funk", "Jungle",
162 "Native American", "Cabaret", "New Wave", "Psychadelic", "Rave",
163 "Showtunes", "Trailer", "Lo-Fi", "Tribal", "Acid Punk", "Acid Jazz",
164 "Polka", "Retro", "Musical", "Rock & Roll", "Hard Rock",
166 /* winamp extensions */
167 "Folk", "Folk-Rock", "National Folk", "Swing", "Fast Fusion", "Bebob",
168 "Latin", "Revival", "Celtic", "Bluegrass", "Avantgarde", "Gothic Rock",
169 "Progressive Rock", "Psychedelic Rock", "Symphonic Rock", "Slow Rock",
170 "Big Band", "Chorus", "Easy Listening", "Acoustic", "Humour", "Speech",
171 "Chanson", "Opera", "Chamber Music", "Sonata", "Symphony", "Booty Bass",
172 "Primus", "Porn Groove", "Satire", "Slow Jam", "Club", "Tango", "Samba",
173 "Folklore", "Ballad", "Power Ballad", "Rhythmic Soul", "Freestyle",
174 "Duet", "Punk Rock", "Drum Solo", "A capella", "Euro-House", "Dance Hall",
175 "Goa", "Drum & Bass", "Club-House", "Hardcore", "Terror", "Indie",
176 "BritPop", "Negerpunk", "Polsk Punk", "Beat", "Christian Gangsta Rap",
177 "Heavy Metal", "Black Metal", "Crossover", "Contemporary Christian",
178 "Christian Rock", "Merengue", "Salsa", "Thrash Metal", "Anime", "Jpop",
179 "Synthpop"
182 char* id3_get_num_genre(const unsigned int genre_num)
184 if (genre_num < sizeof(genres)/sizeof(char*))
185 return (char*)genres[genre_num];
186 return NULL;
189 char* id3_get_codec(const struct mp3entry* id3)
191 if (id3->codectype < AFMT_NUM_CODECS) {
192 return (char*)audio_formats[id3->codectype].label;
193 } else {
194 return NULL;
199 HOW TO ADD ADDITIONAL ID3 VERSION 2 TAGS
200 Code and comments by Thomas Paul Diffenbach
202 To add another ID3v2 Tag, do the following:
203 1. add a char* named for the tag to struct mp3entry in id3.h,
204 (I (tpd) prefer to use char* rather than ints, even for what seems like
205 numerical values, for cases where a number won't do, e.g.,
206 YEAR: "circa 1765", "1790/1977" (composed/performed), "28 Feb 1969"
207 TRACK: "1/12", "1 of 12", GENRE: "Freeform genre name"
208 Text is more flexible, and as the main use of id3 data is to
209 display it, converting it to an int just means reconverting to
210 display it, at a runtime cost.)
212 2. If any special processing beyond copying the tag value from the Id3
213 block to the struct mp3entry is rrequired (such as converting to an
214 int), write a function to perform this special processing.
216 This function's prototype must match that of
217 typedef tagPostProcessFunc, that is it must be:
218 int func( struct mp3entry*, char* tag, int bufferpos )
219 the first argument is a pointer to the current mp3entry structure the
220 second argument is a pointer to the null terminated string value of the
221 tag found the third argument is the offset of the next free byte in the
222 mp3entry's buffer your function should return the corrected offset; if
223 you don't lengthen or shorten the tag string, you can return the third
224 argument unchanged.
226 Unless you have a good reason no to, make the function static.
227 TO JUST COPY THE TAG NO SPECIAL PROCESSING FUNCTION IS NEEDED.
229 3. add one or more entries to the tagList array, using the format:
230 char* ID3 Tag symbolic name -- see the ID3 specification for these,
231 sizeof() that name minus 1,
232 offsetof( struct mp3entry, variable_name_in_struct_mp3entry ),
233 pointer to your special processing function or NULL
234 if you need no special processing
235 flag indicating if this tag is binary or textual
236 Many ID3 symbolic names come in more than one form. You can add both
237 forms, each referencing the same variable in struct mp3entry.
238 If both forms are present, the last found will be used.
239 Note that the offset can be zero, in which case no entry will be set
240 in the mp3entry struct; the frame is still read into the buffer and
241 the special processing function is called (several times, if there
242 are several frames with the same name).
244 4. Alternately, use the TAG_LIST_ENTRY macro with
245 ID3 tag symbolic name,
246 variable in struct mp3entry,
247 special processing function address
249 5. Add code to wps-display.c function get_tag to assign a printf-like
250 format specifier for the tag */
252 /* Structure for ID3 Tag extraction information */
253 struct tag_resolver {
254 const char* tag;
255 int tag_length;
256 size_t offset;
257 int (*ppFunc)(struct mp3entry*, char* tag, int bufferpos);
258 bool binary;
261 static bool global_ff_found;
263 static int unsynchronize(char* tag, int len, bool *ff_found)
265 int i;
266 unsigned char c;
267 unsigned char *rp, *wp;
269 wp = rp = (unsigned char *)tag;
271 rp = (unsigned char *)tag;
272 for(i = 0;i < len;i++) {
273 /* Read the next byte and write it back, but don't increment the
274 write pointer */
275 c = *rp++;
276 *wp = c;
277 if(*ff_found) {
278 /* Increment the write pointer if it isn't an unsynch pattern */
279 if(c != 0)
280 wp++;
281 *ff_found = false;
282 } else {
283 if(c == 0xff)
284 *ff_found = true;
285 wp++;
288 return (long)wp - (long)tag;
291 static int unsynchronize_frame(char* tag, int len)
293 bool ff_found = false;
295 return unsynchronize(tag, len, &ff_found);
298 static int read_unsynched(int fd, void *buf, int len)
300 int i;
301 int rc;
302 int remaining = len;
303 char *wp;
304 char *rp;
306 wp = buf;
308 while(remaining) {
309 rp = wp;
310 rc = read(fd, rp, remaining);
311 if(rc <= 0)
312 return rc;
314 i = unsynchronize(wp, remaining, &global_ff_found);
315 remaining -= i;
316 wp += i;
319 return len;
322 static int skip_unsynched(int fd, int len)
324 int rc;
325 int remaining = len;
326 int rlen;
327 char buf[32];
329 while(remaining) {
330 rlen = MIN(sizeof(buf), (unsigned int)remaining);
331 rc = read(fd, buf, rlen);
332 if(rc <= 0)
333 return rc;
335 remaining -= unsynchronize(buf, rlen, &global_ff_found);
338 return len;
341 /* parse numeric value from string */
342 static int parsetracknum( struct mp3entry* entry, char* tag, int bufferpos )
344 entry->tracknum = atoi( tag );
345 return bufferpos;
348 /* parse numeric value from string */
349 static int parseyearnum( struct mp3entry* entry, char* tag, int bufferpos )
351 entry->year = atoi( tag );
352 return bufferpos;
355 /* parse numeric genre from string, version 2.2 and 2.3 */
356 static int parsegenre( struct mp3entry* entry, char* tag, int bufferpos )
358 if(entry->id3version >= ID3_VER_2_4) {
359 /* In version 2.4 and up, there are no parentheses, and the genre frame
360 is a list of strings, either numbers or text. */
362 /* Is it a number? */
363 if(isdigit(tag[0])) {
364 entry->genre_string = id3_get_num_genre(atoi( tag ));
365 return tag - entry->id3v2buf;
366 } else {
367 entry->genre_string = tag;
368 return bufferpos;
370 } else {
371 if( tag[0] == '(' && tag[1] != '(' ) {
372 entry->genre_string = id3_get_num_genre(atoi( tag + 1 ));
373 return tag - entry->id3v2buf;
375 else {
376 entry->genre_string = tag;
377 return bufferpos;
382 #if CONFIG_CODEC == SWCODEC
383 /* parse user defined text, looking for replaygain information. */
384 static int parseuser( struct mp3entry* entry, char* tag, int bufferpos )
386 char* value = NULL;
387 int desc_len = strlen(tag);
388 int value_len = 0;
390 /* Note: for ID3v2.4, parse_replaygain will not overwrite replaygain
391 values already parsed from RVA2 tags */
392 if ((tag - entry->id3v2buf + desc_len + 2) < bufferpos) {
393 /* At least part of the value was read, so we can safely try to
394 * parse it
396 value = tag + desc_len + 1;
397 value_len = parse_replaygain(tag, value, entry, tag,
398 bufferpos - (tag - entry->id3v2buf));
401 if (value_len) {
402 bufferpos = tag - entry->id3v2buf + value_len;
403 } else {
404 bufferpos = tag - entry->id3v2buf;
407 return bufferpos;
410 /* parse RVA2 binary data and convert to replaygain information. */
411 static int parserva2( struct mp3entry* entry, char* tag, int bufferpos )
413 char* value = NULL;
414 int desc_len = strlen(tag);
415 int value_len = 0;
417 /* Only parse RVA2 replaygain tags if tag version == 2.4 */
418 if (entry->id3version == ID3_VER_2_4 &&
419 (tag - entry->id3v2buf + desc_len + 2) < bufferpos) {
420 value = tag + desc_len + 1;
421 value_len = parse_replaygain_rva(tag, value, entry, tag,
422 bufferpos - (tag - entry->id3v2buf));
425 if (value_len) {
426 bufferpos = tag - entry->id3v2buf + value_len;
427 } else {
428 bufferpos = tag - entry->id3v2buf;
431 return bufferpos;
433 #endif
435 static const struct tag_resolver taglist[] = {
436 { "TPE1", 4, offsetof(struct mp3entry, artist), NULL, false },
437 { "TP1", 3, offsetof(struct mp3entry, artist), NULL, false },
438 { "TIT2", 4, offsetof(struct mp3entry, title), NULL, false },
439 { "TT2", 3, offsetof(struct mp3entry, title), NULL, false },
440 { "TALB", 4, offsetof(struct mp3entry, album), NULL, false },
441 { "TAL", 3, offsetof(struct mp3entry, album), NULL, false },
442 { "TRK", 3, offsetof(struct mp3entry, track_string), &parsetracknum, false },
443 { "TRCK", 4, offsetof(struct mp3entry, track_string), &parsetracknum, false },
444 { "TDRC", 4, offsetof(struct mp3entry, year_string), &parseyearnum, false },
445 { "TYER", 4, offsetof(struct mp3entry, year_string), &parseyearnum, false },
446 { "TYE", 3, offsetof(struct mp3entry, year_string), &parseyearnum, false },
447 { "TCOM", 4, offsetof(struct mp3entry, composer), NULL, false },
448 { "TPE2", 4, offsetof(struct mp3entry, albumartist), NULL, false },
449 { "TP2", 3, offsetof(struct mp3entry, albumartist), NULL, false },
450 { "COMM", 4, offsetof(struct mp3entry, comment), NULL, false },
451 { "TCON", 4, offsetof(struct mp3entry, genre_string), &parsegenre, false },
452 { "TCO", 3, offsetof(struct mp3entry, genre_string), &parsegenre, false },
453 #if CONFIG_CODEC == SWCODEC
454 { "TXXX", 4, 0, &parseuser, false },
455 { "RVA2", 4, 0, &parserva2, true },
456 #endif
459 #define TAGLIST_SIZE ((int)(sizeof(taglist) / sizeof(taglist[0])))
461 /* Checks to see if the passed in string is a 16-bit wide Unicode v2
462 string. If it is, we convert it to a UTF-8 string. If it's not unicode,
463 we convert from the default codepage */
464 static int unicode_munge(char* string, char* utf8buf, int *len) {
465 long tmp;
466 bool le = false;
467 int i = 0;
468 unsigned char *str = (unsigned char *)string;
469 int templen = 0;
470 unsigned char* utf8 = (unsigned char *)utf8buf;
472 switch (str[0]) {
473 case 0x00: /* Type 0x00 is ordinary ISO 8859-1 */
474 str++;
475 (*len)--;
476 utf8 = iso_decode(str, utf8, -1, *len);
477 *utf8 = 0;
478 *len = (unsigned long)utf8 - (unsigned long)utf8buf;
479 break;
481 case 0x01: /* Unicode with or without BOM */
482 case 0x02:
483 (*len)--;
484 str++;
486 /* Handle frames with more than one string
487 (needed for TXXX frames).*/
488 do {
489 tmp = bytes2int(0, 0, str[0], str[1]);
491 /* Now check if there is a BOM
492 (zero-width non-breaking space, 0xfeff)
493 and if it is in little or big endian format */
494 if(tmp == 0xfffe) { /* Little endian? */
495 le = true;
496 str += 2;
497 (*len)-=2;
498 } else if(tmp == 0xfeff) { /* Big endian? */
499 str += 2;
500 (*len)-=2;
501 } else
502 /* If there is no BOM (which is a specification violation),
503 let's try to guess it. If one of the bytes is 0x00, it is
504 probably the most significant one. */
505 if(str[1] == 0)
506 le = true;
508 do {
509 if(le)
510 utf8 = utf16LEdecode(str, utf8, 1);
511 else
512 utf8 = utf16BEdecode(str, utf8, 1);
514 str+=2;
515 i += 2;
516 } while((str[0] || str[1]) && (i < *len));
518 *utf8++ = 0; /* Terminate the string */
519 templen += (strlen(&utf8buf[templen]) + 1);
520 str += 2;
521 i+=2;
522 } while(i < *len);
523 *len = templen - 1;
524 break;
526 case 0x03: /* UTF-8 encoded string */
527 for(i=0; i < *len; i++)
528 utf8[i] = str[i+1];
529 (*len)--;
530 break;
532 default: /* Plain old string */
533 utf8 = iso_decode(str, utf8, -1, *len);
534 *utf8 = 0;
535 *len = (unsigned long)utf8 - (unsigned long)utf8buf;
536 break;
538 return 0;
542 * Sets the title of an MP3 entry based on its ID3v1 tag.
544 * Arguments: file - the MP3 file to scen for a ID3v1 tag
545 * entry - the entry to set the title in
547 * Returns: true if a title was found and created, else false
549 static bool setid3v1title(int fd, struct mp3entry *entry)
551 unsigned char buffer[128];
552 static const char offsets[] = {3, 33, 63, 97, 93, 125, 127};
553 int i, j;
554 unsigned char* utf8;
556 if (-1 == lseek(fd, -128, SEEK_END))
557 return false;
559 if (read(fd, buffer, sizeof buffer) != sizeof buffer)
560 return false;
562 if (strncmp((char *)buffer, "TAG", 3))
563 return false;
565 entry->id3v1len = 128;
566 entry->id3version = ID3_VER_1_0;
568 for (i=0; i < (int)sizeof offsets; i++) {
569 unsigned char* ptr = (unsigned char *)buffer + offsets[i];
571 switch(i) {
572 case 0:
573 case 1:
574 case 2:
575 /* kill trailing space in strings */
576 for (j=29; j && (ptr[j]==0 || ptr[j]==' '); j--)
577 ptr[j] = 0;
578 /* convert string to utf8 */
579 utf8 = (unsigned char *)entry->id3v1buf[i];
580 utf8 = iso_decode(ptr, utf8, -1, 30);
581 /* make sure string is terminated */
582 *utf8 = 0;
583 break;
585 case 3:
586 /* kill trailing space in strings */
587 for (j=27; j && (ptr[j]==0 || ptr[j]==' '); j--)
588 ptr[j] = 0;
589 /* convert string to utf8 */
590 utf8 = (unsigned char *)entry->id3v1buf[3];
591 utf8 = iso_decode(ptr, utf8, -1, 28);
592 /* make sure string is terminated */
593 *utf8 = 0;
594 break;
596 case 4:
597 ptr[4] = 0;
598 entry->year = atoi((char *)ptr);
599 break;
601 case 5:
602 /* id3v1.1 uses last two bytes of comment field for track
603 number: first must be 0 and second is track num */
604 if (!ptr[0] && ptr[1]) {
605 entry->tracknum = ptr[1];
606 entry->id3version = ID3_VER_1_1;
608 break;
610 case 6:
611 /* genre */
612 entry->genre_string = id3_get_num_genre(ptr[0]);
613 break;
617 entry->title = entry->id3v1buf[0];
618 entry->artist = entry->id3v1buf[1];
619 entry->album = entry->id3v1buf[2];
620 entry->comment = entry->id3v1buf[3];
622 return true;
627 * Sets the title of an MP3 entry based on its ID3v2 tag.
629 * Arguments: file - the MP3 file to scan for a ID3v2 tag
630 * entry - the entry to set the title in
632 * Returns: true if a title was found and created, else false
634 static void setid3v2title(int fd, struct mp3entry *entry)
636 int minframesize;
637 int size;
638 long bufferpos = 0, totframelen, framelen;
639 char header[10];
640 char tmp[4];
641 unsigned char version;
642 char *buffer = entry->id3v2buf;
643 int bytesread = 0;
644 int buffersize = sizeof(entry->id3v2buf);
645 unsigned char global_flags;
646 int flags;
647 int skip;
648 bool global_unsynch = false;
649 bool unsynch = false;
650 int data_length_ind;
651 int i, j;
652 int rc;
654 global_ff_found = false;
656 /* Bail out if the tag is shorter than 10 bytes */
657 if(entry->id3v2len < 10)
658 return;
660 /* Read the ID3 tag version from the header */
661 lseek(fd, 0, SEEK_SET);
662 if(10 != read(fd, header, 10))
663 return;
665 /* Get the total ID3 tag size */
666 size = entry->id3v2len - 10;
668 version = header[3];
669 switch ( version ) {
670 case 2:
671 version = ID3_VER_2_2;
672 minframesize = 8;
673 break;
675 case 3:
676 version = ID3_VER_2_3;
677 minframesize = 12;
678 break;
680 case 4:
681 version = ID3_VER_2_4;
682 minframesize = 12;
683 break;
685 default:
686 /* unsupported id3 version */
687 return;
689 entry->id3version = version;
690 entry->tracknum = entry->year = 0;
691 entry->title = entry->artist = entry->album = NULL; /* FIXME incomplete */
693 global_flags = header[5];
695 /* Skip the extended header if it is present */
696 if(global_flags & 0x40) {
697 if(version == ID3_VER_2_3) {
698 if(10 != read(fd, header, 10))
699 return;
700 /* The 2.3 extended header size doesn't include the header size
701 field itself. Also, it is not unsynched. */
702 framelen =
703 bytes2int(header[0], header[1], header[2], header[3]) + 4;
705 /* Skip the rest of the header */
706 lseek(fd, framelen - 10, SEEK_CUR);
709 if(version >= ID3_VER_2_4) {
710 if(4 != read(fd, header, 4))
711 return;
713 /* The 2.4 extended header size does include the entire header,
714 so here we can just skip it. This header is unsynched. */
715 framelen = unsync(header[0], header[1],
716 header[2], header[3]);
718 lseek(fd, framelen - 4, SEEK_CUR);
722 /* Is unsynchronization applied? */
723 if(global_flags & 0x80) {
724 global_unsynch = true;
728 * We must have at least minframesize bytes left for the
729 * remaining frames to be interesting
731 while (size >= minframesize && bufferpos < buffersize - 1) {
732 flags = 0;
734 /* Read frame header and check length */
735 if(version >= ID3_VER_2_3) {
736 if(global_unsynch && version <= ID3_VER_2_3)
737 rc = read_unsynched(fd, header, 10);
738 else
739 rc = read(fd, header, 10);
740 if(rc != 10)
741 return;
742 /* Adjust for the 10 bytes we read */
743 size -= 10;
745 flags = bytes2int(0, 0, header[8], header[9]);
747 if (version >= ID3_VER_2_4) {
748 framelen = unsync(header[4], header[5],
749 header[6], header[7]);
750 } else {
751 /* version .3 files don't use synchsafe ints for
752 * size */
753 framelen = bytes2int(header[4], header[5],
754 header[6], header[7]);
756 } else {
757 if(6 != read(fd, header, 6))
758 return;
759 /* Adjust for the 6 bytes we read */
760 size -= 6;
762 framelen = bytes2int(0, header[3], header[4], header[5]);
765 /* Keep track of the total size */
766 totframelen = framelen;
768 DEBUGF("framelen = %ld\n", framelen);
769 if(framelen == 0){
770 if (header[0] == 0 && header[1] == 0 && header[2] == 0)
771 return;
772 else
773 continue;
776 unsynch = false;
777 data_length_ind = 0;
779 if(flags)
781 skip = 0;
783 if (version >= ID3_VER_2_4) {
784 if(flags & 0x0040) { /* Grouping identity */
785 lseek(fd, 1, SEEK_CUR); /* Skip 1 byte */
786 framelen--;
788 } else {
789 if(flags & 0x0020) { /* Grouping identity */
790 lseek(fd, 1, SEEK_CUR); /* Skip 1 byte */
791 framelen--;
795 if(flags & 0x000c) /* Compression or encryption */
797 /* Skip it using the total size in case
798 it was truncated */
799 size -= totframelen;
800 lseek(fd, totframelen, SEEK_CUR);
801 continue;
804 if(flags & 0x0002) /* Unsynchronization */
805 unsynch = true;
807 if (version >= ID3_VER_2_4) {
808 if(flags & 0x0001) { /* Data length indicator */
809 if(4 != read(fd, tmp, 4))
810 return;
812 data_length_ind = unsync(tmp[0], tmp[1], tmp[2], tmp[3]);
813 framelen -= 4;
818 /* If the frame is larger than the remaining buffer space we try
819 to read as much as would fit in the buffer */
820 if(framelen >= buffersize - bufferpos)
821 framelen = buffersize - bufferpos - 1;
823 DEBUGF("id3v2 frame: %.4s\n", header);
825 /* Check for certain frame headers
827 'size' is the amount of frame bytes remaining. We decrement it by
828 the amount of bytes we read. If we fail to read as many bytes as
829 we expect, we assume that we can't read from this file, and bail
830 out.
832 For each frame. we will iterate over the list of supported tags,
833 and read the tag into entry's buffer. All tags will be kept as
834 strings, for cases where a number won't do, e.g., YEAR: "circa
835 1765", "1790/1977" (composed/performed), "28 Feb 1969" TRACK:
836 "1/12", "1 of 12", GENRE: "Freeform genre name" Text is more
837 flexible, and as the main use of id3 data is to display it,
838 converting it to an int just means reconverting to display it, at a
839 runtime cost.
841 For tags that the current code does convert to ints, a post
842 processing function will be called via a pointer to function. */
844 for (i=0; i<TAGLIST_SIZE; i++) {
845 const struct tag_resolver* tr = &taglist[i];
846 char** ptag = tr->offset ? (char**) (((char*)entry) + tr->offset)
847 : NULL;
848 char* tag;
849 int comm_offset=0;
851 /* Only ID3_VER_2_2 uses frames with three-character names. */
852 if (((version == ID3_VER_2_2) && (tr->tag_length != 3))
853 || ((version > ID3_VER_2_2) && (tr->tag_length != 4))) {
854 continue;
857 /* Note that parser functions sometimes set *ptag to NULL, so
858 * the "!*ptag" check here doesn't always have the desired
859 * effect. Should the parser functions (parsegenre in
860 * particular) be updated to handle the case of being called
861 * multiple times, or should the "*ptag" check be removed?
863 if( (!ptag || !*ptag) && !memcmp( header, tr->tag, tr->tag_length ) ) {
865 /* found a tag matching one in tagList, and not yet filled */
866 tag = buffer + bufferpos;
868 if(global_unsynch && version <= ID3_VER_2_3)
869 bytesread = read_unsynched(fd, tag, framelen);
870 else
871 bytesread = read(fd, tag, framelen);
873 if( bytesread != framelen )
874 return;
876 size -= bytesread;
878 if(unsynch || (global_unsynch && version >= ID3_VER_2_4))
879 bytesread = unsynchronize_frame(tag, bytesread);
881 /* the COMM frame has a 3 char field to hold an ISO-639-1
882 * language string and an optional short description;
883 * remove them so unicode_munge can work correctly
886 if(!memcmp( header, "COMM", 4 )) {
887 comm_offset = 3 + strlen(tag+4) + 1;
888 if(bytesread>comm_offset) {
889 bytesread-=comm_offset;
890 memmove(tag+1, tag+comm_offset+1, bytesread-1);
894 /* Attempt to parse Unicode string only if the tag contents
895 aren't binary */
896 if(!tr->binary) {
897 /* UTF-8 could potentially be 3 times larger */
898 /* so we need to create a new buffer */
899 char utf8buf[(3 * bytesread) + 1];
901 unicode_munge( tag, utf8buf, &bytesread );
903 if(bytesread >= buffersize - bufferpos)
904 bytesread = buffersize - bufferpos - 1;
906 for (j = 0; j < bytesread; j++)
907 tag[j] = utf8buf[j];
909 /* remove trailing spaces */
910 while ( bytesread > 0 && isspace(tag[bytesread-1]))
911 bytesread--;
914 tag[bytesread] = 0;
915 bufferpos += bytesread + 1;
917 if (ptag)
918 *ptag = tag;
920 if( tr->ppFunc )
921 bufferpos = tr->ppFunc(entry, tag, bufferpos);
923 /* Seek to the next frame */
924 if(framelen < totframelen)
925 lseek(fd, totframelen - framelen, SEEK_CUR);
926 break;
930 if( i == TAGLIST_SIZE ) {
931 /* no tag in tagList was found, or it was a repeat.
932 skip it using the total size */
934 if(global_unsynch && version <= ID3_VER_2_3) {
935 size -= skip_unsynched(fd, totframelen);
936 } else {
937 if(data_length_ind)
938 totframelen = data_length_ind;
940 size -= totframelen;
941 if( lseek(fd, totframelen, SEEK_CUR) == -1 )
942 return;
949 * Calculates the size of the ID3v2 tag.
951 * Arguments: file - the file to search for a tag.
953 * Returns: the size of the tag or 0 if none was found
955 int getid3v2len(int fd)
957 char buf[6];
958 int offset;
960 /* Make sure file has a ID3 tag */
961 if((-1 == lseek(fd, 0, SEEK_SET)) ||
962 (read(fd, buf, 6) != 6) ||
963 (strncmp(buf, "ID3", strlen("ID3")) != 0))
964 offset = 0;
966 /* Now check what the ID3v2 size field says */
967 else
968 if(read(fd, buf, 4) != 4)
969 offset = 0;
970 else
971 offset = unsync(buf[0], buf[1], buf[2], buf[3]) + 10;
973 DEBUGF("ID3V2 Length: 0x%x\n", offset);
974 return offset;
978 * Calculates the length (in milliseconds) of an MP3 file.
980 * Modified to only use integers.
982 * Arguments: file - the file to calculate the length upon
983 * entry - the entry to update with the length
985 * Returns: the song length in milliseconds,
986 * 0 means that it couldn't be calculated
988 static int getsonglength(int fd, struct mp3entry *entry)
990 unsigned long filetime = 0;
991 struct mp3info info;
992 long bytecount;
994 /* Start searching after ID3v2 header */
995 if(-1 == lseek(fd, entry->id3v2len, SEEK_SET))
996 return 0;
998 bytecount = get_mp3file_info(fd, &info);
1000 DEBUGF("Space between ID3V2 tag and first audio frame: 0x%lx bytes\n",
1001 bytecount);
1003 if(bytecount < 0)
1004 return -1;
1006 bytecount += entry->id3v2len;
1008 /* Validate byte count, in case the file has been edited without
1009 * updating the header.
1011 if (info.byte_count)
1013 const unsigned long expected = entry->filesize - entry->id3v1len
1014 - entry->id3v2len;
1015 const unsigned long diff = MAX(10240, info.byte_count / 20);
1017 if ((info.byte_count > expected + diff)
1018 || (info.byte_count < expected - diff))
1020 DEBUGF("Note: info.byte_count differs from expected value by "
1021 "%ld bytes\n", labs((long) (expected - info.byte_count)));
1022 info.byte_count = 0;
1023 info.frame_count = 0;
1024 info.file_time = 0;
1025 info.enc_padding = 0;
1027 /* Even if the bitrate was based on "known bad" values, it
1028 * should still be better for VBR files than using the bitrate
1029 * of the first audio frame.
1034 entry->bitrate = info.bitrate;
1035 entry->frequency = info.frequency;
1036 entry->version = info.version;
1037 entry->layer = info.layer;
1038 switch(entry->layer) {
1039 #if CONFIG_CODEC==SWCODEC
1040 case 0:
1041 entry->codectype=AFMT_MPA_L1;
1042 break;
1043 #endif
1044 case 1:
1045 entry->codectype=AFMT_MPA_L2;
1046 break;
1047 case 2:
1048 entry->codectype=AFMT_MPA_L3;
1049 break;
1052 /* If the file time hasn't been established, this may be a fixed
1053 rate MP3, so just use the default formula */
1055 filetime = info.file_time;
1057 if(filetime == 0)
1059 /* Prevent a division by zero */
1060 if (info.bitrate < 8)
1061 filetime = 0;
1062 else
1063 filetime = (entry->filesize - bytecount) / (info.bitrate / 8);
1064 /* bitrate is in kbps so this delivers milliseconds. Doing bitrate / 8
1065 * instead of filesize * 8 is exact, because mpeg audio bitrates are
1066 * always multiples of 8, and it avoids overflows. */
1069 entry->frame_count = info.frame_count;
1071 entry->vbr = info.is_vbr;
1072 entry->has_toc = info.has_toc;
1074 #if CONFIG_CODEC==SWCODEC
1075 entry->lead_trim = info.enc_delay;
1076 entry->tail_trim = info.enc_padding;
1077 #endif
1079 memcpy(entry->toc, info.toc, sizeof(info.toc));
1081 entry->vbr_header_pos = info.vbr_header_pos;
1083 /* Update the seek point for the first playable frame */
1084 entry->first_frame_offset = bytecount;
1085 DEBUGF("First frame is at %lx\n", entry->first_frame_offset);
1087 return filetime;
1091 * Checks all relevant information (such as ID3v1 tag, ID3v2 tag, length etc)
1092 * about an MP3 file and updates it's entry accordingly.
1094 Note, that this returns true for successful, false for error! */
1095 bool get_mp3_metadata(int fd, struct mp3entry *entry, const char *filename, bool v1first)
1097 int v1found = false;
1099 #if CONFIG_CODEC != SWCODEC
1100 memset(entry, 0, sizeof(struct mp3entry));
1101 #endif
1103 strncpy(entry->path, filename, sizeof(entry->path));
1105 entry->title = NULL;
1106 entry->filesize = filesize(fd);
1107 entry->id3v2len = getid3v2len(fd);
1108 entry->tracknum = 0;
1110 if(v1first)
1111 v1found = setid3v1title(fd, entry);
1113 if (!v1found && entry->id3v2len)
1114 setid3v2title(fd, entry);
1115 entry->length = getsonglength(fd, entry);
1117 /* Subtract the meta information from the file size to get
1118 the true size of the MP3 stream */
1119 entry->filesize -= entry->first_frame_offset;
1121 /* only seek to end of file if no id3v2 tags were found,
1122 and we already haven't looked for a v1 tag */
1123 if (!v1first && !entry->id3v2len) {
1124 setid3v1title(fd, entry);
1127 if(!entry->length || (entry->filesize < 8 ))
1128 /* no song length or less than 8 bytes is hereby considered to be an
1129 invalid mp3 and won't be played by us! */
1130 return false;
1132 return true;
1135 /* Note, that this returns false for successful, true for error! */
1136 bool mp3info(struct mp3entry *entry, const char *filename, bool v1first)
1138 int fd;
1139 bool result;
1141 fd = open(filename, O_RDONLY);
1142 if (fd < 0)
1143 return true;
1145 result = !get_mp3_metadata(fd, entry, filename, v1first);
1147 close(fd);
1149 return result;
1152 void adjust_mp3entry(struct mp3entry *entry, void *dest, void *orig)
1154 long offset;
1155 if (orig > dest)
1156 offset = - ((size_t)orig - (size_t)dest);
1157 else
1158 offset = (size_t)dest - (size_t)orig;
1160 if (entry->title)
1161 entry->title += offset;
1162 if (entry->artist)
1163 entry->artist += offset;
1164 if (entry->album)
1165 entry->album += offset;
1166 if (entry->genre_string)
1167 entry->genre_string += offset;
1168 if (entry->track_string)
1169 entry->track_string += offset;
1170 if (entry->year_string)
1171 entry->year_string += offset;
1172 if (entry->composer)
1173 entry->composer += offset;
1174 if (entry->comment)
1175 entry->comment += offset;
1176 if (entry->albumartist)
1177 entry->albumartist += offset;
1178 #if CONFIG_CODEC == SWCODEC
1179 if (entry->track_gain_string)
1180 entry->track_gain_string += offset;
1181 if (entry->album_gain_string)
1182 entry->album_gain_string += offset;
1183 #endif
1186 void copy_mp3entry(struct mp3entry *dest, struct mp3entry *orig)
1188 memcpy(dest, orig, sizeof(struct mp3entry));
1189 adjust_mp3entry(dest, dest, orig);
1192 #ifdef DEBUG_STANDALONE
1194 char *secs2str(int ms)
1196 static char buffer[32];
1197 int secs = ms/1000;
1198 ms %= 1000;
1199 snprintf(buffer, sizeof(buffer), "%d:%02d.%d", secs/60, secs%60, ms/100);
1200 return buffer;
1203 int main(int argc, char **argv)
1205 int i;
1206 for(i=1; i<argc; i++) {
1207 struct mp3entry mp3;
1208 mp3.album = "Bogus";
1209 if(mp3info(&mp3, argv[i], false)) {
1210 printf("Failed to get %s\n", argv[i]);
1211 return 0;
1214 printf("****** File: %s\n"
1215 " Title: %s\n"
1216 " Artist: %s\n"
1217 " Album: %s\n"
1218 " Genre: %s (%d) \n"
1219 " Composer: %s\n"
1220 " Year: %s (%d)\n"
1221 " Track: %s (%d)\n"
1222 " Length: %s / %d s\n"
1223 " Bitrate: %d\n"
1224 " Frequency: %d\n",
1225 argv[i],
1226 mp3.title?mp3.title:"<blank>",
1227 mp3.artist?mp3.artist:"<blank>",
1228 mp3.album?mp3.album:"<blank>",
1229 mp3.genre_string?mp3.genre_string:"<blank>",
1230 mp3.genre,
1231 mp3.composer?mp3.composer:"<blank>",
1232 mp3.year_string?mp3.year_string:"<blank>",
1233 mp3.year,
1234 mp3.track_string?mp3.track_string:"<blank>",
1235 mp3.tracknum,
1236 secs2str(mp3.length),
1237 mp3.length/1000,
1238 mp3.bitrate,
1239 mp3.frequency);
1242 return 0;
1245 #endif