rockbox/apps/metadata.c

715 lines
23 KiB
C
Raw Normal View History

/***************************************************************************
* __________ __ ___.
* Open \______ \ ____ ____ | | _\_ |__ _______ ___
* Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
* Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
* Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
* \/ \/ \/ \/ \/
* $Id$
*
* Copyright (C) 2005 Dave Chapman
*
* All files in this archive are subject to the GNU General Public License.
* See the file COPYING in the source tree root for full license agreement.
*
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
* KIND, either express or implied.
*
****************************************************************************/
#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <ctype.h>
#include "metadata.h"
#include "mp3_playback.h"
#include "mp3data.h"
#include "logf.h"
#include "atoi.h"
/* Simple file type probing by looking filename extension. */
int probe_file_format(const char *filename)
{
char *suffix;
suffix = strrchr(filename, '.');
if (suffix == NULL)
return AFMT_UNKNOWN;
suffix += 1;
if (!strcasecmp("mp1", suffix))
return AFMT_MPA_L1;
else if (!strcasecmp("mp2", suffix))
return AFMT_MPA_L2;
else if (!strcasecmp("mpa", suffix))
return AFMT_MPA_L2;
else if (!strcasecmp("mp3", suffix))
return AFMT_MPA_L3;
else if (!strcasecmp("ogg", suffix))
return AFMT_OGG_VORBIS;
else if (!strcasecmp("wav", suffix))
return AFMT_PCM_WAV;
else if (!strcasecmp("flac", suffix))
return AFMT_FLAC;
else if (!strcasecmp("mpc", suffix))
return AFMT_MPC;
else if (!strcasecmp("aac", suffix))
return AFMT_AAC;
else if (!strcasecmp("ape", suffix))
return AFMT_APE;
else if (!strcasecmp("wma", suffix))
return AFMT_WMA;
else if ((!strcasecmp("a52", suffix)) || (!strcasecmp("ac3", suffix)))
return AFMT_A52;
else if (!strcasecmp("rm", suffix))
return AFMT_REAL;
else if (!strcasecmp("wv", suffix))
return AFMT_WAVPACK;
return AFMT_UNKNOWN;
}
unsigned short a52_bitrates[]={32,40,48,56,64,80,96,
112,128,160,192,224,256,320,
384,448,512,576,640};
/* Only store frame sizes for 44.1KHz - others are simply multiples
of the bitrate */
unsigned short a52_441framesizes[]=
{69*2,70*2,87*2,88*2,104*2,105*2,121*2,122*2,
139*2,140*2,174*2,175*2,208*2,209*2,243*2,244*2,
278*2,279*2,348*2,349*2,417*2,418*2,487*2,488*2,
557*2,558*2,696*2,697*2,835*2,836*2,975*2,976*2,
1114*2,1115*2,1253*2,1254*2,1393*2,1394*2};
const long wavpack_sample_rates [] = { 6000, 8000, 9600, 11025, 12000, 16000,
22050, 24000, 32000, 44100, 48000, 64000, 88200, 96000, 192000 };
/* Get metadata for track - return false if parsing showed problems with the
file that would prevent playback. */
static bool get_apetag_info (struct mp3entry *entry, int fd);
bool get_metadata(struct track_info* track, int fd, const char* trackname,
bool v1first) {
unsigned long totalsamples,bytespersample,channels,bitspersample,numbytes;
int bytesperframe;
unsigned char* buf;
int i,j,eof;
int rc;
/* Load codec specific track tag information. */
switch (track->id3.codectype) {
case AFMT_MPA_L1:
case AFMT_MPA_L2:
case AFMT_MPA_L3:
/* Should check the return value. */
mp3info(&track->id3, trackname, v1first);
lseek(fd, 0, SEEK_SET);
/* This is too slow to execute on some files. */
get_mp3file_info(fd, &track->mp3data);
lseek(fd, 0, SEEK_SET);
/*
logf("T:%s", track->id3.title);
logf("L:%d", track->id3.length);
logf("O:%d", track->id3.first_frame_offset);
logf("F:%d", track->id3.frequency);
*/
track->taginfo_ready = true;
break ;
case AFMT_PCM_WAV:
/* Use the trackname part of the id3 structure as a temporary buffer */
buf=track->id3.path;
lseek(fd, 0, SEEK_SET);
rc = read(fd, buf, 44);
if (rc < 44) {
return false;
}
if ((memcmp(buf,"RIFF",4)!=0) ||
(memcmp(&buf[8],"WAVEfmt",7)!=0)) {
logf("%s is not a WAV file\n",trackname);
return(false);
}
/* FIX: Correctly parse WAV header - we assume canonical
44-byte header */
bitspersample=buf[34];
channels=buf[22];
if ((bitspersample!=16) || (channels != 2)) {
logf("Unsupported WAV file - %d bitspersample, %d channels\n",
bitspersample,channels);
return(false);
}
bytespersample=((bitspersample/8)*channels);
numbytes=(buf[40]|(buf[41]<<8)|(buf[42]<<16)|(buf[43]<<24));
totalsamples=numbytes/bytespersample;
track->id3.vbr=false; /* All WAV files are CBR */
track->id3.filesize=filesize(fd);
track->id3.frequency=buf[24]|(buf[25]<<8)|(buf[26]<<16)|(buf[27]<<24);
/* Calculate track length (in ms) and estimate the bitrate (in kbit/s) */
track->id3.length=(totalsamples/track->id3.frequency)*1000;
track->id3.bitrate=(track->id3.frequency*bytespersample)/(1000/8);
lseek(fd, 0, SEEK_SET);
strncpy(track->id3.path,trackname,sizeof(track->id3.path));
track->taginfo_ready = true;
break;
case AFMT_FLAC:
/* A simple parser to read vital metadata from a FLAC file - length, frequency, bitrate etc. */
/* This code should either be moved to a seperate file, or discarded in favour of the libFLAC code */
/* The FLAC stream specification can be found at http://flac.sourceforge.net/format.html#stream */
/* Use the trackname part of the id3 structure as a temporary buffer */
buf=track->id3.path;
lseek(fd, 0, SEEK_SET);
rc = read(fd, buf, 4);
if (rc < 4) {
return false;
}
if (memcmp(buf,"fLaC",4)!=0) {
logf("%s is not a FLAC file\n",trackname);
return(false);
}
while (1) {
rc = read(fd, buf, 4);
i = (buf[1]<<16)|(buf[2]<<8)|buf[3]; /* The length of the block */
if ((buf[0]&0x7f)==0) { /* 0 is the STREAMINFO block */
rc = read(fd, buf, i); /* FIXME: Don't trust the value of i */
if (rc < 0) {
return false;
}
track->id3.vbr=true; /* All FLAC files are VBR */
track->id3.filesize=filesize(fd);
track->id3.frequency=(buf[10]<<12)|(buf[11]<<4)|((buf[12]&0xf0)>>4);
/* NOT NEEDED: bitspersample=(((buf[12]&0x01)<<4)|((buf[13]&0xf0)>>4))+1; */
/* totalsamples is a 36-bit field, but we assume <= 32 bits are used */
totalsamples=(buf[14]<<24)|(buf[15]<<16)|(buf[16]<<8)|buf[17];
/* Calculate track length (in ms) and estimate the bitrate (in kbit/s) */
track->id3.length=(totalsamples/track->id3.frequency)*1000;
track->id3.bitrate=(filesize(fd)*8)/track->id3.length;
} else if ((buf[0]&0x7f)==4) { /* 4 is the VORBIS_COMMENT block */
/* The next i bytes of the file contain the VORBIS COMMENTS - just skip them for now. */
lseek(fd, i, SEEK_CUR);
} else {
if (buf[0]&0x80) { /* If we have reached the last metadata block, abort. */
break;
} else {
lseek(fd, i, SEEK_CUR); /* Skip to next metadata block */
}
}
}
lseek(fd, 0, SEEK_SET);
strncpy(track->id3.path,trackname,sizeof(track->id3.path));
track->taginfo_ready = true;
break;
case AFMT_OGG_VORBIS:
/* A simple parser to read vital metadata from an Ogg Vorbis file */
/* An Ogg File is split into pages, each starting with the string
"OggS". Each page has a timestamp (in PCM samples) referred to as
the "granule position".
An Ogg Vorbis has the following structure:
1) Identification header (containing samplerate, numchannels, etc)
2) Comment header - containing the Vorbis Comments
3) Setup header - containing codec setup information
4) Many audio packets...
*/
/* Use the trackname part of the id3 structure as a temporary buffer */
buf=track->id3.path;
lseek(fd, 0, SEEK_SET);
rc = read(fd, buf, 58);
if (rc < 4) {
return false;
}
if ((memcmp(buf,"OggS",4)!=0) || (memcmp(&buf[29],"vorbis",6)!=0)) {
logf("%s is not an Ogg Vorbis file\n",trackname);
return(false);
}
/* Ogg stores integers in little-endian format. */
track->id3.filesize=filesize(fd);
track->id3.frequency=buf[40]|(buf[41]<<8)|(buf[42]<<16)|(buf[43]<<24);
channels=buf[39];
/* We now need to search for the last page in the file - identified by
by ('O','g','g','S',0) and retrieve totalsamples */
lseek(fd, -32*1024, SEEK_END);
eof=0;
j=0; /* The number of bytes currently in buffer */
i=0;
totalsamples=0;
while (!eof) {
rc = read(fd, &buf[j], MAX_PATH-j);
if (rc <= 0) {
eof=1;
} else {
j+=rc;
}
/* Inefficient (but simple) search */
i=0;
while (i < (j-5)) {
if (memcmp(&buf[i],"OggS",5)==0) {
if (i < (j-10)) {
totalsamples=(buf[i+6])|(buf[i+7]<<8)|(buf[i+8]<<16)|(buf[i+9]<<24);
j=0; /* We can discard the rest of the buffer */
} else {
break;
}
} else {
i++;
}
}
if (i < (j-5)) {
/* Move OggS to start of buffer */
while(i>0) buf[i--]=buf[j--];
} else {
j=0;
}
}
track->id3.length=(totalsamples/track->id3.frequency)*1000;
/* The following calculation should use datasize, not filesize (i.e. exclude comments etc) */
track->id3.bitrate=(filesize(fd)*8)/track->id3.length;
track->id3.vbr=true;
lseek(fd, 0, SEEK_SET);
strncpy(track->id3.path,trackname,sizeof(track->id3.path));
track->taginfo_ready = true;
break;
case AFMT_WAVPACK:
/* A simple parser to read basic information from a WavPack file.
* This will fail on WavPack files that don't have the WavPack header
* as the first thing (i.e. self-extracting WavPack files) or WavPack
* files that have so much extra RIFF data stored in the first block
* that they don't have samples (very rare, I would think).
*/
/* Use the trackname part of the id3 structure as a temporary buffer */
buf=track->id3.path;
lseek(fd, 0, SEEK_SET);
rc = read(fd, buf, 32);
if (rc < 32) {
return false;
}
if (memcmp (buf, "wvpk", 4) != 0 || buf [9] != 4 || buf [8] < 2) {
logf ("%s is not a WavPack file\n", trackname);
return (false);
}
track->id3.vbr = true; /* All WavPack files are VBR */
track->id3.filesize = filesize (fd);
if ((buf [20] | buf [21] | buf [22] | buf [23]) &&
(buf [12] & buf [13] & buf [14] & buf [15]) != 0xff) {
int srindx = ((buf [26] >> 7) & 1) + ((buf [27] << 1) & 14);
if (srindx == 15)
track->id3.frequency = 44100;
else
track->id3.frequency = wavpack_sample_rates [srindx];
totalsamples = (buf[15] << 24) | (buf[14] << 16) | (buf[13] << 8) | buf[12];
track->id3.length = totalsamples / (track->id3.frequency / 100) * 10;
track->id3.bitrate = filesize (fd) /
(track->id3.length / 8);
}
get_apetag_info (&track->id3, fd); /* use any apetag info we find */
lseek (fd, 0, SEEK_SET);
strncpy (track->id3.path, trackname, sizeof (track->id3.path));
track->taginfo_ready = true;
break;
case AFMT_A52:
/* Use the trackname part of the id3 structure as a temporary buffer */
buf=track->id3.path;
lseek(fd, 0, SEEK_SET);
/* We just need the first 5 bytes */
rc = read(fd, buf, 5);
if (rc < 5) {
return false;
}
if ((buf[0]!=0x0b) || (buf[1]!=0x77)) {
logf("%s is not an A52/AC3 file\n",trackname);
return false;
}
i = buf[4]&0x3e;
if (i > 36) {
logf("A52: Invalid frmsizecod: %d\n",i);
return false;
}
track->id3.bitrate=a52_bitrates[i>>1];
track->id3.vbr=false;
track->id3.filesize = filesize (fd);
switch (buf[4]&0xc0) {
case 0x00:
track->id3.frequency=48000;
bytesperframe=track->id3.bitrate*2*2;
break;
case 0x40:
track->id3.frequency=44100;
bytesperframe=a52_441framesizes[i];
break;
case 0x80:
track->id3.frequency=32000;
bytesperframe=track->id3.bitrate*3*2;
break;
default:
logf("A52: Invalid samplerate code: 0x%02x\n",buf[4]&0xc0);
return false;
break;
}
/* One A52 frame contains 6 blocks, each containing 256 samples */
totalsamples=(track->filesize/bytesperframe)*6*256;
track->id3.length=(totalsamples/track->id3.frequency)*1000;
lseek(fd, 0, SEEK_SET);
strncpy(track->id3.path,trackname,sizeof(track->id3.path));
track->taginfo_ready = true;
break;
/* If we don't know how to read the metadata, just store the filename */
default:
strncpy(track->id3.path,trackname,sizeof(track->id3.path));
track->taginfo_ready = true;
break;
}
return true;
}
/************************* APE TAG HANDLING CODE ****************************/
/*
* This is a first pass at APEv2 tag handling. I'm not sure if this should
* reside here, but I wanted to modify as little as possible since I don't
* have a feel for the complete system. It may be that APEv2 tags should be
* added to the ID3 handling code in the firmware directory. APEv2 tags are
* used in WavPack files and Musepack files by default, however they are
* also used in MP3 files sometimes (by Foobar2000). Also, WavPack files can
* also use ID3v1 tags (but not ID3v2), so it seems like some universal tag
* handler might be a reasonable approach.
*
* This code does not currently handle APEv1 tags, but I believe that this
* is not a problem because they were only used in Monkey's Audio files which
* will probably never be playable in RockBox (and certainly not by this CPU).
*/
#define APETAG_HEADER_FORMAT "8LLLL"
#define APETAG_HEADER_LENGTH 32
#define APETAG_DATA_LIMIT 4096
struct apetag_header {
char id [8];
long version, length, item_count, flags;
char res [8];
};
static struct apetag {
struct apetag_header header;
char data [APETAG_DATA_LIMIT];
} temp_apetag;
static int get_apetag_item (struct apetag *tag,
const char *item,
char *value,
int size);
static int load_apetag (int fd, struct apetag *tag);
static void UTF8ToAnsi (unsigned char *pUTF8);
/*
* This function searches the specified file for an APEv2 tag and uses any
* information found there to populate the appropriate fields in the specified
* mp3entry structure. A temporary buffer is used to hold the tag during this
* operation. For now, the actual string data that needs to be held during the
* life of the track entry is stored in the "id3v2buf" field (which should not
* be used for any file that has an APEv2 tag). This limits the total space
* for the artist, title, album, composer and genre strings to 300 characters.
*/
static bool get_apetag_info (struct mp3entry *entry, int fd)
{
int rem_space = sizeof (entry->id3v2buf), str_space;
char *temp_buffer = entry->id3v2buf;
if (rem_space <= 1 || !load_apetag (fd, &temp_apetag))
return false;
if (get_apetag_item (&temp_apetag, "year", temp_buffer, rem_space))
entry->year = atoi (temp_buffer);
if (get_apetag_item (&temp_apetag, "track", temp_buffer, rem_space))
entry->tracknum = atoi (temp_buffer);
if (get_apetag_item (&temp_apetag, "artist", temp_buffer, rem_space)) {
UTF8ToAnsi (entry->artist = temp_buffer);
str_space = strlen (temp_buffer) + 1;
temp_buffer += str_space;
rem_space -= str_space;
}
if (rem_space > 1 &&
get_apetag_item (&temp_apetag, "title", temp_buffer, rem_space)) {
UTF8ToAnsi (entry->title = temp_buffer);
str_space = strlen (temp_buffer) + 1;
temp_buffer += str_space;
rem_space -= str_space;
}
if (rem_space > 1 &&
get_apetag_item (&temp_apetag, "album", temp_buffer, rem_space)) {
UTF8ToAnsi (entry->album = temp_buffer);
str_space = strlen (temp_buffer) + 1;
temp_buffer += str_space;
rem_space -= str_space;
}
if (rem_space > 1 &&
get_apetag_item (&temp_apetag, "genre", temp_buffer, rem_space)) {
UTF8ToAnsi (entry->genre_string = temp_buffer);
str_space = strlen (temp_buffer) + 1;
temp_buffer += str_space;
rem_space -= str_space;
}
if (rem_space > 1 &&
get_apetag_item (&temp_apetag, "composer", temp_buffer, rem_space))
UTF8ToAnsi (entry->composer = temp_buffer);
return true;
}
/*
* Helper function to convert little-endian structures to easily usable native
* format using a format string (this does nothing on a little-endian machine).
*/
static void little_endian_to_native (void *data, char *format)
{
unsigned char *cp = (unsigned char *) data;
long temp;
while (*format) {
switch (*format) {
case 'L':
temp = cp [0] + ((long) cp [1] << 8) + ((long) cp [2] << 16) + ((long) cp [3] << 24);
* (long *) cp = temp;
cp += 4;
break;
case 'S':
temp = cp [0] + (cp [1] << 8);
* (short *) cp = (short) temp;
cp += 2;
break;
default:
if (*format >= '0' && *format <= '9')
cp += *format - '0';
break;
}
format++;
}
}
/*
* Attempt to obtain the named string-type item from the specified APEv2 tag.
* The tag value will be copied to "value" (including an appended terminating
* NULL) and the length of the string (including the NULL) will be returned.
* If the data will not fit in the specified "size" then it will be truncated
* early (but still terminated). If the specified item is not found then 0 is
* returned and written to the first character of "value". If "value" is
* passed in as NULL, then the specified size is ignored and the actual size
* required to store the value is returned.
*
* Note that this function does not work on binary tag data; only UTF-8
* encoded strings. However, numeric data (like ReplayGain) is usually stored
* as strings.
*
* Also, APEv2 tags may have multiple values for a given item and these will
* all be copied to "value" with NULL separators (this is why the total data
* size is returned). Of course, it is possible to ignore any additional
* values by simply using up to the first NULL.
*/
static int get_apetag_item (struct apetag *tag,
const char *item,
char *value,
int size)
{
if (value && size)
*value = 0;
if (tag->header.id [0] == 'A') {
char *p = tag->data;
char *q = p + tag->header.length - APETAG_HEADER_LENGTH;
int i;
for (i = 0; i < tag->header.item_count; ++i) {
int vsize, flags, isize;
vsize = * (long *) p; p += 4;
flags = * (long *) p; p += 4;
isize = strlen (p);
little_endian_to_native (&vsize, "L");
little_endian_to_native (&flags, "L");
if (p + isize + vsize + 1 > q)
break;
if (isize && vsize && !stricmp (item, p) && !(flags & 6)) {
if (value) {
if (vsize + 1 > size)
vsize = size - 1;
memcpy (value, p + isize + 1, vsize);
value [vsize] = 0;
}
return vsize + 1;
}
else
p += isize + vsize + 1;
}
}
return 0;
}
/*
* Attempt to load an APEv2 tag from the specified file into the specified
* structure. If the APEv2 tag will not fit into the predefined data size,
* then the tag is not loaded. A return value of TRUE indicates success.
*/
static int load_apetag (int fd, struct apetag *tag)
{
if (lseek (fd, -APETAG_HEADER_LENGTH, SEEK_END) == -1 ||
read (fd, &tag->header, APETAG_HEADER_LENGTH) != APETAG_HEADER_LENGTH ||
strncmp (tag->header.id, "APETAGEX", 8)) {
tag->header.id [0] = 0;
return false;
}
little_endian_to_native (&tag->header, APETAG_HEADER_FORMAT);
if (tag->header.version == 2000 && tag->header.item_count &&
tag->header.length > APETAG_HEADER_LENGTH &&
tag->header.length < APETAG_DATA_LIMIT) {
int data_size = tag->header.length - APETAG_HEADER_LENGTH;
if (lseek (fd, -tag->header.length, SEEK_END) == -1 ||
read (fd, tag->data, data_size) != data_size) {
tag->header.id [0] = 0;
return false;
}
else
return true;
}
tag->header.id [0] = 0;
return false;
}
/*
* This is a *VERY* boneheaded attempt to convert UTF-8 unicode character
* strings to ANSI. It simply maps the 16-bit Unicode characters that are
* less than 0x100 directly to an 8-bit value, and turns all the rest into
* question marks. This can be done "in-place" because the resulting string
* can only get smaller.
*/
static void UTF8ToAnsi (unsigned char *pUTF8)
{
unsigned char *pAnsi = pUTF8;
unsigned short widechar = 0;
int trail_bytes = 0;
while (*pUTF8) {
if (*pUTF8 & 0x80) {
if (*pUTF8 & 0x40) {
if (trail_bytes) {
trail_bytes = 0;
*pAnsi++ = widechar < 0x100 ? widechar : '?';
}
else {
char temp = *pUTF8;
while (temp & 0x80) {
trail_bytes++;
temp <<= 1;
}
widechar = temp >> trail_bytes--;
}
}
else if (trail_bytes) {
widechar = (widechar << 6) | (*pUTF8 & 0x3f);
if (!--trail_bytes)
*pAnsi++ = widechar < 0x100 ? widechar : '?';
}
}
else
*pAnsi++ = *pUTF8;
pUTF8++;
}
*pAnsi = 0;
}