WMA Voice now plays and seeks in the sim. The code is still in floating point, and is not added to the main build. There's still a bug with the decoder in the current state that it outputs a fewer number of samples than ffmpeg's.

git-svn-id: svn://svn.rockbox.org/rockbox/trunk@27744 a1c6a512-1295-4272-9138-f99709370657
2010-08-07 17:55:02 +00:00 · 2010-08-07 17:55:02 +00:00 · 4ff2cf4f0c
commit 4ff2cf4f0c
parent eb369699c6
9 changed files with 296 additions and 7 deletions
--- a/apps/codecs/libasf/asf.h
+++ b/apps/codecs/libasf/asf.h
@ -7,6 +7,7 @@
 #define ASF_CODEC_ID_WMAV1      0x160
 #define ASF_CODEC_ID_WMAV2      0x161
 #define ASF_CODEC_ID_WMAPRO     0x162
+#define ASF_CODEC_ID_WMAVOICE   0x00A

 enum asf_error_e {
    ASF_ERROR_INTERNAL       = -1,  /* incorrect input to API calls */
@ -33,7 +34,7 @@ struct asf_waveformatex_s {
    uint16_t bitspersample;
    uint16_t datalen;
    uint16_t numpackets;
-    uint8_t data[18];
+    uint8_t data[46];
 };
 typedef struct asf_waveformatex_s asf_waveformatex_t;

--- a/apps/codecs/libwmavoice/SOURCES
+++ b/apps/codecs/libwmavoice/SOURCES
@ -0,0 +1,17 @@
+acelp_filters.c
+acelp_vectors.c
+avfft.c
+bitstream.c
+celp_filters.c
+celp_math.c
+dct.c
+fft.c
+lsp.c
+mdct.c
+rdft.c
+utils.c
+wmavoice.c
+libavutil/log.c
+libavutil/lzo.c
+libavutil/mem.c
+libavutil/mathematics.c
--- a/apps/codecs/libwmavoice/libwmavoice.make
+++ b/apps/codecs/libwmavoice/libwmavoice.make
@ -0,0 +1,37 @@
+#             __________               __   ___.
+#   Open      \______   \ ____   ____ |  | _\_ |__   _______  ___
+#   Source     |       _//  _ \_/ ___\|  |/ /| __ \ /  _ \  \/  /
+#   Jukebox    |    |   (  <_> )  \___|    < | \_\ (  <_> > <  <
+#   Firmware   |____|_  /\____/ \___  >__|_ \|___  /\____/__/\_ \
+#                     \/            \/     \/    \/            \/
+# $Id: libwmavoice.make 27586 2010-07-27 06:48:15Z nls $
+#
+
+# libwmavoice
+WMAVOICELIB := $(CODECDIR)/libwmavoice.a
+WMAVOICELIB_SRC := $(call preprocess, $(APPSDIR)/codecs/libwmavoice/SOURCES)
+WMAVOICELIB_OBJ := $(call c2obj, $(WMAVOICELIB_SRC))
+OTHER_SRC += $(WMAVOICELIB_SRC)
+
+$(WMAVOICELIB): $(WMAVOICELIB_OBJ)
+	$(SILENT)$(shell rm -f $@)
+	$(call PRINTS,AR $(@F))$(AR) rcs $@ $^ >/dev/null
+
+WMAVOICEFLAGS = -I$(APPSDIR)/codecs/libwmavoice $(filter-out -O%,$(CODECFLAGS))
+
+ifeq ($(CPU),coldfire)
+	WMAVOICEFLAGS += -O2
+else
+	WMAVOICEFLAGS += -O1
+endif
+
+ifeq ($(APP_TYPE),sdl-sim)
+# wmavoice needs libm in the simulator
+$(CODECDIR)/wmavoice.codec: $(CODECDIR)/wmavoice.o
+	$(call PRINTS,LD $(@F))$(CC) $(CODECFLAGS) -o $(CODECDIR)/wmavoice.elf \
+	$(filter %.o, $^) \
+	$(filter %.a, $+) \
+	-lgcc -lm $(CODECLDFLAGS)
+	$(SILENT)cp $(CODECDIR)/wmavoice.elf $@
+endif
+
--- a/apps/codecs/libwmavoice/wmavoice.c
+++ b/apps/codecs/libwmavoice/wmavoice.c
@ -26,7 +26,7 @@
 */

 #include <math.h>
-#include "avcodec.h"
+#include "wmavoice.h"
 #include "get_bits.h"
 #include "put_bits.h"
 #include "wmavoice_data.h"
@ -286,6 +286,10 @@ typedef struct {
     */
 } WMAVoiceContext;

+/* global decode context */
+static WMAVoiceContext globWMAVoiceCtx;
+
+
 /**
 * Set up the variable bit mode (VBM) tree from container extradata.
 * @param gb bit I/O context.
@ -330,9 +334,10 @@ static av_cold int decode_vbmtree(GetBitContext *gb, int8_t vbm_tree[25])
 /**
 * Set up decoder with parameters from demuxer (extradata etc.).
 */
-static av_cold int wmavoice_decode_init(AVCodecContext *ctx)
+av_cold int wmavoice_decode_init(AVCodecContext *ctx)
 {
    int n, flags, pitch_range, lsp16_flag;
+    ctx->priv_data = &globWMAVoiceCtx;
    WMAVoiceContext *s = ctx->priv_data;

    /**
@ -1743,7 +1748,7 @@ static int synth_superframe(AVCodecContext *ctx,
     * the wild yet. */
    if (!get_bits1(gb)) {
        av_log_missing_feature(ctx, "WMAPro-in-WMAVoice support", 1);
-        return -1;
+        return ERROR_WMAPRO_IN_WMAVOICE;
    }

    /* (optional) nr. of samples in superframe; always <= 480 and >= 0 */
@ -1893,7 +1898,7 @@ static void copy_bits(PutBitContext *pb,
 *
 * For more information about frames, see #synth_superframe().
 */
-static int wmavoice_decode_packet(AVCodecContext *ctx, void *data,
+int wmavoice_decode_packet(AVCodecContext *ctx, void *data,
                                  int *data_size, AVPacket *avpkt)
 {
    WMAVoiceContext *s = ctx->priv_data;
@ -1936,6 +1941,15 @@ static int wmavoice_decode_packet(AVCodecContext *ctx, void *data,
                s->sframe_cache_size += s->spillover_nbits;
                if ((res = synth_superframe(ctx, data, data_size)) == 0 &&
                    *data_size > 0) {
+                    /* convert the float values to int32 for rockbox */
+                    int i;
+                    int32_t *iptr = data;
+                    float   *fptr = data;
+                    for(i = 0; i < *data_size/sizeof(float); i++)
+                    {
+                        fptr[i] *= (float)(INT32_MAX);
+                        iptr[i] = (int32_t)fptr[i];
+                    }
                    cnt += s->spillover_nbits;
                    s->skip_bits_next = cnt & 7;
                    return cnt >> 3;
@ -1957,12 +1971,21 @@ static int wmavoice_decode_packet(AVCodecContext *ctx, void *data,
    } else if (*data_size > 0) {
        int cnt = get_bits_count(gb);
        s->skip_bits_next = cnt & 7;
+        /* convert the float values to int32 for rockbox */
+        int i;
+        int32_t *iptr = data;
+        float   *fptr = data;
+        for(i = 0; i < *data_size/sizeof(float); i++)
+        {
+            fptr[i] *= (float)(INT32_MAX);
+            iptr[i] = (int32_t)fptr[i];
+        }
        return cnt >> 3;
    } else if ((s->sframe_cache_size = pos) > 0) {
        /* rewind bit reader to start of last (incomplete) superframe... */
        init_get_bits(gb, avpkt->data, size << 3);
        skip_bits_long(gb, (size << 3) - pos);
-        assert(get_bits_left(gb) == pos);
+        //assert(get_bits_left(gb) == pos);

        /* ...and cache it for spillover in next packet */
        init_put_bits(&s->pb, s->sframe_cache, SFRAME_CACHE_MAXSIZE);
--- a/apps/codecs/libwmavoice/wmavoice.h
+++ b/apps/codecs/libwmavoice/wmavoice.h
@ -0,0 +1,7 @@
+#include "avcodec.h"
+
+#define ERROR_WMAPRO_IN_WMAVOICE -0x162
+
+av_cold int wmavoice_decode_init(AVCodecContext *ctx);
+int wmavoice_decode_packet(AVCodecContext *ctx, void *data,
+                                  int *data_size, AVPacket *avpkt);
--- a/apps/codecs/wmavoice.c
+++ b/apps/codecs/wmavoice.c
@ -0,0 +1,195 @@
+/***************************************************************************
+ *             __________               __   ___.
+ *   Open      \______   \ ____   ____ |  | _\_ |__   _______  ___
+ *   Source     |       _//  _ \_/ ___\|  |/ /| __ \ /  _ \  \/  /
+ *   Jukebox    |    |   (  <_> )  \___|    < | \_\ (  <_> > <  <
+ *   Firmware   |____|_  /\____/ \___  >__|_ \|___  /\____/__/\_ \
+ *                     \/            \/     \/    \/            \/
+ * $Id$
+ *
+ * Copyright (C) 2010 Mohamed Tarek
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
+ * KIND, either express or implied.
+ *
+ ****************************************************************************/
+
+#include "codeclib.h"
+#include "libasf/asf.h"
+#include "libwmavoice/wmavoice.h"
+
+CODEC_HEADER
+
+static AVCodecContext avctx;
+static AVPacket avpkt;
+
+#define MAX_FRAMES           3   /*maximum number of frames per superframe*/
+#define MAX_FRAMESIZE        160 /* maximum number of samples per frame */
+#define BUFSIZE              MAX_FRAMES*MAX_FRAMESIZE
+static int32_t decoded[BUFSIZE] IBSS_ATTR;
+
+
+/* This function initialises AVCodecContext with the data needed for the wmapro
+ * decoder to work. The required data is taken from asf_waveformatex_t because that's
+ * what the rockbox asf metadata parser fill/work with. In the future, when the 
+ * codec is being optimised for on-target playback this function should not be needed. */
+static void init_codec_ctx(AVCodecContext *avctx, asf_waveformatex_t *wfx)
+{
+    /* Copy the extra-data */
+    avctx->extradata_size = wfx->datalen;
+    avctx->extradata = (uint8_t *)malloc(wfx->datalen*sizeof(uint8_t));
+    memcpy(avctx->extradata, wfx->data, wfx->datalen*sizeof(uint8_t));
+    
+    avctx->block_align = wfx->blockalign;
+    avctx->sample_rate = wfx->rate;
+    avctx->channels    = wfx->channels;
+    
+}
+
+/* this is the codec entry point */
+enum codec_status codec_main(void)
+{
+    uint32_t elapsedtime;
+    int retval;
+    asf_waveformatex_t wfx;     /* Holds the stream properties */
+    size_t resume_offset;
+    int res;                    /* Return values from asf_read_packet() and decode_packet() */
+    uint8_t* audiobuf;          /* Pointer to the payload of one wma pro packet */
+    int audiobufsize;           /* Payload size */
+    int packetlength = 0;       /* Logical packet size (minus the header size) */          
+    int outlen = 0;             /* Number of bytes written to the output buffer */
+    int pktcnt = 0;             /* Count of the packets played */
+
+    /* Generic codec initialisation */
+    ci->configure(DSP_SET_SAMPLE_DEPTH, 31);
+    
+
+next_track:
+
+    /* Wait for the metadata to be read */
+    while (!*ci->taginfo_ready && !ci->stop_codec)
+        ci->sleep(1);
+
+    retval = CODEC_OK;
+
+    /* Remember the resume position */
+    resume_offset = ci->id3->offset;
+ restart_track:   
+    if (codec_init()) {
+        LOGF("(WMA Voice) Error: Error initialising codec\n");
+        retval = CODEC_ERROR;
+        goto done;
+    }
+
+    /* Copy the format metadata we've stored in the id3 TOC field.  This
+       saves us from parsing it again here. */
+    memcpy(&wfx, ci->id3->toc, sizeof(wfx));
+    memset(&avctx, 0, sizeof(AVCodecContext));
+    memset(&avpkt, 0, sizeof(AVPacket));
+    
+    ci->configure(DSP_SWITCH_FREQUENCY, wfx.rate);
+    ci->configure(DSP_SET_STEREO_MODE, wfx.channels == 1 ?
+                  STEREO_MONO : STEREO_INTERLEAVED);
+    codec_set_replaygain(ci->id3);
+    
+    /* Initialise the AVCodecContext */
+    init_codec_ctx(&avctx, &wfx);
+
+    if (wmavoice_decode_init(&avctx) < 0) {
+        LOGF("(WMA Voice) Error: Unsupported or corrupt file\n");
+        retval = CODEC_ERROR;
+        goto done;
+    }
+
+    /* Now advance the file position to the first frame */
+    ci->seek_buffer(ci->id3->first_frame_offset);
+    
+    elapsedtime = 0;
+    resume_offset = 0;
+    
+    /* The main decoding loop */
+
+    while (pktcnt < wfx.numpackets)
+    {
+        ci->yield();
+        if (ci->stop_codec || ci->new_track) {
+            goto done;
+        }
+        
+        /* Deal with any pending seek requests */
+        if (ci->seek_time){
+
+            if (ci->seek_time == 1) {
+                ci->seek_complete();
+                goto restart_track; /* Pretend you never saw this... */
+            }
+
+            elapsedtime = asf_seek(ci->seek_time, &wfx);
+            if (elapsedtime < 1){
+                ci->seek_complete();
+                goto next_track;
+            }
+
+            ci->set_elapsed(elapsedtime);
+            ci->seek_complete();
+        }
+        
+new_packet:
+        res = asf_read_packet(&audiobuf, &audiobufsize, &packetlength, &wfx);
+
+        if (res < 0) {
+            LOGF("(WMA Voice) read_packet error %d\n",res);
+            goto done;
+        } else {
+            avpkt.data = audiobuf;
+            avpkt.size = audiobufsize;
+            pktcnt++;
+            
+            while(avpkt.size > 0)
+            {
+                /* wmavoice_decode_packet checks for the output buffer size to 
+                   avoid overflows */
+                outlen = BUFSIZE*sizeof(int32_t);
+
+                res = wmavoice_decode_packet(&avctx, decoded, &outlen, &avpkt);
+                if(res < 0) {
+                    LOGF("(WMA Voice) Error: decode_packet returned %d", res);
+                    if(res == ERROR_WMAPRO_IN_WMAVOICE){
+                    /* Just skip this packet */
+                        ci->advance_buffer(packetlength);
+                        goto new_packet;    
+                    }
+                    else
+                        goto done;
+                }
+                avpkt.data += res;
+                avpkt.size -= res;
+                if(outlen) {
+                    ci->yield ();
+                    outlen /= sizeof(int32_t);
+                    ci->pcmbuf_insert(decoded, NULL, outlen);
+                    elapsedtime += outlen*10/(wfx.rate/100);
+                    ci->set_elapsed(elapsedtime);
+                    ci->yield ();
+                }
+            }
+
+        }
+
+        /* Advance to the next logical packet */
+        ci->advance_buffer(packetlength);
+    }
+    retval = CODEC_OK;
+
+done:
+    if (ci->request_next_track())
+        goto next_track;
+    
+    return retval;
+}
+
--- a/apps/metadata.c
+++ b/apps/metadata.c
@ -182,6 +182,9 @@ const struct afmt_entry audio_formats[AFMT_NUM_CODECS] =
    /* True Audio */
    [AFMT_TTA] =
        AFMT_ENTRY("TTA",  "tta",   NULL,          "tta\0"      ),
+    /* WMA Voice in ASF */
+    [AFMT_WMAVOICE] =
+        AFMT_ENTRY("WMAVoice",  "wmavoice",     NULL,    "wma\0wmv\0asf\0"   ),
 #endif
 };

@ -297,7 +300,7 @@ bool get_metadata(struct mp3entry* id3, int fd, const char* trackname)
        }

        break;
-
+    
    case AFMT_WMA:
        if (!get_asf_metadata(fd, id3))
        {
--- a/apps/metadata.h
+++ b/apps/metadata.h
@ -84,6 +84,7 @@ enum
    AFMT_VOX,          /* VOX */
    AFMT_WAVE64,       /* Wave64 */
    AFMT_TTA,          /* True Audio */
+    AFMT_WMAVOICE,     /* WMA Voice in ASF */
 #endif

    /* add new formats at any index above this line to have a sensible order -
--- a/apps/metadata/asf.c
+++ b/apps/metadata/asf.c
@ -357,6 +357,11 @@ static int asf_parse_header(int fd, struct mp3entry* id3,
                            wfx->audiostream = flags&0x7f;
                            /* Correct codectype to redirect playback to the proper .codec */
                            id3->codectype = AFMT_WMAPRO;
+                        } else if (wfx->codec_id == ASF_CODEC_ID_WMAVOICE) {
+                            read(fd, wfx->data, wfx->datalen);
+                            lseek(fd,current.size - 24 - 72 - wfx->datalen,SEEK_CUR);
+                            wfx->audiostream = flags&0x7f;
+                            id3->codectype = AFMT_WMAVOICE;
                        } else {
                            DEBUGF("Unsupported WMA codec (Lossless, Voice, etc)\n");
                            lseek(fd,current.size - 24 - 72,SEEK_CUR);