1657 lines
50 KiB
C
1657 lines
50 KiB
C
|
/* Copyright (C) 2002-2006 Jean-Marc Valin
|
||
|
File: sb_celp.c
|
||
|
|
||
|
Redistribution and use in source and binary forms, with or without
|
||
|
modification, are permitted provided that the following conditions
|
||
|
are met:
|
||
|
|
||
|
- Redistributions of source code must retain the above copyright
|
||
|
notice, this list of conditions and the following disclaimer.
|
||
|
|
||
|
- Redistributions in binary form must reproduce the above copyright
|
||
|
notice, this list of conditions and the following disclaimer in the
|
||
|
documentation and/or other materials provided with the distribution.
|
||
|
|
||
|
- Neither the name of the Xiph.org Foundation nor the names of its
|
||
|
contributors may be used to endorse or promote products derived from
|
||
|
this software without specific prior written permission.
|
||
|
|
||
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
||
|
``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
||
|
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
||
|
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR
|
||
|
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||
|
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||
|
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||
|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||
|
*/
|
||
|
|
||
|
#ifdef HAVE_CONFIG_H
|
||
|
#include "config.h"
|
||
|
#endif
|
||
|
|
||
|
#include <math_approx.h>
|
||
|
#include "sb_celp.h"
|
||
|
#include "stdlib.h"
|
||
|
#include "filters.h"
|
||
|
#include "lpc.h"
|
||
|
#include "lsp.h"
|
||
|
#include "stack_alloc.h"
|
||
|
#include "cb_search.h"
|
||
|
#include "quant_lsp.h"
|
||
|
#include "vq.h"
|
||
|
#include "ltp.h"
|
||
|
#include "misc.h"
|
||
|
|
||
|
/* Default size for the encoder and decoder stack (can be changed at compile time).
|
||
|
This does not apply when using variable-size arrays or alloca. */
|
||
|
#ifndef SB_ENC_STACK
|
||
|
#define SB_ENC_STACK (10000*sizeof(spx_sig_t))
|
||
|
#endif
|
||
|
|
||
|
#ifndef SB_DEC_STACK
|
||
|
#define SB_DEC_STACK (6000*sizeof(spx_sig_t))
|
||
|
#endif
|
||
|
|
||
|
|
||
|
#ifdef DISABLE_WIDEBAND
|
||
|
void *sb_encoder_init(const SpeexMode *m)
|
||
|
{
|
||
|
speex_error("Wideband and Ultra-wideband are disabled");
|
||
|
return NULL;
|
||
|
}
|
||
|
void sb_encoder_destroy(void *state)
|
||
|
{
|
||
|
speex_error("Wideband and Ultra-wideband are disabled");
|
||
|
}
|
||
|
int sb_encode(void *state, void *vin, SpeexBits *bits)
|
||
|
{
|
||
|
speex_error("Wideband and Ultra-wideband are disabled");
|
||
|
return -2;
|
||
|
}
|
||
|
void *sb_decoder_init(const SpeexMode *m)
|
||
|
{
|
||
|
speex_error("Wideband and Ultra-wideband are disabled");
|
||
|
return NULL;
|
||
|
}
|
||
|
void sb_decoder_destroy(void *state)
|
||
|
{
|
||
|
speex_error("Wideband and Ultra-wideband are disabled");
|
||
|
}
|
||
|
int sb_decode(void *state, SpeexBits *bits, void *vout)
|
||
|
{
|
||
|
speex_error("Wideband and Ultra-wideband are disabled");
|
||
|
return -2;
|
||
|
}
|
||
|
int sb_encoder_ctl(void *state, int request, void *ptr)
|
||
|
{
|
||
|
speex_error("Wideband and Ultra-wideband are disabled");
|
||
|
return -2;
|
||
|
}
|
||
|
int sb_decoder_ctl(void *state, int request, void *ptr)
|
||
|
{
|
||
|
speex_error("Wideband and Ultra-wideband are disabled");
|
||
|
return -2;
|
||
|
}
|
||
|
#else
|
||
|
|
||
|
|
||
|
#ifndef M_PI
|
||
|
#define M_PI 3.14159265358979323846 /* pi */
|
||
|
#endif
|
||
|
|
||
|
#define sqr(x) ((x)*(x))
|
||
|
|
||
|
#define SUBMODE(x) st->submodes[st->submodeID]->x
|
||
|
|
||
|
#ifdef FIXED_POINT
|
||
|
static const spx_word16_t gc_quant_bound[16] = {125, 164, 215, 282, 370, 484, 635, 832, 1090, 1428, 1871, 2452, 3213, 4210, 5516, 7228};
|
||
|
#define LSP_MARGIN 410
|
||
|
#define LSP_DELTA1 6553
|
||
|
#define LSP_DELTA2 1638
|
||
|
|
||
|
#else
|
||
|
|
||
|
#define LSP_MARGIN .05
|
||
|
#define LSP_DELTA1 .2
|
||
|
#define LSP_DELTA2 .05
|
||
|
|
||
|
#endif
|
||
|
|
||
|
#define QMF_ORDER 64
|
||
|
|
||
|
#ifdef FIXED_POINT
|
||
|
static const spx_word16_t h0[64] = {2, -7, -7, 18, 15, -39, -25, 75, 35, -130, -41, 212, 38, -327, -17, 483, -32, -689, 124, 956, -283, -1307, 543, 1780, -973, -2467, 1733, 3633, -3339, -6409, 9059, 30153, 30153, 9059, -6409, -3339, 3633, 1733, -2467, -973, 1780, 543, -1307, -283, 956, 124, -689, -32, 483, -17, -327, 38, 212, -41, -130, 35, 75, -25, -39, 15, 18, -7, -7, 2};
|
||
|
|
||
|
static const spx_word16_t h1[64] = {2, 7, -7, -18, 15, 39, -25, -75, 35, 130, -41, -212, 38, 327, -17, -483, -32, 689, 124, -956, -283, 1307, 543, -1780, -973, 2467, 1733, -3633, -3339, 6409, 9059, -30153, 30153, -9059, -6409, 3339, 3633, -1733, -2467, 973, 1780, -543, -1307, 283, 956, -124, -689, 32, 483, 17, -327, -38, 212, 41, -130, -35, 75, 25, -39, -15, 18, 7, -7, -2};
|
||
|
|
||
|
/*To generate (ruby code): (0...33).each { |idx| puts Math.exp((idx-10) / 8.0).to_s + "," } */
|
||
|
static const float spx_exp_lookup_int[33]={0.28650479686019,0.32465246735835,0.367879441171442,0.416862019678508,0.472366552741015,0.53526142851899,0.606530659712633,0.687289278790972,0.778800783071405,0.882496902584595,1.0,1.13314845306683,1.28402541668774,1.4549914146182,1.64872127070013,1.86824595743222,2.11700001661267,2.3988752939671,2.71828182845905,3.08021684891803,3.49034295746184,3.95507672292058,4.48168907033806,5.07841903718008,5.75460267600573,6.52081912033011,7.38905609893065,8.37289748812726,9.48773583635853,10.7510131860764,12.1824939607035,13.8045741860671,15.6426318841882};
|
||
|
|
||
|
|
||
|
#else
|
||
|
static const float h0[64] = {
|
||
|
3.596189e-05f, -0.0001123515f,
|
||
|
-0.0001104587f, 0.0002790277f,
|
||
|
0.0002298438f, -0.0005953563f,
|
||
|
-0.0003823631f, 0.00113826f,
|
||
|
0.0005308539f, -0.001986177f,
|
||
|
-0.0006243724f, 0.003235877f,
|
||
|
0.0005743159f, -0.004989147f,
|
||
|
-0.0002584767f, 0.007367171f,
|
||
|
-0.0004857935f, -0.01050689f,
|
||
|
0.001894714f, 0.01459396f,
|
||
|
-0.004313674f, -0.01994365f,
|
||
|
0.00828756f, 0.02716055f,
|
||
|
-0.01485397f, -0.03764973f,
|
||
|
0.026447f, 0.05543245f,
|
||
|
-0.05095487f, -0.09779096f,
|
||
|
0.1382363f, 0.4600981f,
|
||
|
0.4600981f, 0.1382363f,
|
||
|
-0.09779096f, -0.05095487f,
|
||
|
0.05543245f, 0.026447f,
|
||
|
-0.03764973f, -0.01485397f,
|
||
|
0.02716055f, 0.00828756f,
|
||
|
-0.01994365f, -0.004313674f,
|
||
|
0.01459396f, 0.001894714f,
|
||
|
-0.01050689f, -0.0004857935f,
|
||
|
0.007367171f, -0.0002584767f,
|
||
|
-0.004989147f, 0.0005743159f,
|
||
|
0.003235877f, -0.0006243724f,
|
||
|
-0.001986177f, 0.0005308539f,
|
||
|
0.00113826f, -0.0003823631f,
|
||
|
-0.0005953563f, 0.0002298438f,
|
||
|
0.0002790277f, -0.0001104587f,
|
||
|
-0.0001123515f, 3.596189e-05f
|
||
|
};
|
||
|
|
||
|
static const float h1[64] = {
|
||
|
3.596189e-05f, 0.0001123515f,
|
||
|
-0.0001104587f, -0.0002790277f,
|
||
|
0.0002298438f, 0.0005953563f,
|
||
|
-0.0003823631f, -0.00113826f,
|
||
|
0.0005308539f, 0.001986177f,
|
||
|
-0.0006243724f, -0.003235877f,
|
||
|
0.0005743159f, 0.004989147f,
|
||
|
-0.0002584767f, -0.007367171f,
|
||
|
-0.0004857935f, 0.01050689f,
|
||
|
0.001894714f, -0.01459396f,
|
||
|
-0.004313674f, 0.01994365f,
|
||
|
0.00828756f, -0.02716055f,
|
||
|
-0.01485397f, 0.03764973f,
|
||
|
0.026447f, -0.05543245f,
|
||
|
-0.05095487f, 0.09779096f,
|
||
|
0.1382363f, -0.4600981f,
|
||
|
0.4600981f, -0.1382363f,
|
||
|
-0.09779096f, 0.05095487f,
|
||
|
0.05543245f, -0.026447f,
|
||
|
-0.03764973f, 0.01485397f,
|
||
|
0.02716055f, -0.00828756f,
|
||
|
-0.01994365f, 0.004313674f,
|
||
|
0.01459396f, -0.001894714f,
|
||
|
-0.01050689f, 0.0004857935f,
|
||
|
0.007367171f, 0.0002584767f,
|
||
|
-0.004989147f, -0.0005743159f,
|
||
|
0.003235877f, 0.0006243724f,
|
||
|
-0.001986177f, -0.0005308539f,
|
||
|
0.00113826f, 0.0003823631f,
|
||
|
-0.0005953563f, -0.0002298438f,
|
||
|
0.0002790277f, 0.0001104587f,
|
||
|
-0.0001123515f, -3.596189e-05f
|
||
|
};
|
||
|
#endif
|
||
|
|
||
|
extern const spx_word16_t lpc_window[];
|
||
|
|
||
|
static void mix_and_saturate(spx_word32_t *x0, spx_word32_t *x1, spx_word16_t *out, int len)
|
||
|
{
|
||
|
int i;
|
||
|
for (i=0;i<len;i++)
|
||
|
{
|
||
|
spx_word32_t tmp;
|
||
|
#ifdef FIXED_POINT
|
||
|
tmp=PSHR(x0[i]-x1[i],SIG_SHIFT-1);
|
||
|
#else
|
||
|
tmp=2*(x0[i]-x1[i]);
|
||
|
#endif
|
||
|
if (tmp>32767)
|
||
|
out[i] = 32767;
|
||
|
else if (tmp<-32767)
|
||
|
out[i] = -32767;
|
||
|
else
|
||
|
out[i] = tmp;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
void *sb_encoder_init(const SpeexMode *m)
|
||
|
{
|
||
|
int i;
|
||
|
SBEncState *st;
|
||
|
const SpeexSBMode *mode;
|
||
|
|
||
|
st = (SBEncState*)speex_alloc(sizeof(SBEncState));
|
||
|
if (!st)
|
||
|
return NULL;
|
||
|
#if defined(VAR_ARRAYS) || defined (USE_ALLOCA)
|
||
|
st->stack = NULL;
|
||
|
#else
|
||
|
st->stack = (char*)speex_alloc_scratch(SB_ENC_STACK);
|
||
|
#endif
|
||
|
st->mode = m;
|
||
|
mode = (const SpeexSBMode*)m->mode;
|
||
|
|
||
|
|
||
|
st->st_low = speex_encoder_init(mode->nb_mode);
|
||
|
st->full_frame_size = 2*mode->frameSize;
|
||
|
st->frame_size = mode->frameSize;
|
||
|
st->subframeSize = mode->subframeSize;
|
||
|
st->nbSubframes = mode->frameSize/mode->subframeSize;
|
||
|
st->windowSize = st->frame_size+st->subframeSize;
|
||
|
st->lpcSize=mode->lpcSize;
|
||
|
st->bufSize=mode->bufSize;
|
||
|
|
||
|
st->encode_submode = 1;
|
||
|
st->submodes=mode->submodes;
|
||
|
st->submodeSelect = st->submodeID=mode->defaultSubmode;
|
||
|
|
||
|
i=9;
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_QUALITY, &i);
|
||
|
i=1;
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_WIDEBAND, &i);
|
||
|
|
||
|
st->lag_factor = mode->lag_factor;
|
||
|
st->lpc_floor = mode->lpc_floor;
|
||
|
st->gamma1=mode->gamma1;
|
||
|
st->gamma2=mode->gamma2;
|
||
|
st->first=1;
|
||
|
|
||
|
st->x0d=(spx_sig_t*)speex_alloc((st->frame_size)*sizeof(spx_sig_t));
|
||
|
st->x1d=(spx_sig_t*)speex_alloc((st->frame_size)*sizeof(spx_sig_t));
|
||
|
st->high=(spx_sig_t*)speex_alloc((st->full_frame_size)*sizeof(spx_sig_t));
|
||
|
st->y0=(spx_sig_t*)speex_alloc((st->full_frame_size)*sizeof(spx_sig_t));
|
||
|
st->y1=(spx_sig_t*)speex_alloc((st->full_frame_size)*sizeof(spx_sig_t));
|
||
|
|
||
|
st->h0_mem=(spx_word16_t*)speex_alloc((QMF_ORDER)*sizeof(spx_word16_t));
|
||
|
st->h1_mem=(spx_word16_t*)speex_alloc((QMF_ORDER)*sizeof(spx_word16_t));
|
||
|
st->g0_mem=(spx_word32_t*)speex_alloc((QMF_ORDER)*sizeof(spx_word32_t));
|
||
|
st->g1_mem=(spx_word32_t*)speex_alloc((QMF_ORDER)*sizeof(spx_word32_t));
|
||
|
|
||
|
st->excBuf=(spx_sig_t*)speex_alloc((st->bufSize)*sizeof(spx_sig_t));
|
||
|
st->exc = st->excBuf + st->bufSize - st->windowSize;
|
||
|
|
||
|
st->res=(spx_sig_t*)speex_alloc((st->frame_size)*sizeof(spx_sig_t));
|
||
|
st->sw=(spx_sig_t*)speex_alloc((st->frame_size)*sizeof(spx_sig_t));
|
||
|
st->window= lpc_window;
|
||
|
|
||
|
st->lagWindow = (spx_word16_t*)speex_alloc((st->lpcSize+1)*sizeof(spx_word16_t));
|
||
|
for (i=0;i<st->lpcSize+1;i++)
|
||
|
st->lagWindow[i]=16384*exp(-.5*sqr(2*M_PI*st->lag_factor*i));
|
||
|
|
||
|
st->autocorr = (spx_word16_t*)speex_alloc((st->lpcSize+1)*sizeof(spx_word16_t));
|
||
|
st->lpc = (spx_coef_t*)speex_alloc(st->lpcSize*sizeof(spx_coef_t));
|
||
|
st->bw_lpc1 = (spx_coef_t*)speex_alloc(st->lpcSize*sizeof(spx_coef_t));
|
||
|
st->bw_lpc2 = (spx_coef_t*)speex_alloc(st->lpcSize*sizeof(spx_coef_t));
|
||
|
st->lsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
|
||
|
st->qlsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
|
||
|
st->old_lsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
|
||
|
st->old_qlsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
|
||
|
st->interp_lsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
|
||
|
st->interp_qlsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
|
||
|
st->interp_lpc = (spx_coef_t*)speex_alloc(st->lpcSize*sizeof(spx_coef_t));
|
||
|
st->interp_qlpc = (spx_coef_t*)speex_alloc(st->lpcSize*sizeof(spx_coef_t));
|
||
|
st->pi_gain = (spx_word32_t*)speex_alloc((st->nbSubframes)*sizeof(spx_word32_t));
|
||
|
st->low_innov = (spx_word32_t*)speex_alloc((st->frame_size)*sizeof(spx_word32_t));
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_INNOVATION_SAVE, st->low_innov);
|
||
|
st->innov_save = NULL;
|
||
|
|
||
|
st->mem_sp = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
|
||
|
st->mem_sp2 = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
|
||
|
st->mem_sw = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
|
||
|
|
||
|
st->vbr_quality = 8;
|
||
|
st->vbr_enabled = 0;
|
||
|
st->vbr_max = 0;
|
||
|
st->vbr_max_high = 20000; /* We just need a big value here */
|
||
|
st->vad_enabled = 0;
|
||
|
st->abr_enabled = 0;
|
||
|
st->relative_quality=0;
|
||
|
|
||
|
st->complexity=2;
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_SAMPLING_RATE, &st->sampling_rate);
|
||
|
st->sampling_rate*=2;
|
||
|
#ifdef ENABLE_VALGRIND
|
||
|
VALGRIND_MAKE_READABLE(st, (st->stack-(char*)st));
|
||
|
#endif
|
||
|
return st;
|
||
|
}
|
||
|
|
||
|
void sb_encoder_destroy(void *state)
|
||
|
{
|
||
|
SBEncState *st=(SBEncState*)state;
|
||
|
|
||
|
speex_encoder_destroy(st->st_low);
|
||
|
#if !(defined(VAR_ARRAYS) || defined (USE_ALLOCA))
|
||
|
speex_free_scratch(st->stack);
|
||
|
#endif
|
||
|
|
||
|
speex_free(st->x0d);
|
||
|
speex_free(st->x1d);
|
||
|
speex_free(st->high);
|
||
|
speex_free(st->y0);
|
||
|
speex_free(st->y1);
|
||
|
|
||
|
speex_free(st->h0_mem);
|
||
|
speex_free(st->h1_mem);
|
||
|
speex_free(st->g0_mem);
|
||
|
speex_free(st->g1_mem);
|
||
|
|
||
|
speex_free(st->excBuf);
|
||
|
speex_free(st->res);
|
||
|
speex_free(st->sw);
|
||
|
speex_free(st->lagWindow);
|
||
|
|
||
|
speex_free(st->autocorr);
|
||
|
speex_free(st->lpc);
|
||
|
speex_free(st->bw_lpc1);
|
||
|
speex_free(st->bw_lpc2);
|
||
|
speex_free(st->lsp);
|
||
|
speex_free(st->qlsp);
|
||
|
speex_free(st->old_lsp);
|
||
|
speex_free(st->old_qlsp);
|
||
|
speex_free(st->interp_lsp);
|
||
|
speex_free(st->interp_qlsp);
|
||
|
speex_free(st->interp_lpc);
|
||
|
speex_free(st->interp_qlpc);
|
||
|
speex_free(st->pi_gain);
|
||
|
speex_free(st->low_innov);
|
||
|
|
||
|
speex_free(st->mem_sp);
|
||
|
speex_free(st->mem_sp2);
|
||
|
speex_free(st->mem_sw);
|
||
|
|
||
|
|
||
|
speex_free(st);
|
||
|
}
|
||
|
|
||
|
|
||
|
int sb_encode(void *state, void *vin, SpeexBits *bits)
|
||
|
{
|
||
|
SBEncState *st;
|
||
|
int i, roots, sub;
|
||
|
char *stack;
|
||
|
VARDECL(spx_mem_t *mem);
|
||
|
VARDECL(spx_sig_t *innov);
|
||
|
VARDECL(spx_word16_t *target);
|
||
|
VARDECL(spx_word16_t *syn_resp);
|
||
|
VARDECL(spx_word32_t *low_pi_gain);
|
||
|
VARDECL(spx_word16_t *low_exc);
|
||
|
const SpeexSBMode *mode;
|
||
|
int dtx;
|
||
|
spx_word16_t *in = (spx_word16_t*)vin;
|
||
|
|
||
|
st = (SBEncState*)state;
|
||
|
stack=st->stack;
|
||
|
mode = (const SpeexSBMode*)(st->mode->mode);
|
||
|
|
||
|
{
|
||
|
VARDECL(spx_word16_t *low);
|
||
|
ALLOC(low, st->frame_size, spx_word16_t);
|
||
|
|
||
|
/* Compute the two sub-bands by filtering with h0 and h1*/
|
||
|
qmf_decomp(in, h0, st->x0d, st->x1d, st->full_frame_size, QMF_ORDER, st->h0_mem, stack);
|
||
|
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
low[i] = SATURATE(PSHR(st->x0d[i],SIG_SHIFT),32767);
|
||
|
|
||
|
/* Encode the narrowband part*/
|
||
|
speex_encode_native(st->st_low, low, bits);
|
||
|
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
st->x0d[i] = SHL(low[i],SIG_SHIFT);
|
||
|
}
|
||
|
/* High-band buffering / sync with low band */
|
||
|
for (i=0;i<st->windowSize-st->frame_size;i++)
|
||
|
st->high[i] = st->high[st->frame_size+i];
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
st->high[st->windowSize-st->frame_size+i]=SATURATE(st->x1d[i],536854528);
|
||
|
|
||
|
speex_move(st->excBuf, st->excBuf+st->frame_size, (st->bufSize-st->frame_size)*sizeof(spx_sig_t));
|
||
|
|
||
|
|
||
|
ALLOC(low_pi_gain, st->nbSubframes, spx_word32_t);
|
||
|
ALLOC(low_exc, st->frame_size, spx_word16_t);
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_PI_GAIN, low_pi_gain);
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_EXC, low_exc);
|
||
|
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_LOW_MODE, &dtx);
|
||
|
|
||
|
if (dtx==0)
|
||
|
dtx=1;
|
||
|
else
|
||
|
dtx=0;
|
||
|
|
||
|
{
|
||
|
VARDECL(spx_word16_t *w_sig);
|
||
|
ALLOC(w_sig, st->windowSize, spx_word16_t);
|
||
|
/* Window for analysis */
|
||
|
for (i=0;i<st->windowSize;i++)
|
||
|
w_sig[i] = SHR(MULT16_16(SHR((spx_word32_t)(st->high[i]),SIG_SHIFT),st->window[i]),SIG_SHIFT);
|
||
|
|
||
|
/* Compute auto-correlation */
|
||
|
_spx_autocorr(w_sig, st->autocorr, st->lpcSize+1, st->windowSize);
|
||
|
}
|
||
|
st->autocorr[0] = ADD16(st->autocorr[0],MULT16_16_Q15(st->autocorr[0],st->lpc_floor)); /* Noise floor in auto-correlation domain */
|
||
|
|
||
|
/* Lag windowing: equivalent to filtering in the power-spectrum domain */
|
||
|
for (i=0;i<st->lpcSize+1;i++)
|
||
|
st->autocorr[i] = MULT16_16_Q14(st->autocorr[i],st->lagWindow[i]);
|
||
|
|
||
|
/* Levinson-Durbin */
|
||
|
_spx_lpc(st->lpc, st->autocorr, st->lpcSize);
|
||
|
|
||
|
/* LPC to LSPs (x-domain) transform */
|
||
|
roots=lpc_to_lsp (st->lpc, st->lpcSize, st->lsp, 10, LSP_DELTA1, stack);
|
||
|
if (roots!=st->lpcSize)
|
||
|
{
|
||
|
roots = lpc_to_lsp (st->lpc, st->lpcSize, st->lsp, 10, LSP_DELTA2, stack);
|
||
|
if (roots!=st->lpcSize) {
|
||
|
/*If we can't find all LSP's, do some damage control and use a flat filter*/
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
{
|
||
|
st->lsp[i]=LSP_SCALING*M_PI*((float)(i+1))/(st->lpcSize+1);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* VBR code */
|
||
|
if ((st->vbr_enabled || st->vad_enabled) && !dtx)
|
||
|
{
|
||
|
float e_low=0, e_high=0;
|
||
|
float ratio;
|
||
|
if (st->abr_enabled)
|
||
|
{
|
||
|
float qual_change=0;
|
||
|
if (st->abr_drift2 * st->abr_drift > 0)
|
||
|
{
|
||
|
/* Only adapt if long-term and short-term drift are the same sign */
|
||
|
qual_change = -.00001*st->abr_drift/(1+st->abr_count);
|
||
|
if (qual_change>.1)
|
||
|
qual_change=.1;
|
||
|
if (qual_change<-.1)
|
||
|
qual_change=-.1;
|
||
|
}
|
||
|
st->vbr_quality += qual_change;
|
||
|
if (st->vbr_quality>10)
|
||
|
st->vbr_quality=10;
|
||
|
if (st->vbr_quality<0)
|
||
|
st->vbr_quality=0;
|
||
|
}
|
||
|
|
||
|
|
||
|
/*FIXME: Are the two signals (low, high) in sync? */
|
||
|
e_low = compute_rms(st->x0d, st->frame_size);
|
||
|
e_high = compute_rms(st->high, st->frame_size);
|
||
|
ratio = 2*log((1+e_high)/(1+e_low));
|
||
|
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_RELATIVE_QUALITY, &st->relative_quality);
|
||
|
if (ratio<-4)
|
||
|
ratio=-4;
|
||
|
if (ratio>2)
|
||
|
ratio=2;
|
||
|
/*if (ratio>-2)*/
|
||
|
if (st->vbr_enabled)
|
||
|
{
|
||
|
int modeid;
|
||
|
modeid = mode->nb_modes-1;
|
||
|
st->relative_quality+=1.0*(ratio+2);
|
||
|
if (st->relative_quality<-1)
|
||
|
st->relative_quality=-1;
|
||
|
while (modeid)
|
||
|
{
|
||
|
int v1;
|
||
|
float thresh;
|
||
|
v1=(int)floor(st->vbr_quality);
|
||
|
if (v1==10)
|
||
|
thresh = mode->vbr_thresh[modeid][v1];
|
||
|
else
|
||
|
thresh = (st->vbr_quality-v1) * mode->vbr_thresh[modeid][v1+1] +
|
||
|
(1+v1-st->vbr_quality) * mode->vbr_thresh[modeid][v1];
|
||
|
if (st->relative_quality >= thresh && st->sampling_rate*st->submodes[modeid]->bits_per_frame/st->full_frame_size <= st->vbr_max_high)
|
||
|
break;
|
||
|
modeid--;
|
||
|
}
|
||
|
speex_encoder_ctl(state, SPEEX_SET_HIGH_MODE, &modeid);
|
||
|
if (st->abr_enabled)
|
||
|
{
|
||
|
int bitrate;
|
||
|
speex_encoder_ctl(state, SPEEX_GET_BITRATE, &bitrate);
|
||
|
st->abr_drift+=(bitrate-st->abr_enabled);
|
||
|
st->abr_drift2 = .95*st->abr_drift2 + .05*(bitrate-st->abr_enabled);
|
||
|
st->abr_count += 1.0;
|
||
|
}
|
||
|
|
||
|
} else {
|
||
|
/* VAD only */
|
||
|
int modeid;
|
||
|
if (st->relative_quality<2.0)
|
||
|
modeid=1;
|
||
|
else
|
||
|
modeid=st->submodeSelect;
|
||
|
/*speex_encoder_ctl(state, SPEEX_SET_MODE, &mode);*/
|
||
|
st->submodeID=modeid;
|
||
|
|
||
|
}
|
||
|
/*fprintf (stderr, "%f %f\n", ratio, low_qual);*/
|
||
|
}
|
||
|
|
||
|
if (st->encode_submode)
|
||
|
{
|
||
|
speex_bits_pack(bits, 1, 1);
|
||
|
if (dtx)
|
||
|
speex_bits_pack(bits, 0, SB_SUBMODE_BITS);
|
||
|
else
|
||
|
speex_bits_pack(bits, st->submodeID, SB_SUBMODE_BITS);
|
||
|
}
|
||
|
|
||
|
/* If null mode (no transmission), just set a couple things to zero*/
|
||
|
if (dtx || st->submodes[st->submodeID] == NULL)
|
||
|
{
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
st->exc[i]=st->sw[i]=VERY_SMALL;
|
||
|
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->mem_sw[i]=0;
|
||
|
st->first=1;
|
||
|
|
||
|
/* Final signal synthesis from excitation */
|
||
|
iir_mem2(st->exc, st->interp_qlpc, st->high, st->frame_size, st->lpcSize, st->mem_sp);
|
||
|
|
||
|
#ifdef RESYNTH
|
||
|
/* Reconstruct the original */
|
||
|
fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack);
|
||
|
fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack);
|
||
|
|
||
|
for (i=0;i<st->full_frame_size;i++)
|
||
|
in[i]=SHR(st->y0[i]-st->y1[i], SIG_SHIFT-1);
|
||
|
#endif
|
||
|
|
||
|
if (dtx)
|
||
|
return 0;
|
||
|
else
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
|
||
|
/* LSP quantization */
|
||
|
SUBMODE(lsp_quant)(st->lsp, st->qlsp, st->lpcSize, bits);
|
||
|
|
||
|
if (st->first)
|
||
|
{
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->old_lsp[i] = st->lsp[i];
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->old_qlsp[i] = st->qlsp[i];
|
||
|
}
|
||
|
|
||
|
ALLOC(mem, st->lpcSize, spx_mem_t);
|
||
|
ALLOC(syn_resp, st->subframeSize, spx_word16_t);
|
||
|
ALLOC(innov, st->subframeSize, spx_sig_t);
|
||
|
ALLOC(target, st->subframeSize, spx_word16_t);
|
||
|
|
||
|
for (sub=0;sub<st->nbSubframes;sub++)
|
||
|
{
|
||
|
spx_sig_t *exc, *sp, *res, *sw, *innov_save=NULL;
|
||
|
spx_word16_t filter_ratio;
|
||
|
int offset;
|
||
|
spx_word32_t rl, rh;
|
||
|
spx_word16_t eh=0;
|
||
|
|
||
|
offset = st->subframeSize*sub;
|
||
|
sp=st->high+offset;
|
||
|
exc=st->exc+offset;
|
||
|
res=st->res+offset;
|
||
|
sw=st->sw+offset;
|
||
|
/* Pointer for saving innovation */
|
||
|
if (st->innov_save)
|
||
|
{
|
||
|
innov_save = st->innov_save+2*offset;
|
||
|
for (i=0;i<2*st->subframeSize;i++)
|
||
|
innov_save[i]=0;
|
||
|
}
|
||
|
|
||
|
/* LSP interpolation (quantized and unquantized) */
|
||
|
lsp_interpolate(st->old_lsp, st->lsp, st->interp_lsp, st->lpcSize, sub, st->nbSubframes);
|
||
|
lsp_interpolate(st->old_qlsp, st->qlsp, st->interp_qlsp, st->lpcSize, sub, st->nbSubframes);
|
||
|
|
||
|
lsp_enforce_margin(st->interp_lsp, st->lpcSize, LSP_MARGIN);
|
||
|
lsp_enforce_margin(st->interp_qlsp, st->lpcSize, LSP_MARGIN);
|
||
|
|
||
|
lsp_to_lpc(st->interp_lsp, st->interp_lpc, st->lpcSize,stack);
|
||
|
lsp_to_lpc(st->interp_qlsp, st->interp_qlpc, st->lpcSize, stack);
|
||
|
|
||
|
bw_lpc(st->gamma1, st->interp_lpc, st->bw_lpc1, st->lpcSize);
|
||
|
bw_lpc(st->gamma2, st->interp_lpc, st->bw_lpc2, st->lpcSize);
|
||
|
|
||
|
/* Compute mid-band (4000 Hz for wideband) response of low-band and high-band
|
||
|
filters */
|
||
|
st->pi_gain[sub]=LPC_SCALING;
|
||
|
rh = LPC_SCALING;
|
||
|
for (i=0;i<st->lpcSize;i+=2)
|
||
|
{
|
||
|
rh += st->interp_qlpc[i+1] - st->interp_qlpc[i];
|
||
|
st->pi_gain[sub] += st->interp_qlpc[i] + st->interp_qlpc[i+1];
|
||
|
}
|
||
|
|
||
|
rl = low_pi_gain[sub];
|
||
|
#ifdef FIXED_POINT
|
||
|
filter_ratio=PDIV32_16(SHL(rl+82,2),SHR(82+rh,5));
|
||
|
#else
|
||
|
filter_ratio=(rl+.01)/(rh+.01);
|
||
|
#endif
|
||
|
|
||
|
/* Compute "real excitation" */
|
||
|
fir_mem2(sp, st->interp_qlpc, exc, st->subframeSize, st->lpcSize, st->mem_sp2);
|
||
|
/* Compute energy of low-band and high-band excitation */
|
||
|
|
||
|
eh = compute_rms(exc, st->subframeSize);
|
||
|
|
||
|
if (!SUBMODE(innovation_quant)) {/* 1 for spectral folding excitation, 0 for stochastic */
|
||
|
float g;
|
||
|
spx_word16_t el;
|
||
|
el = compute_rms(st->low_innov+offset, st->subframeSize);
|
||
|
|
||
|
/* Gain to use if we want to use the low-band excitation for high-band */
|
||
|
g=eh/(1.+el);
|
||
|
|
||
|
#if 0
|
||
|
{
|
||
|
char *tmp_stack=stack;
|
||
|
float *tmp_sig;
|
||
|
float g2;
|
||
|
ALLOC(tmp_sig, st->subframeSize, spx_sig_t);
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
mem[i]=st->mem_sp[i];
|
||
|
iir_mem2(st->low_innov+offset, st->interp_qlpc, tmp_sig, st->subframeSize, st->lpcSize, mem);
|
||
|
g2 = compute_rms(sp, st->subframeSize)/(.01+compute_rms(tmp_sig, st->subframeSize));
|
||
|
/*fprintf (stderr, "gains: %f %f\n", g, g2);*/
|
||
|
g = g2;
|
||
|
stack = tmp_stack;
|
||
|
}
|
||
|
#endif
|
||
|
|
||
|
#ifdef FIXED_POINT
|
||
|
g *= filter_ratio/128.;
|
||
|
#else
|
||
|
g *= filter_ratio;
|
||
|
#endif
|
||
|
/*print_vec(&g, 1, "gain factor");*/
|
||
|
/* Gain quantization */
|
||
|
{
|
||
|
int quant = (int) floor(.5 + 10 + 8.0 * log((g+.0001)));
|
||
|
/*speex_warning_int("tata", quant);*/
|
||
|
if (quant<0)
|
||
|
quant=0;
|
||
|
if (quant>31)
|
||
|
quant=31;
|
||
|
speex_bits_pack(bits, quant, 5);
|
||
|
}
|
||
|
|
||
|
} else {
|
||
|
spx_word16_t gc;
|
||
|
spx_word32_t scale;
|
||
|
spx_word16_t el;
|
||
|
el = compute_rms16(low_exc+offset, st->subframeSize);
|
||
|
|
||
|
gc = PDIV32_16(MULT16_16(filter_ratio,1+eh),1+el);
|
||
|
|
||
|
/* This is a kludge that cleans up a historical bug */
|
||
|
if (st->subframeSize==80)
|
||
|
gc *= 0.70711;
|
||
|
/*printf ("%f %f %f %f\n", el, eh, filter_ratio, gc);*/
|
||
|
#ifdef FIXED_POINT
|
||
|
{
|
||
|
int qgc = scal_quant(gc, gc_quant_bound, 16);
|
||
|
speex_bits_pack(bits, qgc, 4);
|
||
|
gc = MULT16_32_Q15(28626,gc_quant_bound[qgc]);
|
||
|
}
|
||
|
#else
|
||
|
{
|
||
|
int qgc = (int)floor(.5+3.7*(log(gc)+0.15556));
|
||
|
if (qgc<0)
|
||
|
qgc=0;
|
||
|
if (qgc>15)
|
||
|
qgc=15;
|
||
|
speex_bits_pack(bits, qgc, 4);
|
||
|
gc = exp((1/3.7)*qgc-0.15556);
|
||
|
}
|
||
|
#endif
|
||
|
if (st->subframeSize==80)
|
||
|
gc *= 1.4142;
|
||
|
|
||
|
scale = SHL32(MULT16_16(PDIV32_16(SHL32(EXTEND32(gc),SIG_SHIFT-6),filter_ratio),(1+el)),6);
|
||
|
|
||
|
compute_impulse_response(st->interp_qlpc, st->bw_lpc1, st->bw_lpc2, syn_resp, st->subframeSize, st->lpcSize, stack);
|
||
|
|
||
|
|
||
|
/* Reset excitation */
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
exc[i]=VERY_SMALL;
|
||
|
|
||
|
/* Compute zero response (ringing) of A(z/g1) / ( A(z/g2) * Aq(z) ) */
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
mem[i]=st->mem_sp[i];
|
||
|
iir_mem2(exc, st->interp_qlpc, exc, st->subframeSize, st->lpcSize, mem);
|
||
|
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
mem[i]=st->mem_sw[i];
|
||
|
filter_mem2(exc, st->bw_lpc1, st->bw_lpc2, res, st->subframeSize, st->lpcSize, mem);
|
||
|
|
||
|
/* Compute weighted signal */
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
mem[i]=st->mem_sw[i];
|
||
|
filter_mem2(sp, st->bw_lpc1, st->bw_lpc2, sw, st->subframeSize, st->lpcSize, mem);
|
||
|
|
||
|
/* Compute target signal */
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
target[i]=PSHR32(sw[i]-res[i],SIG_SHIFT);
|
||
|
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
exc[i]=0;
|
||
|
|
||
|
signal_div(target, target, scale, st->subframeSize);
|
||
|
|
||
|
/* Reset excitation */
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
innov[i]=0;
|
||
|
|
||
|
/*print_vec(target, st->subframeSize, "\ntarget");*/
|
||
|
SUBMODE(innovation_quant)(target, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2,
|
||
|
SUBMODE(innovation_params), st->lpcSize, st->subframeSize,
|
||
|
innov, syn_resp, bits, stack, st->complexity, SUBMODE(double_codebook));
|
||
|
/*print_vec(target, st->subframeSize, "after");*/
|
||
|
|
||
|
signal_mul(innov, innov, scale, st->subframeSize);
|
||
|
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
exc[i] = ADD32(exc[i], innov[i]);
|
||
|
|
||
|
if (st->innov_save)
|
||
|
{
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
innov_save[2*i]=innov[i];
|
||
|
}
|
||
|
|
||
|
if (SUBMODE(double_codebook)) {
|
||
|
char *tmp_stack=stack;
|
||
|
VARDECL(spx_sig_t *innov2);
|
||
|
ALLOC(innov2, st->subframeSize, spx_sig_t);
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
innov2[i]=0;
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
target[i]*=2.5;
|
||
|
SUBMODE(innovation_quant)(target, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2,
|
||
|
SUBMODE(innovation_params), st->lpcSize, st->subframeSize,
|
||
|
innov2, syn_resp, bits, stack, st->complexity, 0);
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
innov2[i]*=scale*(1/2.5)/SIG_SCALING;
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
exc[i] = ADD32(exc[i],innov2[i]);
|
||
|
stack = tmp_stack;
|
||
|
}
|
||
|
|
||
|
}
|
||
|
|
||
|
/*Keep the previous memory*/
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
mem[i]=st->mem_sp[i];
|
||
|
/* Final signal synthesis from excitation */
|
||
|
iir_mem2(exc, st->interp_qlpc, sp, st->subframeSize, st->lpcSize, st->mem_sp);
|
||
|
|
||
|
/* Compute weighted signal again, from synthesized speech (not sure it's the right thing) */
|
||
|
filter_mem2(sp, st->bw_lpc1, st->bw_lpc2, sw, st->subframeSize, st->lpcSize, st->mem_sw);
|
||
|
}
|
||
|
|
||
|
|
||
|
#ifdef RESYNTH
|
||
|
/* Reconstruct the original */
|
||
|
fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack);
|
||
|
fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack);
|
||
|
|
||
|
for (i=0;i<st->full_frame_size;i++)
|
||
|
in[i]=SHR(st->y0[i]-st->y1[i], SIG_SHIFT-1);
|
||
|
#endif
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->old_lsp[i] = st->lsp[i];
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->old_qlsp[i] = st->qlsp[i];
|
||
|
|
||
|
st->first=0;
|
||
|
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
void *sb_decoder_init(const SpeexMode *m)
|
||
|
{
|
||
|
int tmp;
|
||
|
SBDecState *st;
|
||
|
const SpeexSBMode *mode;
|
||
|
st = (SBDecState*)speex_alloc(sizeof(SBDecState));
|
||
|
if (!st)
|
||
|
return NULL;
|
||
|
#if defined(VAR_ARRAYS) || defined (USE_ALLOCA)
|
||
|
st->stack = NULL;
|
||
|
#else
|
||
|
st->stack = (char*)speex_alloc_scratch(SB_DEC_STACK);
|
||
|
#endif
|
||
|
st->mode = m;
|
||
|
mode=(const SpeexSBMode*)m->mode;
|
||
|
|
||
|
st->encode_submode = 1;
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
st->st_low = speex_decoder_init(mode->nb_mode);
|
||
|
st->full_frame_size = 2*mode->frameSize;
|
||
|
st->frame_size = mode->frameSize;
|
||
|
st->subframeSize = mode->subframeSize;
|
||
|
st->nbSubframes = mode->frameSize/mode->subframeSize;
|
||
|
st->lpcSize=mode->lpcSize;
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_GET_SAMPLING_RATE, &st->sampling_rate);
|
||
|
st->sampling_rate*=2;
|
||
|
tmp=1;
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_WIDEBAND, &tmp);
|
||
|
|
||
|
st->submodes=mode->submodes;
|
||
|
st->submodeID=mode->defaultSubmode;
|
||
|
|
||
|
st->first=1;
|
||
|
|
||
|
|
||
|
st->x0d = (spx_sig_t*)speex_alloc((st->frame_size)*sizeof(spx_sig_t));
|
||
|
st->x1d = (spx_sig_t*)speex_alloc((st->frame_size)*sizeof(spx_sig_t));
|
||
|
st->high = (spx_sig_t*)speex_alloc((st->full_frame_size)*sizeof(spx_sig_t));
|
||
|
st->y0 = (spx_sig_t*)speex_alloc((st->full_frame_size)*sizeof(spx_sig_t));
|
||
|
st->y1 = (spx_sig_t*)speex_alloc((st->full_frame_size)*sizeof(spx_sig_t));
|
||
|
|
||
|
st->g0_mem = (spx_word32_t*)speex_alloc((QMF_ORDER)*sizeof(spx_word32_t));
|
||
|
st->g1_mem = (spx_word32_t*)speex_alloc((QMF_ORDER)*sizeof(spx_word32_t));
|
||
|
|
||
|
st->exc = (spx_sig_t*)speex_alloc((st->frame_size)*sizeof(spx_sig_t));
|
||
|
st->excBuf = (spx_sig_t*)speex_alloc((st->subframeSize)*sizeof(spx_sig_t));
|
||
|
|
||
|
st->qlsp = (spx_lsp_t*)speex_alloc((st->lpcSize)*sizeof(spx_lsp_t));
|
||
|
st->old_qlsp = (spx_lsp_t*)speex_alloc((st->lpcSize)*sizeof(spx_lsp_t));
|
||
|
st->interp_qlsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
|
||
|
st->interp_qlpc = (spx_coef_t*)speex_alloc(st->lpcSize*sizeof(spx_coef_t));
|
||
|
|
||
|
st->pi_gain = (spx_word32_t*)speex_alloc((st->nbSubframes)*sizeof(spx_word32_t));
|
||
|
st->mem_sp = (spx_mem_t*)speex_alloc((2*st->lpcSize)*sizeof(spx_mem_t));
|
||
|
|
||
|
st->low_innov = (spx_word32_t*)speex_alloc((st->frame_size)*sizeof(spx_word32_t));
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_INNOVATION_SAVE, st->low_innov);
|
||
|
st->innov_save = NULL;
|
||
|
|
||
|
|
||
|
st->lpc_enh_enabled=0;
|
||
|
st->seed = 1000;
|
||
|
|
||
|
#ifdef ENABLE_VALGRIND
|
||
|
VALGRIND_MAKE_READABLE(st, (st->stack-(char*)st));
|
||
|
#endif
|
||
|
return st;
|
||
|
}
|
||
|
|
||
|
void sb_decoder_destroy(void *state)
|
||
|
{
|
||
|
SBDecState *st;
|
||
|
st = (SBDecState*)state;
|
||
|
speex_decoder_destroy(st->st_low);
|
||
|
#if !(defined(VAR_ARRAYS) || defined (USE_ALLOCA))
|
||
|
speex_free_scratch(st->stack);
|
||
|
#endif
|
||
|
|
||
|
speex_free(st->x0d);
|
||
|
speex_free(st->x1d);
|
||
|
speex_free(st->high);
|
||
|
speex_free(st->y0);
|
||
|
speex_free(st->y1);
|
||
|
speex_free(st->g0_mem);
|
||
|
speex_free(st->g1_mem);
|
||
|
speex_free(st->exc);
|
||
|
speex_free(st->excBuf);
|
||
|
speex_free(st->qlsp);
|
||
|
speex_free(st->old_qlsp);
|
||
|
speex_free(st->interp_qlsp);
|
||
|
speex_free(st->interp_qlpc);
|
||
|
speex_free(st->pi_gain);
|
||
|
speex_free(st->low_innov);
|
||
|
speex_free(st->mem_sp);
|
||
|
|
||
|
speex_free(state);
|
||
|
}
|
||
|
|
||
|
static void sb_decode_lost(SBDecState *st, spx_word16_t *out, int dtx, char *stack)
|
||
|
{
|
||
|
int i;
|
||
|
int saved_modeid=0;
|
||
|
|
||
|
if (dtx)
|
||
|
{
|
||
|
saved_modeid=st->submodeID;
|
||
|
st->submodeID=1;
|
||
|
} else {
|
||
|
bw_lpc(GAMMA_SCALING*0.99, st->interp_qlpc, st->interp_qlpc, st->lpcSize);
|
||
|
}
|
||
|
|
||
|
st->first=1;
|
||
|
|
||
|
|
||
|
/* Final signal synthesis from excitation */
|
||
|
if (!dtx)
|
||
|
{
|
||
|
spx_word16_t low_ener;
|
||
|
low_ener = .9*compute_rms(st->exc, st->frame_size);
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
st->exc[i] = speex_rand(low_ener, &st->seed);
|
||
|
}
|
||
|
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
st->high[i]=st->exc[i];
|
||
|
|
||
|
iir_mem2(st->high, st->interp_qlpc, st->high, st->frame_size, st->lpcSize,
|
||
|
st->mem_sp);
|
||
|
|
||
|
|
||
|
/* Reconstruct the original */
|
||
|
fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack);
|
||
|
fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack);
|
||
|
|
||
|
mix_and_saturate(st->y0, st->y1, out, st->full_frame_size);
|
||
|
|
||
|
if (dtx)
|
||
|
{
|
||
|
st->submodeID=saved_modeid;
|
||
|
}
|
||
|
|
||
|
return;
|
||
|
}
|
||
|
|
||
|
int sb_decode(void *state, SpeexBits *bits, void *vout)
|
||
|
{
|
||
|
int i, sub;
|
||
|
SBDecState *st;
|
||
|
int wideband;
|
||
|
int ret;
|
||
|
char *stack;
|
||
|
VARDECL(spx_word32_t *low_pi_gain);
|
||
|
VARDECL(spx_word16_t *low_exc);
|
||
|
VARDECL(spx_coef_t *ak);
|
||
|
int dtx;
|
||
|
const SpeexSBMode *mode;
|
||
|
spx_word16_t *out = (spx_word16_t*)vout;
|
||
|
|
||
|
st = (SBDecState*)state;
|
||
|
stack=st->stack;
|
||
|
mode = (const SpeexSBMode*)(st->mode->mode);
|
||
|
|
||
|
{
|
||
|
VARDECL(spx_word16_t *low);
|
||
|
ALLOC(low, st->frame_size, spx_word16_t);
|
||
|
|
||
|
/* Decode the low-band */
|
||
|
ret = speex_decode_native(st->st_low, bits, low);
|
||
|
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
st->x0d[i] = SHL((spx_sig_t)low[i], SIG_SHIFT);
|
||
|
}
|
||
|
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_GET_DTX_STATUS, &dtx);
|
||
|
|
||
|
/* If error decoding the narrowband part, propagate error */
|
||
|
if (ret!=0)
|
||
|
{
|
||
|
return ret;
|
||
|
}
|
||
|
|
||
|
if (!bits)
|
||
|
{
|
||
|
sb_decode_lost(st, out, dtx, stack);
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
if (st->encode_submode)
|
||
|
{
|
||
|
|
||
|
/*Check "wideband bit"*/
|
||
|
if (speex_bits_remaining(bits)>0)
|
||
|
wideband = speex_bits_peek(bits);
|
||
|
else
|
||
|
wideband = 0;
|
||
|
if (wideband)
|
||
|
{
|
||
|
/*Regular wideband frame, read the submode*/
|
||
|
wideband = speex_bits_unpack_unsigned(bits, 1);
|
||
|
st->submodeID = speex_bits_unpack_unsigned(bits, SB_SUBMODE_BITS);
|
||
|
} else
|
||
|
{
|
||
|
/*Was a narrowband frame, set "null submode"*/
|
||
|
st->submodeID = 0;
|
||
|
}
|
||
|
if (st->submodeID != 0 && st->submodes[st->submodeID] == NULL)
|
||
|
{
|
||
|
speex_warning("Invalid mode encountered: corrupted stream?");
|
||
|
return -2;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* If null mode (no transmission), just set a couple things to zero*/
|
||
|
if (st->submodes[st->submodeID] == NULL)
|
||
|
{
|
||
|
if (dtx)
|
||
|
{
|
||
|
sb_decode_lost(st, out, 1, stack);
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
st->exc[i]=VERY_SMALL;
|
||
|
|
||
|
st->first=1;
|
||
|
|
||
|
/* Final signal synthesis from excitation */
|
||
|
iir_mem2(st->exc, st->interp_qlpc, st->high, st->frame_size, st->lpcSize, st->mem_sp);
|
||
|
|
||
|
fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack);
|
||
|
fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack);
|
||
|
|
||
|
mix_and_saturate(st->y0, st->y1, out, st->full_frame_size);
|
||
|
|
||
|
return 0;
|
||
|
|
||
|
}
|
||
|
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
st->exc[i]=0;
|
||
|
|
||
|
ALLOC(low_pi_gain, st->nbSubframes, spx_word32_t);
|
||
|
ALLOC(low_exc, st->frame_size, spx_word16_t);
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_GET_PI_GAIN, low_pi_gain);
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_GET_EXC, low_exc);
|
||
|
|
||
|
SUBMODE(lsp_unquant)(st->qlsp, st->lpcSize, bits);
|
||
|
|
||
|
if (st->first)
|
||
|
{
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->old_qlsp[i] = st->qlsp[i];
|
||
|
}
|
||
|
|
||
|
ALLOC(ak, st->lpcSize, spx_coef_t);
|
||
|
|
||
|
for (sub=0;sub<st->nbSubframes;sub++)
|
||
|
{
|
||
|
spx_sig_t *exc, *sp, *innov_save=NULL;
|
||
|
spx_word16_t filter_ratio;
|
||
|
spx_word16_t el=0;
|
||
|
int offset;
|
||
|
spx_word32_t rl=0,rh=0;
|
||
|
|
||
|
offset = st->subframeSize*sub;
|
||
|
sp=st->high+offset;
|
||
|
exc=st->exc+offset;
|
||
|
/* Pointer for saving innovation */
|
||
|
if (st->innov_save)
|
||
|
{
|
||
|
innov_save = st->innov_save+2*offset;
|
||
|
for (i=0;i<2*st->subframeSize;i++)
|
||
|
innov_save[i]=0;
|
||
|
}
|
||
|
|
||
|
/* LSP interpolation */
|
||
|
lsp_interpolate(st->old_qlsp, st->qlsp, st->interp_qlsp, st->lpcSize, sub, st->nbSubframes);
|
||
|
|
||
|
lsp_enforce_margin(st->interp_qlsp, st->lpcSize, LSP_MARGIN);
|
||
|
|
||
|
/* LSP to LPC */
|
||
|
lsp_to_lpc(st->interp_qlsp, ak, st->lpcSize, stack);
|
||
|
|
||
|
/* Calculate reponse ratio between the low and high filter in the middle
|
||
|
of the band (4000 Hz) */
|
||
|
|
||
|
st->pi_gain[sub]=LPC_SCALING;
|
||
|
rh = LPC_SCALING;
|
||
|
for (i=0;i<st->lpcSize;i+=2)
|
||
|
{
|
||
|
rh += st->interp_qlpc[i+1] - st->interp_qlpc[i];
|
||
|
st->pi_gain[sub] += st->interp_qlpc[i] + st->interp_qlpc[i+1];
|
||
|
}
|
||
|
|
||
|
rl = low_pi_gain[sub];
|
||
|
#ifdef FIXED_POINT
|
||
|
filter_ratio=PDIV32_16(SHL(rl+82,2),SHR(82+rh,5));
|
||
|
#else
|
||
|
filter_ratio=(rl+.01)/(rh+.01);
|
||
|
#endif
|
||
|
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
exc[i]=0;
|
||
|
if (!SUBMODE(innovation_unquant))
|
||
|
{
|
||
|
float g;
|
||
|
int quant;
|
||
|
|
||
|
quant = speex_bits_unpack_unsigned(bits, 5);
|
||
|
#ifdef FIXED_POINT
|
||
|
g= spx_exp_lookup_int[quant];
|
||
|
#else
|
||
|
g= exp(((float)quant-10)/8.0);
|
||
|
#endif
|
||
|
|
||
|
#ifdef FIXED_POINT
|
||
|
g /= filter_ratio/128.;
|
||
|
#else
|
||
|
g /= filter_ratio;
|
||
|
#endif
|
||
|
/* High-band excitation using the low-band excitation and a gain */
|
||
|
|
||
|
#if 0
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
exc[i]=mode->folding_gain*g*st->low_innov[offset+i];
|
||
|
#else
|
||
|
{
|
||
|
float tmp=1;
|
||
|
/*static tmp1=0,tmp2=0;
|
||
|
static int seed=1;
|
||
|
el = compute_rms(low_innov+offset, st->subframeSize);*/
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
{
|
||
|
float e=tmp*g*mode->folding_gain*st->low_innov[offset+i];
|
||
|
tmp *= -1;
|
||
|
exc[i] = e;
|
||
|
/*float r = speex_rand(g*el,&seed);
|
||
|
exc[i] = .5*(r+tmp2 + e-tmp1);
|
||
|
tmp1 = e;
|
||
|
tmp2 = r;*/
|
||
|
}
|
||
|
|
||
|
}
|
||
|
|
||
|
#endif
|
||
|
} else {
|
||
|
spx_word16_t gc;
|
||
|
spx_word32_t scale;
|
||
|
int qgc = speex_bits_unpack_unsigned(bits, 4);
|
||
|
|
||
|
el = compute_rms16(low_exc+offset, st->subframeSize);
|
||
|
|
||
|
#ifdef FIXED_POINT
|
||
|
gc = MULT16_32_Q15(28626,gc_quant_bound[qgc]);
|
||
|
#else
|
||
|
gc = exp((1/3.7)*qgc-0.15556);
|
||
|
#endif
|
||
|
|
||
|
if (st->subframeSize==80)
|
||
|
gc *= 1.4142;
|
||
|
|
||
|
scale = SHL(MULT16_16(PDIV32_16(SHL(gc,SIG_SHIFT-6),filter_ratio),(1+el)),6);
|
||
|
|
||
|
SUBMODE(innovation_unquant)(exc, SUBMODE(innovation_params), st->subframeSize,
|
||
|
bits, stack, &st->seed);
|
||
|
|
||
|
signal_mul(exc,exc,scale,st->subframeSize);
|
||
|
|
||
|
if (SUBMODE(double_codebook)) {
|
||
|
char *tmp_stack=stack;
|
||
|
VARDECL(spx_sig_t *innov2);
|
||
|
ALLOC(innov2, st->subframeSize, spx_sig_t);
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
innov2[i]=0;
|
||
|
SUBMODE(innovation_unquant)(innov2, SUBMODE(innovation_params), st->subframeSize,
|
||
|
bits, stack, &st->seed);
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
innov2[i]*=scale/(float)SIG_SCALING*(1/2.5);
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
exc[i] = ADD32(exc[i],innov2[i]);
|
||
|
stack = tmp_stack;
|
||
|
}
|
||
|
|
||
|
}
|
||
|
|
||
|
if (st->innov_save)
|
||
|
{
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
innov_save[2*i]=exc[i];
|
||
|
}
|
||
|
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
sp[i]=st->excBuf[i];
|
||
|
iir_mem2(sp, st->interp_qlpc, sp, st->subframeSize, st->lpcSize,
|
||
|
st->mem_sp);
|
||
|
for (i=0;i<st->subframeSize;i++)
|
||
|
st->excBuf[i]=exc[i];
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->interp_qlpc[i] = ak[i];
|
||
|
|
||
|
}
|
||
|
|
||
|
fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack);
|
||
|
fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack);
|
||
|
|
||
|
mix_and_saturate(st->y0, st->y1, out, st->full_frame_size);
|
||
|
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->old_qlsp[i] = st->qlsp[i];
|
||
|
|
||
|
st->first=0;
|
||
|
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
|
||
|
int sb_encoder_ctl(void *state, int request, void *ptr)
|
||
|
{
|
||
|
SBEncState *st;
|
||
|
st=(SBEncState*)state;
|
||
|
switch(request)
|
||
|
{
|
||
|
case SPEEX_GET_FRAME_SIZE:
|
||
|
(*(int*)ptr) = st->full_frame_size;
|
||
|
break;
|
||
|
case SPEEX_SET_HIGH_MODE:
|
||
|
st->submodeSelect = st->submodeID = (*(int*)ptr);
|
||
|
break;
|
||
|
case SPEEX_SET_LOW_MODE:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_LOW_MODE, ptr);
|
||
|
break;
|
||
|
case SPEEX_SET_DTX:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_DTX, ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_DTX:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_DTX, ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_LOW_MODE:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_LOW_MODE, ptr);
|
||
|
break;
|
||
|
case SPEEX_SET_MODE:
|
||
|
speex_encoder_ctl(st, SPEEX_SET_QUALITY, ptr);
|
||
|
break;
|
||
|
case SPEEX_SET_VBR:
|
||
|
st->vbr_enabled = (*(int*)ptr);
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_VBR, ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_VBR:
|
||
|
(*(int*)ptr) = st->vbr_enabled;
|
||
|
break;
|
||
|
case SPEEX_SET_VAD:
|
||
|
st->vad_enabled = (*(int*)ptr);
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_VAD, ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_VAD:
|
||
|
(*(int*)ptr) = st->vad_enabled;
|
||
|
break;
|
||
|
case SPEEX_SET_VBR_QUALITY:
|
||
|
{
|
||
|
int q;
|
||
|
float qual = (*(float*)ptr)+.6;
|
||
|
st->vbr_quality = (*(float*)ptr);
|
||
|
if (qual>10)
|
||
|
qual=10;
|
||
|
q=(int)floor(.5+*(float*)ptr);
|
||
|
if (q>10)
|
||
|
q=10;
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_VBR_QUALITY, &qual);
|
||
|
speex_encoder_ctl(state, SPEEX_SET_QUALITY, &q);
|
||
|
break;
|
||
|
}
|
||
|
case SPEEX_GET_VBR_QUALITY:
|
||
|
(*(float*)ptr) = st->vbr_quality;
|
||
|
break;
|
||
|
case SPEEX_SET_ABR:
|
||
|
st->abr_enabled = (*(spx_int32_t*)ptr);
|
||
|
st->vbr_enabled = st->abr_enabled!=0;
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_VBR, &st->vbr_enabled);
|
||
|
if (st->vbr_enabled)
|
||
|
{
|
||
|
int i=10, rate, target;
|
||
|
float vbr_qual;
|
||
|
target = (*(spx_int32_t*)ptr);
|
||
|
while (i>=0)
|
||
|
{
|
||
|
speex_encoder_ctl(st, SPEEX_SET_QUALITY, &i);
|
||
|
speex_encoder_ctl(st, SPEEX_GET_BITRATE, &rate);
|
||
|
if (rate <= target)
|
||
|
break;
|
||
|
i--;
|
||
|
}
|
||
|
vbr_qual=i;
|
||
|
if (vbr_qual<0)
|
||
|
vbr_qual=0;
|
||
|
speex_encoder_ctl(st, SPEEX_SET_VBR_QUALITY, &vbr_qual);
|
||
|
st->abr_count=0;
|
||
|
st->abr_drift=0;
|
||
|
st->abr_drift2=0;
|
||
|
}
|
||
|
|
||
|
break;
|
||
|
case SPEEX_GET_ABR:
|
||
|
(*(spx_int32_t*)ptr) = st->abr_enabled;
|
||
|
break;
|
||
|
case SPEEX_SET_QUALITY:
|
||
|
{
|
||
|
int nb_qual;
|
||
|
int quality = (*(int*)ptr);
|
||
|
if (quality < 0)
|
||
|
quality = 0;
|
||
|
if (quality > 10)
|
||
|
quality = 10;
|
||
|
st->submodeSelect = st->submodeID = ((const SpeexSBMode*)(st->mode->mode))->quality_map[quality];
|
||
|
nb_qual = ((const SpeexSBMode*)(st->mode->mode))->low_quality_map[quality];
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_MODE, &nb_qual);
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_SET_COMPLEXITY:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_COMPLEXITY, ptr);
|
||
|
st->complexity = (*(int*)ptr);
|
||
|
if (st->complexity<1)
|
||
|
st->complexity=1;
|
||
|
break;
|
||
|
case SPEEX_GET_COMPLEXITY:
|
||
|
(*(int*)ptr) = st->complexity;
|
||
|
break;
|
||
|
case SPEEX_SET_BITRATE:
|
||
|
{
|
||
|
int i=10;
|
||
|
spx_int32_t rate, target;
|
||
|
target = (*(spx_int32_t*)ptr);
|
||
|
while (i>=0)
|
||
|
{
|
||
|
speex_encoder_ctl(st, SPEEX_SET_QUALITY, &i);
|
||
|
speex_encoder_ctl(st, SPEEX_GET_BITRATE, &rate);
|
||
|
if (rate <= target)
|
||
|
break;
|
||
|
i--;
|
||
|
}
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_BITRATE:
|
||
|
speex_encoder_ctl(st->st_low, request, ptr);
|
||
|
/*fprintf (stderr, "before: %d\n", (*(int*)ptr));*/
|
||
|
if (st->submodes[st->submodeID])
|
||
|
(*(spx_int32_t*)ptr) += st->sampling_rate*SUBMODE(bits_per_frame)/st->full_frame_size;
|
||
|
else
|
||
|
(*(spx_int32_t*)ptr) += st->sampling_rate*(SB_SUBMODE_BITS+1)/st->full_frame_size;
|
||
|
/*fprintf (stderr, "after: %d\n", (*(int*)ptr));*/
|
||
|
break;
|
||
|
case SPEEX_SET_SAMPLING_RATE:
|
||
|
{
|
||
|
spx_int32_t tmp=(*(spx_int32_t*)ptr);
|
||
|
st->sampling_rate = tmp;
|
||
|
tmp>>=1;
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_SAMPLING_RATE, &tmp);
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_SAMPLING_RATE:
|
||
|
(*(spx_int32_t*)ptr)=st->sampling_rate;
|
||
|
break;
|
||
|
case SPEEX_RESET_STATE:
|
||
|
{
|
||
|
int i;
|
||
|
st->first = 1;
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->lsp[i]=(M_PI*((float)(i+1)))/(st->lpcSize+1);
|
||
|
for (i=0;i<st->lpcSize;i++)
|
||
|
st->mem_sw[i]=st->mem_sp[i]=st->mem_sp2[i]=0;
|
||
|
for (i=0;i<st->bufSize;i++)
|
||
|
st->excBuf[i]=0;
|
||
|
for (i=0;i<QMF_ORDER;i++)
|
||
|
st->h0_mem[i]=st->h1_mem[i]=st->g0_mem[i]=st->g1_mem[i]=0;
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_SET_SUBMODE_ENCODING:
|
||
|
st->encode_submode = (*(int*)ptr);
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_SUBMODE_ENCODING, &ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_SUBMODE_ENCODING:
|
||
|
(*(int*)ptr) = st->encode_submode;
|
||
|
break;
|
||
|
case SPEEX_GET_LOOKAHEAD:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_LOOKAHEAD, ptr);
|
||
|
(*(int*)ptr) = 2*(*(int*)ptr) + QMF_ORDER - 1;
|
||
|
break;
|
||
|
case SPEEX_SET_PLC_TUNING:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_PLC_TUNING, ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_PLC_TUNING:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_PLC_TUNING, ptr);
|
||
|
break;
|
||
|
case SPEEX_SET_VBR_MAX_BITRATE:
|
||
|
{
|
||
|
st->vbr_max = (*(spx_int32_t*)ptr);
|
||
|
if (SPEEX_SET_VBR_MAX_BITRATE<1)
|
||
|
{
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_VBR_MAX_BITRATE, &st->vbr_max);
|
||
|
st->vbr_max_high = 17600;
|
||
|
} else {
|
||
|
spx_int32_t low_rate;
|
||
|
if (st->vbr_max >= 42200)
|
||
|
{
|
||
|
st->vbr_max_high = 17600;
|
||
|
} else if (st->vbr_max >= 27800)
|
||
|
{
|
||
|
st->vbr_max_high = 9600;
|
||
|
} else if (st->vbr_max > 20600)
|
||
|
{
|
||
|
st->vbr_max_high = 5600;
|
||
|
} else {
|
||
|
st->vbr_max_high = 1800;
|
||
|
}
|
||
|
if (st->subframeSize==80)
|
||
|
st->vbr_max_high = 1800;
|
||
|
low_rate = st->vbr_max - st->vbr_max_high;
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_VBR_MAX_BITRATE, &low_rate);
|
||
|
}
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_VBR_MAX_BITRATE:
|
||
|
(*(spx_int32_t*)ptr) = st->vbr_max;
|
||
|
break;
|
||
|
case SPEEX_SET_HIGHPASS:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_HIGHPASS, ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_HIGHPASS:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_GET_HIGHPASS, ptr);
|
||
|
break;
|
||
|
|
||
|
|
||
|
/* This is all internal stuff past this point */
|
||
|
case SPEEX_GET_PI_GAIN:
|
||
|
{
|
||
|
int i;
|
||
|
spx_word32_t *g = (spx_word32_t*)ptr;
|
||
|
for (i=0;i<st->nbSubframes;i++)
|
||
|
g[i]=st->pi_gain[i];
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_EXC:
|
||
|
{
|
||
|
int i;
|
||
|
spx_sig_t *e = (spx_sig_t*)ptr;
|
||
|
for (i=0;i<st->full_frame_size;i++)
|
||
|
e[i]=0;
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
e[2*i]=2*st->exc[i];
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_INNOV:
|
||
|
{
|
||
|
int i;
|
||
|
spx_sig_t *e = (spx_sig_t*)ptr;
|
||
|
for (i=0;i<st->full_frame_size;i++)
|
||
|
e[i]=0;
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
e[2*i]=2*st->exc[i];
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_RELATIVE_QUALITY:
|
||
|
(*(float*)ptr)=st->relative_quality;
|
||
|
break;
|
||
|
case SPEEX_SET_INNOVATION_SAVE:
|
||
|
st->innov_save = (spx_sig_t*)ptr;
|
||
|
break;
|
||
|
case SPEEX_SET_WIDEBAND:
|
||
|
speex_encoder_ctl(st->st_low, SPEEX_SET_WIDEBAND, ptr);
|
||
|
break;
|
||
|
|
||
|
default:
|
||
|
speex_warning_int("Unknown nb_ctl request: ", request);
|
||
|
return -1;
|
||
|
}
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
int sb_decoder_ctl(void *state, int request, void *ptr)
|
||
|
{
|
||
|
SBDecState *st;
|
||
|
st=(SBDecState*)state;
|
||
|
switch(request)
|
||
|
{
|
||
|
case SPEEX_SET_HIGH_MODE:
|
||
|
st->submodeID = (*(int*)ptr);
|
||
|
break;
|
||
|
case SPEEX_SET_LOW_MODE:
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_LOW_MODE, ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_LOW_MODE:
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_GET_LOW_MODE, ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_FRAME_SIZE:
|
||
|
(*(int*)ptr) = st->full_frame_size;
|
||
|
break;
|
||
|
case SPEEX_SET_ENH:
|
||
|
speex_decoder_ctl(st->st_low, request, ptr);
|
||
|
st->lpc_enh_enabled = *((int*)ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_ENH:
|
||
|
*((int*)ptr) = st->lpc_enh_enabled;
|
||
|
break;
|
||
|
case SPEEX_SET_MODE:
|
||
|
case SPEEX_SET_QUALITY:
|
||
|
{
|
||
|
int nb_qual;
|
||
|
int quality = (*(int*)ptr);
|
||
|
if (quality < 0)
|
||
|
quality = 0;
|
||
|
if (quality > 10)
|
||
|
quality = 10;
|
||
|
st->submodeID = ((const SpeexSBMode*)(st->mode->mode))->quality_map[quality];
|
||
|
nb_qual = ((const SpeexSBMode*)(st->mode->mode))->low_quality_map[quality];
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_MODE, &nb_qual);
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_BITRATE:
|
||
|
speex_decoder_ctl(st->st_low, request, ptr);
|
||
|
if (st->submodes[st->submodeID])
|
||
|
(*(spx_int32_t*)ptr) += st->sampling_rate*SUBMODE(bits_per_frame)/st->full_frame_size;
|
||
|
else
|
||
|
(*(spx_int32_t*)ptr) += st->sampling_rate*(SB_SUBMODE_BITS+1)/st->full_frame_size;
|
||
|
break;
|
||
|
case SPEEX_SET_SAMPLING_RATE:
|
||
|
{
|
||
|
spx_int32_t tmp=(*(spx_int32_t*)ptr);
|
||
|
st->sampling_rate = tmp;
|
||
|
tmp>>=1;
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_SAMPLING_RATE, &tmp);
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_SAMPLING_RATE:
|
||
|
(*(spx_int32_t*)ptr)=st->sampling_rate;
|
||
|
break;
|
||
|
case SPEEX_SET_HANDLER:
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_HANDLER, ptr);
|
||
|
break;
|
||
|
case SPEEX_SET_USER_HANDLER:
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_USER_HANDLER, ptr);
|
||
|
break;
|
||
|
case SPEEX_RESET_STATE:
|
||
|
{
|
||
|
int i;
|
||
|
for (i=0;i<2*st->lpcSize;i++)
|
||
|
st->mem_sp[i]=0;
|
||
|
for (i=0;i<QMF_ORDER;i++)
|
||
|
st->g0_mem[i]=st->g1_mem[i]=0;
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_SET_SUBMODE_ENCODING:
|
||
|
st->encode_submode = (*(int*)ptr);
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_SUBMODE_ENCODING, &ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_SUBMODE_ENCODING:
|
||
|
(*(int*)ptr) = st->encode_submode;
|
||
|
break;
|
||
|
case SPEEX_GET_LOOKAHEAD:
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_GET_LOOKAHEAD, ptr);
|
||
|
(*(int*)ptr) = 2*(*(int*)ptr);
|
||
|
break;
|
||
|
case SPEEX_SET_HIGHPASS:
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_HIGHPASS, ptr);
|
||
|
break;
|
||
|
case SPEEX_GET_HIGHPASS:
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_GET_HIGHPASS, ptr);
|
||
|
break;
|
||
|
|
||
|
case SPEEX_GET_PI_GAIN:
|
||
|
{
|
||
|
int i;
|
||
|
spx_word32_t *g = (spx_word32_t*)ptr;
|
||
|
for (i=0;i<st->nbSubframes;i++)
|
||
|
g[i]=st->pi_gain[i];
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_EXC:
|
||
|
{
|
||
|
int i;
|
||
|
spx_sig_t *e = (spx_sig_t*)ptr;
|
||
|
for (i=0;i<st->full_frame_size;i++)
|
||
|
e[i]=0;
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
e[2*i]=2*st->exc[i];
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_INNOV:
|
||
|
{
|
||
|
int i;
|
||
|
spx_sig_t *e = (spx_sig_t*)ptr;
|
||
|
for (i=0;i<st->full_frame_size;i++)
|
||
|
e[i]=0;
|
||
|
for (i=0;i<st->frame_size;i++)
|
||
|
e[2*i]=2*st->exc[i];
|
||
|
}
|
||
|
break;
|
||
|
case SPEEX_GET_DTX_STATUS:
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_GET_DTX_STATUS, ptr);
|
||
|
break;
|
||
|
case SPEEX_SET_INNOVATION_SAVE:
|
||
|
st->innov_save = (spx_sig_t*)ptr;
|
||
|
break;
|
||
|
case SPEEX_SET_WIDEBAND:
|
||
|
speex_decoder_ctl(st->st_low, SPEEX_SET_WIDEBAND, ptr);
|
||
|
break;
|
||
|
|
||
|
default:
|
||
|
speex_warning_int("Unknown nb_ctl request: ", request);
|
||
|
return -1;
|
||
|
}
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
#endif
|
||
|
|