| /* Copyright (C) 2002 Jean-Marc Valin |
| File: sb_celp.c |
| |
| Redistribution and use in source and binary forms, with or without |
| modification, are permitted provided that the following conditions |
| are met: |
| |
| - Redistributions of source code must retain the above copyright |
| notice, this list of conditions and the following disclaimer. |
| |
| - Redistributions in binary form must reproduce the above copyright |
| notice, this list of conditions and the following disclaimer in the |
| documentation and/or other materials provided with the distribution. |
| |
| - Neither the name of the Xiph.org Foundation nor the names of its |
| contributors may be used to endorse or promote products derived from |
| this software without specific prior written permission. |
| |
| THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR |
| CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
| EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
| PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF |
| LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING |
| NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| */ |
| |
| #ifdef HAVE_CONFIG_H |
| #include "config.h" |
| #endif |
| |
| #include <math.h> |
| #include "sb_celp.h" |
| #include "stdlib.h" |
| #include "filters.h" |
| #include "lpc.h" |
| #include "lsp.h" |
| #include "stack_alloc.h" |
| #include "cb_search.h" |
| #include "quant_lsp.h" |
| #include "vq.h" |
| #include "ltp.h" |
| #include "misc.h" |
| |
| /* Default size for the encoder and decoder stack (can be changed at compile time). |
| This does not apply when using variable-size arrays or alloca. */ |
| #ifndef SB_ENC_STACK |
| #define SB_ENC_STACK (10000*sizeof(spx_sig_t)) |
| #endif |
| |
| #ifndef SB_DEC_STACK |
| #define SB_DEC_STACK (6000*sizeof(spx_sig_t)) |
| #endif |
| |
| |
| #ifdef DISABLE_WIDEBAND |
| void *sb_encoder_init(const SpeexMode *m) |
| { |
| speex_error("Wideband and Ultra-wideband are disabled"); |
| return NULL; |
| } |
| void sb_encoder_destroy(void *state) |
| { |
| speex_error("Wideband and Ultra-wideband are disabled"); |
| } |
| int sb_encode(void *state, void *vin, SpeexBits *bits) |
| { |
| speex_error("Wideband and Ultra-wideband are disabled"); |
| return -2; |
| } |
| void *sb_decoder_init(const SpeexMode *m) |
| { |
| speex_error("Wideband and Ultra-wideband are disabled"); |
| return NULL; |
| } |
| void sb_decoder_destroy(void *state) |
| { |
| speex_error("Wideband and Ultra-wideband are disabled"); |
| } |
| int sb_decode(void *state, SpeexBits *bits, void *vout) |
| { |
| speex_error("Wideband and Ultra-wideband are disabled"); |
| return -2; |
| } |
| int sb_encoder_ctl(void *state, int request, void *ptr) |
| { |
| speex_error("Wideband and Ultra-wideband are disabled"); |
| return -2; |
| } |
| int sb_decoder_ctl(void *state, int request, void *ptr) |
| { |
| speex_error("Wideband and Ultra-wideband are disabled"); |
| return -2; |
| } |
| #else |
| |
| |
| #ifndef M_PI |
| #define M_PI 3.14159265358979323846 /* pi */ |
| #endif |
| |
| #define sqr(x) ((x)*(x)) |
| |
| #define SUBMODE(x) st->submodes[st->submodeID]->x |
| |
| #ifdef FIXED_POINT |
| static const spx_word16_t gc_quant_bound[16] = {125, 164, 215, 282, 370, 484, 635, 832, 1090, 1428, 1871, 2452, 3213, 4210, 5516, 7228}; |
| #define LSP_MARGIN 410 |
| #define LSP_DELTA1 6553 |
| #define LSP_DELTA2 1638 |
| |
| #else |
| |
| #define LSP_MARGIN .05 |
| #define LSP_DELTA1 .2 |
| #define LSP_DELTA2 .05 |
| |
| #endif |
| |
| #define QMF_ORDER 64 |
| |
| #ifdef FIXED_POINT |
| static const spx_word16_t h0[64] = {2, -7, -7, 18, 15, -39, -25, 75, 35, -130, -41, 212, 38, -327, -17, 483, -32, -689, 124, 956, -283, -1307, 543, 1780, -973, -2467, 1733, 3633, -3339, -6409, 9059, 30153, 30153, 9059, -6409, -3339, 3633, 1733, -2467, -973, 1780, 543, -1307, -283, 956, 124, -689, -32, 483, -17, -327, 38, 212, -41, -130, 35, 75, -25, -39, 15, 18, -7, -7, 2}; |
| |
| static const spx_word16_t h1[64] = {2, 7, -7, -18, 15, 39, -25, -75, 35, 130, -41, -212, 38, 327, -17, -483, -32, 689, 124, -956, -283, 1307, 543, -1780, -973, 2467, 1733, -3633, -3339, 6409, 9059, -30153, 30153, -9059, -6409, 3339, 3633, -1733, -2467, 973, 1780, -543, -1307, 283, 956, -124, -689, 32, 483, 17, -327, -38, 212, 41, -130, -35, 75, 25, -39, -15, 18, 7, -7, -2}; |
| |
| |
| #else |
| static const float h0[64] = { |
| 3.596189e-05, -0.0001123515, |
| -0.0001104587, 0.0002790277, |
| 0.0002298438, -0.0005953563, |
| -0.0003823631, 0.00113826, |
| 0.0005308539, -0.001986177, |
| -0.0006243724, 0.003235877, |
| 0.0005743159, -0.004989147, |
| -0.0002584767, 0.007367171, |
| -0.0004857935, -0.01050689, |
| 0.001894714, 0.01459396, |
| -0.004313674, -0.01994365, |
| 0.00828756, 0.02716055, |
| -0.01485397, -0.03764973, |
| 0.026447, 0.05543245, |
| -0.05095487, -0.09779096, |
| 0.1382363, 0.4600981, |
| 0.4600981, 0.1382363, |
| -0.09779096, -0.05095487, |
| 0.05543245, 0.026447, |
| -0.03764973, -0.01485397, |
| 0.02716055, 0.00828756, |
| -0.01994365, -0.004313674, |
| 0.01459396, 0.001894714, |
| -0.01050689, -0.0004857935, |
| 0.007367171, -0.0002584767, |
| -0.004989147, 0.0005743159, |
| 0.003235877, -0.0006243724, |
| -0.001986177, 0.0005308539, |
| 0.00113826, -0.0003823631, |
| -0.0005953563, 0.0002298438, |
| 0.0002790277, -0.0001104587, |
| -0.0001123515, 3.596189e-05 |
| }; |
| |
| static const float h1[64] = { |
| 3.596189e-05, 0.0001123515, |
| -0.0001104587, -0.0002790277, |
| 0.0002298438, 0.0005953563, |
| -0.0003823631, -0.00113826, |
| 0.0005308539, 0.001986177, |
| -0.0006243724, -0.003235877, |
| 0.0005743159, 0.004989147, |
| -0.0002584767, -0.007367171, |
| -0.0004857935, 0.01050689, |
| 0.001894714, -0.01459396, |
| -0.004313674, 0.01994365, |
| 0.00828756, -0.02716055, |
| -0.01485397, 0.03764973, |
| 0.026447, -0.05543245, |
| -0.05095487, 0.09779096, |
| 0.1382363, -0.4600981, |
| 0.4600981, -0.1382363, |
| -0.09779096, 0.05095487, |
| 0.05543245, -0.026447, |
| -0.03764973, 0.01485397, |
| 0.02716055, -0.00828756, |
| -0.01994365, 0.004313674, |
| 0.01459396, -0.001894714, |
| -0.01050689, 0.0004857935, |
| 0.007367171, 0.0002584767, |
| -0.004989147, -0.0005743159, |
| 0.003235877, 0.0006243724, |
| -0.001986177, -0.0005308539, |
| 0.00113826, 0.0003823631, |
| -0.0005953563, -0.0002298438, |
| 0.0002790277, 0.0001104587, |
| -0.0001123515, -3.596189e-05 |
| }; |
| #endif |
| |
| extern const spx_word16_t lpc_window[]; |
| |
| static void mix_and_saturate(spx_word32_t *x0, spx_word32_t *x1, spx_word16_t *out, int len) |
| { |
| int i; |
| for (i=0;i<len;i++) |
| { |
| spx_word32_t tmp; |
| #ifdef FIXED_POINT |
| tmp=PSHR(x0[i]-x1[i],SIG_SHIFT-1); |
| #else |
| tmp=2*(x0[i]-x1[i]); |
| #endif |
| if (tmp>32767) |
| out[i] = 32767; |
| else if (tmp<-32767) |
| out[i] = -32767; |
| else |
| out[i] = tmp; |
| } |
| } |
| |
| void *sb_encoder_init(const SpeexMode *m) |
| { |
| int i; |
| SBEncState *st; |
| const SpeexSBMode *mode; |
| |
| st = (SBEncState*)speex_alloc(sizeof(SBEncState)); |
| if (!st) |
| return NULL; |
| #if defined(VAR_ARRAYS) || defined (USE_ALLOCA) |
| st->stack = NULL; |
| #else |
| st->stack = (char*)speex_alloc_scratch(SB_ENC_STACK); |
| #endif |
| st->mode = m; |
| mode = (const SpeexSBMode*)m->mode; |
| |
| |
| st->st_low = speex_encoder_init(mode->nb_mode); |
| st->full_frame_size = 2*mode->frameSize; |
| st->frame_size = mode->frameSize; |
| st->subframeSize = mode->subframeSize; |
| st->nbSubframes = mode->frameSize/mode->subframeSize; |
| st->windowSize = st->frame_size+st->subframeSize; |
| st->lpcSize=mode->lpcSize; |
| st->bufSize=mode->bufSize; |
| |
| st->encode_submode = 1; |
| st->submodes=mode->submodes; |
| st->submodeSelect = st->submodeID=mode->defaultSubmode; |
| |
| i=9; |
| speex_encoder_ctl(st->st_low, SPEEX_SET_QUALITY, &i); |
| |
| st->lag_factor = mode->lag_factor; |
| st->lpc_floor = mode->lpc_floor; |
| st->gamma1=mode->gamma1; |
| st->gamma2=mode->gamma2; |
| st->first=1; |
| |
| st->x0d=speex_alloc((st->frame_size)*sizeof(spx_sig_t)); |
| st->x1d=speex_alloc((st->frame_size)*sizeof(spx_sig_t)); |
| st->high=speex_alloc((st->full_frame_size)*sizeof(spx_sig_t)); |
| st->y0=speex_alloc((st->full_frame_size)*sizeof(spx_sig_t)); |
| st->y1=speex_alloc((st->full_frame_size)*sizeof(spx_sig_t)); |
| |
| st->h0_mem=speex_alloc((QMF_ORDER)*sizeof(spx_word16_t)); |
| st->h1_mem=speex_alloc((QMF_ORDER)*sizeof(spx_word16_t)); |
| st->g0_mem=speex_alloc((QMF_ORDER)*sizeof(spx_word32_t)); |
| st->g1_mem=speex_alloc((QMF_ORDER)*sizeof(spx_word32_t)); |
| |
| st->excBuf=speex_alloc((st->bufSize)*sizeof(spx_sig_t)); |
| st->exc = st->excBuf + st->bufSize - st->windowSize; |
| |
| st->res=speex_alloc((st->frame_size)*sizeof(spx_sig_t)); |
| st->sw=speex_alloc((st->frame_size)*sizeof(spx_sig_t)); |
| st->window= lpc_window; |
| |
| st->lagWindow = speex_alloc((st->lpcSize+1)*sizeof(spx_word16_t)); |
| for (i=0;i<st->lpcSize+1;i++) |
| st->lagWindow[i]=16384*exp(-.5*sqr(2*M_PI*st->lag_factor*i)); |
| |
| st->autocorr = speex_alloc((st->lpcSize+1)*sizeof(spx_word16_t)); |
| st->lpc = speex_alloc(st->lpcSize*sizeof(spx_coef_t)); |
| st->bw_lpc1 = speex_alloc(st->lpcSize*sizeof(spx_coef_t)); |
| st->bw_lpc2 = speex_alloc(st->lpcSize*sizeof(spx_coef_t)); |
| st->lsp = speex_alloc(st->lpcSize*sizeof(spx_lsp_t)); |
| st->qlsp = speex_alloc(st->lpcSize*sizeof(spx_lsp_t)); |
| st->old_lsp = speex_alloc(st->lpcSize*sizeof(spx_lsp_t)); |
| st->old_qlsp = speex_alloc(st->lpcSize*sizeof(spx_lsp_t)); |
| st->interp_lsp = speex_alloc(st->lpcSize*sizeof(spx_lsp_t)); |
| st->interp_qlsp = speex_alloc(st->lpcSize*sizeof(spx_lsp_t)); |
| st->interp_lpc = speex_alloc(st->lpcSize*sizeof(spx_coef_t)); |
| st->interp_qlpc = speex_alloc(st->lpcSize*sizeof(spx_coef_t)); |
| st->pi_gain = speex_alloc((st->nbSubframes)*sizeof(spx_word32_t)); |
| st->low_innov = speex_alloc((st->frame_size)*sizeof(spx_word32_t)); |
| speex_encoder_ctl(st->st_low, SPEEX_SET_INNOVATION_SAVE, st->low_innov); |
| st->innov_save = NULL; |
| |
| st->mem_sp = speex_alloc((st->lpcSize)*sizeof(spx_mem_t)); |
| st->mem_sp2 = speex_alloc((st->lpcSize)*sizeof(spx_mem_t)); |
| st->mem_sw = speex_alloc((st->lpcSize)*sizeof(spx_mem_t)); |
| |
| st->vbr_quality = 8; |
| st->vbr_enabled = 0; |
| st->vbr_max = 0; |
| st->vad_enabled = 0; |
| st->abr_enabled = 0; |
| st->relative_quality=0; |
| |
| st->complexity=2; |
| speex_encoder_ctl(st->st_low, SPEEX_GET_SAMPLING_RATE, &st->sampling_rate); |
| st->sampling_rate*=2; |
| #ifdef ENABLE_VALGRIND |
| VALGRIND_MAKE_READABLE(st, (st->stack-(char*)st)); |
| #endif |
| return st; |
| } |
| |
| void sb_encoder_destroy(void *state) |
| { |
| SBEncState *st=(SBEncState*)state; |
| |
| speex_encoder_destroy(st->st_low); |
| #if !(defined(VAR_ARRAYS) || defined (USE_ALLOCA)) |
| speex_free_scratch(st->stack); |
| #endif |
| |
| speex_free(st->x0d); |
| speex_free(st->x1d); |
| speex_free(st->high); |
| speex_free(st->y0); |
| speex_free(st->y1); |
| |
| speex_free(st->h0_mem); |
| speex_free(st->h1_mem); |
| speex_free(st->g0_mem); |
| speex_free(st->g1_mem); |
| |
| speex_free(st->excBuf); |
| speex_free(st->res); |
| speex_free(st->sw); |
| speex_free(st->lagWindow); |
| |
| speex_free(st->autocorr); |
| speex_free(st->lpc); |
| speex_free(st->bw_lpc1); |
| speex_free(st->bw_lpc2); |
| speex_free(st->lsp); |
| speex_free(st->qlsp); |
| speex_free(st->old_lsp); |
| speex_free(st->old_qlsp); |
| speex_free(st->interp_lsp); |
| speex_free(st->interp_qlsp); |
| speex_free(st->interp_lpc); |
| speex_free(st->interp_qlpc); |
| speex_free(st->pi_gain); |
| |
| speex_free(st->mem_sp); |
| speex_free(st->mem_sp2); |
| speex_free(st->mem_sw); |
| |
| |
| speex_free(st); |
| } |
| |
| |
| int sb_encode(void *state, void *vin, SpeexBits *bits) |
| { |
| SBEncState *st; |
| int i, roots, sub; |
| char *stack; |
| VARDECL(spx_mem_t *mem); |
| VARDECL(spx_sig_t *innov); |
| VARDECL(spx_word16_t *target); |
| VARDECL(spx_word16_t *syn_resp); |
| VARDECL(spx_word32_t *low_pi_gain); |
| VARDECL(spx_word16_t *low_exc); |
| const SpeexSBMode *mode; |
| int dtx; |
| spx_word16_t *in = vin; |
| |
| st = (SBEncState*)state; |
| stack=st->stack; |
| mode = (const SpeexSBMode*)(st->mode->mode); |
| |
| { |
| VARDECL(spx_word16_t *low); |
| ALLOC(low, st->frame_size, spx_word16_t); |
| |
| /* Compute the two sub-bands by filtering with h0 and h1*/ |
| qmf_decomp(in, h0, st->x0d, st->x1d, st->full_frame_size, QMF_ORDER, st->h0_mem, stack); |
| |
| for (i=0;i<st->frame_size;i++) |
| low[i] = SATURATE(PSHR(st->x0d[i],SIG_SHIFT),32767); |
| |
| /* Encode the narrowband part*/ |
| speex_encode_native(st->st_low, low, bits); |
| |
| for (i=0;i<st->frame_size;i++) |
| st->x0d[i] = SHL(low[i],SIG_SHIFT); |
| } |
| /* High-band buffering / sync with low band */ |
| for (i=0;i<st->windowSize-st->frame_size;i++) |
| st->high[i] = st->high[st->frame_size+i]; |
| for (i=0;i<st->frame_size;i++) |
| st->high[st->windowSize-st->frame_size+i]=SATURATE(st->x1d[i],536854528); |
| |
| speex_move(st->excBuf, st->excBuf+st->frame_size, (st->bufSize-st->frame_size)*sizeof(spx_sig_t)); |
| |
| |
| ALLOC(low_pi_gain, st->nbSubframes, spx_word32_t); |
| ALLOC(low_exc, st->frame_size, spx_word16_t); |
| speex_encoder_ctl(st->st_low, SPEEX_GET_PI_GAIN, low_pi_gain); |
| speex_encoder_ctl(st->st_low, SPEEX_GET_EXC, low_exc); |
| |
| speex_encoder_ctl(st->st_low, SPEEX_GET_LOW_MODE, &dtx); |
| |
| if (dtx==0) |
| dtx=1; |
| else |
| dtx=0; |
| |
| { |
| VARDECL(spx_word16_t *w_sig); |
| ALLOC(w_sig, st->windowSize, spx_word16_t); |
| /* Window for analysis */ |
| for (i=0;i<st->windowSize;i++) |
| w_sig[i] = SHR(MULT16_16(SHR((spx_word32_t)(st->high[i]),SIG_SHIFT),st->window[i]),SIG_SHIFT); |
| |
| /* Compute auto-correlation */ |
| _spx_autocorr(w_sig, st->autocorr, st->lpcSize+1, st->windowSize); |
| } |
| st->autocorr[0] = ADD16(st->autocorr[0],MULT16_16_Q15(st->autocorr[0],st->lpc_floor)); /* Noise floor in auto-correlation domain */ |
| |
| /* Lag windowing: equivalent to filtering in the power-spectrum domain */ |
| for (i=0;i<st->lpcSize+1;i++) |
| st->autocorr[i] = MULT16_16_Q14(st->autocorr[i],st->lagWindow[i]); |
| |
| /* Levinson-Durbin */ |
| _spx_lpc(st->lpc, st->autocorr, st->lpcSize); |
| |
| /* LPC to LSPs (x-domain) transform */ |
| roots=lpc_to_lsp (st->lpc, st->lpcSize, st->lsp, 10, LSP_DELTA1, stack); |
| if (roots!=st->lpcSize) |
| { |
| roots = lpc_to_lsp (st->lpc, st->lpcSize, st->lsp, 10, LSP_DELTA2, stack); |
| if (roots!=st->lpcSize) { |
| /*If we can't find all LSP's, do some damage control and use a flat filter*/ |
| for (i=0;i<st->lpcSize;i++) |
| { |
| st->lsp[i]=LSP_SCALING*M_PI*((float)(i+1))/(st->lpcSize+1); |
| } |
| } |
| } |
| |
| /* VBR code */ |
| if ((st->vbr_enabled || st->vad_enabled) && !dtx) |
| { |
| float e_low=0, e_high=0; |
| float ratio; |
| if (st->abr_enabled) |
| { |
| float qual_change=0; |
| if (st->abr_drift2 * st->abr_drift > 0) |
| { |
| /* Only adapt if long-term and short-term drift are the same sign */ |
| qual_change = -.00001*st->abr_drift/(1+st->abr_count); |
| if (qual_change>.1) |
| qual_change=.1; |
| if (qual_change<-.1) |
| qual_change=-.1; |
| } |
| st->vbr_quality += qual_change; |
| if (st->vbr_quality>10) |
| st->vbr_quality=10; |
| if (st->vbr_quality<0) |
| st->vbr_quality=0; |
| } |
| |
| |
| /*FIXME: Are the two signals (low, high) in sync? */ |
| e_low = compute_rms(st->x0d, st->frame_size); |
| e_high = compute_rms(st->high, st->frame_size); |
| ratio = 2*log((1+e_high)/(1+e_low)); |
| |
| speex_encoder_ctl(st->st_low, SPEEX_GET_RELATIVE_QUALITY, &st->relative_quality); |
| if (ratio<-4) |
| ratio=-4; |
| if (ratio>2) |
| ratio=2; |
| /*if (ratio>-2)*/ |
| if (st->vbr_enabled) |
| { |
| int modeid; |
| modeid = mode->nb_modes-1; |
| st->relative_quality+=1.0*(ratio+2); |
| if (st->relative_quality<-1) |
| st->relative_quality=-1; |
| while (modeid) |
| { |
| int v1; |
| float thresh; |
| v1=(int)floor(st->vbr_quality); |
| if (v1==10) |
| thresh = mode->vbr_thresh[modeid][v1]; |
| else |
| thresh = (st->vbr_quality-v1) * mode->vbr_thresh[modeid][v1+1] + |
| (1+v1-st->vbr_quality) * mode->vbr_thresh[modeid][v1]; |
| if (st->relative_quality >= thresh) |
| break; |
| modeid--; |
| } |
| speex_encoder_ctl(state, SPEEX_SET_HIGH_MODE, &modeid); |
| if (st->abr_enabled) |
| { |
| int bitrate; |
| speex_encoder_ctl(state, SPEEX_GET_BITRATE, &bitrate); |
| st->abr_drift+=(bitrate-st->abr_enabled); |
| st->abr_drift2 = .95*st->abr_drift2 + .05*(bitrate-st->abr_enabled); |
| st->abr_count += 1.0; |
| } |
| |
| } else { |
| /* VAD only */ |
| int modeid; |
| if (st->relative_quality<2.0) |
| modeid=1; |
| else |
| modeid=st->submodeSelect; |
| /*speex_encoder_ctl(state, SPEEX_SET_MODE, &mode);*/ |
| st->submodeID=modeid; |
| |
| } |
| /*fprintf (stderr, "%f %f\n", ratio, low_qual);*/ |
| } |
| |
| if (st->encode_submode) |
| { |
| speex_bits_pack(bits, 1, 1); |
| if (dtx) |
| speex_bits_pack(bits, 0, SB_SUBMODE_BITS); |
| else |
| speex_bits_pack(bits, st->submodeID, SB_SUBMODE_BITS); |
| } |
| |
| /* If null mode (no transmission), just set a couple things to zero*/ |
| if (dtx || st->submodes[st->submodeID] == NULL) |
| { |
| for (i=0;i<st->frame_size;i++) |
| st->exc[i]=st->sw[i]=VERY_SMALL; |
| |
| for (i=0;i<st->lpcSize;i++) |
| st->mem_sw[i]=0; |
| st->first=1; |
| |
| /* Final signal synthesis from excitation */ |
| iir_mem2(st->exc, st->interp_qlpc, st->high, st->frame_size, st->lpcSize, st->mem_sp); |
| |
| #ifdef RESYNTH |
| /* Reconstruct the original */ |
| fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack); |
| fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack); |
| |
| for (i=0;i<st->full_frame_size;i++) |
| in[i]=SHR(st->y0[i]-st->y1[i], SIG_SHIFT-1); |
| #endif |
| |
| if (dtx) |
| return 0; |
| else |
| return 1; |
| } |
| |
| |
| /* LSP quantization */ |
| SUBMODE(lsp_quant)(st->lsp, st->qlsp, st->lpcSize, bits); |
| |
| if (st->first) |
| { |
| for (i=0;i<st->lpcSize;i++) |
| st->old_lsp[i] = st->lsp[i]; |
| for (i=0;i<st->lpcSize;i++) |
| st->old_qlsp[i] = st->qlsp[i]; |
| } |
| |
| ALLOC(mem, st->lpcSize, spx_mem_t); |
| ALLOC(syn_resp, st->subframeSize, spx_word16_t); |
| ALLOC(innov, st->subframeSize, spx_sig_t); |
| ALLOC(target, st->subframeSize, spx_word16_t); |
| |
| for (sub=0;sub<st->nbSubframes;sub++) |
| { |
| spx_sig_t *exc, *sp, *res, *sw, *innov_save=NULL; |
| spx_word16_t filter_ratio; |
| int offset; |
| spx_word32_t rl, rh; |
| spx_word16_t eh=0; |
| |
| offset = st->subframeSize*sub; |
| sp=st->high+offset; |
| exc=st->exc+offset; |
| res=st->res+offset; |
| sw=st->sw+offset; |
| /* Pointer for saving innovation */ |
| if (st->innov_save) |
| { |
| innov_save = st->innov_save+2*offset; |
| for (i=0;i<2*st->subframeSize;i++) |
| innov_save[i]=0; |
| } |
| |
| /* LSP interpolation (quantized and unquantized) */ |
| lsp_interpolate(st->old_lsp, st->lsp, st->interp_lsp, st->lpcSize, sub, st->nbSubframes); |
| lsp_interpolate(st->old_qlsp, st->qlsp, st->interp_qlsp, st->lpcSize, sub, st->nbSubframes); |
| |
| lsp_enforce_margin(st->interp_lsp, st->lpcSize, LSP_MARGIN); |
| lsp_enforce_margin(st->interp_qlsp, st->lpcSize, LSP_MARGIN); |
| |
| lsp_to_lpc(st->interp_lsp, st->interp_lpc, st->lpcSize,stack); |
| lsp_to_lpc(st->interp_qlsp, st->interp_qlpc, st->lpcSize, stack); |
| |
| bw_lpc(st->gamma1, st->interp_lpc, st->bw_lpc1, st->lpcSize); |
| bw_lpc(st->gamma2, st->interp_lpc, st->bw_lpc2, st->lpcSize); |
| |
| /* Compute mid-band (4000 Hz for wideband) response of low-band and high-band |
| filters */ |
| st->pi_gain[sub]=LPC_SCALING; |
| rh = LPC_SCALING; |
| for (i=0;i<st->lpcSize;i+=2) |
| { |
| rh += st->interp_qlpc[i+1] - st->interp_qlpc[i]; |
| st->pi_gain[sub] += st->interp_qlpc[i] + st->interp_qlpc[i+1]; |
| } |
| |
| rl = low_pi_gain[sub]; |
| #ifdef FIXED_POINT |
| filter_ratio=PDIV32_16(SHL(rl+82,2),SHR(82+rh,5)); |
| #else |
| filter_ratio=(rl+.01)/(rh+.01); |
| #endif |
| |
| /* Compute "real excitation" */ |
| fir_mem2(sp, st->interp_qlpc, exc, st->subframeSize, st->lpcSize, st->mem_sp2); |
| /* Compute energy of low-band and high-band excitation */ |
| |
| eh = compute_rms(exc, st->subframeSize); |
| |
| if (!SUBMODE(innovation_quant)) {/* 1 for spectral folding excitation, 0 for stochastic */ |
| float g; |
| spx_word16_t el; |
| el = compute_rms(st->low_innov+offset, st->subframeSize); |
| |
| /* Gain to use if we want to use the low-band excitation for high-band */ |
| g=eh/(1.+el); |
| |
| #if 0 |
| { |
| char *tmp_stack=stack; |
| float *tmp_sig; |
| float g2; |
| ALLOC(tmp_sig, st->subframeSize, spx_sig_t); |
| for (i=0;i<st->lpcSize;i++) |
| mem[i]=st->mem_sp[i]; |
| iir_mem2(st->low_innov+offset, st->interp_qlpc, tmp_sig, st->subframeSize, st->lpcSize, mem); |
| g2 = compute_rms(sp, st->subframeSize)/(.01+compute_rms(tmp_sig, st->subframeSize)); |
| /*fprintf (stderr, "gains: %f %f\n", g, g2);*/ |
| g = g2; |
| stack = tmp_stack; |
| } |
| #endif |
| |
| #ifdef FIXED_POINT |
| g *= filter_ratio/128.; |
| #else |
| g *= filter_ratio; |
| #endif |
| /*print_vec(&g, 1, "gain factor");*/ |
| /* Gain quantization */ |
| { |
| int quant = (int) floor(.5 + 10 + 8.0 * log((g+.0001))); |
| /*speex_warning_int("tata", quant);*/ |
| if (quant<0) |
| quant=0; |
| if (quant>31) |
| quant=31; |
| speex_bits_pack(bits, quant, 5); |
| } |
| |
| } else { |
| spx_word16_t gc; |
| spx_word32_t scale; |
| spx_word16_t el; |
| el = compute_rms16(low_exc+offset, st->subframeSize); |
| |
| gc = PDIV32_16(MULT16_16(filter_ratio,1+eh),1+el); |
| |
| /* This is a kludge that cleans up a historical bug */ |
| if (st->subframeSize==80) |
| gc *= 0.70711; |
| /*printf ("%f %f %f %f\n", el, eh, filter_ratio, gc);*/ |
| #ifdef FIXED_POINT |
| { |
| int qgc = scal_quant(gc, gc_quant_bound, 16); |
| speex_bits_pack(bits, qgc, 4); |
| gc = MULT16_32_Q15(28626,gc_quant_bound[qgc]); |
| } |
| #else |
| { |
| int qgc = (int)floor(.5+3.7*(log(gc)+0.15556)); |
| if (qgc<0) |
| qgc=0; |
| if (qgc>15) |
| qgc=15; |
| speex_bits_pack(bits, qgc, 4); |
| gc = exp((1/3.7)*qgc-0.15556); |
| } |
| #endif |
| if (st->subframeSize==80) |
| gc *= 1.4142; |
| |
| scale = SHL32(MULT16_16(PDIV32_16(SHL32(EXTEND32(gc),SIG_SHIFT-6),filter_ratio),(1+el)),6); |
| |
| compute_impulse_response(st->interp_qlpc, st->bw_lpc1, st->bw_lpc2, syn_resp, st->subframeSize, st->lpcSize, stack); |
| |
| |
| /* Reset excitation */ |
| for (i=0;i<st->subframeSize;i++) |
| exc[i]=VERY_SMALL; |
| |
| /* Compute zero response (ringing) of A(z/g1) / ( A(z/g2) * Aq(z) ) */ |
| for (i=0;i<st->lpcSize;i++) |
| mem[i]=st->mem_sp[i]; |
| iir_mem2(exc, st->interp_qlpc, exc, st->subframeSize, st->lpcSize, mem); |
| |
| for (i=0;i<st->lpcSize;i++) |
| mem[i]=st->mem_sw[i]; |
| filter_mem2(exc, st->bw_lpc1, st->bw_lpc2, res, st->subframeSize, st->lpcSize, mem); |
| |
| /* Compute weighted signal */ |
| for (i=0;i<st->lpcSize;i++) |
| mem[i]=st->mem_sw[i]; |
| filter_mem2(sp, st->bw_lpc1, st->bw_lpc2, sw, st->subframeSize, st->lpcSize, mem); |
| |
| /* Compute target signal */ |
| for (i=0;i<st->subframeSize;i++) |
| target[i]=PSHR32(sw[i]-res[i],SIG_SHIFT); |
| |
| for (i=0;i<st->subframeSize;i++) |
| exc[i]=0; |
| |
| signal_div(target, target, scale, st->subframeSize); |
| |
| /* Reset excitation */ |
| for (i=0;i<st->subframeSize;i++) |
| innov[i]=0; |
| |
| /*print_vec(target, st->subframeSize, "\ntarget");*/ |
| SUBMODE(innovation_quant)(target, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2, |
| SUBMODE(innovation_params), st->lpcSize, st->subframeSize, |
| innov, syn_resp, bits, stack, (st->complexity+1)>>1, SUBMODE(double_codebook)); |
| /*print_vec(target, st->subframeSize, "after");*/ |
| |
| signal_mul(innov, innov, scale, st->subframeSize); |
| |
| for (i=0;i<st->subframeSize;i++) |
| exc[i] = ADD32(exc[i], innov[i]); |
| |
| if (st->innov_save) |
| { |
| for (i=0;i<st->subframeSize;i++) |
| innov_save[2*i]=innov[i]; |
| } |
| |
| if (SUBMODE(double_codebook)) { |
| char *tmp_stack=stack; |
| VARDECL(spx_sig_t *innov2); |
| ALLOC(innov2, st->subframeSize, spx_sig_t); |
| for (i=0;i<st->subframeSize;i++) |
| innov2[i]=0; |
| for (i=0;i<st->subframeSize;i++) |
| target[i]*=2.5; |
| SUBMODE(innovation_quant)(target, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2, |
| SUBMODE(innovation_params), st->lpcSize, st->subframeSize, |
| innov2, syn_resp, bits, stack, (st->complexity+1)>>1, 0); |
| for (i=0;i<st->subframeSize;i++) |
| innov2[i]*=scale*(1/2.5)/SIG_SCALING; |
| for (i=0;i<st->subframeSize;i++) |
| exc[i] = ADD32(exc[i],innov2[i]); |
| stack = tmp_stack; |
| } |
| |
| } |
| |
| /*Keep the previous memory*/ |
| for (i=0;i<st->lpcSize;i++) |
| mem[i]=st->mem_sp[i]; |
| /* Final signal synthesis from excitation */ |
| iir_mem2(exc, st->interp_qlpc, sp, st->subframeSize, st->lpcSize, st->mem_sp); |
| |
| /* Compute weighted signal again, from synthesized speech (not sure it's the right thing) */ |
| filter_mem2(sp, st->bw_lpc1, st->bw_lpc2, sw, st->subframeSize, st->lpcSize, st->mem_sw); |
| } |
| |
| |
| #ifdef RESYNTH |
| /* Reconstruct the original */ |
| fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack); |
| fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack); |
| |
| for (i=0;i<st->full_frame_size;i++) |
| in[i]=SHR(st->y0[i]-st->y1[i], SIG_SHIFT-1); |
| #endif |
| for (i=0;i<st->lpcSize;i++) |
| st->old_lsp[i] = st->lsp[i]; |
| for (i=0;i<st->lpcSize;i++) |
| st->old_qlsp[i] = st->qlsp[i]; |
| |
| st->first=0; |
| |
| return 1; |
| } |
| |
| |
| |
| |
| |
| void *sb_decoder_init(const SpeexMode *m) |
| { |
| SBDecState *st; |
| const SpeexSBMode *mode; |
| st = (SBDecState*)speex_alloc(sizeof(SBDecState)); |
| if (!st) |
| return NULL; |
| #if defined(VAR_ARRAYS) || defined (USE_ALLOCA) |
| st->stack = NULL; |
| #else |
| st->stack = (char*)speex_alloc_scratch(SB_DEC_STACK); |
| #endif |
| st->mode = m; |
| mode=(const SpeexSBMode*)m->mode; |
| |
| st->encode_submode = 1; |
| |
| |
| |
| |
| st->st_low = speex_decoder_init(mode->nb_mode); |
| st->full_frame_size = 2*mode->frameSize; |
| st->frame_size = mode->frameSize; |
| st->subframeSize = mode->subframeSize; |
| st->nbSubframes = mode->frameSize/mode->subframeSize; |
| st->lpcSize=mode->lpcSize; |
| speex_decoder_ctl(st->st_low, SPEEX_GET_SAMPLING_RATE, &st->sampling_rate); |
| st->sampling_rate*=2; |
| |
| st->submodes=mode->submodes; |
| st->submodeID=mode->defaultSubmode; |
| |
| st->first=1; |
| |
| |
| st->x0d=speex_alloc((st->frame_size)*sizeof(spx_sig_t)); |
| st->x1d=speex_alloc((st->frame_size)*sizeof(spx_sig_t)); |
| st->high=speex_alloc((st->full_frame_size)*sizeof(spx_sig_t)); |
| st->y0=speex_alloc((st->full_frame_size)*sizeof(spx_sig_t)); |
| st->y1=speex_alloc((st->full_frame_size)*sizeof(spx_sig_t)); |
| |
| st->g0_mem=speex_alloc((QMF_ORDER)*sizeof(spx_word32_t)); |
| st->g1_mem=speex_alloc((QMF_ORDER)*sizeof(spx_word32_t)); |
| |
| st->exc=speex_alloc((st->frame_size)*sizeof(spx_sig_t)); |
| st->excBuf=speex_alloc((st->subframeSize)*sizeof(spx_sig_t)); |
| |
| st->qlsp = speex_alloc((st->lpcSize)*sizeof(spx_lsp_t)); |
| st->old_qlsp = speex_alloc((st->lpcSize)*sizeof(spx_lsp_t)); |
| st->interp_qlsp = speex_alloc(st->lpcSize*sizeof(spx_lsp_t)); |
| st->interp_qlpc = speex_alloc(st->lpcSize*sizeof(spx_coef_t)); |
| |
| st->pi_gain = speex_alloc((st->nbSubframes)*sizeof(spx_word32_t)); |
| st->mem_sp = speex_alloc((2*st->lpcSize)*sizeof(spx_mem_t)); |
| |
| st->low_innov = speex_alloc((st->frame_size)*sizeof(spx_word32_t)); |
| speex_decoder_ctl(st->st_low, SPEEX_SET_INNOVATION_SAVE, st->low_innov); |
| st->innov_save = NULL; |
| |
| |
| st->lpc_enh_enabled=0; |
| st->seed = 1000; |
| |
| #ifdef ENABLE_VALGRIND |
| VALGRIND_MAKE_READABLE(st, (st->stack-(char*)st)); |
| #endif |
| return st; |
| } |
| |
| void sb_decoder_destroy(void *state) |
| { |
| SBDecState *st; |
| st = (SBDecState*)state; |
| speex_decoder_destroy(st->st_low); |
| #if !(defined(VAR_ARRAYS) || defined (USE_ALLOCA)) |
| speex_free_scratch(st->stack); |
| #endif |
| |
| speex_free(st->x0d); |
| speex_free(st->x1d); |
| speex_free(st->high); |
| speex_free(st->y0); |
| speex_free(st->y1); |
| speex_free(st->g0_mem); |
| speex_free(st->g1_mem); |
| speex_free(st->exc); |
| speex_free(st->excBuf); |
| speex_free(st->qlsp); |
| speex_free(st->old_qlsp); |
| speex_free(st->interp_qlsp); |
| speex_free(st->interp_qlpc); |
| speex_free(st->pi_gain); |
| speex_free(st->mem_sp); |
| |
| speex_free(state); |
| } |
| |
| static void sb_decode_lost(SBDecState *st, spx_word16_t *out, int dtx, char *stack) |
| { |
| int i; |
| int saved_modeid=0; |
| |
| if (dtx) |
| { |
| saved_modeid=st->submodeID; |
| st->submodeID=1; |
| } else { |
| bw_lpc(GAMMA_SCALING*0.99, st->interp_qlpc, st->interp_qlpc, st->lpcSize); |
| } |
| |
| st->first=1; |
| |
| |
| /* Final signal synthesis from excitation */ |
| if (!dtx) |
| { |
| spx_word16_t low_ener; |
| low_ener = .9*compute_rms(st->exc, st->frame_size); |
| for (i=0;i<st->frame_size;i++) |
| st->exc[i] = speex_rand(low_ener, &st->seed); |
| } |
| |
| for (i=0;i<st->frame_size;i++) |
| st->high[i]=st->exc[i]; |
| |
| iir_mem2(st->high, st->interp_qlpc, st->high, st->frame_size, st->lpcSize, |
| st->mem_sp); |
| |
| |
| /* Reconstruct the original */ |
| fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack); |
| fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack); |
| |
| mix_and_saturate(st->y0, st->y1, out, st->full_frame_size); |
| |
| if (dtx) |
| { |
| st->submodeID=saved_modeid; |
| } |
| |
| return; |
| } |
| |
| int sb_decode(void *state, SpeexBits *bits, void *vout) |
| { |
| int i, sub; |
| SBDecState *st; |
| int wideband; |
| int ret; |
| char *stack; |
| VARDECL(spx_word32_t *low_pi_gain); |
| VARDECL(spx_word16_t *low_exc); |
| VARDECL(spx_coef_t *ak); |
| int dtx; |
| const SpeexSBMode *mode; |
| spx_word16_t *out = vout; |
| |
| st = (SBDecState*)state; |
| stack=st->stack; |
| mode = (const SpeexSBMode*)(st->mode->mode); |
| |
| { |
| VARDECL(spx_word16_t *low); |
| ALLOC(low, st->frame_size, spx_word16_t); |
| |
| /* Decode the low-band */ |
| ret = speex_decode_native(st->st_low, bits, low); |
| |
| for (i=0;i<st->frame_size;i++) |
| st->x0d[i] = SHL((spx_sig_t)low[i], SIG_SHIFT); |
| } |
| |
| speex_decoder_ctl(st->st_low, SPEEX_GET_DTX_STATUS, &dtx); |
| |
| /* If error decoding the narrowband part, propagate error */ |
| if (ret!=0) |
| { |
| return ret; |
| } |
| |
| if (!bits) |
| { |
| sb_decode_lost(st, out, dtx, stack); |
| return 0; |
| } |
| |
| if (st->encode_submode) |
| { |
| |
| /*Check "wideband bit"*/ |
| if (speex_bits_remaining(bits)>0) |
| wideband = speex_bits_peek(bits); |
| else |
| wideband = 0; |
| if (wideband) |
| { |
| /*Regular wideband frame, read the submode*/ |
| wideband = speex_bits_unpack_unsigned(bits, 1); |
| st->submodeID = speex_bits_unpack_unsigned(bits, SB_SUBMODE_BITS); |
| } else |
| { |
| /*Was a narrowband frame, set "null submode"*/ |
| st->submodeID = 0; |
| } |
| if (st->submodeID != 0 && st->submodes[st->submodeID] == NULL) |
| { |
| speex_warning("Invalid mode encountered: corrupted stream?"); |
| return -2; |
| } |
| } |
| |
| /* If null mode (no transmission), just set a couple things to zero*/ |
| if (st->submodes[st->submodeID] == NULL) |
| { |
| if (dtx) |
| { |
| sb_decode_lost(st, out, 1, stack); |
| return 0; |
| } |
| |
| for (i=0;i<st->frame_size;i++) |
| st->exc[i]=VERY_SMALL; |
| |
| st->first=1; |
| |
| /* Final signal synthesis from excitation */ |
| iir_mem2(st->exc, st->interp_qlpc, st->high, st->frame_size, st->lpcSize, st->mem_sp); |
| |
| fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack); |
| fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack); |
| |
| mix_and_saturate(st->y0, st->y1, out, st->full_frame_size); |
| |
| return 0; |
| |
| } |
| |
| for (i=0;i<st->frame_size;i++) |
| st->exc[i]=0; |
| |
| ALLOC(low_pi_gain, st->nbSubframes, spx_word32_t); |
| ALLOC(low_exc, st->frame_size, spx_word16_t); |
| speex_decoder_ctl(st->st_low, SPEEX_GET_PI_GAIN, low_pi_gain); |
| speex_decoder_ctl(st->st_low, SPEEX_GET_EXC, low_exc); |
| |
| SUBMODE(lsp_unquant)(st->qlsp, st->lpcSize, bits); |
| |
| if (st->first) |
| { |
| for (i=0;i<st->lpcSize;i++) |
| st->old_qlsp[i] = st->qlsp[i]; |
| } |
| |
| ALLOC(ak, st->lpcSize, spx_coef_t); |
| |
| for (sub=0;sub<st->nbSubframes;sub++) |
| { |
| spx_sig_t *exc, *sp, *innov_save=NULL; |
| spx_word16_t filter_ratio; |
| spx_word16_t el=0; |
| int offset; |
| spx_word32_t rl=0,rh=0; |
| |
| offset = st->subframeSize*sub; |
| sp=st->high+offset; |
| exc=st->exc+offset; |
| /* Pointer for saving innovation */ |
| if (st->innov_save) |
| { |
| innov_save = st->innov_save+2*offset; |
| for (i=0;i<2*st->subframeSize;i++) |
| innov_save[i]=0; |
| } |
| |
| /* LSP interpolation */ |
| lsp_interpolate(st->old_qlsp, st->qlsp, st->interp_qlsp, st->lpcSize, sub, st->nbSubframes); |
| |
| lsp_enforce_margin(st->interp_qlsp, st->lpcSize, LSP_MARGIN); |
| |
| /* LSP to LPC */ |
| lsp_to_lpc(st->interp_qlsp, ak, st->lpcSize, stack); |
| |
| /* Calculate reponse ratio between the low and high filter in the middle |
| of the band (4000 Hz) */ |
| |
| st->pi_gain[sub]=LPC_SCALING; |
| rh = LPC_SCALING; |
| for (i=0;i<st->lpcSize;i+=2) |
| { |
| rh += st->interp_qlpc[i+1] - st->interp_qlpc[i]; |
| st->pi_gain[sub] += st->interp_qlpc[i] + st->interp_qlpc[i+1]; |
| } |
| |
| rl = low_pi_gain[sub]; |
| #ifdef FIXED_POINT |
| filter_ratio=PDIV32_16(SHL(rl+82,2),SHR(82+rh,5)); |
| #else |
| filter_ratio=(rl+.01)/(rh+.01); |
| #endif |
| |
| for (i=0;i<st->subframeSize;i++) |
| exc[i]=0; |
| if (!SUBMODE(innovation_unquant)) |
| { |
| float g; |
| int quant; |
| |
| quant = speex_bits_unpack_unsigned(bits, 5); |
| g= exp(((float)quant-10)/8.0); |
| |
| #ifdef FIXED_POINT |
| g /= filter_ratio/128.; |
| #else |
| g /= filter_ratio; |
| #endif |
| /* High-band excitation using the low-band excitation and a gain */ |
| |
| #if 0 |
| for (i=0;i<st->subframeSize;i++) |
| exc[i]=mode->folding_gain*g*st->low_innov[offset+i]; |
| #else |
| { |
| float tmp=1; |
| /*static tmp1=0,tmp2=0; |
| static int seed=1; |
| el = compute_rms(low_innov+offset, st->subframeSize);*/ |
| for (i=0;i<st->subframeSize;i++) |
| { |
| float e=tmp*g*mode->folding_gain*st->low_innov[offset+i]; |
| tmp *= -1; |
| exc[i] = e; |
| /*float r = speex_rand(g*el,&seed); |
| exc[i] = .5*(r+tmp2 + e-tmp1); |
| tmp1 = e; |
| tmp2 = r;*/ |
| } |
| |
| } |
| |
| #endif |
| } else { |
| spx_word16_t gc; |
| spx_word32_t scale; |
| int qgc = speex_bits_unpack_unsigned(bits, 4); |
| |
| el = compute_rms16(low_exc+offset, st->subframeSize); |
| |
| #ifdef FIXED_POINT |
| gc = MULT16_32_Q15(28626,gc_quant_bound[qgc]); |
| #else |
| gc = exp((1/3.7)*qgc-0.15556); |
| #endif |
| |
| if (st->subframeSize==80) |
| gc *= 1.4142; |
| |
| scale = SHL(MULT16_16(PDIV32_16(SHL(gc,SIG_SHIFT-6),filter_ratio),(1+el)),6); |
| |
| SUBMODE(innovation_unquant)(exc, SUBMODE(innovation_params), st->subframeSize, |
| bits, stack); |
| |
| signal_mul(exc,exc,scale,st->subframeSize); |
| |
| if (SUBMODE(double_codebook)) { |
| char *tmp_stack=stack; |
| VARDECL(spx_sig_t *innov2); |
| ALLOC(innov2, st->subframeSize, spx_sig_t); |
| for (i=0;i<st->subframeSize;i++) |
| innov2[i]=0; |
| SUBMODE(innovation_unquant)(innov2, SUBMODE(innovation_params), st->subframeSize, |
| bits, stack); |
| for (i=0;i<st->subframeSize;i++) |
| innov2[i]*=scale/(float)SIG_SCALING*(1/2.5); |
| for (i=0;i<st->subframeSize;i++) |
| exc[i] = ADD32(exc[i],innov2[i]); |
| stack = tmp_stack; |
| } |
| |
| } |
| |
| if (st->innov_save) |
| { |
| for (i=0;i<st->subframeSize;i++) |
| innov_save[2*i]=exc[i]; |
| } |
| |
| for (i=0;i<st->subframeSize;i++) |
| sp[i]=st->excBuf[i]; |
| iir_mem2(sp, st->interp_qlpc, sp, st->subframeSize, st->lpcSize, |
| st->mem_sp); |
| for (i=0;i<st->subframeSize;i++) |
| st->excBuf[i]=exc[i]; |
| for (i=0;i<st->lpcSize;i++) |
| st->interp_qlpc[i] = ak[i]; |
| |
| } |
| |
| fir_mem_up(st->x0d, h0, st->y0, st->full_frame_size, QMF_ORDER, st->g0_mem, stack); |
| fir_mem_up(st->high, h1, st->y1, st->full_frame_size, QMF_ORDER, st->g1_mem, stack); |
| |
| mix_and_saturate(st->y0, st->y1, out, st->full_frame_size); |
| |
| for (i=0;i<st->lpcSize;i++) |
| st->old_qlsp[i] = st->qlsp[i]; |
| |
| st->first=0; |
| |
| return 0; |
| } |
| |
| |
| int sb_encoder_ctl(void *state, int request, void *ptr) |
| { |
| SBEncState *st; |
| st=(SBEncState*)state; |
| switch(request) |
| { |
| case SPEEX_GET_FRAME_SIZE: |
| (*(int*)ptr) = st->full_frame_size; |
| break; |
| case SPEEX_SET_HIGH_MODE: |
| st->submodeSelect = st->submodeID = (*(int*)ptr); |
| break; |
| case SPEEX_SET_LOW_MODE: |
| speex_encoder_ctl(st->st_low, SPEEX_SET_LOW_MODE, ptr); |
| break; |
| case SPEEX_SET_DTX: |
| speex_encoder_ctl(st->st_low, SPEEX_SET_DTX, ptr); |
| break; |
| case SPEEX_GET_DTX: |
| speex_encoder_ctl(st->st_low, SPEEX_GET_DTX, ptr); |
| break; |
| case SPEEX_GET_LOW_MODE: |
| speex_encoder_ctl(st->st_low, SPEEX_GET_LOW_MODE, ptr); |
| break; |
| case SPEEX_SET_MODE: |
| speex_encoder_ctl(st, SPEEX_SET_QUALITY, ptr); |
| break; |
| case SPEEX_SET_VBR: |
| st->vbr_enabled = (*(int*)ptr); |
| speex_encoder_ctl(st->st_low, SPEEX_SET_VBR, ptr); |
| break; |
| case SPEEX_GET_VBR: |
| (*(int*)ptr) = st->vbr_enabled; |
| break; |
| case SPEEX_SET_VAD: |
| st->vad_enabled = (*(int*)ptr); |
| speex_encoder_ctl(st->st_low, SPEEX_SET_VAD, ptr); |
| break; |
| case SPEEX_GET_VAD: |
| (*(int*)ptr) = st->vad_enabled; |
| break; |
| case SPEEX_SET_VBR_QUALITY: |
| { |
| int q; |
| float qual = (*(float*)ptr)+.6; |
| st->vbr_quality = (*(float*)ptr); |
| if (qual>10) |
| qual=10; |
| q=(int)floor(.5+*(float*)ptr); |
| if (q>10) |
| q=10; |
| speex_encoder_ctl(st->st_low, SPEEX_SET_VBR_QUALITY, &qual); |
| speex_encoder_ctl(state, SPEEX_SET_QUALITY, &q); |
| break; |
| } |
| case SPEEX_GET_VBR_QUALITY: |
| (*(float*)ptr) = st->vbr_quality; |
| break; |
| case SPEEX_SET_ABR: |
| st->abr_enabled = (*(spx_int32_t*)ptr); |
| st->vbr_enabled = st->abr_enabled!=0; |
| speex_encoder_ctl(st->st_low, SPEEX_SET_VBR, &st->vbr_enabled); |
| if (st->vbr_enabled) |
| { |
| int i=10, rate, target; |
| float vbr_qual; |
| target = (*(spx_int32_t*)ptr); |
| while (i>=0) |
| { |
| speex_encoder_ctl(st, SPEEX_SET_QUALITY, &i); |
| speex_encoder_ctl(st, SPEEX_GET_BITRATE, &rate); |
| if (rate <= target) |
| break; |
| i--; |
| } |
| vbr_qual=i; |
| if (vbr_qual<0) |
| vbr_qual=0; |
| speex_encoder_ctl(st, SPEEX_SET_VBR_QUALITY, &vbr_qual); |
| st->abr_count=0; |
| st->abr_drift=0; |
| st->abr_drift2=0; |
| } |
| |
| break; |
| case SPEEX_GET_ABR: |
| (*(spx_int32_t*)ptr) = st->abr_enabled; |
| break; |
| case SPEEX_SET_QUALITY: |
| { |
| int nb_qual; |
| int quality = (*(int*)ptr); |
| if (quality < 0) |
| quality = 0; |
| if (quality > 10) |
| quality = 10; |
| st->submodeSelect = st->submodeID = ((const SpeexSBMode*)(st->mode->mode))->quality_map[quality]; |
| nb_qual = ((const SpeexSBMode*)(st->mode->mode))->low_quality_map[quality]; |
| speex_encoder_ctl(st->st_low, SPEEX_SET_MODE, &nb_qual); |
| } |
| break; |
| case SPEEX_SET_COMPLEXITY: |
| speex_encoder_ctl(st->st_low, SPEEX_SET_COMPLEXITY, ptr); |
| st->complexity = (*(int*)ptr); |
| if (st->complexity<1) |
| st->complexity=1; |
| break; |
| case SPEEX_GET_COMPLEXITY: |
| (*(int*)ptr) = st->complexity; |
| break; |
| case SPEEX_SET_BITRATE: |
| { |
| int i=10; |
| spx_int32_t rate, target; |
| target = (*(spx_int32_t*)ptr); |
| while (i>=0) |
| { |
| speex_encoder_ctl(st, SPEEX_SET_QUALITY, &i); |
| speex_encoder_ctl(st, SPEEX_GET_BITRATE, &rate); |
| if (rate <= target) |
| break; |
| i--; |
| } |
| } |
| break; |
| case SPEEX_GET_BITRATE: |
| speex_encoder_ctl(st->st_low, request, ptr); |
| /*fprintf (stderr, "before: %d\n", (*(int*)ptr));*/ |
| if (st->submodes[st->submodeID]) |
| (*(spx_int32_t*)ptr) += st->sampling_rate*SUBMODE(bits_per_frame)/st->full_frame_size; |
| else |
| (*(spx_int32_t*)ptr) += st->sampling_rate*(SB_SUBMODE_BITS+1)/st->full_frame_size; |
| /*fprintf (stderr, "after: %d\n", (*(int*)ptr));*/ |
| break; |
| case SPEEX_SET_SAMPLING_RATE: |
| { |
| spx_int32_t tmp=(*(spx_int32_t*)ptr); |
| st->sampling_rate = tmp; |
| tmp>>=1; |
| speex_encoder_ctl(st->st_low, SPEEX_SET_SAMPLING_RATE, &tmp); |
| } |
| break; |
| case SPEEX_GET_SAMPLING_RATE: |
| (*(spx_int32_t*)ptr)=st->sampling_rate; |
| break; |
| case SPEEX_RESET_STATE: |
| { |
| int i; |
| st->first = 1; |
| for (i=0;i<st->lpcSize;i++) |
| st->lsp[i]=(M_PI*((float)(i+1)))/(st->lpcSize+1); |
| for (i=0;i<st->lpcSize;i++) |
| st->mem_sw[i]=st->mem_sp[i]=st->mem_sp2[i]=0; |
| for (i=0;i<st->bufSize;i++) |
| st->excBuf[i]=0; |
| for (i=0;i<QMF_ORDER;i++) |
| st->h0_mem[i]=st->h1_mem[i]=st->g0_mem[i]=st->g1_mem[i]=0; |
| } |
| break; |
| case SPEEX_SET_SUBMODE_ENCODING: |
| st->encode_submode = (*(int*)ptr); |
| speex_encoder_ctl(st->st_low, SPEEX_SET_SUBMODE_ENCODING, &ptr); |
| break; |
| case SPEEX_GET_SUBMODE_ENCODING: |
| (*(int*)ptr) = st->encode_submode; |
| break; |
| case SPEEX_GET_LOOKAHEAD: |
| speex_encoder_ctl(st->st_low, SPEEX_GET_LOOKAHEAD, ptr); |
| (*(int*)ptr) = 2*(*(int*)ptr) + QMF_ORDER - 1; |
| break; |
| case SPEEX_SET_PLC_TUNING: |
| speex_encoder_ctl(st->st_low, SPEEX_SET_PLC_TUNING, ptr); |
| break; |
| case SPEEX_GET_PLC_TUNING: |
| speex_encoder_ctl(st->st_low, SPEEX_GET_PLC_TUNING, ptr); |
| break; |
| case SPEEX_SET_VBR_MAX_BITRATE: |
| { |
| int high_mode; |
| spx_int32_t high_rate; |
| st->vbr_max = (*(spx_int32_t*)ptr); |
| if (SPEEX_SET_VBR_MAX_BITRATE<1) |
| speex_encoder_ctl(st->st_low, SPEEX_SET_VBR_MAX_BITRATE, &st->vbr_max); |
| else { |
| if (st->vbr_max > 42200) |
| { |
| high_mode = 4; |
| } else if (st->vbr_max > 27800) |
| { |
| high_mode = 3; |
| } else if (st->vbr_max > 20600) |
| { |
| high_mode = 2; |
| } else high_mode = 1; |
| high_rate = st->sampling_rate*st->submodes[high_mode]->bits_per_frame/st->full_frame_size; |
| high_rate = st->vbr_max - high_rate; |
| speex_encoder_ctl(st->st_low, SPEEX_SET_VBR_MAX_BITRATE, &high_rate); |
| } |
| } |
| break; |
| case SPEEX_GET_VBR_MAX_BITRATE: |
| (*(spx_int32_t*)ptr) = st->vbr_max; |
| break; |
| |
| |
| /* This is all internal stuff past this point */ |
| case SPEEX_GET_PI_GAIN: |
| { |
| int i; |
| spx_word32_t *g = (spx_word32_t*)ptr; |
| for (i=0;i<st->nbSubframes;i++) |
| g[i]=st->pi_gain[i]; |
| } |
| break; |
| case SPEEX_GET_EXC: |
| { |
| int i; |
| spx_sig_t *e = (spx_sig_t*)ptr; |
| for (i=0;i<st->full_frame_size;i++) |
| e[i]=0; |
| for (i=0;i<st->frame_size;i++) |
| e[2*i]=2*st->exc[i]; |
| } |
| break; |
| case SPEEX_GET_INNOV: |
| { |
| int i; |
| spx_sig_t *e = (spx_sig_t*)ptr; |
| for (i=0;i<st->full_frame_size;i++) |
| e[i]=0; |
| for (i=0;i<st->frame_size;i++) |
| e[2*i]=2*st->exc[i]; |
| } |
| break; |
| case SPEEX_GET_RELATIVE_QUALITY: |
| (*(float*)ptr)=st->relative_quality; |
| break; |
| case SPEEX_SET_INNOVATION_SAVE: |
| st->innov_save = ptr; |
| break; |
| default: |
| speex_warning_int("Unknown nb_ctl request: ", request); |
| return -1; |
| } |
| return 0; |
| } |
| |
| int sb_decoder_ctl(void *state, int request, void *ptr) |
| { |
| SBDecState *st; |
| st=(SBDecState*)state; |
| switch(request) |
| { |
| case SPEEX_SET_HIGH_MODE: |
| st->submodeID = (*(int*)ptr); |
| break; |
| case SPEEX_SET_LOW_MODE: |
| speex_decoder_ctl(st->st_low, SPEEX_SET_LOW_MODE, ptr); |
| break; |
| case SPEEX_GET_LOW_MODE: |
| speex_decoder_ctl(st->st_low, SPEEX_GET_LOW_MODE, ptr); |
| break; |
| case SPEEX_GET_FRAME_SIZE: |
| (*(int*)ptr) = st->full_frame_size; |
| break; |
| case SPEEX_SET_ENH: |
| speex_decoder_ctl(st->st_low, request, ptr); |
| st->lpc_enh_enabled = *((int*)ptr); |
| break; |
| case SPEEX_GET_ENH: |
| *((int*)ptr) = st->lpc_enh_enabled; |
| break; |
| case SPEEX_SET_MODE: |
| case SPEEX_SET_QUALITY: |
| { |
| int nb_qual; |
| int quality = (*(int*)ptr); |
| if (quality < 0) |
| quality = 0; |
| if (quality > 10) |
| quality = 10; |
| st->submodeID = ((const SpeexSBMode*)(st->mode->mode))->quality_map[quality]; |
| nb_qual = ((const SpeexSBMode*)(st->mode->mode))->low_quality_map[quality]; |
| speex_decoder_ctl(st->st_low, SPEEX_SET_MODE, &nb_qual); |
| } |
| break; |
| case SPEEX_GET_BITRATE: |
| speex_decoder_ctl(st->st_low, request, ptr); |
| if (st->submodes[st->submodeID]) |
| (*(spx_int32_t*)ptr) += st->sampling_rate*SUBMODE(bits_per_frame)/st->full_frame_size; |
| else |
| (*(spx_int32_t*)ptr) += st->sampling_rate*(SB_SUBMODE_BITS+1)/st->full_frame_size; |
| break; |
| case SPEEX_SET_SAMPLING_RATE: |
| { |
| spx_int32_t tmp=(*(spx_int32_t*)ptr); |
| st->sampling_rate = tmp; |
| tmp>>=1; |
| speex_decoder_ctl(st->st_low, SPEEX_SET_SAMPLING_RATE, &tmp); |
| } |
| break; |
| case SPEEX_GET_SAMPLING_RATE: |
| (*(spx_int32_t*)ptr)=st->sampling_rate; |
| break; |
| case SPEEX_SET_HANDLER: |
| speex_decoder_ctl(st->st_low, SPEEX_SET_HANDLER, ptr); |
| break; |
| case SPEEX_SET_USER_HANDLER: |
| speex_decoder_ctl(st->st_low, SPEEX_SET_USER_HANDLER, ptr); |
| break; |
| case SPEEX_RESET_STATE: |
| { |
| int i; |
| for (i=0;i<2*st->lpcSize;i++) |
| st->mem_sp[i]=0; |
| for (i=0;i<QMF_ORDER;i++) |
| st->g0_mem[i]=st->g1_mem[i]=0; |
| } |
| break; |
| case SPEEX_SET_SUBMODE_ENCODING: |
| st->encode_submode = (*(int*)ptr); |
| speex_decoder_ctl(st->st_low, SPEEX_SET_SUBMODE_ENCODING, &ptr); |
| break; |
| case SPEEX_GET_SUBMODE_ENCODING: |
| (*(int*)ptr) = st->encode_submode; |
| break; |
| case SPEEX_GET_LOOKAHEAD: |
| speex_decoder_ctl(st->st_low, SPEEX_GET_LOOKAHEAD, ptr); |
| (*(int*)ptr) = 2*(*(int*)ptr); |
| break; |
| case SPEEX_GET_PI_GAIN: |
| { |
| int i; |
| spx_word32_t *g = (spx_word32_t*)ptr; |
| for (i=0;i<st->nbSubframes;i++) |
| g[i]=st->pi_gain[i]; |
| } |
| break; |
| case SPEEX_GET_EXC: |
| { |
| int i; |
| spx_sig_t *e = (spx_sig_t*)ptr; |
| for (i=0;i<st->full_frame_size;i++) |
| e[i]=0; |
| for (i=0;i<st->frame_size;i++) |
| e[2*i]=2*st->exc[i]; |
| } |
| break; |
| case SPEEX_GET_INNOV: |
| { |
| int i; |
| spx_sig_t *e = (spx_sig_t*)ptr; |
| for (i=0;i<st->full_frame_size;i++) |
| e[i]=0; |
| for (i=0;i<st->frame_size;i++) |
| e[2*i]=2*st->exc[i]; |
| } |
| break; |
| case SPEEX_GET_DTX_STATUS: |
| speex_decoder_ctl(st->st_low, SPEEX_GET_DTX_STATUS, ptr); |
| break; |
| case SPEEX_SET_INNOVATION_SAVE: |
| st->innov_save = ptr; |
| break; |
| default: |
| speex_warning_int("Unknown nb_ctl request: ", request); |
| return -1; |
| } |
| return 0; |
| } |
| |
| #endif |
| |