123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443 |
- /* Copyright (C) 2002-2006 Jean-Marc Valin
- File: sb_celp.c
- Redistribution and use in source and binary forms, with or without
- modification, are permitted provided that the following conditions
- are met:
- - Redistributions of source code must retain the above copyright
- notice, this list of conditions and the following disclaimer.
- - Redistributions in binary form must reproduce the above copyright
- notice, this list of conditions and the following disclaimer in the
- documentation and/or other materials provided with the distribution.
- - Neither the name of the Xiph.org Foundation nor the names of its
- contributors may be used to endorse or promote products derived from
- this software without specific prior written permission.
- THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
- ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
- LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
- A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR
- CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
- EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
- PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
- PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
- LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
- NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- */
- #ifdef HAVE_CONFIG_H
- #include "config.h"
- #endif
- #include <math.h>
- #include "sb_celp.h"
- #include "filters.h"
- #include "lpc.h"
- #include "lsp.h"
- #include "stack_alloc.h"
- #include "cb_search.h"
- #include "quant_lsp.h"
- #include "vq.h"
- #include "ltp.h"
- #include "arch.h"
- #include "math_approx.h"
- #include "os_support.h"
- #ifndef NULL
- #define NULL 0
- #endif
- /* Default size for the encoder and decoder stack (can be changed at compile time).
- This does not apply when using variable-size arrays or alloca. */
- #ifndef SB_ENC_STACK
- #define SB_ENC_STACK (10000*sizeof(spx_sig_t))
- #endif
- #ifndef SB_DEC_STACK
- #define SB_DEC_STACK (6000*sizeof(spx_sig_t))
- #endif
- #ifndef DISABLE_WIDEBAND
- #define SUBMODE(x) st->submodes[st->submodeID]->x
- #ifdef FIXED_POINT
- static const spx_word16_t gc_quant_bound[16] = {125, 164, 215, 282, 370, 484, 635, 832, 1090, 1428, 1871, 2452, 3213, 4210, 5516, 7228};
- static const spx_word16_t fold_quant_bound[32] = {
- 39, 44, 50, 57, 64, 73, 83, 94,
- 106, 120, 136, 154, 175, 198, 225, 255,
- 288, 327, 370, 420, 476, 539, 611, 692,
- 784, 889, 1007, 1141, 1293, 1465, 1660, 1881};
- #define LSP_MARGIN 410
- #define LSP_DELTA1 6553
- #define LSP_DELTA2 1638
- #else
- static const spx_word16_t gc_quant_bound[16] = {
- 0.97979, 1.28384, 1.68223, 2.20426, 2.88829, 3.78458, 4.95900, 6.49787,
- 8.51428, 11.15642, 14.61846, 19.15484, 25.09895, 32.88761, 43.09325, 56.46588};
- static const spx_word16_t fold_quant_bound[32] = {
- 0.30498, 0.34559, 0.39161, 0.44375, 0.50283, 0.56979, 0.64565, 0.73162,
- 0.82903, 0.93942, 1.06450, 1.20624, 1.36685, 1.54884, 1.75506, 1.98875,
- 2.25355, 2.55360, 2.89361, 3.27889, 3.71547, 4.21018, 4.77076, 5.40598,
- 6.12577, 6.94141, 7.86565, 8.91295, 10.09969, 11.44445, 12.96826, 14.69497};
- #define LSP_MARGIN .05
- #define LSP_DELTA1 .2
- #define LSP_DELTA2 .05
- #endif
- #define QMF_ORDER 64
- #ifdef FIXED_POINT
- static const spx_word16_t h0[64] = {2, -7, -7, 18, 15, -39, -25, 75, 35, -130, -41, 212, 38, -327, -17, 483, -32, -689, 124, 956, -283, -1307, 543, 1780, -973, -2467, 1733, 3633, -3339, -6409, 9059, 30153, 30153, 9059, -6409, -3339, 3633, 1733, -2467, -973, 1780, 543, -1307, -283, 956, 124, -689, -32, 483, -17, -327, 38, 212, -41, -130, 35, 75, -25, -39, 15, 18, -7, -7, 2};
- #else
- static const float h0[64] = {
- 3.596189e-05f, -0.0001123515f,
- -0.0001104587f, 0.0002790277f,
- 0.0002298438f, -0.0005953563f,
- -0.0003823631f, 0.00113826f,
- 0.0005308539f, -0.001986177f,
- -0.0006243724f, 0.003235877f,
- 0.0005743159f, -0.004989147f,
- -0.0002584767f, 0.007367171f,
- -0.0004857935f, -0.01050689f,
- 0.001894714f, 0.01459396f,
- -0.004313674f, -0.01994365f,
- 0.00828756f, 0.02716055f,
- -0.01485397f, -0.03764973f,
- 0.026447f, 0.05543245f,
- -0.05095487f, -0.09779096f,
- 0.1382363f, 0.4600981f,
- 0.4600981f, 0.1382363f,
- -0.09779096f, -0.05095487f,
- 0.05543245f, 0.026447f,
- -0.03764973f, -0.01485397f,
- 0.02716055f, 0.00828756f,
- -0.01994365f, -0.004313674f,
- 0.01459396f, 0.001894714f,
- -0.01050689f, -0.0004857935f,
- 0.007367171f, -0.0002584767f,
- -0.004989147f, 0.0005743159f,
- 0.003235877f, -0.0006243724f,
- -0.001986177f, 0.0005308539f,
- 0.00113826f, -0.0003823631f,
- -0.0005953563f, 0.0002298438f,
- 0.0002790277f, -0.0001104587f,
- -0.0001123515f, 3.596189e-05f
- };
- #endif
- extern const spx_word16_t lag_window[];
- extern const spx_word16_t lpc_window[];
- #ifndef DISABLE_ENCODER
- void *sb_encoder_init(const SpeexMode *m)
- {
- int i;
- spx_int32_t tmp;
- SBEncState *st;
- const SpeexSBMode *mode;
- st = (SBEncState*)speex_alloc(sizeof(SBEncState));
- if (!st)
- return NULL;
- st->mode = m;
- mode = (const SpeexSBMode*)m->mode;
- st->st_low = speex_encoder_init(mode->nb_mode);
- #if defined(VAR_ARRAYS) || defined (USE_ALLOCA)
- st->stack = NULL;
- #else
- /*st->stack = (char*)speex_alloc_scratch(SB_ENC_STACK);*/
- speex_encoder_ctl(st->st_low, SPEEX_GET_STACK, &st->stack);
- #endif
- st->full_frame_size = 2*mode->frameSize;
- st->frame_size = mode->frameSize;
- st->subframeSize = mode->subframeSize;
- st->nbSubframes = mode->frameSize/mode->subframeSize;
- st->windowSize = st->frame_size+st->subframeSize;
- st->lpcSize=mode->lpcSize;
- st->encode_submode = 1;
- st->submodes=mode->submodes;
- st->submodeSelect = st->submodeID=mode->defaultSubmode;
- tmp=9;
- speex_encoder_ctl(st->st_low, SPEEX_SET_QUALITY, &tmp);
- tmp=1;
- speex_encoder_ctl(st->st_low, SPEEX_SET_WIDEBAND, &tmp);
- st->lpc_floor = mode->lpc_floor;
- st->gamma1=mode->gamma1;
- st->gamma2=mode->gamma2;
- st->first=1;
- st->high=(spx_word16_t*)speex_alloc((st->windowSize-st->frame_size)*sizeof(spx_word16_t));
- st->h0_mem=(spx_word16_t*)speex_alloc((QMF_ORDER)*sizeof(spx_word16_t));
- st->window= lpc_window;
- st->lagWindow = lag_window;
- st->old_lsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
- st->old_qlsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
- st->interp_qlpc = (spx_coef_t*)speex_alloc(st->lpcSize*sizeof(spx_coef_t));
- st->pi_gain = (spx_word32_t*)speex_alloc((st->nbSubframes)*sizeof(spx_word32_t));
- st->exc_rms = (spx_word16_t*)speex_alloc((st->nbSubframes)*sizeof(spx_word16_t));
- st->innov_rms_save = NULL;
- st->mem_sp = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
- st->mem_sp2 = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
- st->mem_sw = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
- for (i=0;i<st->lpcSize;i++)
- st->old_lsp[i]= DIV32(MULT16_16(QCONST16(3.1415927f, LSP_SHIFT), i+1), st->lpcSize+1);
- #ifndef DISABLE_VBR
- st->vbr_quality = 8;
- st->vbr_enabled = 0;
- st->vbr_max = 0;
- st->vbr_max_high = 20000; /* We just need a big value here */
- st->vad_enabled = 0;
- st->abr_enabled = 0;
- st->relative_quality=0;
- #endif /* #ifndef DISABLE_VBR */
- st->complexity=2;
- speex_encoder_ctl(st->st_low, SPEEX_GET_SAMPLING_RATE, &st->sampling_rate);
- st->sampling_rate*=2;
- #ifdef ENABLE_VALGRIND
- VALGRIND_MAKE_MEM_DEFINED(st, (st->stack-(char*)st));
- #endif
- return st;
- }
- void sb_encoder_destroy(void *state)
- {
- SBEncState *st=(SBEncState*)state;
- speex_encoder_destroy(st->st_low);
- #if !(defined(VAR_ARRAYS) || defined (USE_ALLOCA))
- /*speex_free_scratch(st->stack);*/
- #endif
- speex_free(st->high);
- speex_free(st->h0_mem);
- speex_free(st->old_lsp);
- speex_free(st->old_qlsp);
- speex_free(st->interp_qlpc);
- speex_free(st->pi_gain);
- speex_free(st->exc_rms);
- speex_free(st->mem_sp);
- speex_free(st->mem_sp2);
- speex_free(st->mem_sw);
- speex_free(st);
- }
- int sb_encoder_ctl(void *state, int request, void *ptr)
- {
- SBEncState *st;
- st=(SBEncState*)state;
- switch(request)
- {
- case SPEEX_GET_FRAME_SIZE:
- (*(spx_int32_t*)ptr) = st->full_frame_size;
- break;
- case SPEEX_SET_HIGH_MODE:
- st->submodeSelect = st->submodeID = (*(spx_int32_t*)ptr);
- break;
- case SPEEX_SET_LOW_MODE:
- speex_encoder_ctl(st->st_low, SPEEX_SET_LOW_MODE, ptr);
- break;
- case SPEEX_SET_DTX:
- speex_encoder_ctl(st->st_low, SPEEX_SET_DTX, ptr);
- break;
- case SPEEX_GET_DTX:
- speex_encoder_ctl(st->st_low, SPEEX_GET_DTX, ptr);
- break;
- case SPEEX_GET_LOW_MODE:
- speex_encoder_ctl(st->st_low, SPEEX_GET_LOW_MODE, ptr);
- break;
- case SPEEX_SET_MODE:
- speex_encoder_ctl(st, SPEEX_SET_QUALITY, ptr);
- break;
- #ifndef DISABLE_VBR
- case SPEEX_SET_VBR:
- st->vbr_enabled = (*(spx_int32_t*)ptr);
- speex_encoder_ctl(st->st_low, SPEEX_SET_VBR, ptr);
- break;
- case SPEEX_GET_VBR:
- (*(spx_int32_t*)ptr) = st->vbr_enabled;
- break;
- case SPEEX_SET_VAD:
- st->vad_enabled = (*(spx_int32_t*)ptr);
- speex_encoder_ctl(st->st_low, SPEEX_SET_VAD, ptr);
- break;
- case SPEEX_GET_VAD:
- (*(spx_int32_t*)ptr) = st->vad_enabled;
- break;
- #endif /* #ifndef DISABLE_VBR */
- #if !defined(DISABLE_VBR) && !defined(DISABLE_FLOAT_API)
- case SPEEX_SET_VBR_QUALITY:
- {
- spx_int32_t q;
- float qual = (*(float*)ptr)+.6;
- st->vbr_quality = (*(float*)ptr);
- if (qual>10)
- qual=10;
- q=(int)floor(.5+*(float*)ptr);
- if (q>10)
- q=10;
- speex_encoder_ctl(st->st_low, SPEEX_SET_VBR_QUALITY, &qual);
- speex_encoder_ctl(state, SPEEX_SET_QUALITY, &q);
- break;
- }
- case SPEEX_GET_VBR_QUALITY:
- (*(float*)ptr) = st->vbr_quality;
- break;
- #endif /* #if !defined(DISABLE_VBR) && !defined(DISABLE_FLOAT_API) */
- #ifndef DISABLE_VBR
- case SPEEX_SET_ABR:
- st->abr_enabled = (*(spx_int32_t*)ptr);
- st->vbr_enabled = st->abr_enabled!=0;
- speex_encoder_ctl(st->st_low, SPEEX_SET_VBR, &st->vbr_enabled);
- if (st->vbr_enabled)
- {
- spx_int32_t i=10, rate, target;
- float vbr_qual;
- target = (*(spx_int32_t*)ptr);
- while (i>=0)
- {
- speex_encoder_ctl(st, SPEEX_SET_QUALITY, &i);
- speex_encoder_ctl(st, SPEEX_GET_BITRATE, &rate);
- if (rate <= target)
- break;
- i--;
- }
- vbr_qual=i;
- if (vbr_qual<0)
- vbr_qual=0;
- speex_encoder_ctl(st, SPEEX_SET_VBR_QUALITY, &vbr_qual);
- st->abr_count=0;
- st->abr_drift=0;
- st->abr_drift2=0;
- }
- break;
- case SPEEX_GET_ABR:
- (*(spx_int32_t*)ptr) = st->abr_enabled;
- break;
- #endif /* #ifndef DISABLE_VBR */
- case SPEEX_SET_QUALITY:
- {
- spx_int32_t nb_qual;
- int quality = (*(spx_int32_t*)ptr);
- if (quality < 0)
- quality = 0;
- if (quality > 10)
- quality = 10;
- st->submodeSelect = st->submodeID = ((const SpeexSBMode*)(st->mode->mode))->quality_map[quality];
- nb_qual = ((const SpeexSBMode*)(st->mode->mode))->low_quality_map[quality];
- speex_encoder_ctl(st->st_low, SPEEX_SET_MODE, &nb_qual);
- }
- break;
- case SPEEX_SET_COMPLEXITY:
- speex_encoder_ctl(st->st_low, SPEEX_SET_COMPLEXITY, ptr);
- st->complexity = (*(spx_int32_t*)ptr);
- if (st->complexity<1)
- st->complexity=1;
- break;
- case SPEEX_GET_COMPLEXITY:
- (*(spx_int32_t*)ptr) = st->complexity;
- break;
- case SPEEX_SET_BITRATE:
- {
- spx_int32_t i=10;
- spx_int32_t rate, target;
- target = (*(spx_int32_t*)ptr);
- while (i>=0)
- {
- speex_encoder_ctl(st, SPEEX_SET_QUALITY, &i);
- speex_encoder_ctl(st, SPEEX_GET_BITRATE, &rate);
- if (rate <= target)
- break;
- i--;
- }
- }
- break;
- case SPEEX_GET_BITRATE:
- speex_encoder_ctl(st->st_low, request, ptr);
- /*fprintf (stderr, "before: %d\n", (*(int*)ptr));*/
- if (st->submodes[st->submodeID])
- (*(spx_int32_t*)ptr) += st->sampling_rate*SUBMODE(bits_per_frame)/st->full_frame_size;
- else
- (*(spx_int32_t*)ptr) += st->sampling_rate*(SB_SUBMODE_BITS+1)/st->full_frame_size;
- /*fprintf (stderr, "after: %d\n", (*(int*)ptr));*/
- break;
- case SPEEX_SET_SAMPLING_RATE:
- {
- spx_int32_t tmp=(*(spx_int32_t*)ptr);
- st->sampling_rate = tmp;
- tmp>>=1;
- speex_encoder_ctl(st->st_low, SPEEX_SET_SAMPLING_RATE, &tmp);
- }
- break;
- case SPEEX_GET_SAMPLING_RATE:
- (*(spx_int32_t*)ptr)=st->sampling_rate;
- break;
- case SPEEX_RESET_STATE:
- {
- int i;
- st->first = 1;
- for (i=0;i<st->lpcSize;i++)
- st->old_lsp[i]= DIV32(MULT16_16(QCONST16(3.1415927f, LSP_SHIFT), i+1), st->lpcSize+1);
- for (i=0;i<st->lpcSize;i++)
- st->mem_sw[i]=st->mem_sp[i]=st->mem_sp2[i]=0;
- for (i=0;i<QMF_ORDER;i++)
- st->h0_mem[i]=0;
- }
- break;
- case SPEEX_SET_SUBMODE_ENCODING:
- st->encode_submode = (*(spx_int32_t*)ptr);
- speex_encoder_ctl(st->st_low, SPEEX_SET_SUBMODE_ENCODING, ptr);
- break;
- case SPEEX_GET_SUBMODE_ENCODING:
- (*(spx_int32_t*)ptr) = st->encode_submode;
- break;
- case SPEEX_GET_LOOKAHEAD:
- speex_encoder_ctl(st->st_low, SPEEX_GET_LOOKAHEAD, ptr);
- (*(spx_int32_t*)ptr) = 2*(*(spx_int32_t*)ptr) + QMF_ORDER - 1;
- break;
- case SPEEX_SET_PLC_TUNING:
- speex_encoder_ctl(st->st_low, SPEEX_SET_PLC_TUNING, ptr);
- break;
- case SPEEX_GET_PLC_TUNING:
- speex_encoder_ctl(st->st_low, SPEEX_GET_PLC_TUNING, ptr);
- break;
- #ifndef DISABLE_VBR
- case SPEEX_SET_VBR_MAX_BITRATE:
- {
- st->vbr_max = (*(spx_int32_t*)ptr);
- if (SPEEX_SET_VBR_MAX_BITRATE<1)
- {
- speex_encoder_ctl(st->st_low, SPEEX_SET_VBR_MAX_BITRATE, &st->vbr_max);
- st->vbr_max_high = 17600;
- } else {
- spx_int32_t low_rate;
- if (st->vbr_max >= 42200)
- {
- st->vbr_max_high = 17600;
- } else if (st->vbr_max >= 27800)
- {
- st->vbr_max_high = 9600;
- } else if (st->vbr_max > 20600)
- {
- st->vbr_max_high = 5600;
- } else {
- st->vbr_max_high = 1800;
- }
- if (st->subframeSize==80)
- st->vbr_max_high = 1800;
- low_rate = st->vbr_max - st->vbr_max_high;
- speex_encoder_ctl(st->st_low, SPEEX_SET_VBR_MAX_BITRATE, &low_rate);
- }
- }
- break;
- case SPEEX_GET_VBR_MAX_BITRATE:
- (*(spx_int32_t*)ptr) = st->vbr_max;
- break;
- #endif /* #ifndef DISABLE_VBR */
- case SPEEX_SET_HIGHPASS:
- speex_encoder_ctl(st->st_low, SPEEX_SET_HIGHPASS, ptr);
- break;
- case SPEEX_GET_HIGHPASS:
- speex_encoder_ctl(st->st_low, SPEEX_GET_HIGHPASS, ptr);
- break;
- /* This is all internal stuff past this point */
- case SPEEX_GET_PI_GAIN:
- {
- int i;
- spx_word32_t *g = (spx_word32_t*)ptr;
- for (i=0;i<st->nbSubframes;i++)
- g[i]=st->pi_gain[i];
- }
- break;
- case SPEEX_GET_EXC:
- {
- int i;
- for (i=0;i<st->nbSubframes;i++)
- ((spx_word16_t*)ptr)[i] = st->exc_rms[i];
- }
- break;
- #ifndef DISABLE_VBR
- case SPEEX_GET_RELATIVE_QUALITY:
- (*(float*)ptr)=st->relative_quality;
- break;
- #endif /* #ifndef DISABLE_VBR */
- case SPEEX_SET_INNOVATION_SAVE:
- st->innov_rms_save = (spx_word16_t*)ptr;
- break;
- case SPEEX_SET_WIDEBAND:
- speex_encoder_ctl(st->st_low, SPEEX_SET_WIDEBAND, ptr);
- break;
- case SPEEX_GET_STACK:
- *((char**)ptr) = st->stack;
- break;
- default:
- speex_warning_int("Unknown nb_ctl request: ", request);
- return -1;
- }
- return 0;
- }
- int sb_encode(void *state, void *vin, SpeexBits *bits)
- {
- SBEncState *st;
- int i, roots, sub;
- char *stack;
- VARDECL(spx_mem_t *mem);
- VARDECL(spx_sig_t *innov);
- VARDECL(spx_word16_t *target);
- VARDECL(spx_word16_t *syn_resp);
- VARDECL(spx_word32_t *low_pi_gain);
- spx_word16_t *low;
- spx_word16_t *high;
- VARDECL(spx_word16_t *low_exc_rms);
- VARDECL(spx_word16_t *low_innov_rms);
- const SpeexSBMode *mode;
- spx_int32_t dtx;
- spx_word16_t *in = (spx_word16_t*)vin;
- spx_word16_t e_low=0, e_high=0;
- VARDECL(spx_coef_t *lpc);
- VARDECL(spx_coef_t *interp_lpc);
- VARDECL(spx_coef_t *bw_lpc1);
- VARDECL(spx_coef_t *bw_lpc2);
- VARDECL(spx_lsp_t *lsp);
- VARDECL(spx_lsp_t *qlsp);
- VARDECL(spx_lsp_t *interp_lsp);
- VARDECL(spx_lsp_t *interp_qlsp);
- st = (SBEncState*)state;
- stack=st->stack;
- mode = (const SpeexSBMode*)(st->mode->mode);
- low = in;
- high = in+st->frame_size;
- /* High-band buffering / sync with low band */
- /* Compute the two sub-bands by filtering with QMF h0*/
- qmf_decomp(in, h0, low, high, st->full_frame_size, QMF_ORDER, st->h0_mem, stack);
- #ifndef DISABLE_VBR
- if (st->vbr_enabled || st->vad_enabled)
- {
- /* Need to compute things here before the signal is trashed by the encoder */
- /*FIXME: Are the two signals (low, high) in sync? */
- e_low = compute_rms16(low, st->frame_size);
- e_high = compute_rms16(high, st->frame_size);
- }
- #endif /* #ifndef DISABLE_VBR */
- ALLOC(low_innov_rms, st->nbSubframes, spx_word16_t);
- speex_encoder_ctl(st->st_low, SPEEX_SET_INNOVATION_SAVE, low_innov_rms);
- /* Encode the narrowband part*/
- speex_encode_native(st->st_low, low, bits);
- high = high - (st->windowSize-st->frame_size);
- SPEEX_COPY(high, st->high, st->windowSize-st->frame_size);
- SPEEX_COPY(st->high, &high[st->frame_size], st->windowSize-st->frame_size);
- ALLOC(low_pi_gain, st->nbSubframes, spx_word32_t);
- ALLOC(low_exc_rms, st->nbSubframes, spx_word16_t);
- speex_encoder_ctl(st->st_low, SPEEX_GET_PI_GAIN, low_pi_gain);
- speex_encoder_ctl(st->st_low, SPEEX_GET_EXC, low_exc_rms);
- speex_encoder_ctl(st->st_low, SPEEX_GET_LOW_MODE, &dtx);
- if (dtx==0)
- dtx=1;
- else
- dtx=0;
- ALLOC(lpc, st->lpcSize, spx_coef_t);
- ALLOC(interp_lpc, st->lpcSize, spx_coef_t);
- ALLOC(bw_lpc1, st->lpcSize, spx_coef_t);
- ALLOC(bw_lpc2, st->lpcSize, spx_coef_t);
- ALLOC(lsp, st->lpcSize, spx_lsp_t);
- ALLOC(qlsp, st->lpcSize, spx_lsp_t);
- ALLOC(interp_lsp, st->lpcSize, spx_lsp_t);
- ALLOC(interp_qlsp, st->lpcSize, spx_lsp_t);
- {
- VARDECL(spx_word16_t *autocorr);
- VARDECL(spx_word16_t *w_sig);
- ALLOC(autocorr, st->lpcSize+1, spx_word16_t);
- ALLOC(w_sig, st->windowSize, spx_word16_t);
- /* Window for analysis */
- /* FIXME: This is a kludge */
- if (st->subframeSize==80)
- {
- for (i=0;i<st->windowSize;i++)
- w_sig[i] = EXTRACT16(SHR32(MULT16_16(high[i],st->window[i>>1]),SIG_SHIFT));
- } else {
- for (i=0;i<st->windowSize;i++)
- w_sig[i] = EXTRACT16(SHR32(MULT16_16(high[i],st->window[i]),SIG_SHIFT));
- }
- /* Compute auto-correlation */
- _spx_autocorr(w_sig, autocorr, st->lpcSize+1, st->windowSize);
- autocorr[0] = ADD16(autocorr[0],MULT16_16_Q15(autocorr[0],st->lpc_floor)); /* Noise floor in auto-correlation domain */
- /* Lag windowing: equivalent to filtering in the power-spectrum domain */
- for (i=0;i<st->lpcSize+1;i++)
- autocorr[i] = MULT16_16_Q14(autocorr[i],st->lagWindow[i]);
- /* Levinson-Durbin */
- _spx_lpc(lpc, autocorr, st->lpcSize);
- }
- /* LPC to LSPs (x-domain) transform */
- roots=lpc_to_lsp (lpc, st->lpcSize, lsp, 10, LSP_DELTA1, stack);
- if (roots!=st->lpcSize)
- {
- roots = lpc_to_lsp (lpc, st->lpcSize, lsp, 10, LSP_DELTA2, stack);
- if (roots!=st->lpcSize) {
- /*If we can't find all LSP's, do some damage control and use a flat filter*/
- for (i=0;i<st->lpcSize;i++)
- {
- lsp[i]=st->old_lsp[i];
- }
- }
- }
- #ifndef DISABLE_VBR
- /* VBR code */
- if ((st->vbr_enabled || st->vad_enabled) && !dtx)
- {
- float ratio;
- if (st->abr_enabled)
- {
- float qual_change=0;
- if (st->abr_drift2 * st->abr_drift > 0)
- {
- /* Only adapt if long-term and short-term drift are the same sign */
- qual_change = -.00001*st->abr_drift/(1+st->abr_count);
- if (qual_change>.1)
- qual_change=.1;
- if (qual_change<-.1)
- qual_change=-.1;
- }
- st->vbr_quality += qual_change;
- if (st->vbr_quality>10)
- st->vbr_quality=10;
- if (st->vbr_quality<0)
- st->vbr_quality=0;
- }
- ratio = 2*log((1.f+e_high)/(1.f+e_low));
- speex_encoder_ctl(st->st_low, SPEEX_GET_RELATIVE_QUALITY, &st->relative_quality);
- if (ratio<-4)
- ratio=-4;
- if (ratio>2)
- ratio=2;
- /*if (ratio>-2)*/
- if (st->vbr_enabled)
- {
- spx_int32_t modeid;
- modeid = mode->nb_modes-1;
- st->relative_quality+=1.0*(ratio+2);
- if (st->relative_quality<-1)
- st->relative_quality=-1;
- while (modeid)
- {
- int v1;
- float thresh;
- v1=(int)floor(st->vbr_quality);
- if (v1==10)
- thresh = mode->vbr_thresh[modeid][v1];
- else
- thresh = (st->vbr_quality-v1) * mode->vbr_thresh[modeid][v1+1] +
- (1+v1-st->vbr_quality) * mode->vbr_thresh[modeid][v1];
- if (st->relative_quality >= thresh && st->sampling_rate*st->submodes[modeid]->bits_per_frame/st->full_frame_size <= st->vbr_max_high)
- break;
- modeid--;
- }
- speex_encoder_ctl(state, SPEEX_SET_HIGH_MODE, &modeid);
- if (st->abr_enabled)
- {
- spx_int32_t bitrate;
- speex_encoder_ctl(state, SPEEX_GET_BITRATE, &bitrate);
- st->abr_drift+=(bitrate-st->abr_enabled);
- st->abr_drift2 = .95*st->abr_drift2 + .05*(bitrate-st->abr_enabled);
- st->abr_count += 1.0;
- }
- } else {
- /* VAD only */
- int modeid;
- if (st->relative_quality<2.0)
- modeid=1;
- else
- modeid=st->submodeSelect;
- /*speex_encoder_ctl(state, SPEEX_SET_MODE, &mode);*/
- st->submodeID=modeid;
- }
- /*fprintf (stderr, "%f %f\n", ratio, low_qual);*/
- }
- #endif /* #ifndef DISABLE_VBR */
- if (st->encode_submode)
- {
- speex_bits_pack(bits, 1, 1);
- if (dtx)
- speex_bits_pack(bits, 0, SB_SUBMODE_BITS);
- else
- speex_bits_pack(bits, st->submodeID, SB_SUBMODE_BITS);
- }
- /* If null mode (no transmission), just set a couple things to zero*/
- if (dtx || st->submodes[st->submodeID] == NULL)
- {
- for (i=0;i<st->frame_size;i++)
- high[i]=VERY_SMALL;
- for (i=0;i<st->lpcSize;i++)
- st->mem_sw[i]=0;
- st->first=1;
- /* Final signal synthesis from excitation */
- iir_mem16(high, st->interp_qlpc, high, st->frame_size, st->lpcSize, st->mem_sp, stack);
- if (dtx)
- return 0;
- else
- return 1;
- }
- /* LSP quantization */
- SUBMODE(lsp_quant)(lsp, qlsp, st->lpcSize, bits);
- if (st->first)
- {
- for (i=0;i<st->lpcSize;i++)
- st->old_lsp[i] = lsp[i];
- for (i=0;i<st->lpcSize;i++)
- st->old_qlsp[i] = qlsp[i];
- }
- ALLOC(mem, st->lpcSize, spx_mem_t);
- ALLOC(syn_resp, st->subframeSize, spx_word16_t);
- ALLOC(innov, st->subframeSize, spx_sig_t);
- ALLOC(target, st->subframeSize, spx_word16_t);
- for (sub=0;sub<st->nbSubframes;sub++)
- {
- VARDECL(spx_word16_t *exc);
- VARDECL(spx_word16_t *res);
- VARDECL(spx_word16_t *sw);
- spx_word16_t *sp;
- spx_word16_t filter_ratio; /*Q7*/
- int offset;
- spx_word32_t rl, rh; /*Q13*/
- spx_word16_t eh=0;
- offset = st->subframeSize*sub;
- sp=high+offset;
- ALLOC(exc, st->subframeSize, spx_word16_t);
- ALLOC(res, st->subframeSize, spx_word16_t);
- ALLOC(sw, st->subframeSize, spx_word16_t);
- /* LSP interpolation (quantized and unquantized) */
- lsp_interpolate(st->old_lsp, lsp, interp_lsp, st->lpcSize, sub, st->nbSubframes, LSP_MARGIN);
- lsp_interpolate(st->old_qlsp, qlsp, interp_qlsp, st->lpcSize, sub, st->nbSubframes, LSP_MARGIN);
- lsp_to_lpc(interp_lsp, interp_lpc, st->lpcSize,stack);
- lsp_to_lpc(interp_qlsp, st->interp_qlpc, st->lpcSize, stack);
- bw_lpc(st->gamma1, interp_lpc, bw_lpc1, st->lpcSize);
- bw_lpc(st->gamma2, interp_lpc, bw_lpc2, st->lpcSize);
- /* Compute mid-band (4000 Hz for wideband) response of low-band and high-band
- filters */
- st->pi_gain[sub]=LPC_SCALING;
- rh = LPC_SCALING;
- for (i=0;i<st->lpcSize;i+=2)
- {
- rh += st->interp_qlpc[i+1] - st->interp_qlpc[i];
- st->pi_gain[sub] += st->interp_qlpc[i] + st->interp_qlpc[i+1];
- }
- rl = low_pi_gain[sub];
- #ifdef FIXED_POINT
- filter_ratio=EXTRACT16(SATURATE(PDIV32(SHL32(ADD32(rl,82),7),ADD32(82,rh)),32767));
- #else
- filter_ratio=(rl+.01)/(rh+.01);
- #endif
- /* Compute "real excitation" */
- fir_mem16(sp, st->interp_qlpc, exc, st->subframeSize, st->lpcSize, st->mem_sp2, stack);
- /* Compute energy of low-band and high-band excitation */
- eh = compute_rms16(exc, st->subframeSize);
- if (!SUBMODE(innovation_quant)) {/* 1 for spectral folding excitation, 0 for stochastic */
- spx_word32_t g; /*Q7*/
- spx_word16_t el; /*Q0*/
- el = low_innov_rms[sub];
- /* Gain to use if we want to use the low-band excitation for high-band */
- g=PDIV32(MULT16_16(filter_ratio,eh),EXTEND32(ADD16(1,el)));
- #if 0
- {
- char *tmp_stack=stack;
- float *tmp_sig;
- float g2;
- ALLOC(tmp_sig, st->subframeSize, spx_sig_t);
- for (i=0;i<st->lpcSize;i++)
- mem[i]=st->mem_sp[i];
- iir_mem2(st->low_innov+offset, st->interp_qlpc, tmp_sig, st->subframeSize, st->lpcSize, mem);
- g2 = compute_rms(sp, st->subframeSize)/(.01+compute_rms(tmp_sig, st->subframeSize));
- /*fprintf (stderr, "gains: %f %f\n", g, g2);*/
- g = g2;
- stack = tmp_stack;
- }
- #endif
- /*print_vec(&g, 1, "gain factor");*/
- /* Gain quantization */
- {
- int quant = scal_quant(g, fold_quant_bound, 32);
- /*speex_warning_int("tata", quant);*/
- if (quant<0)
- quant=0;
- if (quant>31)
- quant=31;
- speex_bits_pack(bits, quant, 5);
- }
- if (st->innov_rms_save)
- {
- st->innov_rms_save[sub] = eh;
- }
- st->exc_rms[sub] = eh;
- } else {
- spx_word16_t gc; /*Q7*/
- spx_word32_t scale; /*Q14*/
- spx_word16_t el; /*Q0*/
- el = low_exc_rms[sub]; /*Q0*/
- gc = PDIV32_16(MULT16_16(filter_ratio,1+eh),1+el);
- /* This is a kludge that cleans up a historical bug */
- if (st->subframeSize==80)
- gc = MULT16_16_P15(QCONST16(0.70711f,15),gc);
- /*printf ("%f %f %f %f\n", el, eh, filter_ratio, gc);*/
- {
- int qgc = scal_quant(gc, gc_quant_bound, 16);
- speex_bits_pack(bits, qgc, 4);
- gc = MULT16_16_Q15(QCONST16(0.87360,15),gc_quant_bound[qgc]);
- }
- if (st->subframeSize==80)
- gc = MULT16_16_P14(QCONST16(1.4142f,14), gc);
- scale = SHL32(MULT16_16(PDIV32_16(SHL32(EXTEND32(gc),SIG_SHIFT-6),filter_ratio),(1+el)),6);
- compute_impulse_response(st->interp_qlpc, bw_lpc1, bw_lpc2, syn_resp, st->subframeSize, st->lpcSize, stack);
- /* Reset excitation */
- for (i=0;i<st->subframeSize;i++)
- res[i]=VERY_SMALL;
- /* Compute zero response (ringing) of A(z/g1) / ( A(z/g2) * Aq(z) ) */
- for (i=0;i<st->lpcSize;i++)
- mem[i]=st->mem_sp[i];
- iir_mem16(res, st->interp_qlpc, res, st->subframeSize, st->lpcSize, mem, stack);
- for (i=0;i<st->lpcSize;i++)
- mem[i]=st->mem_sw[i];
- filter_mem16(res, bw_lpc1, bw_lpc2, res, st->subframeSize, st->lpcSize, mem, stack);
- /* Compute weighted signal */
- for (i=0;i<st->lpcSize;i++)
- mem[i]=st->mem_sw[i];
- filter_mem16(sp, bw_lpc1, bw_lpc2, sw, st->subframeSize, st->lpcSize, mem, stack);
- /* Compute target signal */
- for (i=0;i<st->subframeSize;i++)
- target[i]=SUB16(sw[i],res[i]);
- signal_div(target, target, scale, st->subframeSize);
- /* Reset excitation */
- SPEEX_MEMSET(innov, 0, st->subframeSize);
- /*print_vec(target, st->subframeSize, "\ntarget");*/
- SUBMODE(innovation_quant)(target, st->interp_qlpc, bw_lpc1, bw_lpc2,
- SUBMODE(innovation_params), st->lpcSize, st->subframeSize,
- innov, syn_resp, bits, stack, st->complexity, SUBMODE(double_codebook));
- /*print_vec(target, st->subframeSize, "after");*/
- signal_mul(innov, innov, scale, st->subframeSize);
- if (SUBMODE(double_codebook)) {
- char *tmp_stack=stack;
- VARDECL(spx_sig_t *innov2);
- ALLOC(innov2, st->subframeSize, spx_sig_t);
- SPEEX_MEMSET(innov2, 0, st->subframeSize);
- for (i=0;i<st->subframeSize;i++)
- target[i]=MULT16_16_P13(QCONST16(2.5f,13), target[i]);
- SUBMODE(innovation_quant)(target, st->interp_qlpc, bw_lpc1, bw_lpc2,
- SUBMODE(innovation_params), st->lpcSize, st->subframeSize,
- innov2, syn_resp, bits, stack, st->complexity, 0);
- signal_mul(innov2, innov2, MULT16_32_P15(QCONST16(0.4f,15),scale), st->subframeSize);
- for (i=0;i<st->subframeSize;i++)
- innov[i] = ADD32(innov[i],innov2[i]);
- stack = tmp_stack;
- }
- for (i=0;i<st->subframeSize;i++)
- exc[i] = PSHR32(innov[i],SIG_SHIFT);
- if (st->innov_rms_save)
- {
- st->innov_rms_save[sub] = MULT16_16_Q15(QCONST16(.70711f, 15), compute_rms(innov, st->subframeSize));
- }
- st->exc_rms[sub] = compute_rms16(exc, st->subframeSize);
- }
- /*Keep the previous memory*/
- for (i=0;i<st->lpcSize;i++)
- mem[i]=st->mem_sp[i];
- /* Final signal synthesis from excitation */
- iir_mem16(exc, st->interp_qlpc, sp, st->subframeSize, st->lpcSize, st->mem_sp, stack);
- /* Compute weighted signal again, from synthesized speech (not sure it's the right thing) */
- filter_mem16(sp, bw_lpc1, bw_lpc2, sw, st->subframeSize, st->lpcSize, st->mem_sw, stack);
- }
- for (i=0;i<st->lpcSize;i++)
- st->old_lsp[i] = lsp[i];
- for (i=0;i<st->lpcSize;i++)
- st->old_qlsp[i] = qlsp[i];
- st->first=0;
- return 1;
- }
- #endif /* DISABLE_ENCODER */
- #ifndef DISABLE_DECODER
- void *sb_decoder_init(const SpeexMode *m)
- {
- spx_int32_t tmp;
- SBDecState *st;
- const SpeexSBMode *mode;
- st = (SBDecState*)speex_alloc(sizeof(SBDecState));
- if (!st)
- return NULL;
- st->mode = m;
- mode=(const SpeexSBMode*)m->mode;
- st->encode_submode = 1;
- st->st_low = speex_decoder_init(mode->nb_mode);
- #if defined(VAR_ARRAYS) || defined (USE_ALLOCA)
- st->stack = NULL;
- #else
- /*st->stack = (char*)speex_alloc_scratch(SB_DEC_STACK);*/
- speex_decoder_ctl(st->st_low, SPEEX_GET_STACK, &st->stack);
- #endif
- st->full_frame_size = 2*mode->frameSize;
- st->frame_size = mode->frameSize;
- st->subframeSize = mode->subframeSize;
- st->nbSubframes = mode->frameSize/mode->subframeSize;
- st->lpcSize=mode->lpcSize;
- speex_decoder_ctl(st->st_low, SPEEX_GET_SAMPLING_RATE, &st->sampling_rate);
- st->sampling_rate*=2;
- tmp=1;
- speex_decoder_ctl(st->st_low, SPEEX_SET_WIDEBAND, &tmp);
- st->submodes=mode->submodes;
- st->submodeID=mode->defaultSubmode;
- st->first=1;
- st->g0_mem = (spx_word16_t*)speex_alloc((QMF_ORDER)*sizeof(spx_word16_t));
- st->g1_mem = (spx_word16_t*)speex_alloc((QMF_ORDER)*sizeof(spx_word16_t));
- st->excBuf = (spx_word16_t*)speex_alloc((st->subframeSize)*sizeof(spx_word16_t));
- st->old_qlsp = (spx_lsp_t*)speex_alloc((st->lpcSize)*sizeof(spx_lsp_t));
- st->interp_qlpc = (spx_coef_t*)speex_alloc(st->lpcSize*sizeof(spx_coef_t));
- st->pi_gain = (spx_word32_t*)speex_alloc((st->nbSubframes)*sizeof(spx_word32_t));
- st->exc_rms = (spx_word16_t*)speex_alloc((st->nbSubframes)*sizeof(spx_word16_t));
- st->mem_sp = (spx_mem_t*)speex_alloc((2*st->lpcSize)*sizeof(spx_mem_t));
- st->innov_save = NULL;
- st->lpc_enh_enabled=0;
- st->seed = 1000;
- #ifdef ENABLE_VALGRIND
- VALGRIND_MAKE_MEM_DEFINED(st, (st->stack-(char*)st));
- #endif
- return st;
- }
- void sb_decoder_destroy(void *state)
- {
- SBDecState *st;
- st = (SBDecState*)state;
- speex_decoder_destroy(st->st_low);
- #if !(defined(VAR_ARRAYS) || defined (USE_ALLOCA))
- /*speex_free_scratch(st->stack);*/
- #endif
- speex_free(st->g0_mem);
- speex_free(st->g1_mem);
- speex_free(st->excBuf);
- speex_free(st->old_qlsp);
- speex_free(st->interp_qlpc);
- speex_free(st->pi_gain);
- speex_free(st->exc_rms);
- speex_free(st->mem_sp);
- speex_free(state);
- }
- int sb_decoder_ctl(void *state, int request, void *ptr)
- {
- SBDecState *st;
- st=(SBDecState*)state;
- switch(request)
- {
- case SPEEX_SET_HIGH_MODE:
- st->submodeID = (*(spx_int32_t*)ptr);
- break;
- case SPEEX_SET_LOW_MODE:
- speex_decoder_ctl(st->st_low, SPEEX_SET_LOW_MODE, ptr);
- break;
- case SPEEX_GET_LOW_MODE:
- speex_decoder_ctl(st->st_low, SPEEX_GET_LOW_MODE, ptr);
- break;
- case SPEEX_GET_FRAME_SIZE:
- (*(spx_int32_t*)ptr) = st->full_frame_size;
- break;
- case SPEEX_SET_ENH:
- speex_decoder_ctl(st->st_low, request, ptr);
- st->lpc_enh_enabled = *((spx_int32_t*)ptr);
- break;
- case SPEEX_GET_ENH:
- *((spx_int32_t*)ptr) = st->lpc_enh_enabled;
- break;
- case SPEEX_SET_MODE:
- case SPEEX_SET_QUALITY:
- {
- spx_int32_t nb_qual;
- int quality = (*(spx_int32_t*)ptr);
- if (quality < 0)
- quality = 0;
- if (quality > 10)
- quality = 10;
- st->submodeID = ((const SpeexSBMode*)(st->mode->mode))->quality_map[quality];
- nb_qual = ((const SpeexSBMode*)(st->mode->mode))->low_quality_map[quality];
- speex_decoder_ctl(st->st_low, SPEEX_SET_MODE, &nb_qual);
- }
- break;
- case SPEEX_GET_BITRATE:
- speex_decoder_ctl(st->st_low, request, ptr);
- if (st->submodes[st->submodeID])
- (*(spx_int32_t*)ptr) += st->sampling_rate*SUBMODE(bits_per_frame)/st->full_frame_size;
- else
- (*(spx_int32_t*)ptr) += st->sampling_rate*(SB_SUBMODE_BITS+1)/st->full_frame_size;
- break;
- case SPEEX_SET_SAMPLING_RATE:
- {
- spx_int32_t tmp=(*(spx_int32_t*)ptr);
- st->sampling_rate = tmp;
- tmp>>=1;
- speex_decoder_ctl(st->st_low, SPEEX_SET_SAMPLING_RATE, &tmp);
- }
- break;
- case SPEEX_GET_SAMPLING_RATE:
- (*(spx_int32_t*)ptr)=st->sampling_rate;
- break;
- case SPEEX_SET_HANDLER:
- speex_decoder_ctl(st->st_low, SPEEX_SET_HANDLER, ptr);
- break;
- case SPEEX_SET_USER_HANDLER:
- speex_decoder_ctl(st->st_low, SPEEX_SET_USER_HANDLER, ptr);
- break;
- case SPEEX_RESET_STATE:
- {
- int i;
- for (i=0;i<2*st->lpcSize;i++)
- st->mem_sp[i]=0;
- for (i=0;i<QMF_ORDER;i++)
- st->g0_mem[i]=st->g1_mem[i]=0;
- st->last_ener=0;
- }
- break;
- case SPEEX_SET_SUBMODE_ENCODING:
- st->encode_submode = (*(spx_int32_t*)ptr);
- speex_decoder_ctl(st->st_low, SPEEX_SET_SUBMODE_ENCODING, ptr);
- break;
- case SPEEX_GET_SUBMODE_ENCODING:
- (*(spx_int32_t*)ptr) = st->encode_submode;
- break;
- case SPEEX_GET_LOOKAHEAD:
- speex_decoder_ctl(st->st_low, SPEEX_GET_LOOKAHEAD, ptr);
- (*(spx_int32_t*)ptr) = 2*(*(spx_int32_t*)ptr);
- break;
- case SPEEX_SET_HIGHPASS:
- speex_decoder_ctl(st->st_low, SPEEX_SET_HIGHPASS, ptr);
- break;
- case SPEEX_GET_HIGHPASS:
- speex_decoder_ctl(st->st_low, SPEEX_GET_HIGHPASS, ptr);
- break;
- case SPEEX_GET_ACTIVITY:
- speex_decoder_ctl(st->st_low, SPEEX_GET_ACTIVITY, ptr);
- break;
- case SPEEX_GET_PI_GAIN:
- {
- int i;
- spx_word32_t *g = (spx_word32_t*)ptr;
- for (i=0;i<st->nbSubframes;i++)
- g[i]=st->pi_gain[i];
- }
- break;
- case SPEEX_GET_EXC:
- {
- int i;
- for (i=0;i<st->nbSubframes;i++)
- ((spx_word16_t*)ptr)[i] = st->exc_rms[i];
- }
- break;
- case SPEEX_GET_DTX_STATUS:
- speex_decoder_ctl(st->st_low, SPEEX_GET_DTX_STATUS, ptr);
- break;
- case SPEEX_SET_INNOVATION_SAVE:
- st->innov_save = (spx_word16_t*)ptr;
- break;
- case SPEEX_SET_WIDEBAND:
- speex_decoder_ctl(st->st_low, SPEEX_SET_WIDEBAND, ptr);
- break;
- case SPEEX_GET_STACK:
- *((char**)ptr) = st->stack;
- break;
- default:
- speex_warning_int("Unknown nb_ctl request: ", request);
- return -1;
- }
- return 0;
- }
- static void sb_decode_lost(SBDecState *st, spx_word16_t *out, int dtx, char *stack)
- {
- int i;
- int saved_modeid=0;
- if (dtx)
- {
- saved_modeid=st->submodeID;
- st->submodeID=1;
- } else {
- bw_lpc(QCONST16(0.99f,15), st->interp_qlpc, st->interp_qlpc, st->lpcSize);
- }
- st->first=1;
- /* Final signal synthesis from excitation */
- if (!dtx)
- {
- st->last_ener = MULT16_16_Q15(QCONST16(.9f,15),st->last_ener);
- }
- for (i=0;i<st->frame_size;i++)
- out[i+st->frame_size] = speex_rand(st->last_ener, &st->seed);
- iir_mem16(out+st->frame_size, st->interp_qlpc, out+st->frame_size, st->frame_size, st->lpcSize,
- st->mem_sp, stack);
- /* Reconstruct the original */
- qmf_synth(out, out+st->frame_size, h0, out, st->full_frame_size, QMF_ORDER, st->g0_mem, st->g1_mem, stack);
- if (dtx)
- {
- st->submodeID=saved_modeid;
- }
- return;
- }
- int sb_decode(void *state, SpeexBits *bits, void *vout)
- {
- int i, sub;
- SBDecState *st;
- int wideband;
- int ret;
- char *stack;
- VARDECL(spx_word32_t *low_pi_gain);
- VARDECL(spx_word16_t *low_exc_rms);
- VARDECL(spx_coef_t *ak);
- VARDECL(spx_lsp_t *qlsp);
- VARDECL(spx_lsp_t *interp_qlsp);
- spx_int32_t dtx;
- const SpeexSBMode *mode;
- spx_word16_t *out = (spx_word16_t*)vout;
- spx_word16_t *low_innov_alias;
- spx_word32_t exc_ener_sum = 0;
- st = (SBDecState*)state;
- stack=st->stack;
- mode = (const SpeexSBMode*)(st->mode->mode);
- low_innov_alias = out+st->frame_size;
- speex_decoder_ctl(st->st_low, SPEEX_SET_INNOVATION_SAVE, low_innov_alias);
- /* Decode the low-band */
- ret = speex_decode_native(st->st_low, bits, out);
- speex_decoder_ctl(st->st_low, SPEEX_GET_DTX_STATUS, &dtx);
- /* If error decoding the narrowband part, propagate error */
- if (ret!=0)
- {
- return ret;
- }
- if (!bits)
- {
- sb_decode_lost(st, out, dtx, stack);
- return 0;
- }
- if (st->encode_submode)
- {
- /*Check "wideband bit"*/
- if (speex_bits_remaining(bits)>0)
- wideband = speex_bits_peek(bits);
- else
- wideband = 0;
- if (wideband)
- {
- /*Regular wideband frame, read the submode*/
- wideband = speex_bits_unpack_unsigned(bits, 1);
- st->submodeID = speex_bits_unpack_unsigned(bits, SB_SUBMODE_BITS);
- } else
- {
- /*Was a narrowband frame, set "null submode"*/
- st->submodeID = 0;
- }
- if (st->submodeID != 0 && st->submodes[st->submodeID] == NULL)
- {
- speex_notify("Invalid mode encountered. The stream is corrupted.");
- return -2;
- }
- }
- /* If null mode (no transmission), just set a couple things to zero*/
- if (st->submodes[st->submodeID] == NULL)
- {
- if (st->innov_save)
- SPEEX_MEMSET(st->innov_save, 0, st->full_frame_size);
- if (dtx)
- {
- sb_decode_lost(st, out, 1, stack);
- return 0;
- }
- for (i=0;i<st->frame_size;i++)
- out[st->frame_size+i]=VERY_SMALL;
- st->first=1;
- /* Final signal synthesis from excitation */
- iir_mem16(out+st->frame_size, st->interp_qlpc, out+st->frame_size, st->frame_size, st->lpcSize, st->mem_sp, stack);
- qmf_synth(out, out+st->frame_size, h0, out, st->full_frame_size, QMF_ORDER, st->g0_mem, st->g1_mem, stack);
- return 0;
- }
- ALLOC(low_pi_gain, st->nbSubframes, spx_word32_t);
- ALLOC(low_exc_rms, st->nbSubframes, spx_word16_t);
- speex_decoder_ctl(st->st_low, SPEEX_GET_PI_GAIN, low_pi_gain);
- speex_decoder_ctl(st->st_low, SPEEX_GET_EXC, low_exc_rms);
- ALLOC(qlsp, st->lpcSize, spx_lsp_t);
- ALLOC(interp_qlsp, st->lpcSize, spx_lsp_t);
- SUBMODE(lsp_unquant)(qlsp, st->lpcSize, bits);
- if (st->first)
- {
- for (i=0;i<st->lpcSize;i++)
- st->old_qlsp[i] = qlsp[i];
- }
- ALLOC(ak, st->lpcSize, spx_coef_t);
- for (sub=0;sub<st->nbSubframes;sub++)
- {
- VARDECL(spx_word32_t *exc);
- spx_word16_t *innov_save=NULL;
- spx_word16_t *sp;
- spx_word16_t filter_ratio;
- spx_word16_t el=0;
- int offset;
- spx_word32_t rl=0,rh=0;
- offset = st->subframeSize*sub;
- sp=out+st->frame_size+offset;
- ALLOC(exc, st->subframeSize, spx_word32_t);
- /* Pointer for saving innovation */
- if (st->innov_save)
- {
- innov_save = st->innov_save+2*offset;
- SPEEX_MEMSET(innov_save, 0, 2*st->subframeSize);
- }
- /* LSP interpolation */
- lsp_interpolate(st->old_qlsp, qlsp, interp_qlsp, st->lpcSize, sub, st->nbSubframes, LSP_MARGIN);
- /* LSP to LPC */
- lsp_to_lpc(interp_qlsp, ak, st->lpcSize, stack);
- /* Calculate response ratio between the low and high filter in the middle
- of the band (4000 Hz) */
- st->pi_gain[sub]=LPC_SCALING;
- rh = LPC_SCALING;
- for (i=0;i<st->lpcSize;i+=2)
- {
- rh += ak[i+1] - ak[i];
- st->pi_gain[sub] += ak[i] + ak[i+1];
- }
- rl = low_pi_gain[sub];
- #ifdef FIXED_POINT
- filter_ratio=EXTRACT16(SATURATE(PDIV32(SHL32(ADD32(rl,82),7),ADD32(82,rh)),32767));
- #else
- filter_ratio=(rl+.01)/(rh+.01);
- #endif
- SPEEX_MEMSET(exc, 0, st->subframeSize);
- if (!SUBMODE(innovation_unquant))
- {
- spx_word32_t g;
- int quant;
- quant = speex_bits_unpack_unsigned(bits, 5);
- g= spx_exp(MULT16_16(QCONST16(.125f,11),(quant-10)));
- g = PDIV32(g, filter_ratio);
- for (i=0;i<st->subframeSize;i+=2)
- {
- exc[i]=SHL32(MULT16_32_P15(MULT16_16_Q15(mode->folding_gain,low_innov_alias[offset+i]),SHL32(g,6)),SIG_SHIFT);
- exc[i+1]=NEG32(SHL32(MULT16_32_P15(MULT16_16_Q15(mode->folding_gain,low_innov_alias[offset+i+1]),SHL32(g,6)),SIG_SHIFT));
- }
- } else {
- spx_word16_t gc;
- spx_word32_t scale;
- int qgc = speex_bits_unpack_unsigned(bits, 4);
- el = low_exc_rms[sub];
- gc = MULT16_16_Q15(QCONST16(0.87360,15),gc_quant_bound[qgc]);
- if (st->subframeSize==80)
- gc = MULT16_16_P14(QCONST16(1.4142f,14),gc);
- scale = SHL32(PDIV32(SHL32(MULT16_16(gc, el),3), filter_ratio),SIG_SHIFT-3);
- SUBMODE(innovation_unquant)(exc, SUBMODE(innovation_params), st->subframeSize,
- bits, stack, &st->seed);
- signal_mul(exc,exc,scale,st->subframeSize);
- if (SUBMODE(double_codebook)) {
- char *tmp_stack=stack;
- VARDECL(spx_sig_t *innov2);
- ALLOC(innov2, st->subframeSize, spx_sig_t);
- SPEEX_MEMSET(innov2, 0, st->subframeSize);
- SUBMODE(innovation_unquant)(innov2, SUBMODE(innovation_params), st->subframeSize,
- bits, stack, &st->seed);
- signal_mul(innov2, innov2, MULT16_32_P15(QCONST16(0.4f,15),scale), st->subframeSize);
- for (i=0;i<st->subframeSize;i++)
- exc[i] = ADD32(exc[i],innov2[i]);
- stack = tmp_stack;
- }
- }
- if (st->innov_save)
- {
- for (i=0;i<st->subframeSize;i++)
- innov_save[2*i]=EXTRACT16(PSHR32(exc[i],SIG_SHIFT));
- }
- iir_mem16(st->excBuf, st->interp_qlpc, sp, st->subframeSize, st->lpcSize,
- st->mem_sp, stack);
- for (i=0;i<st->subframeSize;i++)
- st->excBuf[i]=EXTRACT16(PSHR32(exc[i],SIG_SHIFT));
- for (i=0;i<st->lpcSize;i++)
- st->interp_qlpc[i] = ak[i];
- st->exc_rms[sub] = compute_rms16(st->excBuf, st->subframeSize);
- exc_ener_sum = ADD32(exc_ener_sum, DIV32(MULT16_16(st->exc_rms[sub],st->exc_rms[sub]), st->nbSubframes));
- }
- st->last_ener = spx_sqrt(exc_ener_sum);
- qmf_synth(out, out+st->frame_size, h0, out, st->full_frame_size, QMF_ORDER, st->g0_mem, st->g1_mem, stack);
- for (i=0;i<st->lpcSize;i++)
- st->old_qlsp[i] = qlsp[i];
- st->first=0;
- return 0;
- }
- #endif /* DISABLE_DECODER */
- #endif
|