third_party/speex/libspeex/nb_celp.c

   1 /* Copyright (C) 2002-2006 Jean-Marc Valin
   2    File: nb_celp.c
   3
   4    Redistribution and use in source and binary forms, with or without
   5    modification, are permitted provided that the following conditions
   6    are met:
   7
   8    - Redistributions of source code must retain the above copyright
   9    notice, this list of conditions and the following disclaimer.
  10
  11    - Redistributions in binary form must reproduce the above copyright
  12    notice, this list of conditions and the following disclaimer in the
  13    documentation and/or other materials provided with the distribution.
  14
  15    - Neither the name of the Xiph.org Foundation nor the names of its
  16    contributors may be used to endorse or promote products derived from
  17    this software without specific prior written permission.
  18
  19    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  20    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  21    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  22    A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR
  23    CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
  24    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
  25    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
  26    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
  27    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
  28    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
  29    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  30 */
  31
  32 #ifdef HAVE_CONFIG_H
  33 #include "config.h"
  34 #endif
  35
  36 #include <math.h>
  37 #include "nb_celp.h"
  38 #include "lpc.h"
  39 #include "lsp.h"
  40 #include "ltp.h"
  41 #include "quant_lsp.h"
  42 #include "cb_search.h"
  43 #include "filters.h"
  44 #include "stack_alloc.h"
  45 #include "vq.h"
  46 #include <speex/speex_bits.h>
  47 #include "vbr.h"
  48 #include "arch.h"
  49 #include "math_approx.h"
  50 #include "os_support.h"
  51 #include <speex/speex_callbacks.h>
  52
  53 #ifdef VORBIS_PSYCHO
  54 #include "vorbis_psy.h"
  55 #endif
  56
  57 #ifndef M_PI
  58 #define M_PI           3.14159265358979323846  /* pi */
  59 #endif
  60
  61 #ifndef NULL
  62 #define NULL 0
  63 #endif
  64
  65 #define SUBMODE(x) st->submodes[st->submodeID]->x
  66
  67 /* Default size for the encoder and decoder stack (can be changed at compile time).
  68    This does not apply when using variable-size arrays or alloca. */
  69 #ifndef NB_ENC_STACK
  70 #define NB_ENC_STACK (8000*sizeof(spx_sig_t))
  71 #endif
  72
  73 #ifndef NB_DEC_STACK
  74 #define NB_DEC_STACK (4000*sizeof(spx_sig_t))
  75 #endif
  76
  77
  78 #ifdef FIXED_POINT
  79 const spx_word32_t ol_gain_table[32]={18900, 25150, 33468, 44536, 59265, 78865, 104946, 139653, 185838, 247297, 329081, 437913, 582736, 775454, 1031906, 1373169, 1827293, 2431601, 3235761, 4305867, 5729870, 7624808, 10146425, 13501971, 17967238, 23909222, 31816294, 42338330, 56340132, 74972501, 99766822, 132760927};
  80 const spx_word16_t exc_gain_quant_scal3_bound[7]={1841, 3883, 6051, 8062, 10444, 13580, 18560};
  81 const spx_word16_t exc_gain_quant_scal3[8]={1002, 2680, 5086, 7016, 9108, 11781, 15380, 21740};
  82 const spx_word16_t exc_gain_quant_scal1_bound[1]={14385};
  83 const spx_word16_t exc_gain_quant_scal1[2]={11546, 17224};
  84
  85 #define LSP_MARGIN 16
  86 #define LSP_DELTA1 6553
  87 #define LSP_DELTA2 1638
  88
  89 #else
  90
  91 const float exc_gain_quant_scal3_bound[7]={0.112338f, 0.236980f, 0.369316f, 0.492054f, 0.637471f, 0.828874f, 1.132784f};
  92 const float exc_gain_quant_scal3[8]={0.061130f, 0.163546f, 0.310413f, 0.428220f, 0.555887f, 0.719055f, 0.938694f, 1.326874f};
  93 const float exc_gain_quant_scal1_bound[1]={0.87798f};
  94 const float exc_gain_quant_scal1[2]={0.70469f, 1.05127f};
  95
  96 #define LSP_MARGIN .002f
  97 #define LSP_DELTA1 .2f
  98 #define LSP_DELTA2 .05f
  99
 100 #endif
 101
 102 #ifdef VORBIS_PSYCHO
 103 #define EXTRA_BUFFER 100
 104 #else
 105 #define EXTRA_BUFFER 0
 106 #endif
 107
 108
 109 #define sqr(x) ((x)*(x))
 110
 111 extern const spx_word16_t lag_window[];
 112 extern const spx_word16_t lpc_window[];
 113
 114 void *nb_encoder_init(const SpeexMode *m)
 115 {
 116    EncState *st;
 117    const SpeexNBMode *mode;
 118    int i;
 119
 120    mode=(const SpeexNBMode *)m->mode;
 121    st = (EncState*)speex_alloc(sizeof(EncState));
 122    if (!st)
 123       return NULL;
 124 #if defined(VAR_ARRAYS) || defined (USE_ALLOCA)
 125    st->stack = NULL;
 126 #else
 127    st->stack = (char*)speex_alloc_scratch(NB_ENC_STACK);
 128 #endif
 129
 130    st->mode=m;
 131
 132    st->frameSize = mode->frameSize;
 133    st->nbSubframes=mode->frameSize/mode->subframeSize;
 134    st->subframeSize=mode->subframeSize;
 135    st->windowSize = st->frameSize+st->subframeSize;
 136    st->lpcSize = mode->lpcSize;
 137    st->gamma1=mode->gamma1;
 138    st->gamma2=mode->gamma2;
 139    st->min_pitch=mode->pitchStart;
 140    st->max_pitch=mode->pitchEnd;
 141    st->lpc_floor = mode->lpc_floor;
 142
 143    st->submodes=mode->submodes;
 144    st->submodeID=st->submodeSelect=mode->defaultSubmode;
 145    st->bounded_pitch = 1;
 146
 147    st->encode_submode = 1;
 148
 149 #ifdef VORBIS_PSYCHO
 150    st->psy = vorbis_psy_init(8000, 256);
 151    st->curve = (float*)speex_alloc(128*sizeof(float));
 152    st->old_curve = (float*)speex_alloc(128*sizeof(float));
 153    st->psy_window = (float*)speex_alloc(256*sizeof(float));
 154 #endif
 155
 156    st->cumul_gain = 1024;
 157
 158    /* Allocating input buffer */
 159    st->winBuf = (spx_word16_t*)speex_alloc((st->windowSize-st->frameSize)*sizeof(spx_word16_t));
 160    /* Allocating excitation buffer */
 161    st->excBuf = (spx_word16_t*)speex_alloc((mode->frameSize+mode->pitchEnd+2)*sizeof(spx_word16_t));
 162    st->exc = st->excBuf + mode->pitchEnd + 2;
 163    st->swBuf = (spx_word16_t*)speex_alloc((mode->frameSize+mode->pitchEnd+2)*sizeof(spx_word16_t));
 164    st->sw = st->swBuf + mode->pitchEnd + 2;
 165
 166    st->window= lpc_window;
 167
 168    /* Create the window for autocorrelation (lag-windowing) */
 169    st->lagWindow = lag_window;
 170
 171    st->old_lsp = (spx_lsp_t*)speex_alloc((st->lpcSize)*sizeof(spx_lsp_t));
 172    st->old_qlsp = (spx_lsp_t*)speex_alloc((st->lpcSize)*sizeof(spx_lsp_t));
 173    st->first = 1;
 174    for (i=0;i<st->lpcSize;i++)
 175       st->old_lsp[i]= DIV32(MULT16_16(QCONST16(3.1415927f, LSP_SHIFT), i+1), st->lpcSize+1);
 176
 177    st->mem_sp = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
 178    st->mem_sw = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
 179    st->mem_sw_whole = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
 180    st->mem_exc = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
 181    st->mem_exc2 = (spx_mem_t*)speex_alloc((st->lpcSize)*sizeof(spx_mem_t));
 182
 183    st->pi_gain = (spx_word32_t*)speex_alloc((st->nbSubframes)*sizeof(spx_word32_t));
 184    st->innov_rms_save = NULL;
 185
 186    st->pitch = (int*)speex_alloc((st->nbSubframes)*sizeof(int));
 187
 188 #ifndef DISABLE_VBR
 189    st->vbr = (VBRState*)speex_alloc(sizeof(VBRState));
 190    vbr_init(st->vbr);
 191    st->vbr_quality = 8;
 192    st->vbr_enabled = 0;
 193    st->vbr_max = 0;
 194    st->vad_enabled = 0;
 195    st->dtx_enabled = 0;
 196    st->dtx_count=0;
 197    st->abr_enabled = 0;
 198    st->abr_drift = 0;
 199    st->abr_drift2 = 0;
 200 #endif /* #ifndef DISABLE_VBR */
 201
 202    st->plc_tuning = 2;
 203    st->complexity=2;
 204    st->sampling_rate=8000;
 205    st->isWideband = 0;
 206    st->highpass_enabled = 1;
 207
 208 #ifdef ENABLE_VALGRIND
 209    VALGRIND_MAKE_READABLE(st, NB_ENC_STACK);
 210 #endif
 211    return st;
 212 }
 213
 214 void nb_encoder_destroy(void *state)
 215 {
 216    EncState *st=(EncState *)state;
 217    /* Free all allocated memory */
 218 #if !(defined(VAR_ARRAYS) || defined (USE_ALLOCA))
 219    speex_free_scratch(st->stack);
 220 #endif
 221
 222    speex_free (st->winBuf);
 223    speex_free (st->excBuf);
 224    speex_free (st->old_qlsp);
 225    speex_free (st->swBuf);
 226
 227    speex_free (st->old_lsp);
 228    speex_free (st->mem_sp);
 229    speex_free (st->mem_sw);
 230    speex_free (st->mem_sw_whole);
 231    speex_free (st->mem_exc);
 232    speex_free (st->mem_exc2);
 233    speex_free (st->pi_gain);
 234    speex_free (st->pitch);
 235
 236 #ifndef DISABLE_VBR
 237    vbr_destroy(st->vbr);
 238    speex_free (st->vbr);
 239 #endif /* #ifndef DISABLE_VBR */
 240
 241 #ifdef VORBIS_PSYCHO
 242    vorbis_psy_destroy(st->psy);
 243    speex_free (st->curve);
 244    speex_free (st->old_curve);
 245    speex_free (st->psy_window);
 246 #endif
 247
 248    /*Free state memory... should be last*/
 249    speex_free(st);
 250 }
 251
 252 int nb_encode(void *state, void *vin, SpeexBits *bits)
 253 {
 254    EncState *st;
 255    int i, sub, roots;
 256    int ol_pitch;
 257    spx_word16_t ol_pitch_coef;
 258    spx_word32_t ol_gain;
 259    VARDECL(spx_word16_t *ringing);
 260    VARDECL(spx_word16_t *target);
 261    VARDECL(spx_sig_t *innov);
 262    VARDECL(spx_word32_t *exc32);
 263    VARDECL(spx_mem_t *mem);
 264    VARDECL(spx_coef_t *bw_lpc1);
 265    VARDECL(spx_coef_t *bw_lpc2);
 266    VARDECL(spx_coef_t *lpc);
 267    VARDECL(spx_lsp_t *lsp);
 268    VARDECL(spx_lsp_t *qlsp);
 269    VARDECL(spx_lsp_t *interp_lsp);
 270    VARDECL(spx_lsp_t *interp_qlsp);
 271    VARDECL(spx_coef_t *interp_lpc);
 272    VARDECL(spx_coef_t *interp_qlpc);
 273    char *stack;
 274    VARDECL(spx_word16_t *syn_resp);
 275    VARDECL(spx_word16_t *real_exc);
 276
 277    spx_word32_t ener=0;
 278    spx_word16_t fine_gain;
 279    spx_word16_t *in = (spx_word16_t*)vin;
 280
 281    st=(EncState *)state;
 282    stack=st->stack;
 283
 284    ALLOC(lpc, st->lpcSize, spx_coef_t);
 285    ALLOC(bw_lpc1, st->lpcSize, spx_coef_t);
 286    ALLOC(bw_lpc2, st->lpcSize, spx_coef_t);
 287    ALLOC(lsp, st->lpcSize, spx_lsp_t);
 288    ALLOC(qlsp, st->lpcSize, spx_lsp_t);
 289    ALLOC(interp_lsp, st->lpcSize, spx_lsp_t);
 290    ALLOC(interp_qlsp, st->lpcSize, spx_lsp_t);
 291    ALLOC(interp_lpc, st->lpcSize, spx_coef_t);
 292    ALLOC(interp_qlpc, st->lpcSize, spx_coef_t);
 293
 294    /* Move signals 1 frame towards the past */
 295    SPEEX_MOVE(st->excBuf, st->excBuf+st->frameSize, st->max_pitch+2);
 296    SPEEX_MOVE(st->swBuf, st->swBuf+st->frameSize, st->max_pitch+2);
 297
 298    if (st->highpass_enabled)
 299       highpass(in, in, st->frameSize, (st->isWideband?HIGHPASS_WIDEBAND:HIGHPASS_NARROWBAND)|HIGHPASS_INPUT, st->mem_hp);
 300
 301    {
 302       VARDECL(spx_word16_t *w_sig);
 303       VARDECL(spx_word16_t *autocorr);
 304       ALLOC(w_sig, st->windowSize, spx_word16_t);
 305       ALLOC(autocorr, st->lpcSize+1, spx_word16_t);
 306       /* Window for analysis */
 307       for (i=0;i<st->windowSize-st->frameSize;i++)
 308          w_sig[i] = EXTRACT16(SHR32(MULT16_16(st->winBuf[i],st->window[i]),SIG_SHIFT));
 309       for (;i<st->windowSize;i++)
 310          w_sig[i] = EXTRACT16(SHR32(MULT16_16(in[i-st->windowSize+st->frameSize],st->window[i]),SIG_SHIFT));
 311       /* Compute auto-correlation */
 312       _spx_autocorr(w_sig, autocorr, st->lpcSize+1, st->windowSize);
 313       autocorr[0] = ADD16(autocorr[0],MULT16_16_Q15(autocorr[0],st->lpc_floor)); /* Noise floor in auto-correlation domain */
 314
 315       /* Lag windowing: equivalent to filtering in the power-spectrum domain */
 316       for (i=0;i<st->lpcSize+1;i++)
 317          autocorr[i] = MULT16_16_Q14(autocorr[i],st->lagWindow[i]);
 318
 319       /* Levinson-Durbin */
 320       _spx_lpc(lpc, autocorr, st->lpcSize);
 321       /* LPC to LSPs (x-domain) transform */
 322       roots=lpc_to_lsp (lpc, st->lpcSize, lsp, 10, LSP_DELTA1, stack);
 323       /* Check if we found all the roots */
 324       if (roots!=st->lpcSize)
 325       {
 326          /*If we can't find all LSP's, do some damage control and use previous filter*/
 327          for (i=0;i<st->lpcSize;i++)
 328          {
 329             lsp[i]=st->old_lsp[i];
 330          }
 331       }
 332    }
 333
 334
 335
 336
 337    /* Whole frame analysis (open-loop estimation of pitch and excitation gain) */
 338    {
 339       int diff = st->windowSize-st->frameSize;
 340       if (st->first)
 341          for (i=0;i<st->lpcSize;i++)
 342             interp_lsp[i] = lsp[i];
 343       else
 344          lsp_interpolate(st->old_lsp, lsp, interp_lsp, st->lpcSize, st->nbSubframes, st->nbSubframes<<1);
 345
 346       lsp_enforce_margin(interp_lsp, st->lpcSize, LSP_MARGIN);
 347
 348       /* Compute interpolated LPCs (unquantized) for whole frame*/
 349       lsp_to_lpc(interp_lsp, interp_lpc, st->lpcSize,stack);
 350
 351
 352       /*Open-loop pitch*/
 353       if (!st->submodes[st->submodeID] || (st->complexity>2 && SUBMODE(have_subframe_gain)<3) || SUBMODE(forced_pitch_gain) || SUBMODE(lbr_pitch) != -1
 354 #ifndef DISABLE_VBR
 355            || st->vbr_enabled || st->vad_enabled
 356 #endif
 357                   )
 358       {
 359          int nol_pitch[6];
 360          spx_word16_t nol_pitch_coef[6];
 361
 362          bw_lpc(st->gamma1, interp_lpc, bw_lpc1, st->lpcSize);
 363          bw_lpc(st->gamma2, interp_lpc, bw_lpc2, st->lpcSize);
 364
 365          SPEEX_COPY(st->sw, st->winBuf, diff);
 366          SPEEX_COPY(st->sw+diff, in, st->frameSize-diff);
 367          filter_mem16(st->sw, bw_lpc1, bw_lpc2, st->sw, st->frameSize, st->lpcSize, st->mem_sw_whole, stack);
 368
 369          open_loop_nbest_pitch(st->sw, st->min_pitch, st->max_pitch, st->frameSize,
 370                                nol_pitch, nol_pitch_coef, 6, stack);
 371          ol_pitch=nol_pitch[0];
 372          ol_pitch_coef = nol_pitch_coef[0];
 373          /*Try to remove pitch multiples*/
 374          for (i=1;i<6;i++)
 375          {
 376 #ifdef FIXED_POINT
 377             if ((nol_pitch_coef[i]>MULT16_16_Q15(nol_pitch_coef[0],27853)) &&
 378 #else
 379             if ((nol_pitch_coef[i]>.85*nol_pitch_coef[0]) &&
 380 #endif
 381                 (ABS(2*nol_pitch[i]-ol_pitch)<=2 || ABS(3*nol_pitch[i]-ol_pitch)<=3 ||
 382                  ABS(4*nol_pitch[i]-ol_pitch)<=4 || ABS(5*nol_pitch[i]-ol_pitch)<=5))
 383             {
 384                /*ol_pitch_coef=nol_pitch_coef[i];*/
 385                ol_pitch = nol_pitch[i];
 386             }
 387          }
 388          /*if (ol_pitch>50)
 389            ol_pitch/=2;*/
 390          /*ol_pitch_coef = sqrt(ol_pitch_coef);*/
 391
 392       } else {
 393          ol_pitch=0;
 394          ol_pitch_coef=0;
 395       }
 396
 397       /*Compute "real" excitation*/
 398       SPEEX_COPY(st->exc, st->winBuf, diff);
 399       SPEEX_COPY(st->exc+diff, in, st->frameSize-diff);
 400       fir_mem16(st->exc, interp_lpc, st->exc, st->frameSize, st->lpcSize, st->mem_exc, stack);
 401
 402       /* Compute open-loop excitation gain */
 403       {
 404          spx_word16_t g = compute_rms16(st->exc, st->frameSize);
 405          if (st->submodeID!=1 && ol_pitch>0)
 406             ol_gain = MULT16_16(g, MULT16_16_Q14(QCONST16(1.1,14),
 407                                 spx_sqrt(QCONST32(1.,28)-MULT16_32_Q15(QCONST16(.8,15),SHL32(MULT16_16(ol_pitch_coef,ol_pitch_coef),16)))));
 408          else
 409             ol_gain = SHL32(EXTEND32(g),SIG_SHIFT);
 410       }
 411    }
 412
 413 #ifdef VORBIS_PSYCHO
 414    SPEEX_MOVE(st->psy_window, st->psy_window+st->frameSize, 256-st->frameSize);
 415    SPEEX_COPY(&st->psy_window[256-st->frameSize], in, st->frameSize);
 416    compute_curve(st->psy, st->psy_window, st->curve);
 417    /*print_vec(st->curve, 128, "curve");*/
 418    if (st->first)
 419       SPEEX_COPY(st->old_curve, st->curve, 128);
 420 #endif
 421
 422    /*VBR stuff*/
 423 #ifndef DISABLE_VBR
 424    if (st->vbr && (st->vbr_enabled||st->vad_enabled))
 425    {
 426       float lsp_dist=0;
 427       for (i=0;i<st->lpcSize;i++)
 428          lsp_dist += (st->old_lsp[i] - lsp[i])*(st->old_lsp[i] - lsp[i]);
 429       lsp_dist /= LSP_SCALING*LSP_SCALING;
 430
 431       if (st->abr_enabled)
 432       {
 433          float qual_change=0;
 434          if (st->abr_drift2 * st->abr_drift > 0)
 435          {
 436             /* Only adapt if long-term and short-term drift are the same sign */
 437             qual_change = -.00001*st->abr_drift/(1+st->abr_count);
 438             if (qual_change>.05)
 439                qual_change=.05;
 440             if (qual_change<-.05)
 441                qual_change=-.05;
 442          }
 443          st->vbr_quality += qual_change;
 444          if (st->vbr_quality>10)
 445             st->vbr_quality=10;
 446          if (st->vbr_quality<0)
 447             st->vbr_quality=0;
 448       }
 449
 450       st->relative_quality = vbr_analysis(st->vbr, in, st->frameSize, ol_pitch, GAIN_SCALING_1*ol_pitch_coef);
 451       /*if (delta_qual<0)*/
 452       /*  delta_qual*=.1*(3+st->vbr_quality);*/
 453       if (st->vbr_enabled)
 454       {
 455          spx_int32_t mode;
 456          int choice=0;
 457          float min_diff=100;
 458          mode = 8;
 459          while (mode)
 460          {
 461             int v1;
 462             float thresh;
 463             v1=(int)floor(st->vbr_quality);
 464             if (v1==10)
 465                thresh = vbr_nb_thresh[mode][v1];
 466             else
 467                thresh = (st->vbr_quality-v1)*vbr_nb_thresh[mode][v1+1] + (1+v1-st->vbr_quality)*vbr_nb_thresh[mode][v1];
 468             if (st->relative_quality > thresh &&
 469                 st->relative_quality-thresh<min_diff)
 470             {
 471                choice = mode;
 472                min_diff = st->relative_quality-thresh;
 473             }
 474             mode--;
 475          }
 476          mode=choice;
 477          if (mode==0)
 478          {
 479             if (st->dtx_count==0 || lsp_dist>.05 || !st->dtx_enabled || st->dtx_count>20)
 480             {
 481                mode=1;
 482                st->dtx_count=1;
 483             } else {
 484                mode=0;
 485                st->dtx_count++;
 486             }
 487          } else {
 488             st->dtx_count=0;
 489          }
 490
 491          speex_encoder_ctl(state, SPEEX_SET_MODE, &mode);
 492          if (st->vbr_max>0)
 493          {
 494             spx_int32_t rate;
 495             speex_encoder_ctl(state, SPEEX_GET_BITRATE, &rate);
 496             if (rate > st->vbr_max)
 497             {
 498                rate = st->vbr_max;
 499                speex_encoder_ctl(state, SPEEX_SET_BITRATE, &rate);
 500             }
 501          }
 502
 503          if (st->abr_enabled)
 504          {
 505             spx_int32_t bitrate;
 506             speex_encoder_ctl(state, SPEEX_GET_BITRATE, &bitrate);
 507             st->abr_drift+=(bitrate-st->abr_enabled);
 508             st->abr_drift2 = .95*st->abr_drift2 + .05*(bitrate-st->abr_enabled);
 509             st->abr_count += 1.0;
 510          }
 511
 512       } else {
 513          /*VAD only case*/
 514          int mode;
 515          if (st->relative_quality<2)
 516          {
 517             if (st->dtx_count==0 || lsp_dist>.05 || !st->dtx_enabled || st->dtx_count>20)
 518             {
 519                st->dtx_count=1;
 520                mode=1;
 521             } else {
 522                mode=0;
 523                st->dtx_count++;
 524             }
 525          } else {
 526             st->dtx_count = 0;
 527             mode=st->submodeSelect;
 528          }
 529          /*speex_encoder_ctl(state, SPEEX_SET_MODE, &mode);*/
 530          st->submodeID=mode;
 531       }
 532    } else {
 533       st->relative_quality = -1;
 534    }
 535 #endif /* #ifndef DISABLE_VBR */
 536
 537    if (st->encode_submode)
 538    {
 539       /* First, transmit a zero for narrowband */
 540       speex_bits_pack(bits, 0, 1);
 541
 542       /* Transmit the sub-mode we use for this frame */
 543       speex_bits_pack(bits, st->submodeID, NB_SUBMODE_BITS);
 544
 545    }
 546
 547    /* If null mode (no transmission), just set a couple things to zero*/
 548    if (st->submodes[st->submodeID] == NULL)
 549    {
 550       for (i=0;i<st->frameSize;i++)
 551          st->exc[i]=st->sw[i]=VERY_SMALL;
 552
 553       for (i=0;i<st->lpcSize;i++)
 554          st->mem_sw[i]=0;
 555       st->first=1;
 556       st->bounded_pitch = 1;
 557
 558       SPEEX_COPY(st->winBuf, in+2*st->frameSize-st->windowSize, st->windowSize-st->frameSize);
 559
 560       /* Clear memory (no need to really compute it) */
 561       for (i=0;i<st->lpcSize;i++)
 562          st->mem_sp[i] = 0;
 563       return 0;
 564
 565    }
 566
 567    /* LSP Quantization */
 568    if (st->first)
 569    {
 570       for (i=0;i<st->lpcSize;i++)
 571          st->old_lsp[i] = lsp[i];
 572    }
 573
 574
 575    /*Quantize LSPs*/
 576 #if 1 /*0 for unquantized*/
 577    SUBMODE(lsp_quant)(lsp, qlsp, st->lpcSize, bits);
 578 #else
 579    for (i=0;i<st->lpcSize;i++)
 580      qlsp[i]=lsp[i];
 581 #endif
 582
 583    /*If we use low bit-rate pitch mode, transmit open-loop pitch*/
 584    if (SUBMODE(lbr_pitch)!=-1)
 585    {
 586       speex_bits_pack(bits, ol_pitch-st->min_pitch, 7);
 587    }
 588
 589    if (SUBMODE(forced_pitch_gain))
 590    {
 591       int quant;
 592       /* This just damps the pitch a bit, because it tends to be too aggressive when forced */
 593       ol_pitch_coef = MULT16_16_Q15(QCONST16(.9,15), ol_pitch_coef);
 594 #ifdef FIXED_POINT
 595       quant = PSHR16(MULT16_16_16(15, ol_pitch_coef),GAIN_SHIFT);
 596 #else
 597       quant = (int)floor(.5+15*ol_pitch_coef*GAIN_SCALING_1);
 598 #endif
 599       if (quant>15)
 600          quant=15;
 601       if (quant<0)
 602          quant=0;
 603       speex_bits_pack(bits, quant, 4);
 604       ol_pitch_coef=MULT16_16_P15(QCONST16(0.066667,15),SHL16(quant,GAIN_SHIFT));
 605    }
 606
 607
 608    /*Quantize and transmit open-loop excitation gain*/
 609 #ifdef FIXED_POINT
 610    {
 611       int qe = scal_quant32(ol_gain, ol_gain_table, 32);
 612       /*ol_gain = exp(qe/3.5)*SIG_SCALING;*/
 613       ol_gain = MULT16_32_Q15(28406,ol_gain_table[qe]);
 614       speex_bits_pack(bits, qe, 5);
 615    }
 616 #else
 617    {
 618       int qe = (int)(floor(.5+3.5*log(ol_gain*1.0/SIG_SCALING)));
 619       if (qe<0)
 620          qe=0;
 621       if (qe>31)
 622          qe=31;
 623       ol_gain = exp(qe/3.5)*SIG_SCALING;
 624       speex_bits_pack(bits, qe, 5);
 625    }
 626 #endif
 627
 628
 629
 630    /* Special case for first frame */
 631    if (st->first)
 632    {
 633       for (i=0;i<st->lpcSize;i++)
 634          st->old_qlsp[i] = qlsp[i];
 635    }
 636
 637    /* Target signal */
 638    ALLOC(target, st->subframeSize, spx_word16_t);
 639    ALLOC(innov, st->subframeSize, spx_sig_t);
 640    ALLOC(exc32, st->subframeSize, spx_word32_t);
 641    ALLOC(ringing, st->subframeSize, spx_word16_t);
 642    ALLOC(syn_resp, st->subframeSize, spx_word16_t);
 643    ALLOC(real_exc, st->subframeSize, spx_word16_t);
 644    ALLOC(mem, st->lpcSize, spx_mem_t);
 645
 646    /* Loop on sub-frames */
 647    for (sub=0;sub<st->nbSubframes;sub++)
 648    {
 649       int   offset;
 650       spx_word16_t *sw;
 651       spx_word16_t *exc;
 652       int pitch;
 653       int response_bound = st->subframeSize;
 654
 655       /* Offset relative to start of frame */
 656       offset = st->subframeSize*sub;
 657       /* Excitation */
 658       exc=st->exc+offset;
 659       /* Weighted signal */
 660       sw=st->sw+offset;
 661
 662       /* LSP interpolation (quantized and unquantized) */
 663       lsp_interpolate(st->old_lsp, lsp, interp_lsp, st->lpcSize, sub, st->nbSubframes);
 664       lsp_interpolate(st->old_qlsp, qlsp, interp_qlsp, st->lpcSize, sub, st->nbSubframes);
 665
 666       /* Make sure the filters are stable */
 667       lsp_enforce_margin(interp_lsp, st->lpcSize, LSP_MARGIN);
 668       lsp_enforce_margin(interp_qlsp, st->lpcSize, LSP_MARGIN);
 669
 670       /* Compute interpolated LPCs (quantized and unquantized) */
 671       lsp_to_lpc(interp_lsp, interp_lpc, st->lpcSize,stack);
 672
 673       lsp_to_lpc(interp_qlsp, interp_qlpc, st->lpcSize, stack);
 674
 675       /* Compute analysis filter gain at w=pi (for use in SB-CELP) */
 676       {
 677          spx_word32_t pi_g=LPC_SCALING;
 678          for (i=0;i<st->lpcSize;i+=2)
 679          {
 680             /*pi_g += -st->interp_qlpc[i] +  st->interp_qlpc[i+1];*/
 681             pi_g = ADD32(pi_g, SUB32(EXTEND32(interp_qlpc[i+1]),EXTEND32(interp_qlpc[i])));
 682          }
 683          st->pi_gain[sub] = pi_g;
 684       }
 685
 686 #ifdef VORBIS_PSYCHO
 687       {
 688          float curr_curve[128];
 689          float fact = ((float)sub+1.0f)/st->nbSubframes;
 690          for (i=0;i<128;i++)
 691             curr_curve[i] = (1.0f-fact)*st->old_curve[i] + fact*st->curve[i];
 692          curve_to_lpc(st->psy, curr_curve, bw_lpc1, bw_lpc2, 10);
 693       }
 694 #else
 695       /* Compute bandwidth-expanded (unquantized) LPCs for perceptual weighting */
 696       bw_lpc(st->gamma1, interp_lpc, bw_lpc1, st->lpcSize);
 697       if (st->gamma2>=0)
 698          bw_lpc(st->gamma2, interp_lpc, bw_lpc2, st->lpcSize);
 699       else
 700       {
 701          for (i=0;i<st->lpcSize;i++)
 702             bw_lpc2[i]=0;
 703       }
 704       /*print_vec(st->bw_lpc1, 10, "bw_lpc");*/
 705 #endif
 706
 707       /*FIXME: This will break if we change the window size */
 708       speex_assert(st->windowSize-st->frameSize == st->subframeSize);
 709       if (sub==0)
 710       {
 711          for (i=0;i<st->subframeSize;i++)
 712             real_exc[i] = sw[i] = st->winBuf[i];
 713       } else {
 714          for (i=0;i<st->subframeSize;i++)
 715             real_exc[i] = sw[i] = in[i+((sub-1)*st->subframeSize)];
 716       }
 717       fir_mem16(real_exc, interp_qlpc, real_exc, st->subframeSize, st->lpcSize, st->mem_exc2, stack);
 718
 719       if (st->complexity==0)
 720          response_bound >>= 1;
 721       compute_impulse_response(interp_qlpc, bw_lpc1, bw_lpc2, syn_resp, response_bound, st->lpcSize, stack);
 722       for (i=response_bound;i<st->subframeSize;i++)
 723          syn_resp[i]=VERY_SMALL;
 724
 725       /* Compute zero response of A(z/g1) / ( A(z/g2) * A(z) ) */
 726       for (i=0;i<st->lpcSize;i++)
 727          mem[i]=SHL32(st->mem_sp[i],1);
 728       for (i=0;i<st->subframeSize;i++)
 729          ringing[i] = VERY_SMALL;
 730 #ifdef SHORTCUTS2
 731       iir_mem16(ringing, interp_qlpc, ringing, response_bound, st->lpcSize, mem, stack);
 732       for (i=0;i<st->lpcSize;i++)
 733          mem[i]=SHL32(st->mem_sw[i],1);
 734       filter_mem16(ringing, st->bw_lpc1, st->bw_lpc2, ringing, response_bound, st->lpcSize, mem, stack);
 735       SPEEX_MEMSET(&ringing[response_bound], 0, st->subframeSize-response_bound);
 736 #else
 737       iir_mem16(ringing, interp_qlpc, ringing, st->subframeSize, st->lpcSize, mem, stack);
 738       for (i=0;i<st->lpcSize;i++)
 739          mem[i]=SHL32(st->mem_sw[i],1);
 740       filter_mem16(ringing, bw_lpc1, bw_lpc2, ringing, st->subframeSize, st->lpcSize, mem, stack);
 741 #endif
 742
 743       /* Compute weighted signal */
 744       for (i=0;i<st->lpcSize;i++)
 745          mem[i]=st->mem_sw[i];
 746       filter_mem16(sw, bw_lpc1, bw_lpc2, sw, st->subframeSize, st->lpcSize, mem, stack);
 747
 748       if (st->complexity==0)
 749          for (i=0;i<st->lpcSize;i++)
 750             st->mem_sw[i]=mem[i];
 751
 752       /* Compute target signal (saturation prevents overflows on clipped input speech) */
 753       for (i=0;i<st->subframeSize;i++)
 754          target[i]=EXTRACT16(SATURATE(SUB32(sw[i],PSHR32(ringing[i],1)),32767));
 755
 756       /* Reset excitation */
 757       SPEEX_MEMSET(exc, 0, st->subframeSize);
 758
 759       /* If we have a long-term predictor (otherwise, something's wrong) */
 760       speex_assert (SUBMODE(ltp_quant));
 761       {
 762          int pit_min, pit_max;
 763          /* Long-term prediction */
 764          if (SUBMODE(lbr_pitch) != -1)
 765          {
 766             /* Low bit-rate pitch handling */
 767             int margin;
 768             margin = SUBMODE(lbr_pitch);
 769             if (margin)
 770             {
 771                if (ol_pitch < st->min_pitch+margin-1)
 772                   ol_pitch=st->min_pitch+margin-1;
 773                if (ol_pitch > st->max_pitch-margin)
 774                   ol_pitch=st->max_pitch-margin;
 775                pit_min = ol_pitch-margin+1;
 776                pit_max = ol_pitch+margin;
 777             } else {
 778                pit_min=pit_max=ol_pitch;
 779             }
 780          } else {
 781             pit_min = st->min_pitch;
 782             pit_max = st->max_pitch;
 783          }
 784
 785          /* Force pitch to use only the current frame if needed */
 786          if (st->bounded_pitch && pit_max>offset)
 787             pit_max=offset;
 788
 789          /* Perform pitch search */
 790          pitch = SUBMODE(ltp_quant)(target, sw, interp_qlpc, bw_lpc1, bw_lpc2,
 791                                     exc32, SUBMODE(ltp_params), pit_min, pit_max, ol_pitch_coef,
 792                                     st->lpcSize, st->subframeSize, bits, stack,
 793                                     exc, syn_resp, st->complexity, 0, st->plc_tuning, &st->cumul_gain);
 794
 795          st->pitch[sub]=pitch;
 796       }
 797       /* Quantization of innovation */
 798       SPEEX_MEMSET(innov, 0, st->subframeSize);
 799
 800       /* FIXME: Make sure this is save from overflows (so far so good) */
 801       for (i=0;i<st->subframeSize;i++)
 802          real_exc[i] = EXTRACT16(SUB32(EXTEND32(real_exc[i]), PSHR32(exc32[i],SIG_SHIFT-1)));
 803
 804       ener = SHL32(EXTEND32(compute_rms16(real_exc, st->subframeSize)),SIG_SHIFT);
 805
 806       /*FIXME: Should use DIV32_16 and make sure result fits in 16 bits */
 807 #ifdef FIXED_POINT
 808       {
 809          spx_word32_t f = PDIV32(ener,PSHR32(ol_gain,SIG_SHIFT));
 810          if (f<=32767)
 811             fine_gain = f;
 812          else
 813             fine_gain = 32767;
 814       }
 815 #else
 816       fine_gain = PDIV32_16(ener,PSHR32(ol_gain,SIG_SHIFT));
 817 #endif
 818       /* Calculate gain correction for the sub-frame (if any) */
 819       if (SUBMODE(have_subframe_gain))
 820       {
 821          int qe;
 822          if (SUBMODE(have_subframe_gain)==3)
 823          {
 824             qe = scal_quant(fine_gain, exc_gain_quant_scal3_bound, 8);
 825             speex_bits_pack(bits, qe, 3);
 826             ener=MULT16_32_Q14(exc_gain_quant_scal3[qe],ol_gain);
 827          } else {
 828             qe = scal_quant(fine_gain, exc_gain_quant_scal1_bound, 2);
 829             speex_bits_pack(bits, qe, 1);
 830             ener=MULT16_32_Q14(exc_gain_quant_scal1[qe],ol_gain);
 831          }
 832       } else {
 833          ener=ol_gain;
 834       }
 835
 836       /*printf ("%f %f\n", ener, ol_gain);*/
 837
 838       /* Normalize innovation */
 839       signal_div(target, target, ener, st->subframeSize);
 840
 841       /* Quantize innovation */
 842       speex_assert (SUBMODE(innovation_quant));
 843       {
 844          /* Codebook search */
 845          SUBMODE(innovation_quant)(target, interp_qlpc, bw_lpc1, bw_lpc2,
 846                   SUBMODE(innovation_params), st->lpcSize, st->subframeSize,
 847                   innov, syn_resp, bits, stack, st->complexity, SUBMODE(double_codebook));
 848
 849          /* De-normalize innovation and update excitation */
 850          signal_mul(innov, innov, ener, st->subframeSize);
 851
 852          for (i=0;i<st->subframeSize;i++)
 853             exc[i] = EXTRACT16(SATURATE32(PSHR32(ADD32(SHL32(exc32[i],1),innov[i]),SIG_SHIFT),32767));
 854
 855          /* In some (rare) modes, we do a second search (more bits) to reduce noise even more */
 856          if (SUBMODE(double_codebook)) {
 857             char *tmp_stack=stack;
 858             VARDECL(spx_sig_t *innov2);
 859             ALLOC(innov2, st->subframeSize, spx_sig_t);
 860             SPEEX_MEMSET(innov2, 0, st->subframeSize);
 861             for (i=0;i<st->subframeSize;i++)
 862                target[i]=MULT16_16_P13(QCONST16(2.2f,13), target[i]);
 863             SUBMODE(innovation_quant)(target, interp_qlpc, bw_lpc1, bw_lpc2,
 864                                       SUBMODE(innovation_params), st->lpcSize, st->subframeSize,
 865                                       innov2, syn_resp, bits, stack, st->complexity, 0);
 866             signal_mul(innov2, innov2, MULT16_32_Q15(QCONST16(0.454545f,15),ener), st->subframeSize);
 867             for (i=0;i<st->subframeSize;i++)
 868                innov[i] = ADD32(innov[i],innov2[i]);
 869             stack = tmp_stack;
 870          }
 871          for (i=0;i<st->subframeSize;i++)
 872             exc[i] = EXTRACT16(SATURATE32(PSHR32(ADD32(SHL32(exc32[i],1),innov[i]),SIG_SHIFT),32767));
 873          if (st->innov_rms_save)
 874          {
 875             st->innov_rms_save[sub] = compute_rms(innov, st->subframeSize);
 876          }
 877       }
 878
 879       /* Final signal synthesis from excitation */
 880       iir_mem16(exc, interp_qlpc, sw, st->subframeSize, st->lpcSize, st->mem_sp, stack);
 881
 882       /* Compute weighted signal again, from synthesized speech (not sure it's the right thing) */
 883       if (st->complexity!=0)
 884          filter_mem16(sw, bw_lpc1, bw_lpc2, sw, st->subframeSize, st->lpcSize, st->mem_sw, stack);
 885
 886    }
 887
 888    /* Store the LSPs for interpolation in the next frame */
 889    if (st->submodeID>=1)
 890    {
 891       for (i=0;i<st->lpcSize;i++)
 892          st->old_lsp[i] = lsp[i];
 893       for (i=0;i<st->lpcSize;i++)
 894          st->old_qlsp[i] = qlsp[i];
 895    }
 896
 897 #ifdef VORBIS_PSYCHO
 898    if (st->submodeID>=1)
 899       SPEEX_COPY(st->old_curve, st->curve, 128);
 900 #endif
 901
 902    if (st->submodeID==1)
 903    {
 904 #ifndef DISABLE_VBR
 905       if (st->dtx_count)
 906          speex_bits_pack(bits, 15, 4);
 907       else
 908 #endif
 909          speex_bits_pack(bits, 0, 4);
 910    }
 911
 912    /* The next frame will not be the first (Duh!) */
 913    st->first = 0;
 914    SPEEX_COPY(st->winBuf, in+2*st->frameSize-st->windowSize, st->windowSize-st->frameSize);
 915
 916    if (SUBMODE(innovation_quant) == noise_codebook_quant || st->submodeID==0)
 917       st->bounded_pitch = 1;
 918    else
 919       st->bounded_pitch = 0;
 920
 921    return 1;
 922 }
 923
 924 void *nb_decoder_init(const SpeexMode *m)
 925 {
 926    DecState *st;
 927    const SpeexNBMode *mode;
 928    int i;
 929
 930    mode=(const SpeexNBMode*)m->mode;
 931    st = (DecState *)speex_alloc(sizeof(DecState));
 932    if (!st)
 933       return NULL;
 934 #if defined(VAR_ARRAYS) || defined (USE_ALLOCA)
 935    st->stack = NULL;
 936 #else
 937    st->stack = (char*)speex_alloc_scratch(NB_DEC_STACK);
 938 #endif
 939
 940    st->mode=m;
 941
 942
 943    st->encode_submode = 1;
 944
 945    st->first=1;
 946    /* Codec parameters, should eventually have several "modes"*/
 947    st->frameSize = mode->frameSize;
 948    st->nbSubframes=mode->frameSize/mode->subframeSize;
 949    st->subframeSize=mode->subframeSize;
 950    st->lpcSize = mode->lpcSize;
 951    st->min_pitch=mode->pitchStart;
 952    st->max_pitch=mode->pitchEnd;
 953
 954    st->submodes=mode->submodes;
 955    st->submodeID=mode->defaultSubmode;
 956
 957    st->lpc_enh_enabled=1;
 958
 959    st->excBuf = (spx_word16_t*)speex_alloc((st->frameSize + 2*st->max_pitch + st->subframeSize + 12)*sizeof(spx_word16_t));
 960    st->exc = st->excBuf + 2*st->max_pitch + st->subframeSize + 6;
 961    SPEEX_MEMSET(st->excBuf, 0, st->frameSize + st->max_pitch);
 962
 963    st->interp_qlpc = (spx_coef_t*)speex_alloc(st->lpcSize*sizeof(spx_coef_t));
 964    st->old_qlsp = (spx_lsp_t*)speex_alloc(st->lpcSize*sizeof(spx_lsp_t));
 965    st->mem_sp = (spx_mem_t*)speex_alloc(st->lpcSize*sizeof(spx_mem_t));
 966    st->pi_gain = (spx_word32_t*)speex_alloc((st->nbSubframes)*sizeof(spx_word32_t));
 967    st->last_pitch = 40;
 968    st->count_lost=0;
 969    st->pitch_gain_buf[0] = st->pitch_gain_buf[1] = st->pitch_gain_buf[2] = 0;
 970    st->pitch_gain_buf_idx = 0;
 971    st->seed = 1000;
 972
 973    st->sampling_rate=8000;
 974    st->last_ol_gain = 0;
 975
 976    st->user_callback.func = &speex_default_user_handler;
 977    st->user_callback.data = NULL;
 978    for (i=0;i<16;i++)
 979       st->speex_callbacks[i].func = NULL;
 980
 981    st->voc_m1=st->voc_m2=st->voc_mean=0;
 982    st->voc_offset=0;
 983    st->dtx_enabled=0;
 984    st->isWideband = 0;
 985    st->highpass_enabled = 1;
 986
 987 #ifdef ENABLE_VALGRIND
 988    VALGRIND_MAKE_READABLE(st, NB_DEC_STACK);
 989 #endif
 990    return st;
 991 }
 992
 993 void nb_decoder_destroy(void *state)
 994 {
 995    DecState *st;
 996    st=(DecState*)state;
 997
 998 #if !(defined(VAR_ARRAYS) || defined (USE_ALLOCA))
 999    speex_free_scratch(st->stack);
1000 #endif
1001
1002    speex_free (st->excBuf);
1003    speex_free (st->interp_qlpc);
1004    speex_free (st->old_qlsp);
1005    speex_free (st->mem_sp);
1006    speex_free (st->pi_gain);
1007
1008    speex_free(state);
1009 }
1010
1011 #define median3(a, b, c)        ((a) < (b) ? ((b) < (c) ? (b) : ((a) < (c) ? (c) : (a))) : ((c) < (b) ? (b) : ((c) < (a) ? (c) : (a))))
1012
1013 #ifdef FIXED_POINT
1014 const spx_word16_t attenuation[10] = {32767, 31483, 27923, 22861, 17278, 12055, 7764, 4616, 2533, 1283};
1015 #else
1016 const spx_word16_t attenuation[10] = {1., 0.961, 0.852, 0.698, 0.527, 0.368, 0.237, 0.141, 0.077, 0.039};
1017
1018 #endif
1019
1020 static void nb_decode_lost(DecState *st, spx_word16_t *out, char *stack)
1021 {
1022    int i;
1023    int pitch_val;
1024    spx_word16_t pitch_gain;
1025    spx_word16_t fact;
1026    spx_word16_t gain_med;
1027    spx_word16_t innov_gain;
1028    spx_word16_t noise_gain;
1029
1030    if (st->count_lost<10)
1031       fact = attenuation[st->count_lost];
1032    else
1033       fact = 0;
1034
1035    gain_med = median3(st->pitch_gain_buf[0], st->pitch_gain_buf[1], st->pitch_gain_buf[2]);
1036    if (gain_med < st->last_pitch_gain)
1037       st->last_pitch_gain = gain_med;
1038
1039 #ifdef FIXED_POINT
1040    pitch_gain = st->last_pitch_gain;
1041    if (pitch_gain>54)
1042       pitch_gain = 54;
1043    pitch_gain = SHL16(pitch_gain, 9);
1044 #else
1045    pitch_gain = GAIN_SCALING_1*st->last_pitch_gain;
1046    if (pitch_gain>.85)
1047       pitch_gain=.85;
1048 #endif
1049    pitch_gain = MULT16_16_Q15(fact,pitch_gain) + VERY_SMALL;
1050    /* FIXME: This was rms of innovation (not exc) */
1051    innov_gain = compute_rms16(st->exc, st->frameSize);
1052    noise_gain = MULT16_16_Q15(innov_gain, MULT16_16_Q15(fact, SUB16(Q15ONE,MULT16_16_Q15(pitch_gain,pitch_gain))));
1053    /* Shift all buffers by one frame */
1054    SPEEX_MOVE(st->excBuf, st->excBuf+st->frameSize, 2*st->max_pitch + st->subframeSize + 12);
1055
1056
1057    pitch_val = st->last_pitch + SHR32((spx_int32_t)speex_rand(1+st->count_lost, &st->seed),SIG_SHIFT);
1058    if (pitch_val > st->max_pitch)
1059       pitch_val = st->max_pitch;
1060    if (pitch_val < st->min_pitch)
1061       pitch_val = st->min_pitch;
1062    for (i=0;i<st->frameSize;i++)
1063    {
1064       st->exc[i]= MULT16_16_Q15(pitch_gain, (st->exc[i-pitch_val]+VERY_SMALL)) +
1065             speex_rand(noise_gain, &st->seed);
1066    }
1067
1068    bw_lpc(QCONST16(.98,15), st->interp_qlpc, st->interp_qlpc, st->lpcSize);
1069    iir_mem16(&st->exc[-st->subframeSize], st->interp_qlpc, out, st->frameSize,
1070              st->lpcSize, st->mem_sp, stack);
1071    highpass(out, out, st->frameSize, HIGHPASS_NARROWBAND|HIGHPASS_OUTPUT, st->mem_hp);
1072
1073    st->first = 0;
1074    st->count_lost++;
1075    st->pitch_gain_buf[st->pitch_gain_buf_idx++] = PSHR16(pitch_gain,9);
1076    if (st->pitch_gain_buf_idx > 2) /* rollover */
1077       st->pitch_gain_buf_idx = 0;
1078 }
1079
1080 /* Just so we don't need to carry the complete wideband mode information */
1081 static const int wb_skip_table[8] = {0, 36, 112, 192, 352, 0, 0, 0};
1082
1083 int nb_decode(void *state, SpeexBits *bits, void *vout)
1084 {
1085    DecState *st;
1086    int i, sub;
1087    int pitch;
1088    spx_word16_t pitch_gain[3];
1089    spx_word32_t ol_gain=0;
1090    int ol_pitch=0;
1091    spx_word16_t ol_pitch_coef=0;
1092    int best_pitch=40;
1093    spx_word16_t best_pitch_gain=0;
1094    int wideband;
1095    int m;
1096    char *stack;
1097    VARDECL(spx_sig_t *innov);
1098    VARDECL(spx_word32_t *exc32);
1099    VARDECL(spx_coef_t *ak);
1100    VARDECL(spx_lsp_t *qlsp);
1101    spx_word16_t pitch_average=0;
1102
1103    spx_word16_t *out = (spx_word16_t*)vout;
1104    VARDECL(spx_lsp_t *interp_qlsp);
1105
1106    st=(DecState*)state;
1107    stack=st->stack;
1108
1109    /* Check if we're in DTX mode*/
1110    if (!bits && st->dtx_enabled)
1111    {
1112       st->submodeID=0;
1113    } else
1114    {
1115       /* If bits is NULL, consider the packet to be lost (what could we do anyway) */
1116       if (!bits)
1117       {
1118          nb_decode_lost(st, out, stack);
1119          return 0;
1120       }
1121
1122       if (st->encode_submode)
1123       {
1124
1125       /* Search for next narrowband block (handle requests, skip wideband blocks) */
1126       do {
1127          if (speex_bits_remaining(bits)<5)
1128             return -1;
1129          wideband = speex_bits_unpack_unsigned(bits, 1);
1130          if (wideband) /* Skip wideband block (for compatibility) */
1131          {
1132             int submode;
1133             int advance;
1134             advance = submode = speex_bits_unpack_unsigned(bits, SB_SUBMODE_BITS);
1135             /*speex_mode_query(&speex_wb_mode, SPEEX_SUBMODE_BITS_PER_FRAME, &advance);*/
1136             advance = wb_skip_table[submode];
1137             if (advance < 0)
1138             {
1139                speex_notify("Invalid mode encountered. The stream is corrupted.");
1140                return -2;
1141             }
1142             advance -= (SB_SUBMODE_BITS+1);
1143             speex_bits_advance(bits, advance);
1144
1145             if (speex_bits_remaining(bits)<5)
1146                return -1;
1147             wideband = speex_bits_unpack_unsigned(bits, 1);
1148             if (wideband)
1149             {
1150                advance = submode = speex_bits_unpack_unsigned(bits, SB_SUBMODE_BITS);
1151                /*speex_mode_query(&speex_wb_mode, SPEEX_SUBMODE_BITS_PER_FRAME, &advance);*/
1152                advance = wb_skip_table[submode];
1153                if (advance < 0)
1154                {
1155                   speex_notify("Invalid mode encountered. The stream is corrupted.");
1156                   return -2;
1157                }
1158                advance -= (SB_SUBMODE_BITS+1);
1159                speex_bits_advance(bits, advance);
1160                wideband = speex_bits_unpack_unsigned(bits, 1);
1161                if (wideband)
1162                {
1163                   speex_notify("More than two wideband layers found. The stream is corrupted.");
1164                   return -2;
1165                }
1166
1167             }
1168          }
1169          if (speex_bits_remaining(bits)<4)
1170             return -1;
1171          /* FIXME: Check for overflow */
1172          m = speex_bits_unpack_unsigned(bits, 4);
1173          if (m==15) /* We found a terminator */
1174          {
1175             return -1;
1176          } else if (m==14) /* Speex in-band request */
1177          {
1178             int ret = speex_inband_handler(bits, st->speex_callbacks, state);
1179             if (ret)
1180                return ret;
1181          } else if (m==13) /* User in-band request */
1182          {
1183             int ret = st->user_callback.func(bits, state, st->user_callback.data);
1184             if (ret)
1185                return ret;
1186          } else if (m>8) /* Invalid mode */
1187          {
1188             speex_notify("Invalid mode encountered. The stream is corrupted.");
1189             return -2;
1190          }
1191
1192       } while (m>8);
1193
1194       /* Get the sub-mode that was used */
1195       st->submodeID = m;
1196       }
1197
1198    }
1199
1200    /* Shift all buffers by one frame */
1201    SPEEX_MOVE(st->excBuf, st->excBuf+st->frameSize, 2*st->max_pitch + st->subframeSize + 12);
1202
1203    /* If null mode (no transmission), just set a couple things to zero*/
1204    if (st->submodes[st->submodeID] == NULL)
1205    {
1206       VARDECL(spx_coef_t *lpc);
1207       ALLOC(lpc, st->lpcSize, spx_coef_t);
1208       bw_lpc(QCONST16(0.93f,15), st->interp_qlpc, lpc, st->lpcSize);
1209       {
1210          spx_word16_t innov_gain=0;
1211          /* FIXME: This was innov, not exc */
1212          innov_gain = compute_rms16(st->exc, st->frameSize);
1213          for (i=0;i<st->frameSize;i++)
1214             st->exc[i]=speex_rand(innov_gain, &st->seed);
1215       }
1216
1217
1218       st->first=1;
1219
1220       /* Final signal synthesis from excitation */
1221       iir_mem16(st->exc, lpc, out, st->frameSize, st->lpcSize, st->mem_sp, stack);
1222
1223       st->count_lost=0;
1224       return 0;
1225    }
1226
1227    ALLOC(qlsp, st->lpcSize, spx_lsp_t);
1228
1229    /* Unquantize LSPs */
1230    SUBMODE(lsp_unquant)(qlsp, st->lpcSize, bits);
1231
1232    /*Damp memory if a frame was lost and the LSP changed too much*/
1233    if (st->count_lost)
1234    {
1235       spx_word16_t fact;
1236       spx_word32_t lsp_dist=0;
1237       for (i=0;i<st->lpcSize;i++)
1238          lsp_dist = ADD32(lsp_dist, EXTEND32(ABS(st->old_qlsp[i] - qlsp[i])));
1239 #ifdef FIXED_POINT
1240       fact = SHR16(19661,SHR32(lsp_dist,LSP_SHIFT+2));
1241 #else
1242       fact = .6*exp(-.2*lsp_dist);
1243 #endif
1244       for (i=0;i<st->lpcSize;i++)
1245          st->mem_sp[i] = MULT16_32_Q15(fact,st->mem_sp[i]);
1246    }
1247
1248
1249    /* Handle first frame and lost-packet case */
1250    if (st->first || st->count_lost)
1251    {
1252       for (i=0;i<st->lpcSize;i++)
1253          st->old_qlsp[i] = qlsp[i];
1254    }
1255
1256    /* Get open-loop pitch estimation for low bit-rate pitch coding */
1257    if (SUBMODE(lbr_pitch)!=-1)
1258    {
1259       ol_pitch = st->min_pitch+speex_bits_unpack_unsigned(bits, 7);
1260    }
1261
1262    if (SUBMODE(forced_pitch_gain))
1263    {
1264       int quant;
1265       quant = speex_bits_unpack_unsigned(bits, 4);
1266       ol_pitch_coef=MULT16_16_P15(QCONST16(0.066667,15),SHL16(quant,GAIN_SHIFT));
1267    }
1268
1269    /* Get global excitation gain */
1270    {
1271       int qe;
1272       qe = speex_bits_unpack_unsigned(bits, 5);
1273 #ifdef FIXED_POINT
1274       /* FIXME: Perhaps we could slightly lower the gain here when the output is going to saturate? */
1275       ol_gain = MULT16_32_Q15(28406,ol_gain_table[qe]);
1276 #else
1277       ol_gain = SIG_SCALING*exp(qe/3.5);
1278 #endif
1279    }
1280
1281    ALLOC(ak, st->lpcSize, spx_coef_t);
1282    ALLOC(innov, st->subframeSize, spx_sig_t);
1283    ALLOC(exc32, st->subframeSize, spx_word32_t);
1284
1285    if (st->submodeID==1)
1286    {
1287       int extra;
1288       extra = speex_bits_unpack_unsigned(bits, 4);
1289
1290       if (extra==15)
1291          st->dtx_enabled=1;
1292       else
1293          st->dtx_enabled=0;
1294    }
1295    if (st->submodeID>1)
1296       st->dtx_enabled=0;
1297
1298    /*Loop on subframes */
1299    for (sub=0;sub<st->nbSubframes;sub++)
1300    {
1301       int offset;
1302       spx_word16_t *exc;
1303       spx_word16_t *sp;
1304       spx_word16_t *innov_save = NULL;
1305       spx_word16_t tmp;
1306
1307       /* Offset relative to start of frame */
1308       offset = st->subframeSize*sub;
1309       /* Excitation */
1310       exc=st->exc+offset;
1311       /* Original signal */
1312       sp=out+offset;
1313       if (st->innov_save)
1314          innov_save = st->innov_save+offset;
1315
1316
1317       /* Reset excitation */
1318       SPEEX_MEMSET(exc, 0, st->subframeSize);
1319
1320       /*Adaptive codebook contribution*/
1321       speex_assert (SUBMODE(ltp_unquant));
1322       {
1323          int pit_min, pit_max;
1324          /* Handle pitch constraints if any */
1325          if (SUBMODE(lbr_pitch) != -1)
1326          {
1327             int margin;
1328             margin = SUBMODE(lbr_pitch);
1329             if (margin)
1330             {
1331 /* GT - need optimization?
1332                if (ol_pitch < st->min_pitch+margin-1)
1333                   ol_pitch=st->min_pitch+margin-1;
1334                if (ol_pitch > st->max_pitch-margin)
1335                   ol_pitch=st->max_pitch-margin;
1336                pit_min = ol_pitch-margin+1;
1337                pit_max = ol_pitch+margin;
1338 */
1339                pit_min = ol_pitch-margin+1;
1340                if (pit_min < st->min_pitch)
1341                   pit_min = st->min_pitch;
1342                pit_max = ol_pitch+margin;
1343                if (pit_max > st->max_pitch)
1344                   pit_max = st->max_pitch;
1345             } else {
1346                pit_min = pit_max = ol_pitch;
1347             }
1348          } else {
1349             pit_min = st->min_pitch;
1350             pit_max = st->max_pitch;
1351          }
1352
1353
1354
1355          SUBMODE(ltp_unquant)(exc, exc32, pit_min, pit_max, ol_pitch_coef, SUBMODE(ltp_params),
1356                  st->subframeSize, &pitch, &pitch_gain[0], bits, stack,
1357                  st->count_lost, offset, st->last_pitch_gain, 0);
1358
1359          /* Ensuring that things aren't blowing up as would happen if e.g. an encoder is
1360          crafting packets to make us produce NaNs and slow down the decoder (vague DoS threat).
1361          We can probably be even more aggressive and limit to 15000 or so. */
1362          sanitize_values32(exc32, NEG32(QCONST32(32000,SIG_SHIFT-1)), QCONST32(32000,SIG_SHIFT-1), st->subframeSize);
1363
1364          tmp = gain_3tap_to_1tap(pitch_gain);
1365
1366          pitch_average += tmp;
1367          if ((tmp>best_pitch_gain&&ABS(2*best_pitch-pitch)>=3&&ABS(3*best_pitch-pitch)>=4&&ABS(4*best_pitch-pitch)>=5)
1368               || (tmp>MULT16_16_Q15(QCONST16(.6,15),best_pitch_gain)&&(ABS(best_pitch-2*pitch)<3||ABS(best_pitch-3*pitch)<4||ABS(best_pitch-4*pitch)<5))
1369               || (MULT16_16_Q15(QCONST16(.67,15),tmp)>best_pitch_gain&&(ABS(2*best_pitch-pitch)<3||ABS(3*best_pitch-pitch)<4||ABS(4*best_pitch-pitch)<5)) )
1370          {
1371             best_pitch = pitch;
1372             if (tmp > best_pitch_gain)
1373                best_pitch_gain = tmp;
1374          }
1375       }
1376
1377       /* Unquantize the innovation */
1378       {
1379          int q_energy;
1380          spx_word32_t ener;
1381
1382          SPEEX_MEMSET(innov, 0, st->subframeSize);
1383
1384          /* Decode sub-frame gain correction */
1385          if (SUBMODE(have_subframe_gain)==3)
1386          {
1387             q_energy = speex_bits_unpack_unsigned(bits, 3);
1388             ener = MULT16_32_Q14(exc_gain_quant_scal3[q_energy],ol_gain);
1389          } else if (SUBMODE(have_subframe_gain)==1)
1390          {
1391             q_energy = speex_bits_unpack_unsigned(bits, 1);
1392             ener = MULT16_32_Q14(exc_gain_quant_scal1[q_energy],ol_gain);
1393          } else {
1394             ener = ol_gain;
1395          }
1396
1397          speex_assert (SUBMODE(innovation_unquant));
1398          {
1399             /*Fixed codebook contribution*/
1400             SUBMODE(innovation_unquant)(innov, SUBMODE(innovation_params), st->subframeSize, bits, stack, &st->seed);
1401             /* De-normalize innovation and update excitation */
1402
1403             signal_mul(innov, innov, ener, st->subframeSize);
1404
1405             /* Decode second codebook (only for some modes) */
1406             if (SUBMODE(double_codebook))
1407             {
1408                char *tmp_stack=stack;
1409                VARDECL(spx_sig_t *innov2);
1410                ALLOC(innov2, st->subframeSize, spx_sig_t);
1411                SPEEX_MEMSET(innov2, 0, st->subframeSize);
1412                SUBMODE(innovation_unquant)(innov2, SUBMODE(innovation_params), st->subframeSize, bits, stack, &st->seed);
1413                signal_mul(innov2, innov2, MULT16_32_Q15(QCONST16(0.454545f,15),ener), st->subframeSize);
1414                for (i=0;i<st->subframeSize;i++)
1415                   innov[i] = ADD32(innov[i], innov2[i]);
1416                stack = tmp_stack;
1417             }
1418             for (i=0;i<st->subframeSize;i++)
1419                exc[i]=EXTRACT16(SATURATE32(PSHR32(ADD32(SHL32(exc32[i],1),innov[i]),SIG_SHIFT),32767));
1420             /*print_vec(exc, 40, "innov");*/
1421             if (innov_save)
1422             {
1423                for (i=0;i<st->subframeSize;i++)
1424                   innov_save[i] = EXTRACT16(PSHR32(innov[i], SIG_SHIFT));
1425             }
1426          }
1427
1428          /*Vocoder mode*/
1429          if (st->submodeID==1)
1430          {
1431             spx_word16_t g=ol_pitch_coef;
1432             g=MULT16_16_P14(QCONST16(1.5f,14),(g-QCONST16(.2f,6)));
1433             if (g<0)
1434                g=0;
1435             if (g>GAIN_SCALING)
1436                g=GAIN_SCALING;
1437
1438             SPEEX_MEMSET(exc, 0, st->subframeSize);
1439             while (st->voc_offset<st->subframeSize)
1440             {
1441                /* exc[st->voc_offset]= g*sqrt(2*ol_pitch)*ol_gain;
1442                   Not quite sure why we need the factor of two in the sqrt */
1443                if (st->voc_offset>=0)
1444                   exc[st->voc_offset]=MULT16_16(spx_sqrt(MULT16_16_16(2,ol_pitch)),EXTRACT16(PSHR32(MULT16_16(g,PSHR32(ol_gain,SIG_SHIFT)),6)));
1445                st->voc_offset+=ol_pitch;
1446             }
1447             st->voc_offset -= st->subframeSize;
1448
1449             for (i=0;i<st->subframeSize;i++)
1450             {
1451                spx_word16_t exci=exc[i];
1452                exc[i]= ADD16(ADD16(MULT16_16_Q15(QCONST16(.7f,15),exc[i]) , MULT16_16_Q15(QCONST16(.3f,15),st->voc_m1)),
1453                              SUB16(MULT16_16_Q15(Q15_ONE-MULT16_16_16(QCONST16(.85f,9),g),EXTRACT16(PSHR32(innov[i],SIG_SHIFT))),
1454                                    MULT16_16_Q15(MULT16_16_16(QCONST16(.15f,9),g),EXTRACT16(PSHR32(st->voc_m2,SIG_SHIFT)))
1455                                   ));
1456                st->voc_m1 = exci;
1457                st->voc_m2=innov[i];
1458                st->voc_mean = EXTRACT16(PSHR32(ADD32(MULT16_16(QCONST16(.8f,15),st->voc_mean), MULT16_16(QCONST16(.2f,15),exc[i])), 15));
1459                exc[i]-=st->voc_mean;
1460             }
1461          }
1462
1463       }
1464    }
1465
1466    ALLOC(interp_qlsp, st->lpcSize, spx_lsp_t);
1467
1468    if (st->lpc_enh_enabled && SUBMODE(comb_gain)>0 && !st->count_lost)
1469    {
1470       multicomb(st->exc-st->subframeSize, out, st->interp_qlpc, st->lpcSize, 2*st->subframeSize, best_pitch, 40, SUBMODE(comb_gain), stack);
1471       multicomb(st->exc+st->subframeSize, out+2*st->subframeSize, st->interp_qlpc, st->lpcSize, 2*st->subframeSize, best_pitch, 40, SUBMODE(comb_gain), stack);
1472    } else {
1473       SPEEX_COPY(out, &st->exc[-st->subframeSize], st->frameSize);
1474    }
1475
1476    /* If the last packet was lost, re-scale the excitation to obtain the same energy as encoded in ol_gain */
1477    if (st->count_lost)
1478    {
1479       spx_word16_t exc_ener;
1480       spx_word32_t gain32;
1481       spx_word16_t gain;
1482       exc_ener = compute_rms16 (st->exc, st->frameSize);
1483       gain32 = PDIV32(ol_gain, ADD16(exc_ener,1));
1484 #ifdef FIXED_POINT
1485       if (gain32 > 32767)
1486          gain32 = 32767;
1487       gain = EXTRACT16(gain32);
1488 #else
1489       if (gain32 > 2)
1490          gain32=2;
1491       gain = gain32;
1492 #endif
1493       for (i=0;i<st->frameSize;i++)
1494       {
1495          st->exc[i] = MULT16_16_Q14(gain, st->exc[i]);
1496          out[i]=st->exc[i-st->subframeSize];
1497       }
1498    }
1499
1500    /*Loop on subframes */
1501    for (sub=0;sub<st->nbSubframes;sub++)
1502    {
1503       int offset;
1504       spx_word16_t *sp;
1505       spx_word16_t *exc;
1506       /* Offset relative to start of frame */
1507       offset = st->subframeSize*sub;
1508       /* Original signal */
1509       sp=out+offset;
1510       /* Excitation */
1511       exc=st->exc+offset;
1512
1513       /* LSP interpolation (quantized and unquantized) */
1514       lsp_interpolate(st->old_qlsp, qlsp, interp_qlsp, st->lpcSize, sub, st->nbSubframes);
1515
1516       /* Make sure the LSP's are stable */
1517       lsp_enforce_margin(interp_qlsp, st->lpcSize, LSP_MARGIN);
1518
1519       /* Compute interpolated LPCs (unquantized) */
1520       lsp_to_lpc(interp_qlsp, ak, st->lpcSize, stack);
1521
1522       /* Compute analysis filter at w=pi */
1523       {
1524          spx_word32_t pi_g=LPC_SCALING;
1525          for (i=0;i<st->lpcSize;i+=2)
1526          {
1527             /*pi_g += -st->interp_qlpc[i] +  st->interp_qlpc[i+1];*/
1528             pi_g = ADD32(pi_g, SUB32(EXTEND32(ak[i+1]),EXTEND32(ak[i])));
1529          }
1530          st->pi_gain[sub] = pi_g;
1531       }
1532
1533       iir_mem16(sp, st->interp_qlpc, sp, st->subframeSize, st->lpcSize,
1534                 st->mem_sp, stack);
1535
1536       for (i=0;i<st->lpcSize;i++)
1537          st->interp_qlpc[i] = ak[i];
1538
1539    }
1540
1541    if (st->highpass_enabled)
1542       highpass(out, out, st->frameSize, (st->isWideband?HIGHPASS_WIDEBAND:HIGHPASS_NARROWBAND)|HIGHPASS_OUTPUT, st->mem_hp);
1543    /*for (i=0;i<st->frameSize;i++)
1544      printf ("%d\n", (int)st->frame[i]);*/
1545
1546    /* Tracking output level */
1547    st->level = 1+PSHR32(ol_gain,SIG_SHIFT);
1548    st->max_level = MAX16(MULT16_16_Q15(QCONST16(.99f,15), st->max_level), st->level);
1549    st->min_level = MIN16(ADD16(1,MULT16_16_Q14(QCONST16(1.01f,14), st->min_level)), st->level);
1550    if (st->max_level < st->min_level+1)
1551       st->max_level = st->min_level+1;
1552    /*printf ("%f %f %f %d\n", og, st->min_level, st->max_level, update);*/
1553
1554    /* Store the LSPs for interpolation in the next frame */
1555    for (i=0;i<st->lpcSize;i++)
1556       st->old_qlsp[i] = qlsp[i];
1557
1558    /* The next frame will not be the first (Duh!) */
1559    st->first = 0;
1560    st->count_lost=0;
1561    st->last_pitch = best_pitch;
1562 #ifdef FIXED_POINT
1563    st->last_pitch_gain = PSHR16(pitch_average,2);
1564 #else
1565    st->last_pitch_gain = .25*pitch_average;
1566 #endif
1567    st->pitch_gain_buf[st->pitch_gain_buf_idx++] = st->last_pitch_gain;
1568    if (st->pitch_gain_buf_idx > 2) /* rollover */
1569       st->pitch_gain_buf_idx = 0;
1570
1571    st->last_ol_gain = ol_gain;
1572
1573    return 0;
1574 }
1575
1576 int nb_encoder_ctl(void *state, int request, void *ptr)
1577 {
1578    EncState *st;
1579    st=(EncState*)state;
1580    switch(request)
1581    {
1582    case SPEEX_GET_FRAME_SIZE:
1583       (*(spx_int32_t*)ptr) = st->frameSize;
1584       break;
1585    case SPEEX_SET_LOW_MODE:
1586    case SPEEX_SET_MODE:
1587       st->submodeSelect = st->submodeID = (*(spx_int32_t*)ptr);
1588       break;
1589    case SPEEX_GET_LOW_MODE:
1590    case SPEEX_GET_MODE:
1591       (*(spx_int32_t*)ptr) = st->submodeID;
1592       break;
1593 #ifndef DISABLE_VBR
1594       case SPEEX_SET_VBR:
1595       st->vbr_enabled = (*(spx_int32_t*)ptr);
1596       break;
1597    case SPEEX_GET_VBR:
1598       (*(spx_int32_t*)ptr) = st->vbr_enabled;
1599       break;
1600    case SPEEX_SET_VAD:
1601       st->vad_enabled = (*(spx_int32_t*)ptr);
1602       break;
1603    case SPEEX_GET_VAD:
1604       (*(spx_int32_t*)ptr) = st->vad_enabled;
1605       break;
1606    case SPEEX_SET_DTX:
1607       st->dtx_enabled = (*(spx_int32_t*)ptr);
1608       break;
1609    case SPEEX_GET_DTX:
1610       (*(spx_int32_t*)ptr) = st->dtx_enabled;
1611       break;
1612    case SPEEX_SET_ABR:
1613       st->abr_enabled = (*(spx_int32_t*)ptr);
1614       st->vbr_enabled = st->abr_enabled!=0;
1615       if (st->vbr_enabled)
1616       {
1617          spx_int32_t i=10;
1618          spx_int32_t rate, target;
1619          float vbr_qual;
1620          target = (*(spx_int32_t*)ptr);
1621          while (i>=0)
1622          {
1623             speex_encoder_ctl(st, SPEEX_SET_QUALITY, &i);
1624             speex_encoder_ctl(st, SPEEX_GET_BITRATE, &rate);
1625             if (rate <= target)
1626                break;
1627             i--;
1628          }
1629          vbr_qual=i;
1630          if (vbr_qual<0)
1631             vbr_qual=0;
1632          speex_encoder_ctl(st, SPEEX_SET_VBR_QUALITY, &vbr_qual);
1633          st->abr_count=0;
1634          st->abr_drift=0;
1635          st->abr_drift2=0;
1636       }
1637
1638       break;
1639    case SPEEX_GET_ABR:
1640       (*(spx_int32_t*)ptr) = st->abr_enabled;
1641       break;
1642 #endif /* #ifndef DISABLE_VBR */
1643 #if !defined(DISABLE_VBR) && !defined(DISABLE_FLOAT_API)
1644    case SPEEX_SET_VBR_QUALITY:
1645       st->vbr_quality = (*(float*)ptr);
1646       break;
1647    case SPEEX_GET_VBR_QUALITY:
1648       (*(float*)ptr) = st->vbr_quality;
1649       break;
1650 #endif /* !defined(DISABLE_VBR) && !defined(DISABLE_FLOAT_API) */
1651    case SPEEX_SET_QUALITY:
1652       {
1653          int quality = (*(spx_int32_t*)ptr);
1654          if (quality < 0)
1655             quality = 0;
1656          if (quality > 10)
1657             quality = 10;
1658          st->submodeSelect = st->submodeID = ((const SpeexNBMode*)(st->mode->mode))->quality_map[quality];
1659       }
1660       break;
1661    case SPEEX_SET_COMPLEXITY:
1662       st->complexity = (*(spx_int32_t*)ptr);
1663       if (st->complexity<0)
1664          st->complexity=0;
1665       break;
1666    case SPEEX_GET_COMPLEXITY:
1667       (*(spx_int32_t*)ptr) = st->complexity;
1668       break;
1669    case SPEEX_SET_BITRATE:
1670       {
1671          spx_int32_t i=10;
1672          spx_int32_t rate, target;
1673          target = (*(spx_int32_t*)ptr);
1674          while (i>=0)
1675          {
1676             speex_encoder_ctl(st, SPEEX_SET_QUALITY, &i);
1677             speex_encoder_ctl(st, SPEEX_GET_BITRATE, &rate);
1678             if (rate <= target)
1679                break;
1680             i--;
1681          }
1682       }
1683       break;
1684    case SPEEX_GET_BITRATE:
1685       if (st->submodes[st->submodeID])
1686          (*(spx_int32_t*)ptr) = st->sampling_rate*SUBMODE(bits_per_frame)/st->frameSize;
1687       else
1688          (*(spx_int32_t*)ptr) = st->sampling_rate*(NB_SUBMODE_BITS+1)/st->frameSize;
1689       break;
1690    case SPEEX_SET_SAMPLING_RATE:
1691       st->sampling_rate = (*(spx_int32_t*)ptr);
1692       break;
1693    case SPEEX_GET_SAMPLING_RATE:
1694       (*(spx_int32_t*)ptr)=st->sampling_rate;
1695       break;
1696    case SPEEX_RESET_STATE:
1697       {
1698          int i;
1699          st->bounded_pitch = 1;
1700          st->first = 1;
1701          for (i=0;i<st->lpcSize;i++)
1702             st->old_lsp[i]= DIV32(MULT16_16(QCONST16(3.1415927f, LSP_SHIFT), i+1), st->lpcSize+1);
1703          for (i=0;i<st->lpcSize;i++)
1704             st->mem_sw[i]=st->mem_sw_whole[i]=st->mem_sp[i]=st->mem_exc[i]=0;
1705          for (i=0;i<st->frameSize+st->max_pitch+1;i++)
1706             st->excBuf[i]=st->swBuf[i]=0;
1707          for (i=0;i<st->windowSize-st->frameSize;i++)
1708             st->winBuf[i]=0;
1709       }
1710       break;
1711    case SPEEX_SET_SUBMODE_ENCODING:
1712       st->encode_submode = (*(spx_int32_t*)ptr);
1713       break;
1714    case SPEEX_GET_SUBMODE_ENCODING:
1715       (*(spx_int32_t*)ptr) = st->encode_submode;
1716       break;
1717    case SPEEX_GET_LOOKAHEAD:
1718       (*(spx_int32_t*)ptr)=(st->windowSize-st->frameSize);
1719       break;
1720    case SPEEX_SET_PLC_TUNING:
1721       st->plc_tuning = (*(spx_int32_t*)ptr);
1722       if (st->plc_tuning>100)
1723          st->plc_tuning=100;
1724       break;
1725    case SPEEX_GET_PLC_TUNING:
1726       (*(spx_int32_t*)ptr)=(st->plc_tuning);
1727       break;
1728 #ifndef DISABLE_VBR
1729    case SPEEX_SET_VBR_MAX_BITRATE:
1730       st->vbr_max = (*(spx_int32_t*)ptr);
1731       break;
1732    case SPEEX_GET_VBR_MAX_BITRATE:
1733       (*(spx_int32_t*)ptr) = st->vbr_max;
1734       break;
1735 #endif /* #ifndef DISABLE_VBR */
1736    case SPEEX_SET_HIGHPASS:
1737       st->highpass_enabled = (*(spx_int32_t*)ptr);
1738       break;
1739    case SPEEX_GET_HIGHPASS:
1740       (*(spx_int32_t*)ptr) = st->highpass_enabled;
1741       break;
1742
1743    /* This is all internal stuff past this point */
1744    case SPEEX_GET_PI_GAIN:
1745       {
1746          int i;
1747          spx_word32_t *g = (spx_word32_t*)ptr;
1748          for (i=0;i<st->nbSubframes;i++)
1749             g[i]=st->pi_gain[i];
1750       }
1751       break;
1752    case SPEEX_GET_EXC:
1753       {
1754          int i;
1755          for (i=0;i<st->nbSubframes;i++)
1756             ((spx_word16_t*)ptr)[i] = compute_rms16(st->exc+i*st->subframeSize, st->subframeSize);
1757       }
1758       break;
1759 #ifndef DISABLE_VBR
1760    case SPEEX_GET_RELATIVE_QUALITY:
1761       (*(float*)ptr)=st->relative_quality;
1762       break;
1763 #endif /* #ifndef DISABLE_VBR */
1764    case SPEEX_SET_INNOVATION_SAVE:
1765       st->innov_rms_save = (spx_word16_t*)ptr;
1766       break;
1767    case SPEEX_SET_WIDEBAND:
1768       st->isWideband = *((spx_int32_t*)ptr);
1769       break;
1770    case SPEEX_GET_STACK:
1771       *((char**)ptr) = st->stack;
1772       break;
1773    default:
1774       speex_warning_int("Unknown nb_ctl request: ", request);
1775       return -1;
1776    }
1777    return 0;
1778 }
1779
1780 int nb_decoder_ctl(void *state, int request, void *ptr)
1781 {
1782    DecState *st;
1783    st=(DecState*)state;
1784    switch(request)
1785    {
1786    case SPEEX_SET_LOW_MODE:
1787    case SPEEX_SET_MODE:
1788       st->submodeID = (*(spx_int32_t*)ptr);
1789       break;
1790    case SPEEX_GET_LOW_MODE:
1791    case SPEEX_GET_MODE:
1792       (*(spx_int32_t*)ptr) = st->submodeID;
1793       break;
1794    case SPEEX_SET_ENH:
1795       st->lpc_enh_enabled = *((spx_int32_t*)ptr);
1796       break;
1797    case SPEEX_GET_ENH:
1798       *((spx_int32_t*)ptr) = st->lpc_enh_enabled;
1799       break;
1800    case SPEEX_GET_FRAME_SIZE:
1801       (*(spx_int32_t*)ptr) = st->frameSize;
1802       break;
1803    case SPEEX_GET_BITRATE:
1804       if (st->submodes[st->submodeID])
1805          (*(spx_int32_t*)ptr) = st->sampling_rate*SUBMODE(bits_per_frame)/st->frameSize;
1806       else
1807          (*(spx_int32_t*)ptr) = st->sampling_rate*(NB_SUBMODE_BITS+1)/st->frameSize;
1808       break;
1809    case SPEEX_SET_SAMPLING_RATE:
1810       st->sampling_rate = (*(spx_int32_t*)ptr);
1811       break;
1812    case SPEEX_GET_SAMPLING_RATE:
1813       (*(spx_int32_t*)ptr)=st->sampling_rate;
1814       break;
1815    case SPEEX_SET_HANDLER:
1816       {
1817          SpeexCallback *c = (SpeexCallback*)ptr;
1818          st->speex_callbacks[c->callback_id].func=c->func;
1819          st->speex_callbacks[c->callback_id].data=c->data;
1820          st->speex_callbacks[c->callback_id].callback_id=c->callback_id;
1821       }
1822       break;
1823    case SPEEX_SET_USER_HANDLER:
1824       {
1825          SpeexCallback *c = (SpeexCallback*)ptr;
1826          st->user_callback.func=c->func;
1827          st->user_callback.data=c->data;
1828          st->user_callback.callback_id=c->callback_id;
1829       }
1830       break;
1831    case SPEEX_RESET_STATE:
1832       {
1833          int i;
1834          for (i=0;i<st->lpcSize;i++)
1835             st->mem_sp[i]=0;
1836          for (i=0;i<st->frameSize + st->max_pitch + 1;i++)
1837             st->excBuf[i]=0;
1838       }
1839       break;
1840    case SPEEX_SET_SUBMODE_ENCODING:
1841       st->encode_submode = (*(spx_int32_t*)ptr);
1842       break;
1843    case SPEEX_GET_SUBMODE_ENCODING:
1844       (*(spx_int32_t*)ptr) = st->encode_submode;
1845       break;
1846    case SPEEX_GET_LOOKAHEAD:
1847       (*(spx_int32_t*)ptr)=st->subframeSize;
1848       break;
1849    case SPEEX_SET_HIGHPASS:
1850       st->highpass_enabled = (*(spx_int32_t*)ptr);
1851       break;
1852    case SPEEX_GET_HIGHPASS:
1853       (*(spx_int32_t*)ptr) = st->highpass_enabled;
1854       break;
1855       /* FIXME: Convert to fixed-point and re-enable even when float API is disabled */
1856 #ifndef DISABLE_FLOAT_API
1857    case SPEEX_GET_ACTIVITY:
1858    {
1859       float ret;
1860       ret = log(st->level/st->min_level)/log(st->max_level/st->min_level);
1861       if (ret>1)
1862          ret = 1;
1863       /* Done in a strange way to catch NaNs as well */
1864       if (!(ret > 0))
1865          ret = 0;
1866       /*printf ("%f %f %f %f\n", st->level, st->min_level, st->max_level, ret);*/
1867       (*(spx_int32_t*)ptr) = (int)(100*ret);
1868    }
1869    break;
1870 #endif
1871    case SPEEX_GET_PI_GAIN:
1872       {
1873          int i;
1874          spx_word32_t *g = (spx_word32_t*)ptr;
1875          for (i=0;i<st->nbSubframes;i++)
1876             g[i]=st->pi_gain[i];
1877       }
1878       break;
1879    case SPEEX_GET_EXC:
1880       {
1881          int i;
1882          for (i=0;i<st->nbSubframes;i++)
1883             ((spx_word16_t*)ptr)[i] = compute_rms16(st->exc+i*st->subframeSize, st->subframeSize);
1884       }
1885       break;
1886    case SPEEX_GET_DTX_STATUS:
1887       *((spx_int32_t*)ptr) = st->dtx_enabled;
1888       break;
1889    case SPEEX_SET_INNOVATION_SAVE:
1890       st->innov_save = (spx_word16_t*)ptr;
1891       break;
1892    case SPEEX_SET_WIDEBAND:
1893       st->isWideband = *((spx_int32_t*)ptr);
1894       break;
1895    case SPEEX_GET_STACK:
1896       *((char**)ptr) = st->stack;
1897       break;
1898    default:
1899       speex_warning_int("Unknown nb_ctl request: ", request);
1900       return -1;
1901    }
1902    return 0;
1903 }