nb_celp.cpp

来自「KphoneSI (kpsi) is a SIP (Session Initia」· C++ 代码 · 共 1,719 行 · 第 1/4 页
CPP
1,719 行
   /* First, transmit a zero for narrowband */   speex_bits_pack(bits, 0, 1);   /* Transmit the sub-mode we use for this frame */   speex_bits_pack(bits, st->submodeID, NB_SUBMODE_BITS);   /* If null mode (no transmission), just set a couple things to zero*/   if (st->submodes[st->submodeID] == NULL)   {      for (i=0;i<st->frameSize;i++)         st->exc[i]=st->exc2[i]=st->sw[i]=VERY_SMALL;      for (i=0;i<st->lpcSize;i++)         st->mem_sw[i]=0;      st->first=1;      st->bounded_pitch = 1;      /* Final signal synthesis from excitation */      iir_mem2(st->exc, st->interp_qlpc, st->frame, st->frameSize, st->lpcSize, st->mem_sp);      in[0] = st->frame[0] + st->preemph*st->pre_mem2;      for (i=1;i<st->frameSize;i++)         in[i]=st->frame[i] + st->preemph*in[i-1];      st->pre_mem2=in[st->frameSize-1];      return 0;   }   /* LSP Quantization */   if (st->first)   {      for (i=0;i<st->lpcSize;i++)         st->old_lsp[i] = st->lsp[i];   }   /*Quantize LSPs*/#if 1 /*0 for unquantized*/   SUBMODE(lsp_quant)(st->lsp, st->qlsp, st->lpcSize, bits);#else   for (i=0;i<st->lpcSize;i++)     st->qlsp[i]=st->lsp[i];#endif   /*If we use low bit-rate pitch mode, transmit open-loop pitch*/   if (SUBMODE(lbr_pitch)!=-1)   {      speex_bits_pack(bits, ol_pitch-st->min_pitch, 7);   }       if (SUBMODE(forced_pitch_gain))   {      int quant;      quant = (int)floor(.5+15*ol_pitch_coef);      if (quant>15)         quant=15;      if (quant<0)         quant=0;      speex_bits_pack(bits, quant, 4);      ol_pitch_coef=0.066667*quant;   }         /*Quantize and transmit open-loop excitation gain*/   {      int qe = (int)(floor(.5+3.5*log(ol_gain)));      if (qe<0)         qe=0;      if (qe>31)         qe=31;      ol_gain = exp(qe/3.5);      speex_bits_pack(bits, qe, 5);   }   /* Special case for first frame */   if (st->first)   {      for (i=0;i<st->lpcSize;i++)         st->old_qlsp[i] = st->qlsp[i];   }   /* Filter response */   res = PUSH(stack, st->subframeSize, float);   /* Target signal */   target = PUSH(stack, st->subframeSize, float);   syn_resp = PUSH(stack, st->subframeSize, float);   mem = PUSH(stack, st->lpcSize, float);   orig = PUSH(stack, st->frameSize, float);   for (i=0;i<st->frameSize;i++)      orig[i]=st->frame[i];   /* Loop on sub-frames */   for (sub=0;sub<st->nbSubframes;sub++)   {      float tmp;      int   offset;      float *sp, *sw, *exc, *exc2;      int pitch;      /* Offset relative to start of frame */      offset = st->subframeSize*sub;      /* Original signal */      sp=st->frame+offset;      /* Excitation */      exc=st->exc+offset;      /* Weighted signal */      sw=st->sw+offset;      exc2=st->exc2+offset;      /* LSP interpolation (quantized and unquantized) */      tmp = (1.0 + sub)/st->nbSubframes;      for (i=0;i<st->lpcSize;i++)         st->interp_lsp[i] = (1-tmp)*st->old_lsp[i] + tmp*st->lsp[i];      for (i=0;i<st->lpcSize;i++)         st->interp_qlsp[i] = (1-tmp)*st->old_qlsp[i] + tmp*st->qlsp[i];      /* Make sure the filters are stable */      lsp_enforce_margin(st->interp_lsp, st->lpcSize, .002);      lsp_enforce_margin(st->interp_qlsp, st->lpcSize, .002);      /* Compute interpolated LPCs (quantized and unquantized) */      for (i=0;i<st->lpcSize;i++)         st->interp_lsp[i] = cos(st->interp_lsp[i]);      lsp_to_lpc(st->interp_lsp, st->interp_lpc, st->lpcSize,stack);      for (i=0;i<st->lpcSize;i++)         st->interp_qlsp[i] = cos(st->interp_qlsp[i]);      lsp_to_lpc(st->interp_qlsp, st->interp_qlpc, st->lpcSize, stack);      /* Compute analysis filter gain at w=pi (for use in SB-CELP) */      tmp=1;      st->pi_gain[sub]=0;      for (i=0;i<=st->lpcSize;i++)      {         st->pi_gain[sub] += tmp*st->interp_qlpc[i];         tmp = -tmp;      }      /* Compute bandwidth-expanded (unquantized) LPCs for perceptual weighting */      bw_lpc(st->gamma1, st->interp_lpc, st->bw_lpc1, st->lpcSize);      if (st->gamma2>=0)         bw_lpc(st->gamma2, st->interp_lpc, st->bw_lpc2, st->lpcSize);      else      {         st->bw_lpc2[0]=1;         st->bw_lpc2[1]=-st->preemph;         for (i=2;i<=st->lpcSize;i++)            st->bw_lpc2[i]=0;      }      /* Compute impulse response of A(z/g1) / ( A(z)*A(z/g2) )*/      for (i=0;i<st->subframeSize;i++)         exc[i]=VERY_SMALL;      exc[0]=1;      syn_percep_zero(exc, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2, syn_resp, st->subframeSize, st->lpcSize, stack);      /* Reset excitation */      for (i=0;i<st->subframeSize;i++)         exc[i]=VERY_SMALL;      for (i=0;i<st->subframeSize;i++)         exc2[i]=VERY_SMALL;      /* Compute zero response of A(z/g1) / ( A(z/g2) * A(z) ) */      for (i=0;i<st->lpcSize;i++)         mem[i]=st->mem_sp[i];      iir_mem2(exc, st->interp_qlpc, exc, st->subframeSize, st->lpcSize, mem);            for (i=0;i<st->lpcSize;i++)         mem[i]=st->mem_sw[i];      filter_mem2(exc, st->bw_lpc1, st->bw_lpc2, res, st->subframeSize, st->lpcSize, mem);            /* Compute weighted signal */      for (i=0;i<st->lpcSize;i++)         mem[i]=st->mem_sw[i];      filter_mem2(sp, st->bw_lpc1, st->bw_lpc2, sw, st->subframeSize, st->lpcSize, mem);            /* Compute target signal */      for (i=0;i<st->subframeSize;i++)         target[i]=sw[i]-res[i];      for (i=0;i<st->subframeSize;i++)         exc[i]=exc2[i]=0;      /* If we have a long-term predictor (otherwise, something's wrong) */      if (SUBMODE(ltp_quant))      {         int pit_min, pit_max;         /* Long-term prediction */         if (SUBMODE(lbr_pitch) != -1)         {            /* Low bit-rate pitch handling */            int margin;            margin = SUBMODE(lbr_pitch);            if (margin)            {               if (ol_pitch < st->min_pitch+margin-1)                  ol_pitch=st->min_pitch+margin-1;               if (ol_pitch > st->max_pitch-margin)                  ol_pitch=st->max_pitch-margin;               pit_min = ol_pitch-margin+1;               pit_max = ol_pitch+margin;            } else {               pit_min=pit_max=ol_pitch;            }         } else {            pit_min = st->min_pitch;            pit_max = st->max_pitch;         }                  /* Force pitch to use only the current frame if needed */         if (st->bounded_pitch && pit_max>offset)            pit_max=offset;         /* Perform pitch search */         pitch = SUBMODE(ltp_quant)(target, sw, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2,                                    exc, SUBMODE(ltp_params), pit_min, pit_max, ol_pitch_coef,                                    st->lpcSize, st->subframeSize, bits, stack,                                     exc2, syn_resp, st->complexity);         st->pitch[sub]=pitch;      } else {         speex_error ("No pitch prediction, what's wrong");      }      /* Update target for adaptive codebook contribution */      syn_percep_zero(exc, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2, res, st->subframeSize, st->lpcSize, stack);      for (i=0;i<st->subframeSize;i++)         target[i]-=res[i];      /* Quantization of innovation */      {         float *innov;         float ener=0, ener_1;         innov = st->innov+sub*st->subframeSize;         for (i=0;i<st->subframeSize;i++)            innov[i]=0;                  residue_percep_zero(target, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2, st->buf2, st->subframeSize, st->lpcSize, stack);         for (i=0;i<st->subframeSize;i++)            ener+=st->buf2[i]*st->buf2[i];         ener=sqrt(.1+ener/st->subframeSize);         /*for (i=0;i<st->subframeSize;i++)            printf ("%f\n", st->buf2[i]/ener);         */                  ener /= ol_gain;         /* Calculate gain correction for the sub-frame (if any) */         if (SUBMODE(have_subframe_gain))          {            int qe;            ener=log(ener);            if (SUBMODE(have_subframe_gain)==3)            {               qe = vq_index(&ener, exc_gain_quant_scal3, 1, 8);               speex_bits_pack(bits, qe, 3);               ener=exc_gain_quant_scal3[qe];            } else {               qe = vq_index(&ener, exc_gain_quant_scal1, 1, 2);               speex_bits_pack(bits, qe, 1);               ener=exc_gain_quant_scal1[qe];                           }            ener=exp(ener);         } else {            ener=1;         }         ener*=ol_gain;         /*printf ("%f %f\n", ener, ol_gain);*/         ener_1 = 1/ener;         /* Normalize innovation */         for (i=0;i<st->subframeSize;i++)            target[i]*=ener_1;                  /* Quantize innovation */         if (SUBMODE(innovation_quant))         {            /* Codebook search */            SUBMODE(innovation_quant)(target, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2,                                       SUBMODE(innovation_params), st->lpcSize, st->subframeSize,                                       innov, syn_resp, bits, stack, st->complexity);                        /* De-normalize innovation and update excitation */            for (i=0;i<st->subframeSize;i++)               innov[i]*=ener;            for (i=0;i<st->subframeSize;i++)               exc[i] += innov[i];         } else {            speex_error("No fixed codebook");         }         /* In some (rare) modes, we do a second search (more bits) to reduce noise even more */         if (SUBMODE(double_codebook)) {            char *tmp_stack=stack;            float *innov2 = PUSH(tmp_stack, st->subframeSize, float);            for (i=0;i<st->subframeSize;i++)               innov2[i]=0;            for (i=0;i<st->subframeSize;i++)               target[i]*=2.2;            SUBMODE(innovation_quant)(target, st->interp_qlpc, st->bw_lpc1, st->bw_lpc2,                                       SUBMODE(innovation_params), st->lpcSize, st->subframeSize,                                       innov2, syn_resp, bits, tmp_stack, st->complexity);            for (i=0;i<st->subframeSize;i++)               innov2[i]*=ener*(1/2.2);            for (i=0;i<st->subframeSize;i++)               exc[i] += innov2[i];         }         for (i=0;i<st->subframeSize;i++)            target[i]*=ener;      }      /*Keep the previous memory*/      for (i=0;i<st->lpcSize;i++)         mem[i]=st->mem_sp[i];      /* Final signal synthesis from excitation */      iir_mem2(exc, st->interp_qlpc, sp, st->subframeSize, st->lpcSize, st->mem_sp);      /* Compute weighted signal again, from synthesized speech (not sure it's the right thing) */      filter_mem2(sp, st->bw_lpc1, st->bw_lpc2, sw, st->subframeSize, st->lpcSize, st->mem_sw);      for (i=0;i<st->subframeSize;i++)         exc2[i]=exc[i];   }   /* Store the LSPs for interpolation in the next frame */   if (st->submodeID>=1)   {      for (i=0;i<st->lpcSize;i++)         st->old_lsp[i] = st->lsp[i];      for (i=0;i<st->lpcSize;i++)         st->old_qlsp[i] = st->qlsp[i];   }   if (st->submodeID==1)   {      if (st->dtx_count)         speex_bits_pack(bits, 15, 4);      else         speex_bits_pack(bits, 0, 4);   }   /* The next frame will not be the first (Duh!) */   st->first = 0;   {      float ener=0, err=0;      float snr;      for (i=0;i<st->frameSize;i++)      {         ener+=st->frame[i]*st->frame[i];         err += (st->frame[i]-orig[i])*(st->frame[i]-orig[i]);      }      snr = 10*log10((ener+1)/(err+1));      /*printf ("%f %f %f\n", snr, ener, err);*/   }   /* Replace input by synthesized speech */   in[0] = st->frame[0] + st->preemph*st->pre_mem2;   for (i=1;i<st->frameSize;i++)     in[i]=st->frame[i] + st->preemph*in[i-1];   st->pre_mem2=in[st->frameSize-1];   if (SUBMODE(innovation_quant) == noise_codebook_quant || st->submodeID==0)      st->bounded_pitch = 1;   else      st->bounded_pitch = 0;   return 1;}void *nb_decoder_init(SpeexMode *m){   DecState *st;   SpeexNBMode *mode;   int i;   mode=(SpeexNBMode*)m->mode;   st = (DecState *)speex_alloc(sizeof(DecState)+4000*sizeof(float));   st->mode=m;   st->stack = ((char*)st) + sizeof(DecState);   st->first=1;   /* Codec parameters, should eventually have several "modes"*/   st->frameSize = mode->frameSize;   st->windowSize = st->frameSize*3/2;   st->nbSubframes=mode->frameSize/mode->subframeSize;   st->subframeSize=mode->subframeSize;   st->lpcSize = mode->lpcSize;   st->bufSize = mode->bufSize;   st->gamma1=mode->gamma1;   st->gamma2=mode->gamma2;   st->min_pitch=mode->pitchStart;   st->max_pitch=mode->pitchEnd;   st->preemph = mode->preemph;   st->submodes=mode->submodes;   st->submodeID=mode->defaultSubmode;   st->pre_mem=0;   st->lpc_enh_enabled=0;   st->inBuf = PUSH(st->stack, st->bufSize, float);   st->frame = st->inBuf + st->bufSize - st->windowSize;   st->excBuf = PUSH(st->stack, st->bufSize, float);   st->exc = st->excBuf + st->bufSize - st->windowSize;   for (i=0;i<st->bufSize;i++)      st->inBuf[i]=0;   for (i=0;i<st->bufSize;i++)      st->excBuf[i]=0;   st->innov = PUSH(st->stack, st->frameSize, float);   st->interp_qlpc = PUSH(st->stack, st->lpcSize+1, float);   st->qlsp = PUSH(st->stack, st->lpcSize, float);   st->old_qlsp = PUSH(st->stack, st->lpcSize, float);   st->interp_qlsp = PUSH(st->stack, st->lpcSize, float);   st->mem_sp = PUSH(st->stack, 5*st->lpcSize, float);   st->comb_mem = PUSHS(st->stack, CombFilterMem);
nb_celp.cpp - 源码说明

本页面展示了「KphoneSI (kpsi) is a SIP (Session Initiation Protocol) user agent for Linux, with which you can in」中的 nb_celp.cpp 源码文件，采用 C++ 编程语言编写，共 1,719 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。
虫虫下载站收录了大量与Initiation相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。
⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?