📄 pitch.c

📁 具有浮点指令的g.729语音压缩编码
💻 C
字号:
/* ITU-T G.729 Software Package Release 2 (November 2006) */
/*
   ITU-T G.729 Annex C - Reference C code for floating point
                         implementation of G.729
                         Version 1.01 of 15.September.98
*/

/*
----------------------------------------------------------------------
                    COPYRIGHT NOTICE
----------------------------------------------------------------------
   ITU-T G.729 Annex C ANSI C source code
   Copyright (C) 1998, AT&T, France Telecom, NTT, University of
   Sherbrooke.  All rights reserved.

----------------------------------------------------------------------
*/

/*
 File : PITCH.C
 Used for the floating point version of G.729 main body
 (not for G.729A)
*/

/*****************************************************************************/
/*           Long Term Prediction Routines                                   */
/*****************************************************************************/
#include <math.h>
#include "typedef.h"
#include "ld8k.h"
#include "tab_ld8k.h"

/* prototypes for local functions */
static void  norm_corr(FLOAT exc[], FLOAT xn[], FLOAT h[], int l_subfr,
    int t_min, int t_max, FLOAT corr_norm[]);
static FLOAT interpol_3(FLOAT cor[], int frac);
static int   lag_max(FLOAT signal[],int L_frame,int pit_max,
                  int pit_min, FLOAT *cor_max);
static FLOAT inv_sqrt( FLOAT x  );

/*----------------------------------------------------------------------------
 * pitch_ol -  compute the open loop pitch lag
 *----------------------------------------------------------------------------
 */
int pitch_ol(           /* output: open-loop pitch lag */
 FLOAT signal[],        /* input : signal to compute pitch  */
                        /*         s[-PIT_MAX : l_frame-1]  */
   int pit_min,         /* input : minimum pitch lag                          */
   int pit_max,         /* input : maximum pitch lag                          */
   int l_frame          /* input : error minimization window */
)
{
    FLOAT  max1, max2, max3;
    int    p_max1, p_max2, p_max3;

   /*--------------------------------------------------------------------*
    *  The pitch lag search is divided in three sections.                *
    *  Each section cannot have a pitch multiple.                        *
    *  We find a maximum for each section.                               *
    *  We compare the maxima of each section by favoring small lag.      *
    *                                                                    *
    *  First section:  lag delay = PIT_MAX to 80                         *
    *  Second section: lag delay = 79 to 40                              *
    *  Third section:  lag delay = 39 to 20                              *
    *--------------------------------------------------------------------*/

    p_max1 = lag_max(signal, l_frame, pit_max, 80 , &max1);
    p_max2 = lag_max(signal, l_frame, 79     , 40 , &max2);
    p_max3 = lag_max(signal, l_frame, 39     , pit_min , &max3);

   /*--------------------------------------------------------------------*
    * Compare the 3 sections maxima, and favor small lag.                *
    *--------------------------------------------------------------------*/

    if ( max1 * THRESHPIT < max2 ) {
        max1 = max2;
        p_max1 = p_max2;
    }

    if ( max1 * THRESHPIT < max3 )  p_max1 = p_max3;

    return (p_max1);
}
/*----------------------------------------------------------------------------
 * lag_max - Find the lag that has maximum correlation
 *----------------------------------------------------------------------------
 */
static int lag_max(     /* output: lag found */
  FLOAT signal[],       /* input : Signal to compute the open loop pitch
                                   signal[-142:-1] should be known.       */
  int l_frame,          /* input : Length of frame to compute pitch       */
  int lagmax,           /* input : maximum lag                            */
  int lagmin,           /* input : minimum lag                            */
  FLOAT *cor_max        /* input : normalized correlation of selected lag */
)
{
    int    i, j;
    FLOAT  *p, *p1;
    FLOAT  max, t0;
    int    p_max;

    max = FLT_MIN_G729;

    for (i = lagmax; i >= lagmin; i--) {
        p  = signal;
        p1 = &signal[-i];
        t0 = (F)0.0;

        for (j=0; j<l_frame; j++) {
            t0 += *p++ * *p1++;
        }

        if (t0 >= max) {
            max    = t0;
            p_max = i;
        }
    }

    /* compute energy */

    t0 = (F)0.01;                  /* to avoid division by zero */
    p = &signal[-p_max];
    for(i=0; i<l_frame; i++, p++) {
        t0 += *p * *p;
    }
    t0 = inv_sqrt(t0);          /* 1/sqrt(energy)    */

    *cor_max = max * t0;        /* max/sqrt(energy)  */

    return(p_max);
}


/*----------------------------------------------------------------------------
 * pitch_fr3 - find the pitch period  with 1/3 subsample resolution
 *----------------------------------------------------------------------------
 */
int pitch_fr3(          /* output: integer part of pitch period        */
 FLOAT exc[],           /* input : excitation buffer                   */
 FLOAT xn[],            /* input : target vector                       */
 FLOAT h[],             /* input : impulse response of filters.        */
 int l_subfr,           /* input : Length of frame to compute pitch    */
 int t0_min,            /* input : minimum value in the searched range */
 int t0_max,            /* input : maximum value in the searched range */
 int i_subfr,           /* input : indicator for first subframe        */
 int *pit_frac          /* output: chosen fraction                     */
)
{
  int    i, frac;
  int    lag, t_min, t_max;
  FLOAT  max;
  FLOAT  corr_int;
  FLOAT  corr_v[10+2*L_INTER4];  /* size: 2*L_INTER4+t0_max-t0_min+1 */
  FLOAT  *corr;

  /* Find interval to compute normalized correlation */

  t_min = t0_min - L_INTER4;
  t_max = t0_max + L_INTER4;

  corr = &corr_v[-t_min];    /* corr[t_min:t_max] */

  /* Compute normalized correlation between target and filtered excitation */

  norm_corr(exc, xn, h, l_subfr, t_min, t_max, corr);

  /* find integer pitch */

  max = corr[t0_min];
  lag  = t0_min;

  for(i= t0_min+1; i<=t0_max; i++)
  {
    if( corr[i] >= max)
    {
      max = corr[i];
      lag = i;
    }
  }

  /* If first subframe and lag > 84 do not search fractionnal pitch */

  if( (i_subfr == 0) && (lag > 84) )
  {
    *pit_frac = 0;
    return(lag);
  }

  /* test the fractions around lag and choose the one which maximizes
     the interpolated normalized correlation */

  max  = interpol_3(&corr[lag], -2);
  frac = -2;

  for (i = -1; i <= 2; i++)
  {
    corr_int = interpol_3(&corr[lag], i);
    if(corr_int > max)
    {
      max = corr_int;
      frac = i;
    }
  }

  /* limit the fraction value in the interval [-1,0,1] */

  if (frac == -2)
  {
    frac = 1;
    lag -= 1;
  }
  if (frac == 2)
  {
    frac = -1;
    lag += 1;
  }

  *pit_frac = frac;

  return lag;
}

/*----------------------------------------------------------------------------
 * norm_corr - Find the normalized correlation between the target vector and
 *             the filtered past excitation.
 *----------------------------------------------------------------------------
 */
static void norm_corr(
 FLOAT exc[],           /* input : excitation buffer */
 FLOAT xn[],            /* input : target vector */
 FLOAT h[],             /* input : imp response of synth and weighting flt */
 int l_subfr,           /* input : Length of frame to compute pitch */
 int t_min,             /* input : minimum value of searched range */
 int t_max,             /* input : maximum value of search range */
 FLOAT corr_norm[]      /* output: normalized correlation (correlation between
                                   target and filtered excitation divided by
                                   the square root of energy of filtered
                                    excitation) */
)
{
 int    i, j, k;
 FLOAT excf[L_SUBFR];     /* filtered past excitation */
 FLOAT  alp, s, norm;

 k = -t_min;

 /* compute the filtered excitation for the first delay t_min */

 convolve(&exc[k], h, excf, l_subfr);

 /* loop for every possible period */

 for (i = t_min; i <= t_max; i++)
 {
   /* Compute 1/sqrt(energie of excf[]) */

   alp = (F)0.01;
   for (j = 0; j < l_subfr; j++)
     alp += excf[j]*excf[j];

   norm = inv_sqrt(alp);


   /* Compute correlation between xn[] and excf[] */

   s = (F)0.0;
   for (j = 0; j < l_subfr; j++)  s += xn[j]*excf[j];


   /* Normalize correlation = correlation * (1/sqrt(energie)) */

   corr_norm[i] = s*norm;

   /* modify the filtered excitation excf[] for the next iteration */

   if (i != t_max)
   {
     k--;
     for (j = l_subfr-1; j > 0; j--)
        excf[j] = excf[j-1] + exc[k]*h[j];
     excf[0] = exc[k];
   }
 }

 return;

}
/*----------------------------------------------------------------------------
 * g_pitch - compute adaptive codebook gain and compute <y1,y1> , -2<xn,y1>
 *----------------------------------------------------------------------------
 */

FLOAT g_pitch(          /* output: pitch gain */
 FLOAT xn[],            /* input : target vector */
 FLOAT y1[],            /* input : filtered adaptive codebook vector */
 FLOAT g_coeff[],       /* output: <y1,y1> and -2<xn,y1> */
 int l_subfr            /* input : vector dimension */
)
{
    FLOAT xy, yy, gain;
    int   i;

    xy = (F)0.0;
    for (i = 0; i < l_subfr; i++) {
        xy += xn[i] * y1[i];
    }
    yy = (F)0.01;
    for (i = 0; i < l_subfr; i++) {
        yy += y1[i] * y1[i];          /* energy of filtered excitation */
    }
    g_coeff[0] = yy;
    g_coeff[1] = (F)-2.0*xy +(F)0.01;

    /* find pitch gain and bound it by [0,1.2] */

    gain = xy/yy;

    if (gain<(F)0.0)  gain = (F)0.0;
    if (gain>GAIN_PIT_MAX) gain = GAIN_PIT_MAX;

    return gain;
}

/*----------------------------------------------------------------------*
 *    Function enc_lag3()                                               *
 *             ~~~~~~~~~~                                               *
 *   Encoding of fractional pitch lag with 1/3 resolution.              *
 *----------------------------------------------------------------------*
 * The pitch range for the first subframe is divided as follows:        *
 *   19 1/3  to   84 2/3   resolution 1/3                               *
 *   85      to   143      resolution 1                                 *
 *                                                                      *
 * The period in the first subframe is encoded with 8 bits.             *
 * For the range with fractions:                                        *
 *   index = (T-19)*3 + frac - 1;   where T=[19..85] and frac=[-1,0,1]  *
 * and for the integer only range                                       *
 *   index = (T - 85) + 197;        where T=[86..143]                   *
 *----------------------------------------------------------------------*
 * For the second subframe a resolution of 1/3 is always used, and the  *
 * search range is relative to the lag in the first subframe.           *
 * If t0 is the lag in the first subframe then                          *
 *  t_min=t0-5   and  t_max=t0+4   and  the range is given by           *
 *       t_min - 2/3   to  t_max + 2/3                                  *
 *                                                                      *
 * The period in the 2nd subframe is encoded with 5 bits:               *
 *   index = (T-(t_min-1))*3 + frac - 1;    where T[t_min-1 .. t_max+1] *
 *----------------------------------------------------------------------*/
int  enc_lag3(     /* output: Return index of encoding */
  int  T0,         /* input : Pitch delay              */
  int  T0_frac,    /* input : Fractional pitch delay   */
  int  *T0_min,    /* in/out: Minimum search delay     */
  int  *T0_max,    /* in/out: Maximum search delay     */
  int pit_min,     /* input : Minimum pitch delay      */
  int pit_max,     /* input : Maximum pitch delay      */
  int  pit_flag    /* input : Flag for 1st subframe    */
)
{
  int index;

  if (pit_flag == 0)   /* if 1st subframe */
  {
     /* encode pitch delay (with fraction) */

     if (T0 <= 85)
       index = T0*3 - 58 + T0_frac;
     else
       index = T0 + 112;

     /* find T0_min and T0_max for second subframe */

     *T0_min = T0 - 5;
     if (*T0_min < pit_min) *T0_min = pit_min;
     *T0_max = *T0_min + 9;
     if (*T0_max > pit_max)
     {
         *T0_max = pit_max;
         *T0_min = *T0_max - 9;
     }
  }

  else                    /* second subframe */
  {
     index = T0 - *T0_min;
     index = index*3 + 2 + T0_frac;
  }
  return index;
}

/*----------------------------------------------------------------------------
 * interpol_3 - For interpolating the normalized correlation
 *----------------------------------------------------------------------------
 */
static FLOAT interpol_3(   /* output: interpolated value */
 FLOAT *x,              /* input : function to be interpolated */
 int frac               /* input : fraction value to evaluate */
)
{
  int i;
  FLOAT s, *x1, *x2, *c1, *c2;


  if (frac < 0) {
    frac += UP_SAMP;
    x--;
  }
  x1 = &x[0];
  x2 = &x[1];
  c1 = &inter_3[frac];
  c2 = &inter_3[UP_SAMP-frac];

  s = (F)0.0;
  for(i=0; i< L_INTER4; i++, c1+=UP_SAMP, c2+=UP_SAMP)
     s+= (*x1--) * (*c1) + (*x2++) * (*c2);

  return s;
}

/*----------------------------------------------------------------------------
 * inv_sqrt - compute y = 1 / sqrt(x)
 *----------------------------------------------------------------------------
 */
static FLOAT inv_sqrt(         /* output: 1/sqrt(x) */
 FLOAT x                /* input : value of x */
)
{
   return ((F)1.0 / (FLOAT)sqrt((double)x) );
}
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -