melp_syn.c

来自「melp谱的计算。本程序是语音编码melp的C程序实现」· C语言代码 · 共 484 行
484 行
/*2.4 kbps MELP Proposed Federal Standard speech coderversion 1.2Copyright (c) 1996, Texas Instruments, Inc.  Texas Instruments has intellectual property rights on the MELPalgorithm.  The Texas Instruments contact for licensing issues forcommercial and non-government use is William Gordon, Director,Government Contracts, Texas Instruments Incorporated, SemiconductorGroup (phone 972 480 7442).*//*    Name: melp_syn.c    Description: MELP synthesis      This program takes the new parameters for a speech      frame and synthesizes the output speech.  It keeps      an internal record of the previous frame parameters      to use for interpolation.			    Inputs:      *par - MELP parameter structure    Outputs:       speech[] - output speech signal    Returns: void*//* compiler include files */ #include <stdio.h>#include <math.h>#include "melp.h"#include "spbstd.h"#include "lpc.h"#include "mat.h"#include "vq.h"#include "fs.h"/* compiler constants */ #if (MIX_ORD > DISP_ORD)#define BEGIN MIX_ORD#else#define BEGIN DISP_ORD#endif#define TILT_ORD 1#define SYN_GAIN 1000.0#define	SCALEOVER	10#define PDEL SCALEOVER/* external memory references */ extern float bp_cof[NUM_BANDS][MIX_ORD+1];extern float disp_cof[DISP_ORD+1];extern float msvq_cb[];extern float fsvq_cb[];extern int fsvq_weighted;/* temporary memory */static float sigbuf[BEGIN+PITCHMAX];static float sig2[BEGIN+PITCHMAX];static float fs_real[PITCHMAX];/* permanent memory */ static int firstcall = 1; /* Just used for noise gain init */static int prev_gain_err;static float sigsave[PITCHMAX];static struct melp_param prev_par;static int syn_begin;static float prev_scale;static float noise_gain = MIN_NOISE;static float pulse_del[MIX_ORD],noise_del[MIX_ORD];static float lpc_del[LPC_ORD],ase_del[LPC_ORD],tilt_del[TILT_ORD];static float disp_del[DISP_ORD];static struct msvq_param vq_par;  /* MSVQ parameters */static struct msvq_param fs_vq_par;  /* Fourier series VQ parameters */static float w_fs_inv[NUM_HARM];/* these can be saved or recomputed */static float prev_pcof[MIX_ORD+1],prev_ncof[MIX_ORD+1];static float prev_tilt;static float prev_gain;void melp_syn(struct melp_param *par,float sp_out[]){    int i, gaincnt;    int erase;    int length;    float intfact, ifact, ifact_gain;    float gain,pulse_gain,pitch,jitter;    float curr_tilt,tilt_cof[TILT_ORD+1];    float temp,sig_prob;    float lsf[LPC_ORD+1];    float lpc[LPC_ORD+1];    float ase_num[LPC_ORD+1],ase_den[LPC_ORD+1];    float curr_pcof[MIX_ORD+1],curr_ncof[MIX_ORD+1];    float pulse_cof[MIX_ORD+1],noise_cof[MIX_ORD+1];        /* Copy previous period of processed speech to output array */    if (syn_begin > 0) {	if (syn_begin > FRAME) {	    v_equ(&sp_out[0],&sigsave[0],FRAME);	    /* past end: save remainder in sigsave[0] */	    v_equ(&sigsave[0],&sigsave[FRAME],syn_begin-FRAME);	}	else 	  v_equ(&sp_out[0],&sigsave[0],syn_begin);    }        erase = 0; /* no erasures yet */        /* Update MSVQ information */    par->msvq_stages = vq_par.num_stages;    par->msvq_bits = vq_par.num_bits;    par->msvq_levels = vq_par.num_levels;    par->msvq_index = vq_par.indices;    par->fsvq_index = fs_vq_par.indices;        /*	Read and decode channel input buffer	*/    erase = melp_chn_read(par,&prev_par);    if (par->uv_flag != 1 && !erase) { 	/* Un-weight Fourier magnitudes */	window(&par->fs_mag[0],w_fs_inv,&par->fs_mag[0],NUM_HARM);    }    /* Update adaptive noise level estimate based on last gain	*/    if (firstcall) {	firstcall = 0;	noise_gain = par->gain[NUM_GAINFR-1];    }        else if (!erase) {	for (i = 0; i < NUM_GAINFR; i++) {	    noise_est(par->gain[i],&noise_gain,UPCONST,DOWNCONST,		      MIN_NOISE,MAX_NOISE);	    /* Adjust gain based on noise level (noise suppression) */	    noise_sup(&par->gain[i],noise_gain,MAX_NS_SUP,MAX_NS_ATT,NFACT);	}	        }        /* Clamp LSP bandwidths to avoid sharp LPC filters */    lpc_clamp(par->lsf,BWMIN,LPC_ORD);        /* Calculate spectral tilt for current frame for spectral enhancement */    tilt_cof[0] = 1.0;    lpc_lsp2pred(par->lsf,lpc,LPC_ORD);    lpc_pred2refl(lpc,sig2,LPC_ORD);    if (sig2[1] < 0.0)      curr_tilt = 0.5*sig2[1];    else      curr_tilt = 0.0;        /* Disable pitch interpolation for high-pitched onsets */    if (par->pitch < 0.5*prev_par.pitch && 	par->gain[0] > 6.0 + prev_par.gain[NUM_GAINFR-1]) {		/* copy current pitch into previous */	prev_par.pitch = par->pitch;    }        /* Set pulse and noise coefficients based on voicing strengths */    v_zap(curr_pcof,MIX_ORD+1);    v_zap(curr_ncof,MIX_ORD+1);    for (i = 0; i < NUM_BANDS; i++) {	if (par->bpvc[i] > 0.5)	    v_add(curr_pcof,&bp_cof[i][0],MIX_ORD+1);	else	    v_add(curr_ncof,&bp_cof[i][0],MIX_ORD+1);    }	    /* Process each pitch period */        while (syn_begin < FRAME) {	/* interpolate previous and current parameters */	ifact = ((float) syn_begin ) / FRAME;				if (syn_begin >= GAINFR) {	    gaincnt = 2;	    ifact_gain = ((float) syn_begin-GAINFR) / GAINFR;	}	else {	    gaincnt = 1;	    ifact_gain = ((float) syn_begin) / GAINFR;	}		/* interpolate gain */	if (gaincnt > 1) {	    gain = ifact_gain*par->gain[gaincnt-1] + 		(1.0-ifact_gain)*par->gain[gaincnt-2];	}	else {	    gain = ifact_gain*par->gain[gaincnt-1] + 		(1.0-ifact_gain)*prev_par.gain[NUM_GAINFR-1];	}		/* Set overall interpolation path based on gain change */		temp = par->gain[NUM_GAINFR-1] - prev_par.gain[NUM_GAINFR-1];	if (fabs(temp) > 6) {	    /* Power surge: use gain adjusted interpolation */	    intfact = (gain - prev_par.gain[NUM_GAINFR-1]) / temp;	    if (intfact > 1.0)		intfact = 1.0;	    if (intfact < 0.0)		intfact = 0.0;	}	else	    /* Otherwise, linear interpolation */	    intfact = ((float) syn_begin) / FRAME;		/* interpolate LSF's and convert to LPC filter */	interp_array(prev_par.lsf,par->lsf,lsf,intfact,LPC_ORD+1);	lpc_lsp2pred(lsf,lpc,LPC_ORD);		/* Check signal probability for adaptive spectral enhancement filter */	sig_prob = lin_int_bnd(gain,noise_gain+12.0,noise_gain+30.0,			       0.0,1.0);	/* Calculate adaptive spectral enhancement filter coefficients */	ase_num[0] = 1.0;	lpc_bw_expand(lpc,ase_num,sig_prob*ASE_NUM_BW,LPC_ORD);	lpc_bw_expand(lpc,ase_den,sig_prob*ASE_DEN_BW,LPC_ORD);	tilt_cof[1] = sig_prob*(intfact*curr_tilt + 				(1.0-intfact)*prev_tilt);		/* interpolate pitch and pulse gain */	pitch = intfact*par->pitch + (1.0-intfact)*prev_par.pitch;	pulse_gain = SYN_GAIN*sqrt(pitch);		/* interpolate pulse and noise coefficients */	temp = sqrt(ifact);	interp_array(prev_pcof,curr_pcof,pulse_cof,temp,MIX_ORD+1);	interp_array(prev_ncof,curr_ncof,noise_cof,temp,MIX_ORD+1);		/* interpolate jitter */	jitter = ifact*par->jitter + 	    (1.0-ifact)*prev_par.jitter;		/* convert gain to linear */	gain = pow(10.0,0.05*gain);		/* Set period length based on pitch and jitter */	rand_num(&temp,1.0,1);	length = pitch * (1.0-jitter*temp) + 0.5;	if (length < PITCHMIN)	    length = PITCHMIN;	if (length > PITCHMAX)	    length = PITCHMAX;		/* Use inverse DFT for pulse excitation */	fill(fs_real,1.0,length);	fs_real[0] = 0.0;	interp_array(prev_par.fs_mag,par->fs_mag,&fs_real[1],intfact,		     NUM_HARM);	idft_real(fs_real,&sigbuf[BEGIN],length);		/* Delay overall signal by PDEL samples (circular shift) */	/* use fs_real as a scratch buffer */	v_equ(fs_real,&sigbuf[BEGIN],length);	v_equ(&sigbuf[BEGIN+PDEL],fs_real,length-PDEL);	v_equ(&sigbuf[BEGIN],&fs_real[length-PDEL],PDEL);		/* Scale by pulse gain */	v_scale(&sigbuf[BEGIN],pulse_gain,length);			/* Filter and scale pulse excitation */	v_equ(&sigbuf[BEGIN-MIX_ORD],pulse_del,MIX_ORD);	v_equ(pulse_del,&sigbuf[length+BEGIN-MIX_ORD],MIX_ORD);	zerflt(&sigbuf[BEGIN],pulse_cof,&sigbuf[BEGIN],MIX_ORD,length);		/* Get scaled noise excitation */	rand_num(&sig2[BEGIN],(1.732*SYN_GAIN),length);		/* Filter noise excitation */	v_equ(&sig2[BEGIN-MIX_ORD],noise_del,MIX_ORD);	v_equ(noise_del,&sig2[length+BEGIN-MIX_ORD],MIX_ORD);	zerflt(&sig2[BEGIN],noise_cof,&sig2[BEGIN],MIX_ORD,length);		/* Add two excitation signals (mixed excitation) */	v_add(&sigbuf[BEGIN],&sig2[BEGIN],length);		/* Adaptive spectral enhancement */	v_equ(&sigbuf[BEGIN-LPC_ORD],ase_del,LPC_ORD);	lpc_synthesis(&sigbuf[BEGIN],&sigbuf[BEGIN],ase_den,LPC_ORD,length);	v_equ(ase_del,&sigbuf[BEGIN+length-LPC_ORD],LPC_ORD);	zerflt(&sigbuf[BEGIN],ase_num,&sigbuf[BEGIN],LPC_ORD,length);	v_equ(&sigbuf[BEGIN-TILT_ORD],tilt_del,TILT_ORD);	v_equ(tilt_del,&sigbuf[length+BEGIN-TILT_ORD],TILT_ORD);	zerflt(&sigbuf[BEGIN],tilt_cof,&sigbuf[BEGIN],TILT_ORD,length);		/* Perform LPC synthesis filtering */	v_equ(&sigbuf[BEGIN-LPC_ORD],lpc_del,LPC_ORD);	lpc_synthesis(&sigbuf[BEGIN],&sigbuf[BEGIN],lpc,LPC_ORD,length);	v_equ(lpc_del,&sigbuf[length+BEGIN-LPC_ORD],LPC_ORD);			/* Adjust scaling of synthetic speech */	scale_adj(&sigbuf[BEGIN],gain,&prev_scale,length,SCALEOVER);	/* Implement pulse dispersion filter */	v_equ(&sigbuf[BEGIN-DISP_ORD],disp_del,DISP_ORD);	v_equ(disp_del,&sigbuf[length+BEGIN-DISP_ORD],DISP_ORD);	zerflt(&sigbuf[BEGIN],disp_cof,&sigbuf[BEGIN],DISP_ORD,length);			/* Copy processed speech to output array (not past frame end) */	if (syn_begin+length > FRAME) {	    v_equ(&sp_out[syn_begin],&sigbuf[BEGIN],FRAME-syn_begin);					    /* past end: save remainder in sigsave[0] */	    v_equ(&sigsave[0],&sigbuf[BEGIN+FRAME-syn_begin],		  length-(FRAME-syn_begin));	}				else	    v_equ(&sp_out[syn_begin],&sigbuf[BEGIN],length);			/* Update syn_begin for next period */	syn_begin += length;    }		    /* Save previous pulse and noise filters for next frame */    v_equ(prev_pcof,curr_pcof,MIX_ORD+1);    v_equ(prev_ncof,curr_ncof,MIX_ORD+1);        /* Copy current parameters to previous parameters for next time */    prev_par = *par;    prev_tilt = curr_tilt;        /* Update syn_begin for next frame */    syn_begin -= FRAME;    }/*  * * Subroutine melp_syn_init(): perform initialization for melp  *	synthesis * */void melp_syn_init(){    int i;    float w_fs[NUM_HARM];	    v_zap(prev_par.gain,NUM_GAINFR);    prev_par.pitch = UV_PITCH;    prev_par.lsf[0] = 0.0;    for (i = 1; i < LPC_ORD+1; i++)      prev_par.lsf[i] = prev_par.lsf[i-1] + (1.0/(LPC_ORD+1));    prev_par.jitter = 0.0;    v_zap(&prev_par.bpvc[0],NUM_BANDS);    prev_tilt=0.0;    prev_gain = 0.0;    prev_scale = 0.0;    syn_begin = 0;    noise_gain = MIN_NOISE;    firstcall = 1;    prev_gain_err = 0;    v_zap(pulse_del,MIX_ORD);    v_zap(noise_del,MIX_ORD);    v_zap(lpc_del,LPC_ORD);    v_zap(ase_del,LPC_ORD);    v_zap(tilt_del,TILT_ORD);    v_zap(disp_del,DISP_ORD);    v_zap(sig2,BEGIN+PITCHMAX);    v_zap(sigbuf,BEGIN+PITCHMAX);    v_zap(sigsave,PITCHMAX);    v_zap(prev_pcof,MIX_ORD+1);    v_zap(prev_ncof,MIX_ORD+1);    prev_ncof[MIX_ORD/2] = 1.0;	    fill(prev_par.fs_mag,1.0,NUM_HARM);    /*      * Initialize multi-stage vector quantization (read codebook)      */	     vq_par.num_best = MSVQ_M;    vq_par.num_stages = 4;    vq_par.dimension = 10;    /*      * Allocate memory for number of levels per stage and indices     * and for number of bits per stage      */     MEM_ALLOC(MALLOC,vq_par.num_levels,vq_par.num_stages,int);    MEM_ALLOC(MALLOC,vq_par.indices,vq_par.num_stages,int);    MEM_ALLOC(MALLOC,vq_par.num_bits,vq_par.num_stages,int);	    vq_par.num_levels[0] = 128;    vq_par.num_levels[1] = 64;    vq_par.num_levels[2] = 64;    vq_par.num_levels[3] = 64;	    vq_par.num_bits[0] = 7;    vq_par.num_bits[1] = 6;    vq_par.num_bits[2] = 6;    vq_par.num_bits[3] = 6;	    vq_par.cb = msvq_cb;	    /* Scale codebook to 0 to 1 */    if (fsvq_weighted == 0)      v_scale(vq_par.cb,(2.0/FSAMP),3200);    /*      * Initialize Fourier magnitude vector quantization (read codebook)      */	     fs_vq_par.num_best = 1;    fs_vq_par.num_stages = 1;    fs_vq_par.dimension = NUM_HARM;    /*      * Allocate memory for number of levels per stage and indices     * and for number of bits per stage      */     MEM_ALLOC(MALLOC,fs_vq_par.num_levels,fs_vq_par.num_stages,int);    MEM_ALLOC(MALLOC,fs_vq_par.indices,fs_vq_par.num_stages,int);    MEM_ALLOC(MALLOC,fs_vq_par.num_bits,fs_vq_par.num_stages,int);	    fs_vq_par.num_levels[0] = FS_LEVELS;	    fs_vq_par.num_bits[0] = FS_BITS;	    fs_vq_par.cb = fsvq_cb;	    /*      * Initialize fixed MSE weighting and inverse of weighting      */	    vq_fsw(w_fs, NUM_HARM, 60.0);    for (i = 0; i < NUM_HARM; i++)      w_fs_inv[i] = 1.0/w_fs[i];    /*      * Pre-weight codebook (assume single stage only)      */	    if (fsvq_weighted == 0)      {	  fsvq_weighted = 1;	  for (i = 0; i < fs_vq_par.num_levels[0]; i++)	    window(&fs_vq_par.cb[i*NUM_HARM],w_fs,&fs_vq_par.cb[i*NUM_HARM],		   NUM_HARM);      }	}
melp_syn.c - 源码说明

本页面展示了「melp谱的计算。本程序是语音编码melp的C程序实现」中的 melp_syn.c 源码文件，采用 C语言编程语言编写，共 484 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。
虫虫下载站收录了大量与melp相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。
⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?