首页 › 资源下载 › 网络 › julius version 4.12. › 源码查看

wav2mfcc.c

来自「julius version 4.12.about sound recognit」· C语言代码 · 共 178 行

178 行

/** * @file   wav2mfcc.c *  * <JA> * @brief  泼魔翁ベクトル(MFCC)废误の换叫∈润悸箕粗惹∷ * * 掐蜗された不兰侨妨から·泼魔ベクトル废误を藐叫します.  * Julius/Julianで藐叫できる泼魔ベクトルは·MFCC の扦罢肌傅眶のもので· * _0, _E, _D, _A, _Z, _N の扦罢の寥圭わせをサポ〖トします.  * そのほか·岭墓やフレ〖ムシフト·掠拌カットなどのパラメ〖タを回年できます.  * 千急箕には·不读モデルのヘッダとチェックが乖われ·CMNの铜痰など * が疯年されます.  *  * ここの簇眶は·バッファ惧に眠姥された不兰侨妨デ〖タを办刨に * 泼魔ベクトル废误に恃垂するもので·ファイル掐蜗などに脱いられます.  * マイク掐蜗などで·掐蜗と士乖に千急を乖う眷圭は·ここの簇眶ではなく· * realtime-1stpass.c 柒で乖われます.  * </JA> *  * <EN> * @brief  Calculate feature vector (MFCC) sequence (non on-the-fly ver.) * * Parameter vector sequence extraction of input speech is done * here.  The supported parameter is MFCC, with any combination of * all the qualifiers in HTK: _0, _E, _D, _A, _Z, _N.  Acoustic model * for recognition should be trained with the same parameter type. * You can specify other parameters such as window size, frame shift, * high/low frequency cut-off via runtime options.  At startup, Julius * will check for the parameter types of acoustic model if it conforms * the limitation, and determine whether other additional processing * is needed such as Cepstral Mean Normalization. * * Functions below are used to convert fully buffered whole sentence * utterance, and typically used for audio file input.  When input * is concurrently processed with recognition process at 1st pass,  * in case of microphone input, the MFCC computation will be done * within functions in realtime-1stpass.c instead of these. * </EN> *  * @author Akinobu Lee * @date   Sun Sep 18 19:40:34 2005 * * $Revision: 1.2 $ *  *//* * Copyright (c) 1991-2007 Kawahara Lab., Kyoto University * Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology * Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology * All rights reserved */#include <julius/julius.h>#include <sys/stat.h>/**  * <JA> * 不兰侨妨デ〖タから MFCC パラメ〖タを藐叫する. * エンジンインスタンス柒の MFCC 纷换インスタンスごとにパラメ〖タ藐叫が * 乖われ·それぞれの mfcc->param に呈羌される.  *  * @param speech [in] 不兰侨妨デ〖タ * @param speechlen [in] @a speech の墓さ∈帽疤¨サンプル眶∷ * @param recog [in] エンジンインスタンス *  * @return 喇根箕 TRUE, エラ〖箕 FALSE を手す.  * </JA> * <EN> * Extract MFCC parameters with sentence CMN from given waveform. * Parameters will be computed for each MFCC calculation instance * in the engine instance, and stored in mfcc->param for each. *  * @param speech [in] buffer of speech waveform * @param speechlen [in] length of @a speech in samples * @param recog [in] engine instance *  * @return TRUE on success, FALSE on error. * </EN> * * @callgraph * @callergraph */booleanwav2mfcc(SP16 speech[], int speechlen, Recog *recog){  int framenum;  int len;  Value *para;  MFCCCalc *mfcc;  /* calculate frame length from speech length, frame size and frame shift */  framenum = (int)((speechlen - recog->jconf->input.framesize) / recog->jconf->input.frameshift) + 1;  if (framenum < 1) {    jlog("WARNING: input too short (%d samples), ignored\n", speechlen);    return FALSE;  }  for(mfcc=recog->mfcclist;mfcc;mfcc=mfcc->next) {    if (mfcc->frontend.ssload_filename) {      /* setup for spectral subtraction using file */      if (mfcc->frontend.ssbuf == NULL) {	/* load noise spectrum for spectral subtraction from file (once) */	if ((mfcc->frontend.ssbuf = new_SS_load_from_file(mfcc->frontend.ssload_filename, &(mfcc->frontend.sslen))) == NULL) {	  jlog("ERROR: wav2mfcc: failed to read noise spectrum from file \"%s\"\n", mfcc->frontend.ssload_filename);	  return FALSE;	}      }    }    if (mfcc->frontend.sscalc) {      /* compute noise spectrum from head silence for each input */      len = mfcc->frontend.sscalc_len * recog->jconf->input.sfreq / 1000;      if (len > speechlen) len = speechlen;#ifdef SSDEBUG      jlog("DEBUG: [%d]\n", len);#endif      mfcc->frontend.ssbuf = new_SS_calculate(speech, len, &(mfcc->frontend.sslen), mfcc->frontend.mfccwrk_ss, mfcc->para);    }  }  /* compute mfcc from speech file for each mfcc instances */  for(mfcc=recog->mfcclist;mfcc;mfcc=mfcc->next) {    para = mfcc->para;    /* malloc new param */    param_init_content(mfcc->param);    if (param_alloc(mfcc->param, framenum, para->veclen) == FALSE) {      jlog("ERROR: failed to allocate memory for converted parameter vectors\n");      return FALSE;    }    if (mfcc->frontend.ssload_filename || mfcc->frontend.sscalc) {      /* make link from mfccs to this buffer */      mfcc->wrk->ssbuf = mfcc->frontend.ssbuf;      mfcc->wrk->ssbuflen = mfcc->frontend.sslen;      mfcc->wrk->ss_alpha = mfcc->frontend.ss_alpha;      mfcc->wrk->ss_floor = mfcc->frontend.ss_floor;    }      /* make MFCC from speech data */    if (Wav2MFCC(speech, mfcc->param->parvec, para, speechlen, mfcc->wrk) == FALSE) {      jlog("ERROR: failed to compute MFCC from input speech\n");      if (mfcc->frontend.sscalc) {	free(mfcc->frontend.ssbuf);	mfcc->frontend.ssbuf = NULL;      }      return FALSE;    }    /* set miscellaneous parameters */    mfcc->param->header.samplenum = framenum;    mfcc->param->header.wshift = para->smp_period * para->frameshift;    mfcc->param->header.sampsize = para->veclen * sizeof(VECT); /* not compressed */    mfcc->param->header.samptype = F_MFCC;    if (para->delta) mfcc->param->header.samptype |= F_DELTA;    if (para->acc) mfcc->param->header.samptype |= F_ACCL;    if (para->energy) mfcc->param->header.samptype |= F_ENERGY;    if (para->c0) mfcc->param->header.samptype |= F_ZEROTH;    if (para->absesup) mfcc->param->header.samptype |= F_ENERGY_SUP;    if (para->cmn) mfcc->param->header.samptype |= F_CEPNORM;    mfcc->param->veclen = para->veclen;    mfcc->param->samplenum = framenum;    if (mfcc->frontend.sscalc) {      free(mfcc->frontend.ssbuf);      mfcc->frontend.ssbuf = NULL;    }  }  return TRUE;}/* end of file */

wav2mfcc.c - 源码说明

本页面展示了「julius version 4.12.about sound recognition.」中的 wav2mfcc.c 源码文件，采用 C语言编程语言编写，共 178 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。

虫虫下载站收录了大量与recognition相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。

⌨️ 快捷键说明

复制代码Ctrl + C

搜索代码Ctrl + F

全屏模式F11

增大字号Ctrl + =

减小字号Ctrl + -

显示快捷键?