📄 live_dump.c

📁 CMU大名鼎鼎的SPHINX－3大词汇量连续语音识别系统
💻 C
字号:
/* ==================================================================== * Copyright (c) 1999-2004 Carnegie Mellon University.  All rights * reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * * 1. Redistributions of source code must retain the above copyright *    notice, this list of conditions and the following disclaimer.  * * 2. Redistributions in binary form must reproduce the above copyright *    notice, this list of conditions and the following disclaimer in *    the documentation and/or other materials provided with the *    distribution. * * This work was supported in part by funding from the Defense Advanced  * Research Projects Agency and the National Science Foundation of the  * United States of America, and the CMU Sphinx Speech Consortium. * * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND  * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,  * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. * * ==================================================================== * *//************************************************* * CMU ARPA Speech Project * * Copyright (c) 2000 Carnegie Mellon University. * ALL RIGHTS RESERVED. ************************************************* * * 13-Apr-2001  Ricky Houghton *              Added live_free_memory to clean up memory allocated locally. * * 01-Jan-2000  Rita Singh (rsingh@cs.cmu.edu) at Carnegie Mellon University *		Created a separate function live_get_partialhyp() to  *		generate partial hypotheses from the kb structure * * 31-Dec-2000  Rita Singh (rsingh@cs.cmu.edu) at Carnegie Mellon University * Created */#include <utt.h>#include <profile.h>#include <kb.h>#include <fe.h> #include "live_dump.h"#include "fe_dump.h"#include "feat_dump.h"#include "cmd_ln_args.h"static fe_t  *fe;static kb_t  *kb;static kbcore_t *kbcore;static FILE  *hmmdumpfp;static partialhyp_t *parthyp = NULL;static float32 *dummyframe;/* This routine initializes decoder variables for live mode decoding */void live_initialize_decoder(char *live_args){    static kb_t live_kb;    int32   maxcepvecs, maxhyplen, samprate, ceplen;    param_t *fe_param;    metricsStart("Loading");    parse_args_file(live_args);    unlimit();    kb_init(&live_kb);    kb = &live_kb;    kbcore = kb->kbcore;    hmmdumpfp = cmd_ln_int32("-hmmdump") ? stderr : NULL;    maxhyplen = cmd_ln_int32 ("-maxhyplen");    if (!parthyp)         parthyp  = (partialhyp_t *) ckd_calloc(maxhyplen, sizeof(partialhyp_t));    fe_param = (param_t *) ckd_calloc(1, sizeof(param_t));    samprate = cmd_ln_int32 ("-samprate");    if (samprate != 8000 && samprate != 16000)	E_FATAL("Sampling rate %s not supported. Must be 8000 or 16000\n",samprate);    fe_param->SAMPLING_RATE = (float32) samprate;    fe_param->LOWER_FILT_FREQ = cmd_ln_float32("-lowerf");    fe_param->UPPER_FILT_FREQ = cmd_ln_float32("-upperf");    fe_param->NUM_FILTERS = cmd_ln_int32("-nfilt");    fe_param->FRAME_RATE = cmd_ln_int32("-frate");    fe_param->PRE_EMPHASIS_ALPHA = cmd_ln_float32("-alpha");    fe_param->FFT_SIZE = cmd_ln_int32("-nfft");    fe_param->WINDOW_LENGTH = cmd_ln_float32("-wlen");    fe_param->doublebw = cmd_ln_int32("-doublebw");    fe_param->machine_endian = cmd_ln_int32("-machine_endian");    fe_param->input_endian = cmd_ln_int32("-input_endian");    fe = fe_init(fe_param);    if (!fe)	E_FATAL("Front end initialization fe_init() failed\n");    maxcepvecs = cmd_ln_int32 ("-maxcepvecs");    ceplen = kbcore->fcb->cepsize;    dummyframe = (float32*) ckd_calloc(1 * ceplen,sizeof(float32));	/*  */    metricsStop("Loading");}/* RAH Apr.13.2001: Memory was being held, Added Call fe_close to release memory held by fe and then release locally allocated memory */int32 live_free_memory (){    parse_args_free(); /* Free memory allocated during the argument parseing stage */    fe_close (fe);		/*  */    kb_free (kb);		/*  */    ckd_free ((void *) dummyframe); /*  */    ckd_free ((void *) parthyp);  /*  */    return (0);}/******************************************************************* * This routine retrieves the part hypothesis from the kb structure * at any stage in the decoding. The "endutt" flag is needed to know * whether the utterance is to be considered terminated or not * The function stores the partial hypothesis in the global array * "parthyp" and returns the number of words in the hypothesis *******************************************************************/int32 live_get_partialhyp(int32 endutt){    int32 id, nwds;    glist_t   hyp;    gnode_t   *gn;    hyp_t     *h;    dict_t    *dict;    dict = kbcore_dict (kb->kbcore);    if (endutt)        id = vithist_utt_end(kb->vithist, kb->kbcore);    else        id = vithist_partialutt_end(kb->vithist, kb->kbcore);    if (id > 0) {        hyp = vithist_backtrace(kb->vithist,id);        for (gn = hyp,nwds=0; gn; gn = gnode_next(gn),nwds++) {            h = (hyp_t *) gnode_ptr (gn);            if (parthyp[nwds].word != NULL) {                ckd_free(parthyp[nwds].word);                parthyp[nwds].word = NULL;            }            parthyp[nwds].word = strdup(dict_wordstr(dict, h->id));            parthyp[nwds].sf = h->sf;            parthyp[nwds].ef = h->ef;	    parthyp[nwds].ascr = h->ascr;	    parthyp[nwds].lscr = h->lscr;        }        if (parthyp[nwds].word != NULL){            ckd_free(parthyp[nwds].word);            parthyp[nwds].word = NULL;        }        /* Free hyplist */        for (gn = hyp; gn && (gnode_next(gn)); gn = gnode_next(gn)) {            h = (hyp_t *) gnode_ptr (gn);            ckd_free ((void *) h);        }        glist_free (hyp);    } else {        nwds = 0;        if (parthyp[nwds].word != NULL) {            ckd_free(parthyp[nwds].word);            parthyp[nwds].word = NULL;        }    }    return(nwds);}/* Routine to decode a block of incoming samples. A partial hypothesis * for the utterance upto the current block of samples is returned. * The calling routine has to inform the routine if the block of samples * being passed is the final block of samples for an utterance by * setting live_endutt to 1. On receipt of a live_endutt flag the routine * automatically assumes that the next block of samples is the beginning * of a new utterance  */int32 live_utt_decode_block (int16 *samples, int32 nsamples, 		      int32 live_endutt, partialhyp_t **ohyp){    static int32 live_begin_new_utt = 1;    static int32 frmno;    static float32 ***live_feat = NULL;    int32   live_nfr, live_nfeatvec;    int32   nwds;    float32 **mfcbuf;    metricsStart("Decode");    if(live_feat==NULL)      live_feat = feat_array_alloc (kbcore_fcb(kbcore), LIVEBUFBLOCKSIZE);    if (live_begin_new_utt){        kb->uttid = "bogus ID";        fe_start_utt(fe);	utt_begin (kb);	frmno = 0;	kb->nfr = 0;        kb->utt_hmm_eval = 0;        kb->utt_sen_eval = 0;        kb->utt_gau_eval = 0;        live_begin_new_utt = 0;    }    /* 10.jan.01 RAH, fe_process_utt now requires ***mfcbuf and it allocates the memory internally) */    mfcbuf = NULL;    metricsStart("FrontEnd");    live_nfr = fe_dump_process_utt(fe, samples, nsamples, &mfcbuf); /*  */    if (live_endutt) {        /* RAH, It seems that we shouldn't throw out this data */        fe_dump_end_utt(fe,dummyframe); /* Flush out the fe */    }    /* Compute feature vectors */    live_nfeatvec = feat_dump_s2mfc2feat_block(kbcore_fcb(kbcore), mfcbuf,                                               live_nfr, live_begin_new_utt,                                               live_endutt, live_feat);    metricsStop("FrontEnd");    /* decode the block */    metricsStart("ScorePrune");    if(live_nfeatvec>0){      utt_decode_block (live_feat, live_nfeatvec, &frmno, kb, 			hmmdumpfp);    }        metricsStop("ScorePrune");    metricsStop("Decode");    /* Pull out partial hypothesis */    metricsStart("ExtractHypothesis");    nwds =  live_get_partialhyp(live_endutt);    *ohyp = parthyp;    metricsStop("ExtractHypothesis");    /* Clean up */    metricsStart("Decode");    if (live_endutt) {	live_begin_new_utt = 1;	kb->tot_fr += kb->nfr;	utt_end(kb);    }    else {	live_begin_new_utt = 0;    }    metricsStop("Decode");    /* I'm starting to think that fe_process_utt should not be       allocating its memory,       that or it should allocate some max and just keep on going,        this idea of constantly allocating freeing       memory seems dangerous to me.       ckd_free_2d((void **) mfcbuf);       RAH, this must be freed since fe_process_utt allocates it       */    return(nwds);}/** * Routine to run the frontend on a block of samples. */int32 live_fe_process_block (int16 *samples, int32 nsamples, 			     int32 live_endutt, partialhyp_t **ohyp){    static int32 live_begin_new_utt = 1;    static int32 frmno;    float32 **live_feat;    int32   live_nfr, live_nfeatvec;    float32 **mfcbuf;    if (live_begin_new_utt) {        fe_start_utt(fe);	frmno = 0;	kb->nfr = 0;        kb->utt_hmm_eval = 0;        kb->utt_sen_eval = 0;        kb->utt_gau_eval = 0;        live_begin_new_utt = 0;    }    /* 10.jan.01 RAH, fe_process_utt now requires ***mfcbuf       and it allocates the memory internally) */    mfcbuf = NULL;    metricsStart("FrontEnd");    live_nfr = fe_dump_process_utt(fe, samples, nsamples, &mfcbuf); /*  */    if (live_endutt) /* RAH, It seems that we shouldn't throw out this data */        fe_dump_end_utt(fe,dummyframe); /* Flush out the fe */    /* Compute feature vectors */    live_nfeatvec = feat_dump_s2mfc2feat_block(kbcore_fcb(kbcore), mfcbuf,                                               live_nfr, live_begin_new_utt,                                               live_endutt, &live_feat);    metricsStop("FrontEnd");    /* E_INFO ("live_nfeatvec: %ld\n",live_nfeatvec); */    if (fe_dump) {        fe_dump2d_float_frame(fe_dumpfile, live_feat, live_nfeatvec,                              feat_stream_len(kbcore_fcb(kbcore), 0),                              "FEATURE_FRAME", "FEATURE");    }    /* Clean up */    if (live_endutt) {	live_begin_new_utt = 1;	kb->tot_fr += kb->nfr;    }    else {	live_begin_new_utt = 0;    }    ckd_free_2d((void **) mfcbuf);    return 0;}void live_print_profiles(FILE *file){    ptmr_print_all(file, &kb->tm_sen, (float64) 1);    ptmr_print_all(file, &kb->tm_srch, (float64) 1);}
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -