jconf.h

来自「julius version 4.12.about sound recognit」· C头文件 代码 · 共 1,202 行 · 第 1/2 页

H
1,202
字号
    /**     * Length threshold to detect short-pause segment in frames     */    int sp_frame_duration;    /**     * name string of pause model     *      */    char *pausemodelname;#ifdef SPSEGMENT_NAIST    /**     * Backstep margin when speech trigger detected by NAIST short-pause     * detection system     *      */    int sp_margin;    /**     * Delay frame of speech trigger detection in NAIST short-pause     * detection system     *      */    int sp_delay;#endif  } successive;  /**   * Annotation to the output   *    */  struct {#ifdef CONFIDENCE_MEASURE    /**     * Scaling factor for confidence scoring (-cmalpha)     */    LOGPROB cm_alpha;#ifdef   CM_MULTIPLE_ALPHA    /**     * Begin value of alpha     */    LOGPROB cm_alpha_bgn;    /**     * End value of alpha     */    LOGPROB cm_alpha_end;    /**     * Number of test values (will be set from above values)     */    int cm_alpha_num;    /**     * Step value of alpha     */    LOGPROB cm_alpha_step;#endif#ifdef   CM_SEARCH_LIMIT    /**     * Cut-off threshold for generated hypo. for confidence decoding (-cmthres)     */    LOGPROB cm_cut_thres;#endif#ifdef   CM_SEARCH_LIMIT_POPO    /**     * Cut-off threshold for popped hypo. for confidence decoding (-cmthres2)     */    LOGPROB cm_cut_thres_pop;#endif#endif /* CONFIDENCE_MEASURE */    /**     * Forced alignment: per word (-walign)     */    boolean align_result_word_flag;    /**     * Forced alignment: per phoneme (-palign)     */    boolean align_result_phoneme_flag;    /**     * Forced alignment: per state (-salign)     */    boolean align_result_state_flag;  } annotate;  /**   * Output configurations   *    */  struct {    /**     * Result: number of sentence to output (-output) , also see @a nbest (-n).     */    int output_hypo_maxnum;    /**     * Result: output partial recognition result on the 1st pass (-progout)     */    boolean progout_flag;    /**     * Result: Progressive output interval on 1st pass in msec (-proginterval)     */    int progout_interval;    /**     * Result: INTERNAL: interval in number of frames     */    int progout_interval_frame;    /**     * Get results for all grammars independently on 2nd pass on DFA     * (-multigramout / -nomultigramout)     */    boolean multigramout_flag;  } output;  /**   * Misc. switches   *    */  struct {    /**     * Enter trellis interactive check routine after boot (-check trellis)     */    boolean trellis_check_flag;    /**     * Enter triphone existence check routine after boot (-check triphone)     */    boolean triphone_check_flag;    /**     * Enter lexicon structure consulting mode after boot (-check wchmm)     */    boolean wchmm_check_flag;    /**     * should be set to TRUE at startup when this process should start     * with inactive status     *      */    boolean start_inactive;    /**     * In case the 2nd pass search fails, this option specifies Julius     * to use the result of the previous 1st pass as final result.     * When this is TRUE, no RECOGFAIL occur.     *      */    boolean fallback_pass1_flag;      } sw;  /* pointer to next instance */  struct __jconf_search__ *next;} JCONF_SEARCH;/** * Configuration parameters (global) *  */typedef struct __Jconf__ {  /**   * Input source information, gathered from all AM conf.   */  struct {    /**     * Input source type. (waveform / mfc)     *      */    int type;    /**     * Input source.     *      */    int speech_input;    /**     * Input device.     *      */    int device;    /**     * id of the selected plug-in if using plugin     *      */    int plugin_source;    /**     * Sampling frequency     *      */    long sfreq;    /**     * Sampling period in 100ns units     *      */    long period;    /**     * Window size in samples, similar to WINDOWSIZE in HTK (unit is different)     *      */    int framesize;    /**     * Frame shift length in samples     *      */    int frameshift;    /**     * Use 48kHz input and perform down sampling to 16kHz (-48)     */    boolean use_ds48to16;    /**     * List of input files for rawfile / mfcfile input (-filelist)      */    char *inputlist_filename;    /**     * Port number for adinnet input (-adport)     */    int adinnet_port;#ifdef USE_NETAUDIO    /**     * Host/unit name for NetAudio/DatLink input (-NA)     */    char *netaudio_devname;#endif    /**     * Check input parameter type with header of the hmmdefs     * for parameter file input.  FALSE avoids the check.     */    boolean paramtype_check_flag;  } input;  /**   * Configurations for Voice activity detection   *    */  struct {    /**     * Input level threshold from 0 to 32767 (-lv)     */    int level_thres;    /**     * Head margin in msec (-headmargin)     */    int head_margin_msec;    /**     * Tail margin in msec (-tailmargin)     */    int tail_margin_msec;    /**     * Zero cross number threshold per a second (-zc)     */    int zero_cross_num;    /**     * Silence detection and cutting: 0=off, 1=on, 2=accept device default     * (-cutsilence / -nocutsilence)     */    int silence_cut;#ifdef GMM_VAD    /**     * (GMM_VAD) Backstep margin when speech trigger is detected.     *      */    int gmm_margin;    /**     * (GMM_VAD) Up trigger threshold of GMM likelihood, where GMM     * likelihood is defined as \[ \max_{m \in M_v} p(x|m) - \max_{m     * \in M_n} p(x|m) \] where $M_v$ is a set of voice GMM, and $M_n$     * is a set of noise GMM whose names are specified by     * "-gmmreject".  Julius calculate this value for each input     * frame, and average it for the last gmm_margin frames, and when     * the value gets higher than this value, Julius will start recognition.     */    float gmm_uptrigger_thres;    /**     * (GMM_VAD) Down trigger threshold of GMM likelihood, where GMM     * likelihood is defined as \[ \max_{m \in M_v} p(x|m) - \max_{m     * \in M_n} p(x|m) \] where $M_v$ is a set of voice GMM, and $M_n$     * is a set of noise GMM whose names are specified by     * "-gmmreject".  Julius calculate this value for each input     * frame, and average it for the last gmm_margin frames, and when     * the value gets lower than this value, Julius will stop recognition.     */    float gmm_downtrigger_thres;#endif  } detect;  /**   * Pre-processing parameters before frontends   *    */  struct {    /**     * Strip off zero samples (-nostrip to unset)     */    boolean strip_zero_sample;    /**     * Remove DC offset by zero mean (-zmean / -nozmean)     */    boolean use_zmean;  } preprocess;  /**   * Models and parameters for input rejection   *    */  struct {    /**     * GMM definition file (-gmm)     */    char *gmm_filename;    /**     * Number of Gaussians to be computed on GMM calculation (-gmmnum)     */    int gmm_gprune_num;    /**     * Comma-separated list of GMM model name to be rejected (-gmmreject)     */    char *gmm_reject_cmn_string;    /**     * Length threshold to reject input (-rejectshort)     */    int rejectshortlen;#ifdef POWER_REJECT    /**     * Rejection power threshold     *      */    float powerthres;#endif  } reject;  /**   * decoding parameters to control recognition process (global)   *    */  struct {    /**     * INTERNAL: do on-the-fly decoding if TRUE (value depends on     * device default and forced_realtime.     */    boolean realtime_flag;            /**     * INTERNAL: TRUE if either of "-realtime" or "-norealtime" is     * explicitly specified by user.  When TRUE, the user-specified value     * in forced_realtime will be applied to realtime_flag.     */    boolean force_realtime_flag;        /**     * Force on-the-fly decoding on 1st pass with audio input and     * MAP-CMN (-realtime / -norealtime)     */    boolean forced_realtime;        /**     * TRUE if a kind of speech segmentation is enabled     *      */    boolean segment;  } decodeopt;  /**   * Configurations for acoustic models (HMM, HMMList) and am-specific   * parameters   *    */  JCONF_AM *am_root;  /**   * Language models (N-gram / DFA), dictionary, and related parameters.   *    */  JCONF_LM *lm_root;  /**   * Search parameters (LM/AM independent), annotation,   * and output parameters   *    */  JCONF_SEARCH *search_root;  /**   * Current JCONF_AM for reading options   *    */  JCONF_LM *lmnow;  /**   * Current JCONF_AM for reading options   *    */  JCONF_AM *amnow;  /**   * Current JCONF_AM for reading options   *    */  JCONF_SEARCH *searchnow;  /**   * Config parameters for GMM computation.   * (only gmmconf->analysis.* is used)   *    */  JCONF_AM *gmm;  /**   * Current option declaration mode while loading options   *    */  short optsection;  /**   * Whether option sectioning ristriction should be applied or not   *    */  boolean optsectioning;} Jconf;enum {  JCONF_OPT_DEFAULT,  JCONF_OPT_GLOBAL,  JCONF_OPT_AM,  JCONF_OPT_LM,  JCONF_OPT_SR,  SIZEOF_JCONF_OPT};#endif /* __J_JCONF_H__ *//*=======================================================  An OLD variable name mapping from old global.h to common.h  These data are bogus, left here only for reference=======================================================result_reorder_flag -> DELETEDadinnet_port ->jconf.input.adinnet_portalign_result_phoneme_flag ->jconf.annotate.align_result_phoneme_flagalign_result_state_flag ->jconf.annotate.align_result_state_flagalign_result_word_flag ->jconf.annotate.align_result_word_flagbackmax ->recog.backmaxbacktrellis ->recog.backtrellisccd_flag ->jconf.am.ccd_flagccd_flag_force ->jconf.am.ccd_flag_forcecm_alpha ->jconf.annotate.cm_alphacm_alpha_bgn ->jconf.annotate.cm_alpha_bgncm_alpha_end ->jconf.annotate.cm_alpha_endcm_alpha_num ->jconf.annotate.cm_alpha_numcm_alpha_step ->jconf.annotate.cm_alpha_stepcm_cut_thres ->jconf.annotate.cm_cut_threscm_cut_thres_pop ->jconf.annotate.cm_cut_thres_popcmn_loaded ->recog.cmn_loadedcmn_map_weight ->jconf.frontend.cmn_map_weightcmn_update ->jconf.frontend.cmn_updatecmnload_filename ->jconf.frontend.cmnload_filenamecmnsave_filename ->jconf.frontend.cmnsave_filenamecompute_only_1pass ->jconf.sw.compute_only_1passdfa ->model.dfadfa_filename ->jconf.lm.dfa_filenamedictfilename ->jconf.lm.dictfilenameenable_iwsp ->jconf.lm.enable_iwspenable_iwspword ->jconf.lm.enable_iwspwordenveloped_bestfirst_width ->jconf.search.pass2.enveloped_bestfirst_widthforce_realtime_flag ->jconf.search.pass1.force_realtime_flagforced_realtime ->jconf.search.pass1.forced_realtimeforcedict_flag ->jconf.lm.forcedict_flagframemaxscore ->recog.framemaxscorefrom_code ->jconf.output.from_codegmm ->model.gmmgmm_filename ->jconf.reject.gmm_filenamegmm_gprune_num ->jconf.reject.gmm_gprune_numgmm_reject_cmn_string ->jconf.reject.gmm_reject_cmn_stringgprune_method ->jconf.am.gprune_methodgramlist ->model.grammarsgramlist_root ->jconf.lm.gramlist_rootgraph_merge_neighbor_range ->jconf.graph.graph_merge_neighbor_rangegraph_totalwordnum ->recog.graph_totalwordnumgraphout_cut_depth ->jconf.graph.graphout_cut_depthgraphout_limit_boundary_loop_num ->jconf.graph.graphout_limit_boundary_loop_numgraphout_search_delay ->jconf.graph.graphout_search_delaygs_statenum ->jconf.am.gs_statenumhead_margin_msec ->jconf.detect.head_margin_msechead_silname ->jconf.lm.head_silnamehmm_gs ->model.hmm_gshmm_gs_filename ->jconf.am.hmm_gs_filenamehmmfilename ->jconf.am.hmmfilenamehmminfo ->model.hmminfohypo_overflow ->jconf.search.pass2.hypo_overflowinputlist_filename ->jconf.input.inputlist_filenameiw_cache_rate ->jconf.search.pass1.iw_cache_rateiwcdmaxn ->jconf.search.pass1.iwcdmaxniwcdmethod ->jconf.search.pass1.iwcdmethodiwsp_penalty ->jconf.lm.iwsp_penaltyiwspentry ->jconf.lm.iwspentrylevel_thres ->jconf.detect.level_threslm_penalty ->jconf.lm.lm_penaltylm_penalty2 ->jconf.lm.lm_penalty2lm_penalty_trans ->jconf.lm.lm_penalty_translm_weight ->jconf.lm.lm_weightlm_weight2 ->jconf.lm.lm_weight2lmp_specified ->jconf.lm.lmp_specifiedlmp2_specified ->jconf.lm.lmp2_specifiedlooktrellis_flag ->jconf.search.pass2.looktrellis_flaglookup_range ->jconf.search.pass2.lookup_rangemapfilename ->jconf.am.mapfilenamemixnum_thres ->jconf.am.mixnum_thresmodule_mode -> (app)module_port -> (app)module_sd -> (app)multigramout_flag ->jconf.output.multigramout_flagnbest ->jconf.search.pass2.nbestnetaudio_devname ->jconf.input.netaudio_devnamengram ->model.ngramngram_filename ->jconf.lm.ngram_filenamengram_filename_lr_arpa ->jconf.lm.ngram_filename_lr_arpangram_filename_rl_arpa ->jconf.lm.ngram_filename_rl_arpaold_iwcd_flag -> USE_OLD_IWCD (define.h)old_tree_function_flag ->jconf.search.pass1.old_tree_function_flagoutput_hypo_maxnum ->jconf.output.output_hypo_maxnumpara ->jconf.analysis.parapara_default ->jconf.analysis.para_defaultpara_hmm ->jconf.analysis.para_hmmpara_htk ->jconf.analysis.para_htkparamtype_check_flag ->jconf.analysis.paramtype_check_flagpass1_score ->recog.pass1_scorepass1_wnum ->recog.pass1_wnumpass1_wseq ->recog.pass1_wseqpenalty1 ->jconf.lm.penalty1penalty2 ->jconf.lm.penalty2peseqlen ->recog.peseqlenprogout_flag ->jconf.output.progout_flagprogout_interval ->jconf.output.progout_intervalprogout_interval_frame (beam.c) ->jconf.output.progout_intervalrealtime_flag ->jconf.search.pass1.realtime_flagrecord_dirname ->jconf.output.record_dirnamerejectshortlen ->jconf.reject.rejectshortlenrest_param ->recog.rest_paramresult_output -> (app)scan_beam_thres ->jconf.search.pass2.scan_beam_thresseparate_score_flag ->jconf.output.separate_score_flagseparate_wnum ->jconf.search.pass1.separate_wnumsilence_cut ->jconf.detect.silence_cutsp_break_2_begin_word ->recog.sp_break_2_begin_wordsp_break_2_end_word ->recog.sp_break_2_end_wordsp_break_last_nword ->recog.sp_break_last_nwordsp_break_last_nword_allow_override ->recog.sp_break_last_nword_allow_overridesp_break_last_word ->recog.sp_break_last_wordsp_frame_duration ->jconf.successive.sp_frame_durationspecified_trellis_beam_width ->jconf.search.pass1.specified_trellis_beam_widthspeech ->recog.speechspeech_input ->jconf.input.speech_inputspeechlen ->recog.speechlenspmodel_name ->jconf.am.spmodel_namessbuf ->recog.ssbufsscalc ->jconf.frontend.sscalcsscalc_len ->jconf.frontend.sscalc_lensslen ->recog.sslenssload_filename ->jconf.frontend.ssload_filenamestack_size ->jconf.search.pass2.stack_sizestrip_zero_sample ->jconf.frontend.strip_zero_sampletail_margin_msec ->jconf.detect.tail_margin_msectail_silname ->jconf.lm.tail_silnameto_code ->jconf.output.to_codetrellis_beam_width ->recog.trellis_beam_widthtrellis_check_flag ->jconf.sw.trellis_check_flagtriphone_check_flag ->jconf.sw.triphone_check_flaguse_ds48to16 ->jconf.input.use_ds48to16use_zmean ->jconf.frontend.use_zmeanwchmm ->recog.wchmmwchmm_check_flag ->jconf.sw.wchmm_check_flagwinfo ->model.winfowpair_keep_nlimit ->jconf.search.pass1.wpair_keep_nlimitzero_cross_num ->jconf.detect.zero_cross_numverbose_flag -> (remain in global.h)debug2_flag -> (remain in global.h)*/ 

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?