jconf.h
来自「julius version 4.12.about sound recognit」· C头文件 代码 · 共 1,202 行 · 第 1/2 页
H
1,202 行
/** * Length threshold to detect short-pause segment in frames */ int sp_frame_duration; /** * name string of pause model * */ char *pausemodelname;#ifdef SPSEGMENT_NAIST /** * Backstep margin when speech trigger detected by NAIST short-pause * detection system * */ int sp_margin; /** * Delay frame of speech trigger detection in NAIST short-pause * detection system * */ int sp_delay;#endif } successive; /** * Annotation to the output * */ struct {#ifdef CONFIDENCE_MEASURE /** * Scaling factor for confidence scoring (-cmalpha) */ LOGPROB cm_alpha;#ifdef CM_MULTIPLE_ALPHA /** * Begin value of alpha */ LOGPROB cm_alpha_bgn; /** * End value of alpha */ LOGPROB cm_alpha_end; /** * Number of test values (will be set from above values) */ int cm_alpha_num; /** * Step value of alpha */ LOGPROB cm_alpha_step;#endif#ifdef CM_SEARCH_LIMIT /** * Cut-off threshold for generated hypo. for confidence decoding (-cmthres) */ LOGPROB cm_cut_thres;#endif#ifdef CM_SEARCH_LIMIT_POPO /** * Cut-off threshold for popped hypo. for confidence decoding (-cmthres2) */ LOGPROB cm_cut_thres_pop;#endif#endif /* CONFIDENCE_MEASURE */ /** * Forced alignment: per word (-walign) */ boolean align_result_word_flag; /** * Forced alignment: per phoneme (-palign) */ boolean align_result_phoneme_flag; /** * Forced alignment: per state (-salign) */ boolean align_result_state_flag; } annotate; /** * Output configurations * */ struct { /** * Result: number of sentence to output (-output) , also see @a nbest (-n). */ int output_hypo_maxnum; /** * Result: output partial recognition result on the 1st pass (-progout) */ boolean progout_flag; /** * Result: Progressive output interval on 1st pass in msec (-proginterval) */ int progout_interval; /** * Result: INTERNAL: interval in number of frames */ int progout_interval_frame; /** * Get results for all grammars independently on 2nd pass on DFA * (-multigramout / -nomultigramout) */ boolean multigramout_flag; } output; /** * Misc. switches * */ struct { /** * Enter trellis interactive check routine after boot (-check trellis) */ boolean trellis_check_flag; /** * Enter triphone existence check routine after boot (-check triphone) */ boolean triphone_check_flag; /** * Enter lexicon structure consulting mode after boot (-check wchmm) */ boolean wchmm_check_flag; /** * should be set to TRUE at startup when this process should start * with inactive status * */ boolean start_inactive; /** * In case the 2nd pass search fails, this option specifies Julius * to use the result of the previous 1st pass as final result. * When this is TRUE, no RECOGFAIL occur. * */ boolean fallback_pass1_flag; } sw; /* pointer to next instance */ struct __jconf_search__ *next;} JCONF_SEARCH;/** * Configuration parameters (global) * */typedef struct __Jconf__ { /** * Input source information, gathered from all AM conf. */ struct { /** * Input source type. (waveform / mfc) * */ int type; /** * Input source. * */ int speech_input; /** * Input device. * */ int device; /** * id of the selected plug-in if using plugin * */ int plugin_source; /** * Sampling frequency * */ long sfreq; /** * Sampling period in 100ns units * */ long period; /** * Window size in samples, similar to WINDOWSIZE in HTK (unit is different) * */ int framesize; /** * Frame shift length in samples * */ int frameshift; /** * Use 48kHz input and perform down sampling to 16kHz (-48) */ boolean use_ds48to16; /** * List of input files for rawfile / mfcfile input (-filelist) */ char *inputlist_filename; /** * Port number for adinnet input (-adport) */ int adinnet_port;#ifdef USE_NETAUDIO /** * Host/unit name for NetAudio/DatLink input (-NA) */ char *netaudio_devname;#endif /** * Check input parameter type with header of the hmmdefs * for parameter file input. FALSE avoids the check. */ boolean paramtype_check_flag; } input; /** * Configurations for Voice activity detection * */ struct { /** * Input level threshold from 0 to 32767 (-lv) */ int level_thres; /** * Head margin in msec (-headmargin) */ int head_margin_msec; /** * Tail margin in msec (-tailmargin) */ int tail_margin_msec; /** * Zero cross number threshold per a second (-zc) */ int zero_cross_num; /** * Silence detection and cutting: 0=off, 1=on, 2=accept device default * (-cutsilence / -nocutsilence) */ int silence_cut;#ifdef GMM_VAD /** * (GMM_VAD) Backstep margin when speech trigger is detected. * */ int gmm_margin; /** * (GMM_VAD) Up trigger threshold of GMM likelihood, where GMM * likelihood is defined as \[ \max_{m \in M_v} p(x|m) - \max_{m * \in M_n} p(x|m) \] where $M_v$ is a set of voice GMM, and $M_n$ * is a set of noise GMM whose names are specified by * "-gmmreject". Julius calculate this value for each input * frame, and average it for the last gmm_margin frames, and when * the value gets higher than this value, Julius will start recognition. */ float gmm_uptrigger_thres; /** * (GMM_VAD) Down trigger threshold of GMM likelihood, where GMM * likelihood is defined as \[ \max_{m \in M_v} p(x|m) - \max_{m * \in M_n} p(x|m) \] where $M_v$ is a set of voice GMM, and $M_n$ * is a set of noise GMM whose names are specified by * "-gmmreject". Julius calculate this value for each input * frame, and average it for the last gmm_margin frames, and when * the value gets lower than this value, Julius will stop recognition. */ float gmm_downtrigger_thres;#endif } detect; /** * Pre-processing parameters before frontends * */ struct { /** * Strip off zero samples (-nostrip to unset) */ boolean strip_zero_sample; /** * Remove DC offset by zero mean (-zmean / -nozmean) */ boolean use_zmean; } preprocess; /** * Models and parameters for input rejection * */ struct { /** * GMM definition file (-gmm) */ char *gmm_filename; /** * Number of Gaussians to be computed on GMM calculation (-gmmnum) */ int gmm_gprune_num; /** * Comma-separated list of GMM model name to be rejected (-gmmreject) */ char *gmm_reject_cmn_string; /** * Length threshold to reject input (-rejectshort) */ int rejectshortlen;#ifdef POWER_REJECT /** * Rejection power threshold * */ float powerthres;#endif } reject; /** * decoding parameters to control recognition process (global) * */ struct { /** * INTERNAL: do on-the-fly decoding if TRUE (value depends on * device default and forced_realtime. */ boolean realtime_flag; /** * INTERNAL: TRUE if either of "-realtime" or "-norealtime" is * explicitly specified by user. When TRUE, the user-specified value * in forced_realtime will be applied to realtime_flag. */ boolean force_realtime_flag; /** * Force on-the-fly decoding on 1st pass with audio input and * MAP-CMN (-realtime / -norealtime) */ boolean forced_realtime; /** * TRUE if a kind of speech segmentation is enabled * */ boolean segment; } decodeopt; /** * Configurations for acoustic models (HMM, HMMList) and am-specific * parameters * */ JCONF_AM *am_root; /** * Language models (N-gram / DFA), dictionary, and related parameters. * */ JCONF_LM *lm_root; /** * Search parameters (LM/AM independent), annotation, * and output parameters * */ JCONF_SEARCH *search_root; /** * Current JCONF_AM for reading options * */ JCONF_LM *lmnow; /** * Current JCONF_AM for reading options * */ JCONF_AM *amnow; /** * Current JCONF_AM for reading options * */ JCONF_SEARCH *searchnow; /** * Config parameters for GMM computation. * (only gmmconf->analysis.* is used) * */ JCONF_AM *gmm; /** * Current option declaration mode while loading options * */ short optsection; /** * Whether option sectioning ristriction should be applied or not * */ boolean optsectioning;} Jconf;enum { JCONF_OPT_DEFAULT, JCONF_OPT_GLOBAL, JCONF_OPT_AM, JCONF_OPT_LM, JCONF_OPT_SR, SIZEOF_JCONF_OPT};#endif /* __J_JCONF_H__ *//*======================================================= An OLD variable name mapping from old global.h to common.h These data are bogus, left here only for reference=======================================================result_reorder_flag -> DELETEDadinnet_port ->jconf.input.adinnet_portalign_result_phoneme_flag ->jconf.annotate.align_result_phoneme_flagalign_result_state_flag ->jconf.annotate.align_result_state_flagalign_result_word_flag ->jconf.annotate.align_result_word_flagbackmax ->recog.backmaxbacktrellis ->recog.backtrellisccd_flag ->jconf.am.ccd_flagccd_flag_force ->jconf.am.ccd_flag_forcecm_alpha ->jconf.annotate.cm_alphacm_alpha_bgn ->jconf.annotate.cm_alpha_bgncm_alpha_end ->jconf.annotate.cm_alpha_endcm_alpha_num ->jconf.annotate.cm_alpha_numcm_alpha_step ->jconf.annotate.cm_alpha_stepcm_cut_thres ->jconf.annotate.cm_cut_threscm_cut_thres_pop ->jconf.annotate.cm_cut_thres_popcmn_loaded ->recog.cmn_loadedcmn_map_weight ->jconf.frontend.cmn_map_weightcmn_update ->jconf.frontend.cmn_updatecmnload_filename ->jconf.frontend.cmnload_filenamecmnsave_filename ->jconf.frontend.cmnsave_filenamecompute_only_1pass ->jconf.sw.compute_only_1passdfa ->model.dfadfa_filename ->jconf.lm.dfa_filenamedictfilename ->jconf.lm.dictfilenameenable_iwsp ->jconf.lm.enable_iwspenable_iwspword ->jconf.lm.enable_iwspwordenveloped_bestfirst_width ->jconf.search.pass2.enveloped_bestfirst_widthforce_realtime_flag ->jconf.search.pass1.force_realtime_flagforced_realtime ->jconf.search.pass1.forced_realtimeforcedict_flag ->jconf.lm.forcedict_flagframemaxscore ->recog.framemaxscorefrom_code ->jconf.output.from_codegmm ->model.gmmgmm_filename ->jconf.reject.gmm_filenamegmm_gprune_num ->jconf.reject.gmm_gprune_numgmm_reject_cmn_string ->jconf.reject.gmm_reject_cmn_stringgprune_method ->jconf.am.gprune_methodgramlist ->model.grammarsgramlist_root ->jconf.lm.gramlist_rootgraph_merge_neighbor_range ->jconf.graph.graph_merge_neighbor_rangegraph_totalwordnum ->recog.graph_totalwordnumgraphout_cut_depth ->jconf.graph.graphout_cut_depthgraphout_limit_boundary_loop_num ->jconf.graph.graphout_limit_boundary_loop_numgraphout_search_delay ->jconf.graph.graphout_search_delaygs_statenum ->jconf.am.gs_statenumhead_margin_msec ->jconf.detect.head_margin_msechead_silname ->jconf.lm.head_silnamehmm_gs ->model.hmm_gshmm_gs_filename ->jconf.am.hmm_gs_filenamehmmfilename ->jconf.am.hmmfilenamehmminfo ->model.hmminfohypo_overflow ->jconf.search.pass2.hypo_overflowinputlist_filename ->jconf.input.inputlist_filenameiw_cache_rate ->jconf.search.pass1.iw_cache_rateiwcdmaxn ->jconf.search.pass1.iwcdmaxniwcdmethod ->jconf.search.pass1.iwcdmethodiwsp_penalty ->jconf.lm.iwsp_penaltyiwspentry ->jconf.lm.iwspentrylevel_thres ->jconf.detect.level_threslm_penalty ->jconf.lm.lm_penaltylm_penalty2 ->jconf.lm.lm_penalty2lm_penalty_trans ->jconf.lm.lm_penalty_translm_weight ->jconf.lm.lm_weightlm_weight2 ->jconf.lm.lm_weight2lmp_specified ->jconf.lm.lmp_specifiedlmp2_specified ->jconf.lm.lmp2_specifiedlooktrellis_flag ->jconf.search.pass2.looktrellis_flaglookup_range ->jconf.search.pass2.lookup_rangemapfilename ->jconf.am.mapfilenamemixnum_thres ->jconf.am.mixnum_thresmodule_mode -> (app)module_port -> (app)module_sd -> (app)multigramout_flag ->jconf.output.multigramout_flagnbest ->jconf.search.pass2.nbestnetaudio_devname ->jconf.input.netaudio_devnamengram ->model.ngramngram_filename ->jconf.lm.ngram_filenamengram_filename_lr_arpa ->jconf.lm.ngram_filename_lr_arpangram_filename_rl_arpa ->jconf.lm.ngram_filename_rl_arpaold_iwcd_flag -> USE_OLD_IWCD (define.h)old_tree_function_flag ->jconf.search.pass1.old_tree_function_flagoutput_hypo_maxnum ->jconf.output.output_hypo_maxnumpara ->jconf.analysis.parapara_default ->jconf.analysis.para_defaultpara_hmm ->jconf.analysis.para_hmmpara_htk ->jconf.analysis.para_htkparamtype_check_flag ->jconf.analysis.paramtype_check_flagpass1_score ->recog.pass1_scorepass1_wnum ->recog.pass1_wnumpass1_wseq ->recog.pass1_wseqpenalty1 ->jconf.lm.penalty1penalty2 ->jconf.lm.penalty2peseqlen ->recog.peseqlenprogout_flag ->jconf.output.progout_flagprogout_interval ->jconf.output.progout_intervalprogout_interval_frame (beam.c) ->jconf.output.progout_intervalrealtime_flag ->jconf.search.pass1.realtime_flagrecord_dirname ->jconf.output.record_dirnamerejectshortlen ->jconf.reject.rejectshortlenrest_param ->recog.rest_paramresult_output -> (app)scan_beam_thres ->jconf.search.pass2.scan_beam_thresseparate_score_flag ->jconf.output.separate_score_flagseparate_wnum ->jconf.search.pass1.separate_wnumsilence_cut ->jconf.detect.silence_cutsp_break_2_begin_word ->recog.sp_break_2_begin_wordsp_break_2_end_word ->recog.sp_break_2_end_wordsp_break_last_nword ->recog.sp_break_last_nwordsp_break_last_nword_allow_override ->recog.sp_break_last_nword_allow_overridesp_break_last_word ->recog.sp_break_last_wordsp_frame_duration ->jconf.successive.sp_frame_durationspecified_trellis_beam_width ->jconf.search.pass1.specified_trellis_beam_widthspeech ->recog.speechspeech_input ->jconf.input.speech_inputspeechlen ->recog.speechlenspmodel_name ->jconf.am.spmodel_namessbuf ->recog.ssbufsscalc ->jconf.frontend.sscalcsscalc_len ->jconf.frontend.sscalc_lensslen ->recog.sslenssload_filename ->jconf.frontend.ssload_filenamestack_size ->jconf.search.pass2.stack_sizestrip_zero_sample ->jconf.frontend.strip_zero_sampletail_margin_msec ->jconf.detect.tail_margin_msectail_silname ->jconf.lm.tail_silnameto_code ->jconf.output.to_codetrellis_beam_width ->recog.trellis_beam_widthtrellis_check_flag ->jconf.sw.trellis_check_flagtriphone_check_flag ->jconf.sw.triphone_check_flaguse_ds48to16 ->jconf.input.use_ds48to16use_zmean ->jconf.frontend.use_zmeanwchmm ->recog.wchmmwchmm_check_flag ->jconf.sw.wchmm_check_flagwinfo ->model.winfowpair_keep_nlimit ->jconf.search.pass1.wpair_keep_nlimitzero_cross_num ->jconf.detect.zero_cross_numverbose_flag -> (remain in global.h)debug2_flag -> (remain in global.h)*/
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?