首页 › 资源下载 › Java编程 › It is the Speech rec › 源码查看
livemoderecognizer.java

来自「It is the Speech recognition software. 」· Java 代码 · 共 367 行
JAVA
367 行
/* * Copyright 1999-2002 Carnegie Mellon University.   * Portions Copyright 2002 Sun Microsystems, Inc.   * Portions Copyright 2002 Mitsubishi Electric Research Laboratories. * All Rights Reserved.  Use is subject to license terms. *  * See the file "license.terms" for information on usage and * redistribution of this file, and for a DISCLAIMER OF ALL  * WARRANTIES. * */package edu.cmu.sphinx.tools.live;import java.io.File;import java.io.FileWriter;import java.io.IOException;import java.net.URL;import java.util.Iterator;import java.util.LinkedList;import java.util.List;import edu.cmu.sphinx.frontend.util.ConcatFileDataSource;import edu.cmu.sphinx.recognizer.Recognizer;import edu.cmu.sphinx.result.Result;import edu.cmu.sphinx.util.GapInsertionDetector;import edu.cmu.sphinx.util.NISTAlign;import edu.cmu.sphinx.util.ReferenceSource;import edu.cmu.sphinx.util.Timer;import edu.cmu.sphinx.util.props.Configurable;import edu.cmu.sphinx.util.props.ConfigurationManager;import edu.cmu.sphinx.util.props.PropertyException;import edu.cmu.sphinx.util.props.PropertySheet;import edu.cmu.sphinx.util.props.PropertyType;import edu.cmu.sphinx.util.props.Registry;/** * Decodes a batch file containing a list of files to decode. The files can be * either audio files or cepstral files, but defaults to audio files. */public class LiveModeRecognizer implements Configurable {    /**     * The SphinxProperty name for how many files to skip for every decode.     */    public final static String PROP_SKIP = "skip";    /**     * The default value for the property PROP_SKIP.     */    public final static int PROP_SKIP_DEFAULT = 0;    /**     * The Sphinx property that specifies the recognizer to use     */    public final static String PROP_RECOGNIZER = "recognizer";    /**     * The Sphinx property that specifies the source of the transcript     */    public final static String PROP_INPUT_SOURCE = "inputSource";    /**     * SphinxProperty specifying whether to print out the gap insertion errors.     */    public static final String PROP_SHOW_GAP_INSERTIONS = "showGapInsertions";    /**     * Default value for PROP_SHOW_GAP_INSERTIONS.     */    public static final boolean PROP_SHOW_GAP_INSERTIONS_DEFAULT = false;    /**     * SphinxProperty specifying the transcript file.     */    public final static String PROP_HYPOTHESIS_TRANSCRIPT = "hypothesisTranscript";    /**     * The default value of PROP_TRANSCRIPT.     */    public final static String PROP_HYPOTHESIS_TRANSCRIPT_DEFAULT = "hypothesis.txt";    /**     * SphinxProperty specifying the number of files to decode before alignment     * is performed.     */    public final static String PROP_ALIGN_INTERVAL = "alignInterval";    /**     * The default value of PROP_ALIGN_INTERVAL.     */    public final static int PROP_ALIGN_INTERVAL_DEFAULT = -1;    // TODO - the instrumentation in here that is looking for gap insertions    // and performing the alignment and reporting of the live summary data    // should probably be moved to a separate instrumentation package, much    // like the AccuracyTracker.    // -------------------------------    // Configuration data    // --------------------------------    private String name;    private int skip;    private Recognizer recognizer;    private ConcatFileDataSource dataSource;    private String hypothesisFile;    private boolean showGapInsertions;    // -------------------------------    // Working data    // --------------------------------    private int alignInterval;    private int numUtterances;    private FileWriter hypothesisTranscript;    private ReferenceSource referenceSource;    private GapInsertionDetector gapInsertionDetector;    private NISTAlign aligner = new NISTAlign(true, true);    /*     * (non-Javadoc)     *      * @see edu.cmu.sphinx.util.props.Configurable#register(java.lang.String,     *      edu.cmu.sphinx.util.props.Registry)     */    public void register(String name, Registry registry)            throws PropertyException {        this.name = name;        registry.register(PROP_SKIP, PropertyType.INT);        registry.register(PROP_RECOGNIZER, PropertyType.COMPONENT);        registry.register(PROP_INPUT_SOURCE, PropertyType.COMPONENT);        registry.register(PROP_SHOW_GAP_INSERTIONS, PropertyType.BOOLEAN);        registry.register(PROP_ALIGN_INTERVAL, PropertyType.INT);        registry.register(PROP_HYPOTHESIS_TRANSCRIPT, PropertyType.STRING);    }    /*     * (non-Javadoc)     *      * @see edu.cmu.sphinx.util.props.Configurable#newProperties(edu.cmu.sphinx.util.props.PropertySheet)     */    public void newProperties(PropertySheet ps) throws PropertyException {        skip = ps.getInt(PROP_SKIP, PROP_SKIP_DEFAULT);        recognizer = (Recognizer) ps.getComponent(PROP_RECOGNIZER,                Recognizer.class);        dataSource = (ConcatFileDataSource) ps.getComponent(PROP_INPUT_SOURCE,                ConcatFileDataSource.class);        showGapInsertions = ps.getBoolean(PROP_SHOW_GAP_INSERTIONS,                PROP_SHOW_GAP_INSERTIONS_DEFAULT);        hypothesisFile = ps.getString(PROP_HYPOTHESIS_TRANSCRIPT,                PROP_HYPOTHESIS_TRANSCRIPT_DEFAULT);        alignInterval = ps.getInt(PROP_ALIGN_INTERVAL,                PROP_ALIGN_INTERVAL_DEFAULT);        referenceSource = dataSource;    }    /*     * (non-Javadoc)     *      * @see edu.cmu.sphinx.util.props.Configurable#getName()     */    public String getName() {        return name;    }    /**     * Decodes the batch of audio files     */    public void decode() throws IOException {        List resultList = new LinkedList();        Result result = null;        int startReference = 0;        hypothesisTranscript = new FileWriter(hypothesisFile);        recognizer.allocate();        while ((result = recognizer.recognize()) != null) {            numUtterances++;            String resultText = result.getBestResultNoFiller();            System.out.println("\nHYP: " + resultText);            System.out.println("   Sentences: " + numUtterances);            resultList.add(resultText);            hypothesisTranscript.write(result.getTimedBestResult(false, true)                    + "\n");            hypothesisTranscript.flush();            if (alignInterval > 0 && (numUtterances % alignInterval == 0)) {                // perform alignment if the property 'alignInterval' is set                List references = referenceSource.getReferences();                List section = references.subList(startReference, references                        .size());                alignResults(resultList, section);                resultList = new LinkedList();                startReference = references.size();            }        }        hypothesisTranscript.close();        // perform alignment on remaining results        List references = referenceSource.getReferences();        List section = references.subList(startReference, references.size());        if (resultList.size() > 0 || section.size() > 0) {            alignResults(resultList, section);        }        System.out.println("# ------------- Summary Statistics -------------");        aligner.printTotalSummary();        recognizer.deallocate();        showLiveSummary();        System.out.println();    }    /**     * Shows the test statistics that relates to live mode decoding.     *      */    private void showLiveSummary() throws IOException {        int actualUtterances = referenceSource.getReferences().size();        int gapInsertions = detectGapInsertionErrors();                System.out.println            ("   Utterances:  Actual: " + actualUtterances +              "  Found: " + numUtterances);        System.out.println            ("   Gap Insertions: " + gapInsertions);    }    /**     * Detect gap insertion errors.     */    private int detectGapInsertionErrors() throws IOException {        Timer gapTimer = Timer.getTimer("GapInsertionDetector");        gapTimer.start();        GapInsertionDetector gid = new GapInsertionDetector(dataSource                .getTranscriptFile(), hypothesisFile, showGapInsertions);        int gapInsertions = gid.detect();        gapTimer.stop();        return gapInsertions;    }    /**     * Align the list of results with reference text. This method figures out     * how many words and sentences match, and the different types of errors.     *      * @param hypothesisList     *                the list of hypotheses     * @param referenceList     *                the list of references     */    private void alignResults(List hypothesisList, List referenceList) {        System.out.println();        System.out.println("Aligning results...");        System.out.println("   Utterances: Found: " + hypothesisList.size()                + "   Actual: " + referenceList.size());        String hypothesis = listToString(hypothesisList);        String reference = listToString(referenceList);        saveAlignedText(hypothesis, reference);        getAlignTimer().start();        aligner.align(reference, hypothesis);        getAlignTimer().stop();        System.out.println(" ...done aligning");        System.out.println();    }    /**     * Saves the aligned hypothesis and reference text to the aligned text     * file.     *      * @param hypothesis     *                the aligned hypothesis text     * @param reference     *                the aligned reference text     */    private void saveAlignedText(String hypothesis, String reference) {        try {            FileWriter writer = new FileWriter("align.txt");            writer.write(hypothesis);            writer.write("\n");            writer.write(reference);            writer.close();        } catch (IOException ioe) {            ioe.printStackTrace();        }    }    /**     * Converts the given list of strings into one string, putting a space     * character in between the strings.     *      * @param resultList     *                the list of strings     *      * @return a string which is a concatenation of the strings in the list,     *         separated by a space character     */    private String listToString(List resultList) {        StringBuffer sb = new StringBuffer();        for (Iterator i = resultList.iterator(); i.hasNext();) {            String result = (String) i.next();            sb.append(result + " ");        }        return sb.toString();    }    /**     * Return the timer for alignment.     */    private Timer getAlignTimer() {        return Timer.getTimer("Align");    }    /**     * Do clean up     */    public void close() throws IOException {        hypothesisTranscript.close();    }    /**     * Main method of this BatchDecoder.     *      * @param argv     *                argv[0] : config file argv[1] : a file listing     *                all the audio files to decode     */    public static void main(String[] argv) {        if (argv.length != 1) {            System.out.println("Usage: LiveModeRecognizer config-file.xml ");            System.exit(1);        }        String cmFile = argv[0];        ConfigurationManager cm;        LiveModeRecognizer lmr = null;        try {            URL url = new File(cmFile).toURI().toURL();            cm = new ConfigurationManager(url);            lmr = (LiveModeRecognizer) cm.lookup("live");        } catch (IOException ioe) {            System.err.println("I/O error during initialization: \n   " + ioe);            return;        } catch (InstantiationException e) {            System.err.println("Error during initialization: \n  " + e);            return;        } catch (PropertyException e) {            System.err.println("Error during initialization: \n  " + e);            e.printStackTrace();            return;        }        if (lmr == null) {            System.err.println("Can't find liveModeRecognizer in " + cmFile);            return;        }        try {            lmr.decode();        } catch (IOException ioe) {            System.err                    .println("I/O error during decoding: " + ioe.getMessage());        }    }}
livemoderecognizer.java - 源码说明

本页面展示了「It is the Speech recognition software. It is platform independent. To execute the source code,」中的 livemoderecognizer.java 源码文件，采用 Java 编程语言编写，共 367 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。
虫虫下载站收录了大量与independent相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。
⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?