📄 microphone.java

📁 It is the Speech recognition software. It is platform independent. To execute the source code,
💻 JAVA
📖 第 1 页 / 共 2 页
字号:
12 下一页
/* * Copyright 1999-2004 Carnegie Mellon University.   * Portions Copyright 2004 Sun Microsystems, Inc.   * Portions Copyright 2004 Mitsubishi Electric Research Laboratories. * All Rights Reserved.  Use is subject to license terms. *  * See the file "license.terms" for information on usage and * redistribution of this file, and for a DISCLAIMER OF ALL  * WARRANTIES. * */package edu.cmu.sphinx.frontend.util;import java.io.IOException;import java.util.LinkedList;import java.util.List;import java.util.logging.Logger;import java.util.logging.Level;import javax.sound.sampled.AudioFormat;import javax.sound.sampled.AudioInputStream;import javax.sound.sampled.AudioSystem;import javax.sound.sampled.DataLine;import javax.sound.sampled.Line;import javax.sound.sampled.LineUnavailableException;import javax.sound.sampled.TargetDataLine;import javax.sound.sampled.LineListener;import javax.sound.sampled.LineEvent;import javax.sound.sampled.Mixer;import edu.cmu.sphinx.frontend.BaseDataProcessor;import edu.cmu.sphinx.frontend.Data;import edu.cmu.sphinx.frontend.DataEndSignal;import edu.cmu.sphinx.frontend.DataProcessingException;import edu.cmu.sphinx.frontend.DataStartSignal;import edu.cmu.sphinx.frontend.DoubleData;import edu.cmu.sphinx.util.props.PropertyException;import edu.cmu.sphinx.util.props.PropertySheet;import edu.cmu.sphinx.util.props.PropertyType;import edu.cmu.sphinx.util.props.Registry;/** * <p> * A Microphone captures audio data from the system's underlying * audio input systems. Converts these audio data into Data * objects. When the method <code>startRecording()</code> is called, * a new thread will be created and used to capture * audio, and will stop when <code>stopRecording()</code> * is called. Calling <code>getData()</code> returns the captured audio * data as Data objects. * </p> * <p> * This Microphone will attempt to obtain an audio device with the format * specified in the configuration. If such a device with that format * cannot be obtained, it will try to obtain a device with an audio format * that has a higher sample rate than the configured sample rate, * while the other parameters of the format (i.e., sample size, endianness, * sign, and channel) remain the same. If, again, no such device can be * obtained, it flags an error, and a call <code>startRecording</code>  * returns false. * </p> */public class Microphone extends BaseDataProcessor {    /**     * SphinxProperty for the sample rate of the data.     */    public static final String PROP_SAMPLE_RATE = "sampleRate";    /**     * Default value for PROP_SAMPLE_RATE.     */    public static final int PROP_SAMPLE_RATE_DEFAULT = 16000;    /**     * Sphinx property that specifies whether or not the microphone     * will release the audio between utterances.  On certain systems     * (linux for one), closing and reopening the audio does not work     * too well. The default is false for Linux systems, true for others.     */    public final static String PROP_CLOSE_BETWEEN_UTTERANCES =	"closeBetweenUtterances";    /**     * Default value for PROP_CLOSE_BETWEEN_UTTERANCES.     */    public final static boolean PROP_CLOSE_BETWEEN_UTTERANCES_DEFAULT = true;    /**     * The Sphinx property that specifies the number of milliseconds of     * audio data to read each time from the underlying Java Sound audio      * device.     */    public final static String PROP_MSEC_PER_READ = "msecPerRead";    /**     * The default value of PROP_MSEC_PER_READ.     */    public final static int PROP_MSEC_PER_READ_DEFAULT = 10;    /**     * SphinxProperty for the number of bits per value.     */    public static final String PROP_BITS_PER_SAMPLE = "bitsPerSample";    /**     * Default value for PROP_BITS_PER_SAMPLE.     */    public static final int PROP_BITS_PER_SAMPLE_DEFAULT = 16;    /**     * Property specifying the number of channels.     */    public static final String PROP_CHANNELS = "channels";    /**     * Default value for PROP_CHANNELS.     */    public static final int PROP_CHANNELS_DEFAULT = 1;    /**     * Property specify the endianness of the data.     */    public static final String PROP_BIG_ENDIAN = "bigEndian";    /**     * Default value for PROP_BIG_ENDIAN.     */    public static final boolean PROP_BIG_ENDIAN_DEFAULT = true;    /**     * Property specify whether the data is signed.     */    public static final String PROP_SIGNED = "signed";    /**     * Default value for PROP_SIGNED.     */    public static final boolean PROP_SIGNED_DEFAULT = true;    /**     * The Sphinx property that specifies whether to keep the audio     * data of an utterance around until the next utterance is recorded.     */    public final static String PROP_KEEP_LAST_AUDIO = "keepLastAudio";    /**     * The default value of PROP_KEEP_AUDIO.     */    public final static boolean PROP_KEEP_LAST_AUDIO_DEFAULT = false;    /**     * The Sphinx property that specifies how to convert stereo audio to mono.     * Currently, the possible values are "average", which averages the     * samples from at each channel, or "selectChannel", which chooses     * audio only from that channel. If you choose "selectChannel",     * you should also specify which channel to use with the "selectChannel"     * property.     */    public final static String PROP_STEREO_TO_MONO = "stereoToMono";    /**     * The default value of PROP_STEREO_TO_MONO.     */    public final static String PROP_STEREO_TO_MONO_DEFAULT = "average";    /**     * The Sphinx property that specifies the channel to use if the audio     * is stereo     */    public final static String PROP_SELECT_CHANNEL = "selectChannel";    /**     * The default value of PROP_SELECT_CHANNEL.     */    public final static int PROP_SELECT_CHANNEL_DEFAULT = 0;    /**     * The Sphinx property that specifies the mixer to use.  The value     * can be "default," (which means let the AudioSystem decide),     * "last," (which means select the last Mixer supported by the     * AudioSystem), which appears to be what is often used for USB     * headsets, or an integer value which represents the index of     * the Mixer.Info that is returned by AudioSystem.getMixerInfo().     * To get the list of Mixer.Info objects, run the AudioTool     * application with a command line argument of "-dumpMixers".     *     * @see edu.cmu.sphinx.tools.audio.AudioTool     */    public final static String PROP_SELECT_MIXER = "selectMixer";    /**     * The default value of PROP_SELECT_MIXER.  This means that a     * specific Mixer will not be used.  Instead, the AudioSystem     * will be used to choose the audio line to use.     */    public final static String PROP_SELECT_MIXER_DEFAULT = "default";    private AudioFormat finalFormat;    private AudioInputStream audioStream = null;    private TargetDataLine audioLine = null;    private DataList audioList;    private Utterance currentUtterance;    private boolean doConversion = false;    private int audioBufferSize = 160000;    private volatile boolean recording = false;    private volatile boolean utteranceEndReached = true;    private RecordingThread recorder;    // Configuration data    private AudioFormat desiredFormat;    private Logger logger;    private boolean closeBetweenUtterances;    private boolean keepDataReference;    private boolean signed;    private int frameSizeInBytes;    private int msecPerRead;    private int selectedChannel;    private String selectedMixerIndex;    private String stereoToMono;        /*     * (non-Javadoc)     *      * @see edu.cmu.sphinx.util.props.Configurable#register(java.lang.String,     *      edu.cmu.sphinx.util.props.Registry)     */    public void register(String name, Registry registry)        throws PropertyException {        super.register(name, registry);        registry.register(PROP_SAMPLE_RATE, PropertyType.INT);	registry.register(PROP_CLOSE_BETWEEN_UTTERANCES, PropertyType.BOOLEAN);        registry.register(PROP_MSEC_PER_READ, PropertyType.INT);        registry.register(PROP_BITS_PER_SAMPLE, PropertyType.INT);        registry.register(PROP_CHANNELS, PropertyType.INT);        registry.register(PROP_BIG_ENDIAN, PropertyType.BOOLEAN);        registry.register(PROP_SIGNED, PropertyType.BOOLEAN);        registry.register(PROP_KEEP_LAST_AUDIO, PropertyType.BOOLEAN);        registry.register(PROP_STEREO_TO_MONO, PropertyType.STRING);        registry.register(PROP_SELECT_CHANNEL, PropertyType.INT);        registry.register(PROP_SELECT_MIXER, PropertyType.STRING);    }    /*     * (non-Javadoc)     *      * @see edu.cmu.sphinx.util.props.Configurable#newProperties(edu.cmu.sphinx.util.props.PropertySheet)     */    public void newProperties(PropertySheet ps) throws PropertyException {        super.newProperties(ps);        logger = ps.getLogger();        int sampleRate = ps.getInt(PROP_SAMPLE_RATE, PROP_SAMPLE_RATE_DEFAULT);        int sampleSizeInBits = ps.getInt            (PROP_BITS_PER_SAMPLE, PROP_BITS_PER_SAMPLE_DEFAULT);        int channels = ps.getInt(PROP_CHANNELS, PROP_CHANNELS_DEFAULT);        boolean bigEndian =             ps.getBoolean(PROP_BIG_ENDIAN, PROP_BIG_ENDIAN_DEFAULT);        signed = ps.getBoolean(PROP_SIGNED, PROP_SIGNED_DEFAULT);        desiredFormat = new AudioFormat            ((float)sampleRate, sampleSizeInBits, channels, signed, bigEndian);        	closeBetweenUtterances = ps.getBoolean            (PROP_CLOSE_BETWEEN_UTTERANCES,             PROP_CLOSE_BETWEEN_UTTERANCES_DEFAULT);                msecPerRead = ps.getInt(PROP_MSEC_PER_READ,                                 PROP_MSEC_PER_READ_DEFAULT);        keepDataReference = ps.getBoolean            (PROP_KEEP_LAST_AUDIO, PROP_KEEP_LAST_AUDIO_DEFAULT);        stereoToMono = ps.getString            (PROP_STEREO_TO_MONO, PROP_STEREO_TO_MONO_DEFAULT);        selectedChannel = ps.getInt            (PROP_SELECT_CHANNEL, PROP_SELECT_CHANNEL_DEFAULT);        selectedMixerIndex = ps.getString            (PROP_SELECT_MIXER, PROP_SELECT_MIXER_DEFAULT);    }    /**     * Constructs a Microphone with the given InputStream.     *     * @throws IOException if an I/O error occurs     */    public void initialize() {        super.initialize();        audioList = new DataList();                DataLine.Info  info                 = new DataLine.Info(TargetDataLine.class, desiredFormat);        /* If we cannot get an audio line that matches the desired         * characteristics, shoot for one that matches almost         * everything we want, but has a higher sample rate.         */        if (!AudioSystem.isLineSupported(info)) {            logger.info(desiredFormat + " not supported");            AudioFormat nativeFormat                = DataUtil.getNativeAudioFormat(desiredFormat,                                                getSelectedMixer());            if (nativeFormat == null) {                logger.severe("couldn't find suitable target audio format");                return;            } else {                finalFormat = nativeFormat;                                /* convert from native to the desired format if supported */                doConversion = AudioSystem.isConversionSupported                    (desiredFormat, nativeFormat);                                if (doConversion) {                    logger.info                        ("Converting from " + finalFormat.getSampleRate()                         + "Hz to " + desiredFormat.getSampleRate() + "Hz");                } else {                    logger.info                        ("Using native format: Cannot convert from " +                         finalFormat.getSampleRate() + "Hz to " +                         desiredFormat.getSampleRate() + "Hz");                }            }        } else {            logger.info("Desired format: " + desiredFormat + " supported.");            finalFormat = desiredFormat;        }    }    /**     * Gets the Mixer to use.  Depends upon selectedMixerIndex being     * defined.     *     * @see #newProperties     */    private Mixer getSelectedMixer() {        if (selectedMixerIndex.equals("default")) {            return null;        } else {            Mixer.Info[] mixerInfo = AudioSystem.getMixerInfo();            if (selectedMixerIndex.equals("last")) {                return AudioSystem.getMixer(mixerInfo[mixerInfo.length - 1]);            } else {                int index = Integer.parseInt(selectedMixerIndex);                return AudioSystem.getMixer(mixerInfo[index]);            }        }    }            /**     * Creates the audioLine if necessary and returns it.     */    private TargetDataLine getAudioLine() {        if (audioLine != null) {            return audioLine;        }                /* Obtain and open the line and stream.         */        try {            /* The finalFormat was decided in the initialize() method             * and is based upon the capabilities of the underlying             * audio system.  The final format will have all the             * desired audio characteristics, but may have a sample             * rate that is higher than desired.  The idea here is             * that we'll let the processors in the front end (e.g.,             * the FFT) handle some form of downsampling for us.             */            logger.info("Final format: " + finalFormat);                        DataLine.Info info = new DataLine.Info(TargetDataLine.class,                                                   finalFormat);            /* We either get the audio from the AudioSystem (our             * default choice), or use a specific Mixer if the             * selectedMixerIndex property has been set.             */            Mixer selectedMixer = getSelectedMixer();            if (selectedMixer == null) {                audioLine = (TargetDataLine) AudioSystem.getLine(info);            } else {                audioLine = (TargetDataLine) selectedMixer.getLine(info);            }            /* Add a line listener that just traces             * the line states.             */            audioLine.addLineListener(new LineListener() {                    public  void update(LineEvent event) {                        logger.info("line listener " + event);                    }            });        } catch (LineUnavailableException e) {            logger.severe("microphone unavailable " + e.getMessage());        }        return audioLine;    }    /**     * Opens the audio capturing device so that it will be ready     * for capturing audio. Attempts to create a converter if the     * requested audio format is not directly available.     *     * @return true if the audio capturing device is opened successfully;     *     false otherwise     */    private boolean open() {        TargetDataLine audioLine = getAudioLine();        if (audioLine != null) {            if (!audioLine.isOpen()) {                logger.info("open");                try {                    audioLine.open(finalFormat, audioBufferSize);                } catch (LineUnavailableException e) {                    logger.severe("Can't open microphone " + e.getMessage());                    return false;                }
12 下一页
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -