📄 chatencoder.java

📁 编辑视频文件
💻 JAVA
字号:
/* * File:     CHATEncoder.java * Project:  MPI Linguistic Application * Date:     02 May 2007 * * Copyright (C) 2001-2007  Max Planck Institute for Psycholinguistics * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA *//* * Created on Oct 15, 2004 */package mpi.eudico.server.corpora.clomimpl.chat;import mpi.eudico.server.corpora.clom.Annotation;import mpi.eudico.server.corpora.clom.AnnotationDocEncoder;import mpi.eudico.server.corpora.clom.EncoderInfo;import mpi.eudico.server.corpora.clom.Tier;import mpi.eudico.server.corpora.clom.Transcription;import mpi.eudico.server.corpora.clomimpl.abstr.AlignableAnnotation;import mpi.eudico.server.corpora.clomimpl.abstr.MediaDescriptor;import mpi.eudico.server.corpora.clomimpl.abstr.TierImpl;import mpi.eudico.server.corpora.clomimpl.abstr.TranscriptionImpl;import java.io.FileOutputStream;import java.io.OutputStreamWriter;import java.util.Collections;import java.util.HashSet;import java.util.Hashtable;import java.util.Iterator;import java.util.Vector;import javax.swing.JOptionPane;/** * Encodes information from a Transcription to CHAT (UTF-8) format and stores it. * * @author hennie */public class CHATEncoder implements AnnotationDocEncoder {    private static String BEGIN_LABEL = "@Begin";    private static String END_LABEL = "@End";    private static String LANGUAGE_LABEL = "@Languages:\t";    private static String PARTICIPANTS_LABEL = "@Participants:\t";    private static String ID_LABEL = "@ID:\t";    private static String SOUND_LABEL = "%snd:";    private static String VIDEO_LABEL = "%mov:";    /** Holds value of property DOCUMENT ME! */    private final char BULLET = '\u0015';    private long lastAlignedBeginTime = 0;    private String[][] mainTierInfo;    private String[][] dependentTierInfo;    /*     * @see mpi.eudico.server.corpora.clom.AnnotationDocEncoder#encodeAndSave(mpi.eudico.server.corpora.clom.Transcription, java.util.Vector, java.lang.String)     */    public void encodeAndSave(Transcription theTranscription,        EncoderInfo encoderInfo, Vector tierOrder, String path) {        mainTierInfo = ((CHATEncoderInfo) encoderInfo).getMainTierInfo();        dependentTierInfo = ((CHATEncoderInfo) encoderInfo).getDependentTierInfo();        try {            OutputStreamWriter out = new OutputStreamWriter(new FileOutputStream(                        path), "UTF-8");            out.write("@UTF8\n");            out.write(BEGIN_LABEL + "\n");            writeHeader(theTranscription, encoderInfo, out);            writeBlocks(theTranscription, encoderInfo, out);            out.write(END_LABEL + "\n");            out.close();        } catch (Exception e) {            String txt = "Sorry: unable to export this file to CHAT. (" +                e.getMessage() + ")";            JOptionPane.showMessageDialog(null, txt, txt,                JOptionPane.ERROR_MESSAGE);        }    }    private void writeHeader(Transcription theTranscription,        EncoderInfo encoderInfo, OutputStreamWriter out) {        // @Languages        try {            String langString = LANGUAGE_LABEL;            HashSet languages = new HashSet();            Vector tiers = theTranscription.getTiers();            if (tiers != null) {                for (int i = 0; i < tiers.size(); i++) {                    languages.add(((TierImpl) tiers.elementAt(i)).getDefaultLocale()                                   .getLanguage());                }            }            int j = 0;            Iterator langIter = languages.iterator();            while (langIter.hasNext()) {                if (j > 0) {                    langString += ", ";                }                langString += (String) langIter.next();                j++;            }            if (langString != LANGUAGE_LABEL) {                out.write(langString + "\n");            }            // @Participants            String participantsString = PARTICIPANTS_LABEL;            //String[][] mainTierInfo = ((CHATEncoderInfo) encoderInfo).getMainTierInfo();            for (int i = 0; i < mainTierInfo[1].length; i++) {                if (mainTierInfo[1][i] == null) {                    continue;                }                if (i > 0) {                    participantsString += ", ";                }                participantsString += (mainTierInfo[1][i]).substring(1);                if (!mainTierInfo[2][i].equals("")) {                    participantsString += (" " + mainTierInfo[2][i]);                }                if (!mainTierInfo[3][i].equals("")) {                    participantsString += (" " + mainTierInfo[3][i]);                } else {                    participantsString += (" " + "Unidentified");                }            }            if (participantsString != PARTICIPANTS_LABEL) {                out.write(participantsString + "\n");            }            // @ID lines, one for each participant            for (int i = 0; i < mainTierInfo[4].length; i++) {                if (mainTierInfo[4][i] == null) {                    continue;                }                if (!mainTierInfo[4][i].equals("")) {                    String idString = ID_LABEL + mainTierInfo[4][i];                    out.write(idString + "\n");                } else {                    String idString = ID_LABEL + mainTierInfo[5][i] + "|" +                        mainTierInfo[1][i].substring(1) + "|||||" +                        "Unidentified" + "||";                    out.write(idString + "\n");                }            }        } catch (Exception ex) {            ex.printStackTrace();        }    }    private void writeBlocks(Transcription theTranscription,        EncoderInfo encoderInfo, OutputStreamWriter out) {        Vector rootAnnotations = new Vector();        // iterate over top tiers, over annotations        try {            Vector topTiers = ((TranscriptionImpl) theTranscription).getTopTiers();            Iterator tierIter = topTiers.iterator();            while (tierIter.hasNext()) {                TierImpl t = (TierImpl) tierIter.next();                Vector annots = t.getAnnotations();                rootAnnotations.addAll(annots);            }            Collections.sort(rootAnnotations);            Iterator annotIter = rootAnnotations.iterator();            while (annotIter.hasNext()) {                Annotation ann = (Annotation) annotIter.next();                String blockString = getBlock(theTranscription, encoderInfo, ann);                out.write(blockString);            }        } catch (Exception rex) {            rex.printStackTrace();        }    }    private String getBlock(Transcription tr, EncoderInfo encoderInfo,        Annotation ann) {        boolean exportBlock = false;        StringBuffer blockString = new StringBuffer("");        // create main tier string        // find label from mainTierInfo        String tierName = ann.getTier().getName();        for (int i = 0; i < mainTierInfo[0].length; i++) {            if (mainTierInfo[0][i] == null) {                continue;            }            if (mainTierInfo[0][i].equals(tierName)) {                //blockString += mainTierInfo[1][i] + ":\t" + ann.getValue().replaceAll("\t", "\n" + "\t") + "\n";                blockString.append(mainTierInfo[1][i] + ":\t" +                    ann.getValue().replaceAll("\t", "\n" + "\t"));                exportBlock = true;                break;            }        }        if (!exportBlock) {            return blockString.toString();        }        // HS may 2006: add the media filename and begin and end times either on the same line (special formatting)        // or at the next line following the root annotation        // take unaligned slots of root annots together. One time link line can refer to more than        // one preceding block        // HS may 2006: we could still assume there are no unaligned slots/annotations on a root tier        if (((AlignableAnnotation) ann).getBegin().isTimeAligned()) {            lastAlignedBeginTime = ((AlignableAnnotation) ann).getBegin()                                    .getTime();            if (((CHATEncoderInfo) encoderInfo).getCorrectAnnotationTimes()) {                lastAlignedBeginTime += ((CHATEncoderInfo) encoderInfo).getMediaOffset();            }        }        if (((AlignableAnnotation) ann).getEnd().isTimeAligned()) {            long endTime = ann.getEndTimeBoundary();            if (((CHATEncoderInfo) encoderInfo).getCorrectAnnotationTimes()) {                endTime += ((CHATEncoderInfo) encoderInfo).getMediaOffset();            }            String mediaFileName = "";            Vector mediaDescriptors = tr.getMediaDescriptors();            String mediaLabel = SOUND_LABEL;            if ((mediaDescriptors != null) && (mediaDescriptors.size() > 0)) {                mediaFileName = ((MediaDescriptor) mediaDescriptors.firstElement()).mediaURL;                mediaFileName = mediaFileName.substring(mediaFileName.lastIndexOf(                            "/") + 1);                if (!((CHATEncoderInfo) encoderInfo).isTimesOnSeparateLine()) {                    int index = mediaFileName.indexOf('.');                    if (index > 0) {                        mediaFileName = mediaFileName.substring(0, index);                    }                }                String mimeType = ((MediaDescriptor) mediaDescriptors.firstElement()).mimeType;                if (mimeType.startsWith("video")) {                    mediaLabel = VIDEO_LABEL;                }                if (((CHATEncoderInfo) encoderInfo).isTimesOnSeparateLine()) {                    blockString.append("\n" + BULLET + mediaLabel + "\t" +                        "\"" + mediaFileName + "\" " + lastAlignedBeginTime +                        " " + endTime + BULLET + "\n");                } else {                    blockString.append(" " + BULLET + mediaLabel + "\"" +                        mediaFileName + "\"" + "_" + lastAlignedBeginTime +                        "_" + endTime + BULLET + "\n");                }            }        }        // recursively add annotations for dependent tiers        Hashtable annotsPerTier = new Hashtable();        Vector tierOrder = new Vector();        getDependentLines(ann, tr, annotsPerTier, tierOrder);        // compose output string for dependent annotations        //String dependentString = "";        for (int i = 0; i < tierOrder.size(); i++) {            Tier t = (Tier) tierOrder.elementAt(i);            Vector annots = (Vector) annotsPerTier.get(t);            boolean exportTier = false;            if (annots != null) {                Collections.sort(annots);                // label                for (int j = 0; j < dependentTierInfo[0].length; j++) {                    if (dependentTierInfo[0][j] == null) {                        continue;                    }                    if (dependentTierInfo[0][j].equals(t.getName())) {                        blockString.append(dependentTierInfo[1][j] + ":\t");                        exportTier = true;                        break;                    }                }                // concatenate annotation values                if (exportTier) {                    for (int k = 0; k < annots.size(); k++) {                        if (k != 0) {                            blockString.append(" ");                        }                        blockString.append(((Annotation) annots.elementAt(k)).getValue()                                            .replaceAll("\t", "\n\t"));                    }                    blockString.append("\n");                }            }        }        // add time information.        // take unaligned slots of root annots together. One time link line can refer to more than        // one preceding block        /*        if (((AlignableAnnotation) ann).getBegin().isTimeAligned()) {            lastAlignedBeginTime = ((AlignableAnnotation) ann).getBegin().getTime();        }        if (((AlignableAnnotation) ann).getEnd().isTimeAligned()) {            String mediaFileName = "";            Vector mediaDescriptors = tr.getMediaDescriptors();            String mediaLabel = SOUND_LABEL;            if (mediaDescriptors != null && mediaDescriptors.size() > 0) {                mediaFileName = ((MediaDescriptor) mediaDescriptors.firstElement()).mediaURL;                mediaFileName = mediaFileName.substring(mediaFileName.lastIndexOf("/") + 1);                String mimeType = ((MediaDescriptor) mediaDescriptors.firstElement()).mimeType;                if (mimeType.startsWith("video")) {                    mediaLabel = VIDEO_LABEL;                }                blockString.append( BULLET + mediaLabel + "\t" + "\"" + mediaFileName + "\" "                                            + lastAlignedBeginTime + " "                                            + ann.getEndTimeBoundary() + BULLET + "\n");            }        }        */        return blockString.toString();    }    private void getDependentLines(Annotation ann, Transcription tr,        Hashtable annotsPerTier, Vector tierOrder) {        Vector childAnnots = ((TranscriptionImpl) tr).getChildAnnotationsOf(ann);        // collect dependent annots per tier        Vector annots = null;        Iterator childIter = childAnnots.iterator();        while (childIter.hasNext()) {            Annotation child = (Annotation) childIter.next();            annots = (Vector) annotsPerTier.get(child.getTier());            if (annots == null) {                annots = new Vector();                annotsPerTier.put(child.getTier(), annots);                tierOrder.add(child.getTier());            }            annots.add(child);            getDependentLines(child, tr, annotsPerTier, tierOrder);        }    }}
💿 文件大小 23621 K
👤 上传用户 ccuading
📂 所属分类 Java编程
🏷️ 相关标签

#编辑 #视频
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -