simplereadlistener.java

来自「庖丁分词模块」· Java 代码 · 共 68 行

JAVA
68
字号
/**
 * Copyright 2007 The Apache Software Foundation
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package net.paoding.analysis.dictionary.support.filewords;

import java.util.HashSet;
import java.util.Hashtable;
import java.util.LinkedList;
import java.util.Map;


/**
 * 
 * @author Zhiliang Wang [qieqie.wang@gmail.com]
 * 
 * @since 1.0
 * 
 */
public class SimpleReadListener implements ReadListener {
	private Map<String, LinkedList<String>> dics = new Hashtable<String, LinkedList<String>>();
	private LinkedList<String> sortedWords;
	private HashSet<String> setSortedWords;
	
	public boolean onFileBegin(String file) {
		if (!file.endsWith(".dic")){
			return false;
		}
		sortedWords = new LinkedList<String>();
		setSortedWords = new HashSet<String>();
		return true;
	}

	public void onFileEnd(String file) {
		String name = file.substring(0, file.length() - 4);
		dics.put(name, sortedWords);
		setSortedWords = null;
		sortedWords = null;
	}

	public void onWord(String word) {
		word = word.trim().toLowerCase();
		if (word.length() == 0 
				|| word.charAt(0) == '#'
				|| word.charAt(0) == '-') {
			return;
		}
		//保证不会重复
		if (setSortedWords.add(word)) {
			sortedWords.add(word);
		}
	}
	public Map<String, LinkedList<String>> getResult(){
		return dics;
	}
	
}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?