testthaianalyzer.java

来自「一套java版本的搜索引擎源码」· Java 代码 · 共 71 行

JAVA
71
字号
package org.apache.lucene.analysis.th;/** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements.  See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License.  You may obtain a copy of the License at * *     http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */import java.io.StringReader;import junit.framework.TestCase;import org.apache.lucene.analysis.Analyzer;import org.apache.lucene.analysis.Token;import org.apache.lucene.analysis.TokenStream;/** * Test case for ThaiAnalyzer, modified from TestFrenchAnalyzer * * @author    Samphan Raruenrom <samphan@osdev.co.th> * @version   0.1 */public class TestThaiAnalyzer extends TestCase {	public void assertAnalyzesTo(Analyzer a, String input, String[] output)		throws Exception {		TokenStream ts = a.tokenStream("dummy", new StringReader(input));		for (int i = 0; i < output.length; i++) {			Token t = ts.next();			assertNotNull(t);			assertEquals(t.termText(), output[i]);		}		assertNull(ts.next());		ts.close();	}	public void testAnalyzer() throws Exception {		ThaiAnalyzer analyzer = new ThaiAnalyzer();			assertAnalyzesTo(analyzer, "", new String[] {});		assertAnalyzesTo(			analyzer,			"การที่ได้ต้องแสดงว่างานดี",			new String[] { "การ", "ที่", "ได้", "ต้อง", "แสดง", "ว่า", "งาน", "ดี"});		assertAnalyzesTo(			analyzer,			"บริษัทชื่อ XY&Z - คุยกับ xyz@demo.com",			new String[] { "บริษัท", "ชื่อ", "xy&z", "คุย", "กับ", "xyz@demo.com" });    // English stop words		assertAnalyzesTo(			analyzer,			"ประโยคว่า The quick brown fox jumped over the lazy dogs",			new String[] { "ประโยค", "ว่า", "quick", "brown", "fox", "jumped", "over", "lazy", "dogs" });	}}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?