📄 traintokenshapechunkertest.java
字号:
package com.aliasi.test.unit.chunk;import com.aliasi.test.unit.BaseTestCase;import com.aliasi.chunk.*;import com.aliasi.tokenizer.*;import com.aliasi.util.AbstractExternalizable;public class TrainTokenShapeChunkerTest extends BaseTestCase { public void testNulls() throws Exception { IndoEuropeanTokenizerFactory factory = new IndoEuropeanTokenizerFactory(); IndoEuropeanTokenCategorizer categorizer = new IndoEuropeanTokenCategorizer(); TrainTokenShapeChunker trainer = new TrainTokenShapeChunker(categorizer,factory); try { trainer.handle(new String[] { "foo", null, "bar" }, null, new String[] { "A", "B", "C" }); fail(); } catch (NullPointerException e) { succeed(); } try { trainer.handle(new String[] { "foo", "bar", "baz" }, null, new String[] { "A", null, "C" }); fail(); } catch (NullPointerException e) { succeed(); } } public void testOne() throws Exception { IndoEuropeanTokenizerFactory factory = new IndoEuropeanTokenizerFactory(); IndoEuropeanTokenCategorizer categorizer = new IndoEuropeanTokenCategorizer(); TrainTokenShapeChunker trainer = new TrainTokenShapeChunker(categorizer,factory); String text1 = "John J. Smith lives in Washington."; // 0123456789012345678901234567890123 // 0 1 2 3 ChunkingImpl chunking1 = new ChunkingImpl(text1); Chunk chunk11 = ChunkFactory.createChunk(0,13,"PER"); Chunk chunk12 = ChunkFactory.createChunk(23,33,"LOC"); chunking1.add(chunk11); chunking1.add(chunk12); for (int i = 0; i < 5; ++i) trainer.handle(chunking1); Chunker chunker = (Chunker) AbstractExternalizable.compile(trainer); Chunking resultChunking = chunker.chunk(text1); assertEquals(chunking1.chunkSet(),resultChunking.chunkSet()); assertEquals(chunking1.charSequence().toString(), resultChunking.charSequence().toString()); String text2 = "blah blah blah" + text1 + "blah blah."; char[] cs = text2.toCharArray(); int start = "blah blah blah".length(); Chunking resultChunking2 = chunker.chunk(cs,start,start + text1.length()); assertEquals(chunking1.chunkSet(),resultChunking2.chunkSet()); assertEquals(chunking1.charSequence().toString(), resultChunking2.charSequence().toString()); }}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -