⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 testsegmenttermenum.java

📁 索引aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa
💻 JAVA
字号:
package org.apache.lucene.index;import java.io.IOException;import junit.framework.TestCase;import org.apache.lucene.analysis.WhitespaceAnalyzer;import org.apache.lucene.document.Document;import org.apache.lucene.document.Field;import org.apache.lucene.index.IndexReader;import org.apache.lucene.index.IndexWriter;import org.apache.lucene.index.Term;import org.apache.lucene.index.TermEnum;import org.apache.lucene.store.Directory;import org.apache.lucene.store.RAMDirectory;/** * @author goller */public class TestSegmentTermEnum extends TestCase{  Directory dir = new RAMDirectory();  public void testTermEnum()  {    IndexWriter writer = null;    try {      writer  = new IndexWriter(dir, new WhitespaceAnalyzer(), true);      // add 100 documents with term : aaa      // add 100 documents with terms: aaa bbb      // Therefore, term 'aaa' has document frequency of 200 and term 'bbb' 100      for (int i = 0; i < 100; i++) {        addDoc(writer, "aaa");        addDoc(writer, "aaa bbb");      }      writer.close();    }    catch (IOException e) {      e.printStackTrace();    }    try {      // verify document frequency of terms in an unoptimized index      verifyDocFreq();      // merge segments by optimizing the index      writer = new IndexWriter(dir, new WhitespaceAnalyzer(), false);      writer.optimize();      writer.close();      // verify document frequency of terms in an optimized index      verifyDocFreq();    }    catch (IOException e2) {      e2.printStackTrace();    }  }  private void verifyDocFreq()      throws IOException  {      IndexReader reader = IndexReader.open(dir);      TermEnum termEnum = null;    // create enumeration of all terms    termEnum = reader.terms();    // go to the first term (aaa)    termEnum.next();    // assert that term is 'aaa'    assertEquals("aaa", termEnum.term().text());    assertEquals(200, termEnum.docFreq());    // go to the second term (bbb)    termEnum.next();    // assert that term is 'bbb'    assertEquals("bbb", termEnum.term().text());    assertEquals(100, termEnum.docFreq());    termEnum.close();    // create enumeration of terms after term 'aaa', including 'aaa'    termEnum = reader.terms(new Term("content", "aaa"));    // assert that term is 'aaa'    assertEquals("aaa", termEnum.term().text());    assertEquals(200, termEnum.docFreq());    // go to term 'bbb'    termEnum.next();    // assert that term is 'bbb'    assertEquals("bbb", termEnum.term().text());    assertEquals(100, termEnum.docFreq());    termEnum.close();  }  private void addDoc(IndexWriter writer, String value)  {    Document doc = new Document();    doc.add(Field.UnStored("content", value));    try {      writer.addDocument(doc);    }    catch (IOException e) {      e.printStackTrace();    }  }}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -