📄 doctest.java
字号:
package org.apache.lucene.index;/** * Copyright 2004 The Apache Software Foundation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */import org.apache.lucene.analysis.SimpleAnalyzer;import org.apache.lucene.analysis.Analyzer;import org.apache.lucene.store.FSDirectory;import org.apache.lucene.store.Directory;import org.apache.lucene.document.Document;import org.apache.lucene.search.Similarity;import org.apache.lucene.demo.FileDocument;import java.io.File;// FIXME: OG: remove hard-coded file namesclass DocTest { public static void main(String[] args) { try { Directory directory = FSDirectory.getDirectory("test", true); directory.close(); indexDoc("one", "test.txt"); printSegment("one"); indexDoc("two", "test2.txt"); printSegment("two"); merge("one", "two", "merge"); printSegment("merge"); merge("one", "two", "merge2"); printSegment("merge2"); merge("merge", "merge2", "merge3"); printSegment("merge3"); } catch (Exception e) { System.out.println(" caught a " + e.getClass() + "\n with message: " + e.getMessage()); e.printStackTrace(); } } public static void indexDoc(String segment, String fileName) throws Exception { Directory directory = FSDirectory.getDirectory("test", false); Analyzer analyzer = new SimpleAnalyzer(); DocumentWriter writer = new DocumentWriter(directory, analyzer, Similarity.getDefault(), 1000); File file = new File(fileName); Document doc = FileDocument.Document(file); writer.addDocument(segment, doc); directory.close(); } static void merge(String seg1, String seg2, String merged) throws Exception { Directory directory = FSDirectory.getDirectory("test", false); SegmentReader r1 = new SegmentReader(new SegmentInfo(seg1, 1, directory)); SegmentReader r2 = new SegmentReader(new SegmentInfo(seg2, 1, directory)); SegmentMerger merger = new SegmentMerger(directory, merged, false); merger.add(r1); merger.add(r2); merger.merge(); merger.closeReaders(); directory.close(); } static void printSegment(String segment) throws Exception { Directory directory = FSDirectory.getDirectory("test", false); SegmentReader reader = new SegmentReader(new SegmentInfo(segment, 1, directory)); for (int i = 0; i < reader.numDocs(); i++) System.out.println(reader.document(i)); TermEnum tis = reader.terms(); while (tis.next()) { System.out.print(tis.term()); System.out.println(" DF=" + tis.docFreq()); TermPositions positions = reader.termPositions(tis.term()); try { while (positions.next()) { System.out.print(" doc=" + positions.doc()); System.out.print(" TF=" + positions.freq()); System.out.print(" pos="); System.out.print(positions.nextPosition()); for (int j = 1; j < positions.freq(); j++) System.out.print("," + positions.nextPosition()); System.out.println(""); } } finally { positions.close(); } } tis.close(); reader.close(); directory.close(); }}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -