📄 testindexwriter.java

📁 lucene2.2.0版本
💻 JAVA
📖 第 1 页 / 共 3 页
字号:
12 3 下一页
package org.apache.lucene.index;/** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements.  See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License.  You may obtain a copy of the License at * *     http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */import java.io.IOException;import java.io.File;import java.util.Arrays;import junit.framework.TestCase;import org.apache.lucene.analysis.WhitespaceAnalyzer;import org.apache.lucene.document.Document;import org.apache.lucene.document.Field;import org.apache.lucene.index.IndexReader;import org.apache.lucene.index.IndexWriter;import org.apache.lucene.search.IndexSearcher;import org.apache.lucene.search.Hits;import org.apache.lucene.search.TermQuery;import org.apache.lucene.store.Directory;import org.apache.lucene.store.FSDirectory;import org.apache.lucene.store.RAMDirectory;import org.apache.lucene.store.IndexInput;import org.apache.lucene.store.IndexOutput;import org.apache.lucene.store.AlreadyClosedException;import org.apache.lucene.store.MockRAMDirectory;import org.apache.lucene.store.LockFactory;import org.apache.lucene.store.Lock;import org.apache.lucene.store.SingleInstanceLockFactory;/** * @author goller * @version $Id: TestIndexWriter.java 545696 2007-06-09 06:09:46Z buschmi $ */public class TestIndexWriter extends TestCase{    public void testDocCount() throws IOException    {        Directory dir = new RAMDirectory();        IndexWriter writer = null;        IndexReader reader = null;        int i;        IndexWriter.setDefaultWriteLockTimeout(2000);        assertEquals(2000, IndexWriter.getDefaultWriteLockTimeout());        writer  = new IndexWriter(dir, new WhitespaceAnalyzer());        IndexWriter.setDefaultWriteLockTimeout(1000);        // add 100 documents        for (i = 0; i < 100; i++) {            addDoc(writer);        }        assertEquals(100, writer.docCount());        writer.close();        // delete 40 documents        reader = IndexReader.open(dir);        for (i = 0; i < 40; i++) {            reader.deleteDocument(i);        }        reader.close();        // test doc count before segments are merged/index is optimized        writer = new IndexWriter(dir, new WhitespaceAnalyzer());        assertEquals(100, writer.docCount());        writer.close();        reader = IndexReader.open(dir);        assertEquals(100, reader.maxDoc());        assertEquals(60, reader.numDocs());        reader.close();        // optimize the index and check that the new doc count is correct        writer = new IndexWriter(dir, true, new WhitespaceAnalyzer());        writer.optimize();        assertEquals(60, writer.docCount());        writer.close();        // check that the index reader gives the same numbers.        reader = IndexReader.open(dir);        assertEquals(60, reader.maxDoc());        assertEquals(60, reader.numDocs());        reader.close();        // make sure opening a new index for create over        // this existing one works correctly:        writer = new IndexWriter(dir, new WhitespaceAnalyzer(), true);        assertEquals(0, writer.docCount());        writer.close();    }    private void addDoc(IndexWriter writer) throws IOException    {        Document doc = new Document();        doc.add(new Field("content", "aaa", Field.Store.NO, Field.Index.TOKENIZED));        writer.addDocument(doc);    }    private void addDocWithIndex(IndexWriter writer, int index) throws IOException    {        Document doc = new Document();        doc.add(new Field("content", "aaa " + index, Field.Store.YES, Field.Index.TOKENIZED));        doc.add(new Field("id", "" + index, Field.Store.YES, Field.Index.TOKENIZED));        writer.addDocument(doc);    }    /*      Test: make sure when we run out of disk space or hit      random IOExceptions in any of the addIndexes(*) calls      that 1) index is not corrupt (searcher can open/search      it) and 2) transactional semantics are followed:      either all or none of the incoming documents were in      fact added.    */    public void testAddIndexOnDiskFull() throws IOException    {      int START_COUNT = 57;      int NUM_DIR = 50;      int END_COUNT = START_COUNT + NUM_DIR*25;      boolean debug = false;      // Build up a bunch of dirs that have indexes which we      // will then merge together by calling addIndexes(*):      Directory[] dirs = new Directory[NUM_DIR];      long inputDiskUsage = 0;      for(int i=0;i<NUM_DIR;i++) {        dirs[i] = new RAMDirectory();        IndexWriter writer  = new IndexWriter(dirs[i], new WhitespaceAnalyzer(), true);        for(int j=0;j<25;j++) {          addDocWithIndex(writer, 25*i+j);        }        writer.close();        String[] files = dirs[i].list();        for(int j=0;j<files.length;j++) {          inputDiskUsage += dirs[i].fileLength(files[j]);        }      }      // Now, build a starting index that has START_COUNT docs.  We      // will then try to addIndexes into a copy of this:      RAMDirectory startDir = new RAMDirectory();      IndexWriter writer = new IndexWriter(startDir, new WhitespaceAnalyzer(), true);              for(int j=0;j<START_COUNT;j++) {        addDocWithIndex(writer, j);      }      writer.close();      // Make sure starting index seems to be working properly:      Term searchTerm = new Term("content", "aaa");              IndexReader reader = IndexReader.open(startDir);      assertEquals("first docFreq", 57, reader.docFreq(searchTerm));      IndexSearcher searcher = new IndexSearcher(reader);      Hits hits = searcher.search(new TermQuery(searchTerm));      assertEquals("first number of hits", 57, hits.length());      searcher.close();      reader.close();      // Iterate with larger and larger amounts of free      // disk space.  With little free disk space,      // addIndexes will certainly run out of space &      // fail.  Verify that when this happens, index is      // not corrupt and index in fact has added no      // documents.  Then, we increase disk space by 2000      // bytes each iteration.  At some point there is      // enough free disk space and addIndexes should      // succeed and index should show all documents were      // added.      // String[] files = startDir.list();      long diskUsage = startDir.sizeInBytes();      long startDiskUsage = 0;      String[] files = startDir.list();      for(int i=0;i<files.length;i++) {        startDiskUsage += startDir.fileLength(files[i]);      }      for(int iter=0;iter<6;iter++) {        // Start with 100 bytes more than we are currently using:        long diskFree = diskUsage+100;        boolean autoCommit = iter % 2 == 0;        int method = iter/2;        boolean success = false;        boolean done = false;        String methodName;        if (0 == method) {          methodName = "addIndexes(Directory[])";        } else if (1 == method) {          methodName = "addIndexes(IndexReader[])";        } else {          methodName = "addIndexesNoOptimize(Directory[])";        }        int cycleCount = 0;        while(!done) {          cycleCount++;          // Make a new dir that will enforce disk usage:          MockRAMDirectory dir = new MockRAMDirectory(startDir);          writer = new IndexWriter(dir, autoCommit, new WhitespaceAnalyzer(), false);          IOException err = null;          for(int x=0;x<2;x++) {            // Two loops: first time, limit disk space &            // throw random IOExceptions; second time, no            // disk space limit:            double rate = 0.05;            double diskRatio = ((double) diskFree)/diskUsage;            long thisDiskFree;            String testName = null;            if (0 == x) {              thisDiskFree = diskFree;              if (diskRatio >= 2.0) {                rate /= 2;              }              if (diskRatio >= 4.0) {                rate /= 2;              }              if (diskRatio >= 6.0) {                rate = 0.0;              }              if (debug)                testName = "disk full test " + methodName + " with disk full at " + diskFree + " bytes autoCommit=" + autoCommit;            } else {              thisDiskFree = 0;              rate = 0.0;              if (debug)                testName = "disk full test " + methodName + " with unlimited disk space autoCommit=" + autoCommit;            }            if (debug)              System.out.println("\ncycle: " + testName);            dir.setMaxSizeInBytes(thisDiskFree);            dir.setRandomIOExceptionRate(rate, diskFree);            try {              if (0 == method) {                writer.addIndexes(dirs);              } else if (1 == method) {                IndexReader readers[] = new IndexReader[dirs.length];                for(int i=0;i<dirs.length;i++) {                  readers[i] = IndexReader.open(dirs[i]);                }                try {                  writer.addIndexes(readers);                } finally {                  for(int i=0;i<dirs.length;i++) {                    readers[i].close();                  }                }              } else {                writer.addIndexesNoOptimize(dirs);              }              success = true;              if (debug) {                System.out.println("  success!");              }              if (0 == x) {                done = true;              }            } catch (IOException e) {              success = false;              err = e;              if (debug) {                System.out.println("  hit IOException: " + e);                // e.printStackTrace(System.out);              }              if (1 == x) {                e.printStackTrace(System.out);                fail(methodName + " hit IOException after disk space was freed up");              }            }            if (autoCommit) {              // Whether we succeeded or failed, check that              // all un-referenced files were in fact              // deleted (ie, we did not create garbage).              // Only check this when autoCommit is true:              // when it's false, it's expected that there              // are unreferenced files (ie they won't be              // referenced until the "commit on close").              // Just create a new IndexFileDeleter, have it              // delete unreferenced files, then verify that              // in fact no files were deleted:              String successStr;              if (success) {                successStr = "success";              } else {                successStr = "IOException";              }              String message = methodName + " failed to delete unreferenced files after " + successStr + " (" + diskFree + " bytes)";              assertNoUnreferencedFiles(dir, message);            }            if (debug) {              System.out.println("  now test readers");            }            // Finally, verify index is not corrupt, and, if            // we succeeded, we see all docs added, and if we            // failed, we see either all docs or no docs added            // (transactional semantics):            try {              reader = IndexReader.open(dir);            } catch (IOException e) {              e.printStackTrace(System.out);              fail(testName + ": exception when creating IndexReader: " + e);            }            int result = reader.docFreq(searchTerm);            if (success) {              if (autoCommit && result != END_COUNT) {                fail(testName + ": method did not throw exception but docFreq('aaa') is " + result + " instead of expected " + END_COUNT);              } else if (!autoCommit && result != START_COUNT) {
12 3 下一页
💿 文件大小 5913 K
👤 上传用户 jjjjjkkkkjkjkjk
📂 所属分类 Java编程
🏷️ 相关标签

#lucene #版本
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -