📄 testqualityrun.java

📁 Lucene a java open-source SearchEngine Framework
💻 JAVA
字号:
package org.apache.lucene.benchmark.quality;/** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements.  See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License.  You may obtain a copy of the License at * *     http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */import java.io.BufferedReader;import java.io.File;import java.io.FileReader;import java.io.PrintWriter;import org.apache.lucene.benchmark.byTask.TestPerfTasksLogic;import org.apache.lucene.benchmark.byTask.feeds.ReutersDocMaker;import org.apache.lucene.benchmark.quality.Judge;import org.apache.lucene.benchmark.quality.QualityQuery;import org.apache.lucene.benchmark.quality.QualityQueryParser;import org.apache.lucene.benchmark.quality.QualityBenchmark;import org.apache.lucene.benchmark.quality.trec.TrecJudge;import org.apache.lucene.benchmark.quality.trec.TrecTopicsReader;import org.apache.lucene.benchmark.quality.utils.SimpleQQParser;import org.apache.lucene.benchmark.quality.utils.SubmissionReport;import org.apache.lucene.search.IndexSearcher;import org.apache.lucene.store.FSDirectory;import junit.framework.TestCase;/** * Test that quality run does its job. */public class TestQualityRun extends TestCase {  private static boolean DEBUG = Boolean.getBoolean("tests.verbose");    /**   * @param arg0   */  public TestQualityRun(String name) {    super(name);  }  public void testTrecQuality() throws Exception {    // first create the complete reuters index    createReutersIndex();        File workDir = new File(System.getProperty("benchmark.work.dir","work"));    assertTrue("Bad workDir: "+workDir, workDir.exists()&& workDir.isDirectory());    int maxResults = 1000;    String docNameField = "docid";         PrintWriter logger = DEBUG ? new PrintWriter(System.out,true) : null;    // <tests src dir> for topics/qrels files - src/test/org/apache/lucene/benchmark/quality    File srcTestDir = new File(new File(new File(new File(new File(      new File(new File(workDir.getAbsoluteFile().getParentFile(),        "src"),"test"),"org"),"apache"),"lucene"),"benchmark"),"quality");        // prepare topics    File topicsFile = new File(srcTestDir, "trecTopics.txt");    assertTrue("Bad topicsFile: "+topicsFile, topicsFile.exists()&& topicsFile.isFile());    TrecTopicsReader qReader = new TrecTopicsReader();    QualityQuery qqs[] = qReader.readQueries(new BufferedReader(new FileReader(topicsFile)));        // prepare judge    File qrelsFile = new File(srcTestDir, "trecQRels.txt");    assertTrue("Bad qrelsFile: "+qrelsFile, qrelsFile.exists()&& qrelsFile.isFile());    Judge judge = new TrecJudge(new BufferedReader(new FileReader(qrelsFile)));        // validate topics & judgments match each other    judge.validateData(qqs, logger);        IndexSearcher searcher = new IndexSearcher(FSDirectory.getDirectory(new File(workDir,"index")));    QualityQueryParser qqParser = new SimpleQQParser("title","body");    QualityBenchmark qrun = new QualityBenchmark(qqs, qqParser, searcher, docNameField);        SubmissionReport submitLog = DEBUG ? new SubmissionReport(logger, "TestRun") : null;    qrun.setMaxResults(maxResults);    QualityStats stats[] = qrun.execute(judge, submitLog, logger);        // --------- verify by the way judgments were altered for this test:    // for some queries, depending on m = qnum % 8    // m==0: avg_precision and recall are hurt, by marking fake docs as relevant    // m==1: precision_at_n and avg_precision are hurt, by unmarking relevant docs    // m==2: all precision, precision_at_n and recall are hurt.    // m>=3: these queries remain perfect    for (int i = 0; i < stats.length; i++) {      QualityStats s = stats[i];      switch (i%8) {      case 0:        assertTrue("avg-p should be hurt: "+s.getAvp(), 1.0 > s.getAvp());        assertTrue("recall should be hurt: "+s.getRecall(), 1.0 > s.getRecall());        for (int j = 1; j <= QualityStats.MAX_POINTS; j++) {          assertEquals("p_at_"+j+" should be perfect: "+s.getPrecisionAt(j), 1.0, s.getPrecisionAt(j), 1E-9);        }        break;            case 1:        assertTrue("avg-p should be hurt", 1.0 > s.getAvp());        assertEquals("recall should be perfect: "+s.getRecall(), 1.0, s.getRecall(), 1E-9);        for (int j = 1; j <= QualityStats.MAX_POINTS; j++) {          assertTrue("p_at_"+j+" should be hurt: "+s.getPrecisionAt(j), 1.0 > s.getPrecisionAt(j));        }        break;      case 2:        assertTrue("avg-p should be hurt: "+s.getAvp(), 1.0 > s.getAvp());        assertTrue("recall should be hurt: "+s.getRecall(), 1.0 > s.getRecall());        for (int j = 1; j <= QualityStats.MAX_POINTS; j++) {          assertTrue("p_at_"+j+" should be hurt: "+s.getPrecisionAt(j), 1.0 > s.getPrecisionAt(j));        }        break;      default: {        assertEquals("avg-p should be perfect: "+s.getAvp(), 1.0, s.getAvp(), 1E-9);        assertEquals("recall should be perfect: "+s.getRecall(), 1.0, s.getRecall(), 1E-9);        for (int j = 1; j <= QualityStats.MAX_POINTS; j++) {          assertEquals("p_at_"+j+" should be perfect: "+s.getPrecisionAt(j), 1.0, s.getPrecisionAt(j), 1E-9);        }      }            }    }        QualityStats avg = QualityStats.average(stats);    if (logger!=null) {      avg.log("Average statistis:",1,logger,"  ");    }        assertTrue("mean avg-p should be hurt: "+avg.getAvp(), 1.0 > avg.getAvp());    assertTrue("avg recall should be hurt: "+avg.getRecall(), 1.0 > avg.getRecall());    for (int j = 1; j <= QualityStats.MAX_POINTS; j++) {      assertTrue("avg p_at_"+j+" should be hurt: "+avg.getPrecisionAt(j), 1.0 > avg.getPrecisionAt(j));    }      }  // use benchmark logic to create the full Reuters index  private void createReutersIndex() throws Exception {    // 1. alg definition    String algLines[] = {        "# ----- properties ",        "doc.maker="+ReutersDocMaker.class.getName(),        "doc.add.log.step=2500",        "doc.term.vector=false",        "doc.maker.forever=false",        "directory=FSDirectory",        "doc.stored=true",        "doc.tokenized=true",        "# ----- alg ",        "ResetSystemErase",        "CreateIndex",        "{ AddDoc } : *",        "CloseIndex",    };        // 2. execute the algorithm  (required in every "logic" test)    TestPerfTasksLogic.execBenchmark(algLines);  }}
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -