📄 testpositionincrement.java

📁 Lucene a java open-source SearchEngine Framework
💻 JAVA
字号:
package org.apache.lucene.search;/** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements.  See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License.  You may obtain a copy of the License at * *     http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */import org.apache.lucene.index.Term;import org.apache.lucene.index.IndexWriter;import org.apache.lucene.queryParser.QueryParser;import org.apache.lucene.search.PhraseQuery;import org.apache.lucene.search.Hits;import org.apache.lucene.search.IndexSearcher;import org.apache.lucene.store.RAMDirectory;import org.apache.lucene.analysis.Analyzer;import org.apache.lucene.analysis.StopAnalyzer;import org.apache.lucene.analysis.StopFilter;import org.apache.lucene.analysis.Token;import org.apache.lucene.analysis.TokenStream;import org.apache.lucene.analysis.WhitespaceAnalyzer;import org.apache.lucene.document.Document;import org.apache.lucene.document.Field;import java.io.Reader;import java.io.StringReader;import org.apache.lucene.util.LuceneTestCase;/** * Term position unit test. * * * @version $Revision: 607591 $ */public class TestPositionIncrement extends LuceneTestCase {  public void testSetPosition() throws Exception {    Analyzer analyzer = new Analyzer() {      public TokenStream tokenStream(String fieldName, Reader reader) {        return new TokenStream() {          private final String[] TOKENS = {"1", "2", "3", "4", "5"};          private final int[] INCREMENTS = {1, 2, 1, 0, 1};          private int i = 0;          public Token next() {            if (i == TOKENS.length)              return null;            Token t = new Token(TOKENS[i], i, i);            t.setPositionIncrement(INCREMENTS[i]);            i++;            return t;          }        };      }    };    RAMDirectory store = new RAMDirectory();    IndexWriter writer = new IndexWriter(store, analyzer, true);    Document d = new Document();    d.add(new Field("field", "bogus", Field.Store.YES, Field.Index.TOKENIZED));    writer.addDocument(d);    writer.optimize();    writer.close();    IndexSearcher searcher = new IndexSearcher(store);    PhraseQuery q;    Hits hits;    q = new PhraseQuery();    q.add(new Term("field", "1"));    q.add(new Term("field", "2"));    hits = searcher.search(q);    assertEquals(0, hits.length());    // same as previous, just specify positions explicitely.    q = new PhraseQuery();     q.add(new Term("field", "1"),0);    q.add(new Term("field", "2"),1);    hits = searcher.search(q);    assertEquals(0, hits.length());    // specifying correct positions should find the phrase.    q = new PhraseQuery();    q.add(new Term("field", "1"),0);    q.add(new Term("field", "2"),2);    hits = searcher.search(q);    assertEquals(1, hits.length());    q = new PhraseQuery();    q.add(new Term("field", "2"));    q.add(new Term("field", "3"));    hits = searcher.search(q);    assertEquals(1, hits.length());    q = new PhraseQuery();    q.add(new Term("field", "3"));    q.add(new Term("field", "4"));    hits = searcher.search(q);    assertEquals(0, hits.length());    // phrase query would find it when correct positions are specified.     q = new PhraseQuery();    q.add(new Term("field", "3"),0);    q.add(new Term("field", "4"),0);    hits = searcher.search(q);    assertEquals(1, hits.length());    // phrase query should fail for non existing searched term     // even if there exist another searched terms in the same searched position.     q = new PhraseQuery();    q.add(new Term("field", "3"),0);    q.add(new Term("field", "9"),0);    hits = searcher.search(q);    assertEquals(0, hits.length());    // multi-phrase query should succed for non existing searched term    // because there exist another searched terms in the same searched position.     MultiPhraseQuery mq = new MultiPhraseQuery();    mq.add(new Term[]{new Term("field", "3"),new Term("field", "9")},0);    hits = searcher.search(mq);    assertEquals(1, hits.length());    q = new PhraseQuery();    q.add(new Term("field", "2"));    q.add(new Term("field", "4"));    hits = searcher.search(q);    assertEquals(1, hits.length());    q = new PhraseQuery();    q.add(new Term("field", "3"));    q.add(new Term("field", "5"));    hits = searcher.search(q);    assertEquals(1, hits.length());    q = new PhraseQuery();    q.add(new Term("field", "4"));    q.add(new Term("field", "5"));    hits = searcher.search(q);    assertEquals(1, hits.length());    q = new PhraseQuery();    q.add(new Term("field", "2"));    q.add(new Term("field", "5"));    hits = searcher.search(q);    assertEquals(0, hits.length());    // analyzer to introduce stopwords and increment gaps     Analyzer stpa = new Analyzer() {      final WhitespaceAnalyzer a = new WhitespaceAnalyzer();      public TokenStream tokenStream(String fieldName, Reader reader) {        TokenStream ts = a.tokenStream(fieldName,reader);        return new StopFilter(ts,new String[]{"stop"});      }    };    // should not find "1 2" because there is a gap of 1 in the index    QueryParser qp = new QueryParser("field",stpa);    q = (PhraseQuery) qp.parse("\"1 2\"");    hits = searcher.search(q);    assertEquals(0, hits.length());    // omitted stop word cannot help because stop filter swallows the increments.     q = (PhraseQuery) qp.parse("\"1 stop 2\"");    hits = searcher.search(q);    assertEquals(0, hits.length());    // query parser alone won't help, because stop filter swallows the increments.     qp.setEnablePositionIncrements(true);    q = (PhraseQuery) qp.parse("\"1 stop 2\"");    hits = searcher.search(q);    assertEquals(0, hits.length());    boolean dflt = StopFilter.getEnablePositionIncrementsDefault();    try {      // stop filter alone won't help, because query parser swallows the increments.       qp.setEnablePositionIncrements(false);      StopFilter.setEnablePositionIncrementsDefault(true);      q = (PhraseQuery) qp.parse("\"1 stop 2\"");      hits = searcher.search(q);      assertEquals(0, hits.length());            // when both qp qnd stopFilter propagate increments, we should find the doc.      qp.setEnablePositionIncrements(true);      q = (PhraseQuery) qp.parse("\"1 stop 2\"");      hits = searcher.search(q);      assertEquals(1, hits.length());    } finally {      StopFilter.setEnablePositionIncrementsDefault(dflt);    }  }  /**   * Basic analyzer behavior should be to keep sequential terms in one   * increment from one another.   */  public void testIncrementingPositions() throws Exception {    Analyzer analyzer = new WhitespaceAnalyzer();    TokenStream ts = analyzer.tokenStream("field",                                new StringReader("one two three four five"));    while (true) {      Token token = ts.next();      if (token == null) break;      assertEquals(token.termText(), 1, token.getPositionIncrement());    }  }}
💿 文件大小 5390 K
👤 上传用户 rickie936
📂 所属分类 Java编程
🏷️ 相关标签

#SearchEngine #open-source #Framework #Lucene
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -