📄 documentiteratorbuildervisitor.java

📁 MG4J (Managing Gigabytes for Java) is a free full-text search engine for large document collections
💻 JAVA
字号:
package it.unimi.dsi.mg4j.search;/*		  * MG4J: Managing Gigabytes for Java * * Copyright (C) 2006-2007 Sebastiano Vigna  * *  This library is free software; you can redistribute it and/or modify it *  under the terms of the GNU Lesser General Public License as published by the Free *  Software Foundation; either version 2.1 of the License, or (at your option) *  any later version. * *  This library is distributed in the hope that it will be useful, but *  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY *  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License *  for more details. * *  You should have received a copy of the GNU Lesser General Public License *  along with this program; if not, write to the Free Software *  Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. * */import it.unimi.dsi.fastutil.objects.Object2ReferenceMap;import it.unimi.dsi.fastutil.objects.ObjectArrayList;import it.unimi.dsi.fastutil.objects.Reference2ReferenceMap;import it.unimi.dsi.fastutil.objects.Reference2ReferenceMaps;import it.unimi.dsi.mg4j.index.Index;import it.unimi.dsi.mg4j.index.IndexIterator;import it.unimi.dsi.mg4j.index.MultiTermIndexIterator;import it.unimi.dsi.mg4j.index.TooManyTermsException;import it.unimi.dsi.mg4j.index.payload.Payload;import it.unimi.dsi.mg4j.query.nodes.AbstractQueryBuilderVisitor;import it.unimi.dsi.mg4j.query.nodes.Align;import it.unimi.dsi.mg4j.query.nodes.And;import it.unimi.dsi.mg4j.query.nodes.Consecutive;import it.unimi.dsi.mg4j.query.nodes.Difference;import it.unimi.dsi.mg4j.query.nodes.LowPass;import it.unimi.dsi.mg4j.query.nodes.MultiTerm;import it.unimi.dsi.mg4j.query.nodes.Not;import it.unimi.dsi.mg4j.query.nodes.Or;import it.unimi.dsi.mg4j.query.nodes.OrderedAnd;import it.unimi.dsi.mg4j.query.nodes.Prefix;import it.unimi.dsi.mg4j.query.nodes.QueryBuilderVisitorException;import it.unimi.dsi.mg4j.query.nodes.Range;import it.unimi.dsi.mg4j.query.nodes.Select;import it.unimi.dsi.mg4j.query.nodes.Term;import java.io.IOException;import java.lang.reflect.InvocationTargetException;import java.lang.reflect.Method;import java.util.NoSuchElementException;/** A {@link it.unimi.dsi.mg4j.query.nodes.QueryBuilderVisitor} * that builds a {@link it.unimi.dsi.mg4j.search.DocumentIterator} * resolving the queries using the objects in {@link it.unimi.dsi.mg4j.search}. *  * <p>This elementary builder visitor invokes {@link it.unimi.dsi.mg4j.index.Index#documents(CharSequence)} * to build the leaf {@linkplain it.unimi.dsi.mg4j.index.IndexIterator index iterators}. Thus, the * resulting {@link it.unimi.dsi.mg4j.search.DocumentIterator} should be carefully * {@linkplain it.unimi.dsi.mg4j.search.DocumentIterator#dispose() disposed} after usage (every * index iterator may open a file or a socket). *  * <p>{@link Prefix} and {@link MultiTerm} nodes cause the creation of a {@link MultiTermIndexIterator}, * in the first case by callying {@link it.unimi.dsi.mg4j.index.Index#documents(CharSequence,int)} and * in the second case by creating a {@link MultiTermIndexIterator} with the name and frequency equal to the * maximum frequency over all terms. Other implementations might choose differently. *  * <p>At construction time, you must provide a map from strings to indices that will be used to resolve * {@link it.unimi.dsi.mg4j.query.nodes.Select} nodes. The map may be <code>null</code>, in which case * such nodes will cause an {@link java.lang.IllegalArgumentException}.  * If a {@link it.unimi.dsi.mg4j.query.nodes.Select} * node contains an index name that does not appear in the map a {@link NoSuchElementException} * will be thrown instead. *  * <p>A production site will likely substitute this builder visitor with one that reuses  * {@linkplain it.unimi.dsi.mg4j.index.IndexReader index readers} out of a pool. *  * <p>Instances of this class may be safely reused by calling {@link #prepare()}. */public class DocumentIteratorBuilderVisitor extends AbstractQueryBuilderVisitor<DocumentIterator> {		/** A map associating a textual key to indices. */	private final Object2ReferenceMap<String, Index> indexMap;	/** A map associating an object with a <code>parse(String)</code> method to each payload-based index. */	private final Reference2ReferenceMap<Index, Object> index2Parser;	/** The default index. */	private final Index defaultIndex;	/** The number of documents (fetched from the default index). */	private final int numberOfDocuments;	/** The limit on prefix queries provided in the constructor. */	private final int limit;	/** The stack of selected indices (changed by {@link Select} nodes). */	private ObjectArrayList<Index> curr;			/** Creates a new builder visitor.	 * 	 * @param indexMap a map from index names to indices, to be used in {@link Select} nodes, or <code>null</code>	 * if the only used index is the default index.	 * @param defaultIndex the default index.	 * @param limit a limit that will be used with {@link Prefix} nodes.	 */	@SuppressWarnings("unchecked")	public DocumentIteratorBuilderVisitor( final Object2ReferenceMap<String,Index> indexMap, final Index defaultIndex, final int limit ) {		this( indexMap, Reference2ReferenceMaps.EMPTY_MAP, defaultIndex, limit );	}		/** Creates a new builder visitor with additional parsers for payload-based indices.	 * 	 * @param indexMap a map from index names to indices, to be used in {@link Select} nodes, or <code>null</code>	 * if the only used index is the default index.	 * @param defaultIndex the default index.	 * @param limit a limit that will be used with {@link Prefix} nodes.	 */	public DocumentIteratorBuilderVisitor( final Object2ReferenceMap<String,Index> indexMap, final Reference2ReferenceMap<Index,Object> index2Parser, final Index defaultIndex, final int limit ) {		this.indexMap = indexMap;		this.defaultIndex = defaultIndex;		this.index2Parser = index2Parser;		this.limit = limit;		curr = new ObjectArrayList<Index>();		curr.push( defaultIndex );		this.numberOfDocuments = defaultIndex.numberOfDocuments;	}		public DocumentIteratorBuilderVisitor copy() {		return new DocumentIteratorBuilderVisitor( indexMap, defaultIndex, limit );	}		public DocumentIteratorBuilderVisitor prepare() {		curr.size( 1 );		return this;	}	public DocumentIterator[] newArray( final int len ) { return new DocumentIterator[ len ]; }	public DocumentIterator visit( final Term node ) throws QueryBuilderVisitorException {		try {			if ( node.termNumber != -1 ) return curr.top().documents( node.termNumber );			return curr.top().documents( node.term );		}		catch ( IOException e ) {			throw new QueryBuilderVisitorException( e );		}	}		public DocumentIterator visit( final Prefix node ) throws QueryBuilderVisitorException {		try {			return curr.top().documents( node.prefix, limit );		}		catch ( IOException e ) {			throw new QueryBuilderVisitorException( e );		}		catch ( TooManyTermsException e ) {			throw new QueryBuilderVisitorException( e );		}	}	public DocumentIterator visit( Range node ) throws QueryBuilderVisitorException {		final Index index = curr.top();		if ( ! index.hasPayloads ) throw new IllegalStateException( "Index " + index + " does not have payloads" );		try {			final Object parser = index2Parser.containsKey( index ) ? index2Parser.get( index ) : index.payload;			final Method method = parser.getClass().getMethod( "parse", String.class );			final Payload left = index.payload.copy(), right = index.payload.copy();			if ( node.left != null ) left.set( method.invoke( parser, node.left.toString() ) );			if ( node.right != null ) right.set( method.invoke( parser, node.right.toString() ) );			return PayloadPredicateDocumentIterator.getInstance( index.documents( 0 ), 					index.payload.rangeFilter( node.left == null ? null : left, node.right == null ? null : right ) );		}		catch( InvocationTargetException e ) {			throw new QueryBuilderVisitorException( e.getCause() );		}		catch ( Exception e ) {			throw new QueryBuilderVisitorException( e );		}	}		public DocumentIterator visitPost( final And node, final DocumentIterator[] subNode ) throws QueryBuilderVisitorException {		try {			return AndDocumentIterator.getInstance( numberOfDocuments, subNode );		}		catch ( IOException e ) {			throw new QueryBuilderVisitorException( e );		}	}	public DocumentIterator visitPost( final Consecutive node, final DocumentIterator[] subNode ) throws QueryBuilderVisitorException {		try {			return ConsecutiveDocumentIterator.getInstance( subNode, node.gap );		}		catch ( IOException e ) {			throw new QueryBuilderVisitorException( e );		}	}	public DocumentIterator visitPost( final LowPass node, final DocumentIterator subNode ) {		return LowPassDocumentIterator.getInstance( subNode, node.k );	}	public DocumentIterator visitPost( final Not node, final DocumentIterator subNode ) throws QueryBuilderVisitorException {		try {			return NotDocumentIterator.getInstance( subNode, numberOfDocuments );		}		catch ( IOException e ) {			throw new QueryBuilderVisitorException( e );		}	}	public DocumentIterator visitPost( final Or node, final DocumentIterator[] subNode ) throws QueryBuilderVisitorException {		try {			return OrDocumentIterator.getInstance( subNode );		}		catch ( IOException e ) {			throw new QueryBuilderVisitorException( e );		}	}		public DocumentIterator visitPost( final OrderedAnd node, final DocumentIterator[] subNode ) throws QueryBuilderVisitorException {		try {			return OrderedAndDocumentIterator.getInstance( numberOfDocuments, subNode );		}		catch ( IOException e ) {			throw new QueryBuilderVisitorException( e );		}	}	public DocumentIterator visitPost( final Align node, final DocumentIterator[] subNode ) throws QueryBuilderVisitorException {		return AlignDocumentIterator.getInstance( subNode[ 0 ], subNode[ 1 ] );	}	public DocumentIterator visitPost( final Difference node, final DocumentIterator[] subNode ) {		return DifferenceDocumentIterator.getInstance( subNode[ 0 ], subNode[ 1 ], node.leftMargin, node.rightMargin );	}	public DocumentIterator visitPost( final MultiTerm node, final DocumentIterator subNode[] ) throws QueryBuilderVisitorException {		final IndexIterator[] indexIterator = new IndexIterator[ subNode.length ];		System.arraycopy( subNode, 0, indexIterator, 0, indexIterator.length );		IndexIterator result;		try {			result = MultiTermIndexIterator.getInstance( curr.top(), indexIterator );		}		catch ( IOException e ) {			throw new QueryBuilderVisitorException( e );		}		result.term( node.toString() );		return result;	}	public boolean visitPre( final Select node ) throws QueryBuilderVisitorException {		if ( indexMap == null ) throw new IllegalArgumentException( "You cannot use Select nodes without an index map" );		final Index index = indexMap.get( node.index.toString() );		if ( index == null ) throw new NoSuchElementException( "The selected index (" + node.index + ")" + " does not appear in the index map (" + indexMap + ")" ); 		curr.push( indexMap.get( node.index.toString() ) );		return true;	}	public DocumentIterator visitPost( final Select node, final DocumentIterator subNode ) {		curr.pop();		return subNode;	}}
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -