All Downloads are FREE. Search and download functionalities are using the official Maven repository.

src.it.unimi.dsi.big.mg4j.query.nodes.MultiTerm Maven / Gradle / Ivy

Go to download

MG4J (Managing Gigabytes for Java) is a free full-text search engine for large document collections written in Java. The big version is a fork of the original MG4J that can handle more than 2^31 terms and documents.

The newest version!
package it.unimi.dsi.big.mg4j.query.nodes;

import it.unimi.dsi.fastutil.objects.ObjectOpenHashSet;
import it.unimi.dsi.lang.MutableString;
import it.unimi.dsi.big.mg4j.index.MultiTermIndexIterator;
import it.unimi.dsi.big.mg4j.search.DocumentIterator;

import java.util.Arrays;

/*		 
 * MG4J: Managing Gigabytes for Java (big)
 *
 * Copyright (C) 2007-2011 Sebastiano Vigna 
 *
 *  This library is free software; you can redistribute it and/or modify it
 *  under the terms of the GNU Lesser General Public License as published by the Free
 *  Software Foundation; either version 3 of the License, or (at your option)
 *  any later version.
 *
 *  This library is distributed in the hope that it will be useful, but
 *  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
 *  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License
 *  for more details.
 *
 *  You should have received a copy of the GNU Lesser General Public License
 *  along with this program; if not, see .
 *
 */

/** A node representing a virtual term obtained by merging the occurrences of the given (possibly weighted) terms.
 * 
 * 

This node is mainly useful when performing query expansion. The {@link QueryBuilderVisitor} * used to generate {@linkplain DocumentIterator document iterators} can decide which * policy to use for setting the frequency and the name of the virtual term. * * @author Sebastiano Vigna * @see MultiTermIndexIterator */ public class MultiTerm extends Composite { private static final long serialVersionUID = 1L; /** Creates a new multi-term node. * * @param query a vector of nodes representing distinct terms; they must be either instances * of {@link Term}, or instances of {@link Weight} containing instances of {@link Term}. * @throws IllegalArgumentException if some term appears twice in query, or if * the specification is not followed. */ public MultiTerm( final Query... query ) { super( query ); final ObjectOpenHashSet s = new ObjectOpenHashSet( query.length ); for( Query q : query ) { if ( ! ( q instanceof Term ) && ! ( ( q instanceof Weight ) && ( ((Weight)q).query instanceof Term ) ) ) throw new IllegalArgumentException(); s.add( new MutableString( q instanceof Term ? ((Term)q).term : ((Term)((Weight)q).query ).term ) ); } if ( s.size() != query.length ) throw new IllegalArgumentException( "Multiterm nodes require distinct terms" ); } public String toString() { return super.toString( "MULTITERM(", ")", ", " ); } public T accept( final QueryBuilderVisitor visitor ) throws QueryBuilderVisitorException { if ( ! visitor.visitPre( this ) ) return null; final T[] result = visitor.newArray( query.length ); for( int i = 0; i < query.length; i++ ) if ( ( result[ i ] = query[ i ].accept( visitor ) ) == null ) return null; return visitor.visitPost( this, result ); } public boolean equals( final Object o ) { if ( ! ( o instanceof MultiTerm ) ) return false; return Arrays.equals( query, ((MultiTerm)o).query ); } public int hashCode() { return Arrays.hashCode( query ) ^ getClass().hashCode(); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy