All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.carrot2.source.SimpleSearchEngine Maven / Gradle / Ivy

There is a newer version: 4.6.0
Show newest version

/*
 * Carrot2 project.
 *
 * Copyright (C) 2002-2018, Dawid Weiss, Stanisław Osiński.
 * All rights reserved.
 *
 * Refer to the full license file "carrot2.LICENSE"
 * in the root folder of the repository checkout or at:
 * http://www.carrot2.org/carrot2.LICENSE
 */

package org.carrot2.source;

import org.carrot2.core.IDocumentSource;
import org.carrot2.core.ProcessingException;
import org.carrot2.util.ExceptionUtils;
import org.carrot2.util.attribute.Bindable;

/**
 * A base class facilitating implementation of {@link IDocumentSource}s wrapping external
 * search engines with remote/ network-based interfaces. This implementation assumes that
 * all requested results can be fetched from the search engine using one request.
 * 
 * @see MultipageSearchEngine
 */
@Bindable
public abstract class SimpleSearchEngine extends SearchEngineBase
{
    /**
     * Requests and returns results from the underlying search engine.
     * 
     * @throws Exception in case of problems with the underlying search engine
     */
    protected abstract SearchEngineResponse fetchSearchResponse() throws Exception;

    @Override
    public void process() throws ProcessingException
    {
        try
        {
            final SearchEngineResponse response = fetchSearchResponse();
            documents = response.results;
            resultsTotal = response.getResultsTotal();
            compressed = false;
            final String compression = (String) response.metadata
                .get(SearchEngineResponse.COMPRESSION_KEY);
            if (compression != null && "gzip".contains(compression))
            {
                compressed = true;
            }
        }
        catch (Exception e)
        {
            throw ExceptionUtils.wrapAs(ProcessingException.class, e);
        }
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy