All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.manifoldcf.agents.interfaces.IOutputCheckActivity Maven / Gradle / Ivy

/* $Id$ */

/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.manifoldcf.agents.interfaces;

import org.apache.manifoldcf.core.interfaces.*;
import org.apache.manifoldcf.agents.interfaces.*;

import java.io.*;
import java.util.*;

/** This interface abstracts from the activities that a transformation connector can do
when checking a document.
*/
public interface IOutputCheckActivity
{
  public static final String _rcsid = "@(#)$Id$";

  /** Detect if a document date is acceptable downstream or not.  This method is used to determine whether it makes sense to fetch a document
  * in the first place.
  *@param date is the date of the document.
  *@return true if the document with that date can be accepted by the downstream connection.
  */
  public boolean checkDateIndexable(Date date)
    throws ManifoldCFException, ServiceInterruption;

  /** Detect if a mime type is acceptable downstream or not.  This method is used to determine whether it makes sense to fetch a document
  * in the first place.
  *@param mimeType is the mime type of the document.
  *@return true if the mime type can be accepted by the downstream connection.
  */
  public boolean checkMimeTypeIndexable(String mimeType)
    throws ManifoldCFException, ServiceInterruption;

  /** Pre-determine whether a document (passed here as a File object) is acceptable downstream.  This method is
  * used to determine whether a document needs to be actually transferred.  This hook is provided mainly to support
  * search engines that only handle a small set of accepted file types.
  *@param localFile is the local file to check.
  *@return true if the file is acceptable by the downstream connection.
  */
  public boolean checkDocumentIndexable(File localFile)
    throws ManifoldCFException, ServiceInterruption;

  /** Pre-determine whether a document's length is acceptable downstream.  This method is used
  * to determine whether to fetch a document in the first place.
  *@param length is the length of the document.
  *@return true if the file is acceptable by the downstream connection.
  */
  public boolean checkLengthIndexable(long length)
    throws ManifoldCFException, ServiceInterruption;

  /** Pre-determine whether a document's URL is acceptable downstream.  This method is used
  * to help filter out documents that cannot be indexed in advance.
  *@param url is the URL of the document.
  *@return true if the file is acceptable by the downstream connection.
  */
  public boolean checkURLIndexable(String url)
    throws ManifoldCFException, ServiceInterruption;

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy