com.bigdata.relation.IRelation Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of bigdata-core Show documentation
Blazegraph(TM) DB Core Platform. It contains all Blazegraph DB dependencies other than Blueprints.
There is a newer version: 2.1.4
/*

Copyright (C) SYSTAP, LLC DBA Blazegraph 2006-2016.  All rights reserved.

Contact:
     SYSTAP, LLC DBA Blazegraph
     2501 Calvert ST NW #106
     Washington, DC 20008
     licenses@blazegraph.com

This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

*/
/*
 * Created on Jun 23, 2008
 */

package com.bigdata.relation;

import java.util.Iterator;
import java.util.List;
import java.util.Set;
import java.util.concurrent.ExecutorService;

import com.bigdata.bop.BOp;
import com.bigdata.bop.BOpEvaluationContext;
import com.bigdata.bop.IBindingSet;
import com.bigdata.bop.IPredicate;
import com.bigdata.bop.IVariable;
import com.bigdata.btree.IIndex;
import com.bigdata.btree.ITuple;
import com.bigdata.btree.ITupleIterator;
import com.bigdata.journal.IIndexManager;
import com.bigdata.rdf.lexicon.LexiconRelation;
import com.bigdata.rdf.spo.SPORelation;
import com.bigdata.relation.accesspath.AccessPath;
import com.bigdata.relation.accesspath.IAccessPath;
import com.bigdata.relation.accesspath.IElementFilter;
import com.bigdata.relation.locator.ILocatableResource;
import com.bigdata.service.IBigdataFederation;
import com.bigdata.striterator.IKeyOrder;

/**
 * An abstraction corresponding to a set of elements using some schema (think a
 * table containing a set of rows). Each relation is backed by one or more
 * indices and knows how to return the {@link IAccessPath} that is most
 * efficient given an {@link IPredicate} expressing a query against the
 * {@link IRelation}.
 * 
 * @author Bryan Thompson
 * @version $Id$
 * @param E
 *            The generic type for the elements in the relation.
 */
public interface IRelation extends ILocatableResource>{

    /**
     * The {@link IIndexManager} for the {@link IRelation}.
     */
    IIndexManager getIndexManager();

    /**
     * The service used to run asynchronous or parallel tasks for the
     * {@link IRelation}.
     */
    ExecutorService getExecutorService();

    /**
     * Return the class for the generic type of this relation. This information
     * is used to dynamically create arrays of that generic type.
     */
    Class getElementClass();
    
//    /**
//     * Create and return a new element. The element is constructed from the
//     * predicate given the bindings. Typically, this is used when generating an
//     * {@link ISolution} for an {@link IRule} during either a query or mutation
//     * operations. The element is NOT inserted into the relation.
//     * 
//     * @param predicate
//     *            The predicate that is the head of some {@link IRule}.
//     * @param bindingSet
//     *            A set of bindings for that {@link IRule}.
//     * 
//     * @return The new element.
//     * 
//     * @throws IllegalArgumentException
//     *             if any parameter is null.
//     * @throws IllegalStateException
//     *             if the predicate is not fully bound given those bindings.
//     */
//    E newElement(IPredicate predicate, IBindingSet bindingSet);

    /**
     * Create and return a new element. The element is constructed from the
     * ordered list of variables and constants. Variables are replaced using the
     * given the bindings. The element is NOT inserted into the relation.
     * 
     * @param args
     *            An ordered list of variables and/or constants.
     * @param bindingSet
     *            A set of bindings.
     * 
     * @return The new element.
     * 
     * @throws IllegalArgumentException
     *             if any parameter is null.
     * @throws IllegalArgumentException
     *             if any of a is neither an {@link IVariable} nor an
     *             {@link IPredicate}.
     * @throws IllegalStateException
     *             if there exists a variable which is not bound given those
     *             bindings.
     */
    E newElement(List args, IBindingSet bindingSet);

    /**
     * Return the fully qualified name of each index maintained by this
     * relation.
     * 
     * @return An immutable set of the index names for the relation.
     * 
     * @deprecated by {@link #getKeyOrders()}. However, note that some odd ball
     *             cases exist such as the free text index of the
     *             {@link LexiconRelation} and the justifications index of the
     *             {@link SPORelation}.  These are currently enumerated by
     *             {@link #getIndexNames()} but they are not enumerated by
     *             {@link #getKeyOrders()} since they are not a simple 
     *             transform of the original relation.
     */
    Set getIndexNames();

    /**
     * Return the {@link IKeyOrder} for the primary index for the relation.
     */
    IKeyOrder getPrimaryKeyOrder();

    /**
     * Return the {@link IKeyOrder}s corresponding to the registered indices for
     * this relation. [rather than getIndexNames?]
     */
    Iterator> getKeyOrders();

    /**
     * Return the {@link IKeyOrder} for the predicate corresponding to the
     * perfect access path. A perfect access path is one where the bound values
     * in the predicate form a prefix in the key space of the corresponding
     * index.
     * 
     * @param p
     *            The predicate.
     * 
     * @return The {@link IKeyOrder} for the perfect access path -or-
     *         null if there is no index which provides a perfect
     *         access path for that predicate.
     * 
     * @todo What about "best" versus "perfect"? Perfect is more a concept from
     *       RDF with covering indices. For other schemas we will often just
     *       have "best". If you only have one index then it is always "best".
     *       However, in order to use the "best" access path we must impose the
     *       constraint on the {@link IAccessPath} that it filter out any
     *       elements visited during the scan which do not satisfy the places
     *       where bound variables or constants appear in the predicate.
     *       
     *       Range count estimates will report all rows to be scanned. Exact
     *       range counts will perform the scan, applying any filters.
     */
    IKeyOrder getKeyOrder(IPredicate predicate);

    /**
     * Return the best {@link IAccessPath} for a relation given a predicate with
     * zero or more unbound variables.
     * 

     * If there is an {@link IIndex} that directly corresponds to the natural
     * order implied by the variable pattern on the predicate then the access
     * path should use that index. Otherwise you should choose the best index
     * given the constraints and make sure that the {@link IAccessPath}
     * incorporates additional filters that will allow you to filter out the
     * irrelevant {@link ITuple}s during the scan - this is very important when
     * the index is remote!
     * 

     * If there are any {@link IElementFilter}s then the access path MUST
     * incorporate those constraints such that only elements that satisfy the
     * constraints may be visited.
     * 

     * Whether the constraints arise because of the lack of a perfect index for
     * the access path or because they were explicitly specified for the
     * {@link IPredicate}, those constraints should be translated into
     * constraints imposed on the underlying {@link ITupleIterator} and sent
     * with it to be evaluated local to the data.
     * 

     * Note: Filters should be specified when the {@link IAccessPath} is
     * constructed so that they will be evaluated on the data service rather
     * than materializing the elements and then filtering then. This can be
     * accomplished by adding the filter as a constraint on the predicate when
     * specifying the access path.
     * 
     * @param predicate
     *            The constraint on the elements to be visited.
     * 
     * @return The best {@link IAccessPath} for that {@link IPredicate}.
     * 
     * @see #getAccessPath(IKeyOrder, IPredicate)
     */
    IAccessPath getAccessPath(IPredicate predicate);

    /**
     * Return the {@link IAccessPath} for an {@link IRelation} using the
     * specified {@link IKeyOrder}.
     * 
     * @param keyOrder
     *            Identifies which index to use (required).
     * @param predicate
     *            The predicate (required).
     *            
     * @return The {@link IAccessPath}.
     * 
     * @see #getAccessPath(IIndexManager, IKeyOrder, IPredicate) 
     */
    IAccessPath getAccessPath(IKeyOrder keyOrder,IPredicate predicate);

    /**
     * Return the {@link IAccessPath} for an {@link IRelation} using the
     * specified {@link IIndexManager} and {@link IKeyOrder} (core impl).
     * 

     * 
Predicate annotations

     * Together, this method and {@link AccessPath} is responsible for
     * interpreting the following {@link IPredicate}
     * {@link IPredicate#Annotations}:
     * 
     * {@link IPredicate.Annotations#ACCESS_PATH_EXPANDER}

     * 

     * 

     * Access paths and a Standalone Database

     * There is only one {@link IIndexManager} when running against a standalone
     * database. That {@link IIndexManager} is available from
     * {@link IRelation#getIndexManager()}.
     * 
     * Access Paths and Scale-Out Operators

     * 
     * Scale-out {@link BOp operators} which are
     * {@link BOpEvaluationContext#SHARDED} or
     * {@link BOpEvaluationContext#HASHED} require access to the local index
     * manager on the data service and signal this using:
     * 

     * The {@link BOpEvaluationContext#SHARDED} or
     * {@link BOpEvaluationContext#HASHED} (on a join); and

     * The {@link IPredicate.Annotations#PARTITION_ID} (for a shard-wise
     * access path).

     * 

     * In order to service a request for a local access path in scale-out, the
     * caller MUST specify the localIndexManager.
     * 
     * Scale-out {@link BOp operators} MAY use remote access paths and signal
     * this using:
     * 

     * The {@link BOpEvaluationContext#ANY} (on a join); and

     * Setting {@link IPredicate.Annotations#REMOTE_ACCESS_PATH} to
     * true.

     * 

     * When a remote access path is required, the localIndexManager is
     * ignored and {@link IRelation#getIndexManager()} is used to obtain the
     * {@link IBigdataFederation} from which the {@link IRelation} definition
     * was materialized.
     * 
     * @param localIndexManager
     *            The local index manager (optional).
     * @param keyOrder
     *            Identifies which index to use (required).
     * @param predicate
     *            The predicate (required).
     * 
     * @return The {@link IAccessPath}.
     */
    IAccessPath getAccessPath(IIndexManager localIndexManager,
            IKeyOrder keyOrder, IPredicate predicate);

//    /**
//     * This handles a request for an access path that is restricted to a
//     * specific index partition. This access path is used with the scale-out
//     * JOIN strategy, which distributes join tasks onto each index partition
//     * from which it needs to read. Those tasks constrain the predicate to only
//     * read from the index partition which is being serviced by that join task.
//     * 
//     * Note: Expanders ARE NOT applied in this code path. Expanders require a
//     * total view of the relation, which is not available during scale-out
//     * pipeline joins.
//     * 
//     * @param indexManager
//     *            This MUST be the data service local index manager so that the
//     *            returned access path will read against the local shard.
//     * @param predicate
//     *            The predicate. {@link IPredicate#getPartitionId()} MUST return
//     *            a valid index partition identifier.
//     * 
//     * @throws IllegalArgumentException
//     *             if either argument is null.
//     * @throws IllegalArgumentException
//     *             unless the {@link IIndexManager} is a local index
//     *             manager providing direct access to the specified shard.
//     * @throws IllegalArgumentException
//     *             unless the predicate identifies a specific shard using
//     *             {@link IPredicate#getPartitionId()}.
//     *             
//     * @deprecated {@link AccessPath} is handling this directly based on the
//     *             {@link IPredicate.Annotations#PARTITION_ID}.
//     */
//    IAccessPath getAccessPathForIndexPartition(IIndexManager indexManager,
//            IPredicate predicate);
    
    /**
     * The fully qualified name of the index.
     * 
     * @param keyOrder
     *            The natural index order.
     * 
     * @return The index name.
     */
    String getFQN(IKeyOrder keyOrder);

    /**
     * Return the index for associated with the specified {@link IKeyOrder} this
     * view of the relation.
     * 
     * @param keyOrder
     *            The natural index order.
     * 
     * @return The index -or- null iff the index does not exist as
     *         of the timestamp for this view of the relation.
     * 
     * @see #getIndex(String)
     */
    IIndex getIndex(IKeyOrder keyOrder);
    
}