org.modeshape.jcr.RepositoryQueryManager Maven / Gradle / Ivy
/*
* ModeShape (http://www.modeshape.org)
* See the COPYRIGHT.txt file distributed with this work for information
* regarding copyright ownership. Some portions may be licensed
* to Red Hat, Inc. under one or more contributor license agreements.
* See the AUTHORS.txt file in the distribution for a full listing of
* individual contributors.
*
* ModeShape is free software. Unless otherwise indicated, all code in ModeShape
* is licensed to you under the terms of the GNU Lesser General Public License as
* published by the Free Software Foundation; either version 2.1 of
* the License, or (at your option) any later version.
*
* ModeShape is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this software; if not, write to the Free
* Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
* 02110-1301 USA, or see the FSF site: http://www.fsf.org.
*/
package org.modeshape.jcr;
import java.util.HashSet;
import java.util.LinkedList;
import java.util.Map;
import java.util.Properties;
import java.util.Queue;
import java.util.Set;
import java.util.concurrent.Callable;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Future;
import java.util.concurrent.locks.Lock;
import java.util.concurrent.locks.ReentrantLock;
import javax.jcr.query.InvalidQueryException;
import javax.transaction.Synchronization;
import org.hibernate.search.backend.TransactionContext;
import org.hibernate.search.engine.spi.SearchFactoryImplementor;
import org.hibernate.search.spi.SearchFactoryBuilder;
import org.modeshape.common.annotation.GuardedBy;
import org.modeshape.common.logging.Logger;
import org.modeshape.common.util.CheckArg;
import org.modeshape.jcr.JcrRepository.RunningState;
import org.modeshape.jcr.RepositoryConfiguration.QuerySystem;
import org.modeshape.jcr.api.query.qom.QueryCommand;
import org.modeshape.jcr.cache.CachedNode;
import org.modeshape.jcr.cache.ChildReference;
import org.modeshape.jcr.cache.ChildReferences;
import org.modeshape.jcr.cache.NodeCache;
import org.modeshape.jcr.cache.NodeKey;
import org.modeshape.jcr.cache.PathCache;
import org.modeshape.jcr.cache.RepositoryCache;
import org.modeshape.jcr.query.CancellableQuery;
import org.modeshape.jcr.query.QueryIndexing;
import org.modeshape.jcr.query.lucene.LuceneQueryEngine;
import org.modeshape.jcr.query.lucene.LuceneSearchConfiguration;
import org.modeshape.jcr.query.lucene.basic.BasicLuceneConfiguration;
import org.modeshape.jcr.query.optimize.Optimizer;
import org.modeshape.jcr.query.optimize.RuleBasedOptimizer;
import org.modeshape.jcr.query.plan.CanonicalPlanner;
import org.modeshape.jcr.query.plan.PlanHints;
import org.modeshape.jcr.query.plan.Planner;
import org.modeshape.jcr.query.validate.Schemata;
import org.modeshape.jcr.value.Path;
import org.modeshape.jcr.value.Path.Segment;
/**
* The query manager a the repository. Each instance lazily starts up the {@link LuceneQueryEngine}, which can be expensive.
*/
class RepositoryQueryManager {
private final RunningState runningState;
private final ExecutorService indexingExecutorService;
private final LuceneSearchConfiguration config;
private final Lock engineInitLock = new ReentrantLock();
@GuardedBy( "engineInitLock" )
private volatile LuceneQueryEngine queryEngine;
private final Logger logger = Logger.getLogger(getClass());
protected RepositoryQueryManager( RunningState runningState,
QuerySystem querySystem ) {
this.runningState = runningState;
this.indexingExecutorService = null;
this.config = null;
}
RepositoryQueryManager( RunningState runningState,
QuerySystem querySystem,
ExecutorService indexingExecutorService,
Properties backendProps,
Properties indexingProps,
Properties indexStorageProps ) {
this.runningState = runningState;
this.indexingExecutorService = indexingExecutorService;
// Set up the query engine ...
String repoName = runningState.name();
this.config = new BasicLuceneConfiguration(repoName, backendProps, indexingProps, indexStorageProps);
}
void shutdown() {
indexingExecutorService.shutdown();
if (queryEngine != null) {
try {
engineInitLock.lock();
if (queryEngine != null) {
try {
queryEngine.shutdown();
} finally {
queryEngine = null;
}
}
} finally {
engineInitLock.unlock();
}
}
}
public CancellableQuery query( ExecutionContext context,
RepositoryCache repositoryCache,
Set workspaceNames,
Map overriddenNodeCachesByWorkspaceName,
QueryCommand query,
Schemata schemata,
PlanHints hints,
Map variables ) throws InvalidQueryException {
return queryEngine().query(context,
repositoryCache,
workspaceNames,
overriddenNodeCachesByWorkspaceName,
(org.modeshape.jcr.query.model.QueryCommand)query,
schemata,
hints,
variables);
}
public QueryIndexing getIndexes() {
return queryEngine().getQueryIndexing();
}
protected final LuceneQueryEngine queryEngine() {
if (queryEngine == null) {
try {
engineInitLock.lock();
if (queryEngine == null) {
Logger.getLogger(getClass()).debug("Hibernate Search configuration for repository '{0}': {1}",
runningState.name(),
config);
boolean enableFullTextSearch = runningState.isFullTextSearchEnabled();
Planner planner = new CanonicalPlanner();
Optimizer optimizer = new RuleBasedOptimizer();
SearchFactoryImplementor searchFactory = new SearchFactoryBuilder().configuration(config)
.buildSearchFactory();
queryEngine = new LuceneQueryEngine(runningState.context(), runningState.name(), planner, optimizer,
searchFactory, config.getVersion(), enableFullTextSearch);
}
} finally {
engineInitLock.unlock();
}
}
return queryEngine;
}
/**
* Crawl and index all of the repository content.
*
* @param indexOnlyIfMissing flag which indicates whether all the nodes should be re-indexed or only nodes which are not part
* of the existing indexes
* @param includeSystemContent flag which indicates whether content in the system workspace (below /jcr:system) should be
* re-indexed or not.
* @param async flag which indicates whether the operation should be done synchronously or asynchronously
*/
protected void reindexContent( final boolean indexOnlyIfMissing,
final boolean includeSystemContent,
boolean async ) {
if (async) {
indexingExecutorService.submit(new Callable() {
@SuppressWarnings( "synthetic-access" )
@Override
public Void call() throws Exception {
reindexContent(indexOnlyIfMissing, includeSystemContent);
return null;
}
});
} else {
reindexContent(indexOnlyIfMissing, includeSystemContent);
}
}
/**
* Crawl and index all of the repository content.
*
* @param indexOnlyIfMissing true if the reindexing should be performed if the indexes are missing
* @param includeSystemContent true if the system content should also be indexed
*/
private void reindexContent( boolean indexOnlyIfMissing,
boolean includeSystemContent ) {
// The node type schemata changes every time a node type is (un)registered, so get the snapshot that we'll use throughout
NodeTypeSchemata schemata = runningState.nodeTypeManager().getRepositorySchemata();
RepositoryCache repoCache = runningState.repositoryCache();
// If we want to index only missing nodes, we need load what's already indexed
Set excludedKeysFromIndexing = new HashSet();
if (indexOnlyIfMissing) {
excludedKeysFromIndexing.addAll(getIndexes().indexedNodes());
}
if (indexOnlyIfMissing) {
if (excludedKeysFromIndexing.isEmpty()) {
logger.info(JcrI18n.reindexMissingNoIndexesExist, runningState.name());
} else {
logger.debug("Only missing indexes will be re-indexed in the {0} repository. The existing nodes are indexed: {1}",
runningState.name(),
excludedKeysFromIndexing);
}
} else {
logger.info(JcrI18n.reindexAll, runningState.name());
}
if (includeSystemContent) {
NodeCache systemWorkspaceCache = repoCache.getWorkspaceCache(repoCache.getSystemWorkspaceName());
CachedNode rootNode = systemWorkspaceCache.getNode(repoCache.getSystemKey());
// Index the system content ...
logger.debug("Starting reindex of system content in '{0}' repository.", runningState.name());
reindexSystemContent(rootNode, Integer.MAX_VALUE, schemata, excludedKeysFromIndexing);
logger.debug("Completed reindex of system content in '{0}' repository.", runningState.name());
}
// Index the non-system workspaces ...
for (String workspaceName : repoCache.getWorkspaceNames()) {
NodeCache workspaceCache = repoCache.getWorkspaceCache(workspaceName);
CachedNode rootNode = workspaceCache.getNode(workspaceCache.getRootKey());
logger.debug("Starting reindex of workspace '{0}' content in '{1}' repository.", runningState.name(), workspaceName);
reindexContent(workspaceName, schemata, workspaceCache, rootNode, Integer.MAX_VALUE, false, excludedKeysFromIndexing);
logger.debug("Completed reindex of workspace '{0}' content in '{1}' repository.", runningState.name(), workspaceName);
}
}
/**
* Crawl and index the content in the named workspace.
*
* @param workspace the workspace
* @throws IllegalArgumentException if the workspace is null
*/
public void reindexContent( JcrWorkspace workspace ) {
reindexContent(workspace, Path.ROOT_PATH, Integer.MAX_VALUE);
}
/**
* Crawl and index the content starting at the supplied path in the named workspace, to the designated depth.
*
* @param workspace the workspace
* @param path the path of the content to be indexed
* @param depth the depth of the content to be indexed
* @throws IllegalArgumentException if the workspace or path are null, or if the depth is less than 1
*/
public void reindexContent( JcrWorkspace workspace,
Path path,
int depth ) {
CheckArg.isPositive(depth, "depth");
JcrSession session = workspace.getSession();
NodeCache cache = session.cache().getWorkspace();
String workspaceName = workspace.getName();
// Look for the node ...
CachedNode node = cache.getNode(cache.getRootKey());
for (Segment segment : path) {
// Look for the child by name ...
ChildReference ref = node.getChildReferences(cache).getChild(segment);
if (ref == null) return;
node = cache.getNode(ref);
}
// The node type schemata changes every time a node type is (un)registered, so get the snapshot that we'll use throughout
NodeTypeSchemata schemata = runningState.nodeTypeManager().getRepositorySchemata();
// If the node is in the system workspace ...
String systemWorkspaceKey = runningState.repositoryCache().getSystemWorkspaceKey();
if (node.getKey().getWorkspaceKey().equals(systemWorkspaceKey)) {
reindexSystemContent(node, depth, schemata, null);
} else {
// It's just a regular node in the workspace ...
reindexContent(workspaceName, schemata, cache, node, depth, path.isRoot(), null);
}
}
protected void reindexContent( final String workspaceName,
final NodeTypeSchemata schemata,
NodeCache cache,
CachedNode node,
int depth,
boolean reindexSystemContent,
Set keysToExclude ) {
boolean excludeCertainKeys = keysToExclude != null && !keysToExclude.isEmpty();
if (!node.isQueryable(cache)) {
return;
}
// Get the path for the first node (we already have it, but we need to populate the cache) ...
final PathCache paths = new PathCache(cache);
Path nodePath = paths.getPath(node);
// Index the first node ...
final QueryIndexing indexes = getIndexes();
final TransactionContext txnCtx = NO_TRANSACTION;
if (!excludeCertainKeys || keysToExclude == null || !keysToExclude.contains(node.getKey())) {
indexes.updateIndex(workspaceName,
node.getKey(),
nodePath,
node.getPrimaryType(cache),
node.getMixinTypes(cache),
node.getProperties(cache),
schemata,
txnCtx);
}
if (depth == 1) return;
// Create a queue for processing the subgraph
final Queue queue = new LinkedList();
if (reindexSystemContent) {
// We need to look for the system node, and index it differently ...
ChildReferences childRefs = node.getChildReferences(cache);
ChildReference systemRef = childRefs.getChild(JcrLexicon.SYSTEM);
NodeKey systemKey = systemRef != null ? systemRef.getKey() : null;
for (ChildReference childRef : node.getChildReferences(cache)) {
NodeKey childKey = childRef.getKey();
if (childKey.equals(systemKey)) {
// This is the "/jcr:system" node ...
node = cache.getNode(childKey);
reindexSystemContent(node, depth - 1, schemata, keysToExclude);
} else {
queue.add(childKey);
}
}
} else {
// Add all children to the queue ...
for (ChildReference childRef : node.getChildReferences(cache)) {
NodeKey childKey = childRef.getKey();
// we should not reindex anything which is in the system area
if (!childKey.getWorkspaceKey().equals(runningState.systemWorkspaceKey())) {
queue.add(childKey);
}
}
}
// Now, process the queue until empty ...
while (true) {
NodeKey key = queue.poll();
if (key == null) break;
// Look up the node and find the path ...
node = cache.getNode(key);
if (!node.isQueryable(cache)) {
continue;
}
nodePath = paths.getPath(node);
if (!excludeCertainKeys || keysToExclude == null || !keysToExclude.contains(key)) {
// Index the node ...
indexes.updateIndex(workspaceName,
node.getKey(),
nodePath,
node.getPrimaryType(cache),
node.getMixinTypes(cache),
node.getProperties(cache),
schemata,
txnCtx);
}
// Check the depth ...
if (nodePath.size() <= depth) {
// Add the children to the queue ...
for (ChildReference childRef : node.getChildReferences(cache)) {
queue.add(childRef.getKey());
}
}
}
}
protected void reindexSystemContent( CachedNode nodeInSystemBranch,
int depth,
NodeTypeSchemata schemata,
Set keysToExclude ) {
RepositoryCache repoCache = runningState.repositoryCache();
String workspaceName = repoCache.getSystemWorkspaceName();
NodeCache systemWorkspaceCache = repoCache.getWorkspaceCache(workspaceName);
reindexContent(workspaceName, schemata, systemWorkspaceCache, nodeInSystemBranch, depth, true, keysToExclude);
}
protected void reindexSystemContent( boolean async ) {
RepositoryCache repositoryCache = runningState.repositoryCache();
final NodeCache systemWorkspaceCache = repositoryCache.getWorkspaceCache(repositoryCache.getSystemWorkspaceName());
final CachedNode systemRoot = systemWorkspaceCache.getNode(repositoryCache.getSystemKey());
if (async) {
indexingExecutorService.submit(new Callable() {
@Override
public Void call() throws Exception {
reindexSystemContent(systemRoot, systemWorkspaceCache);
return null;
}
});
} else {
reindexSystemContent(systemRoot, systemWorkspaceCache);
}
}
protected final void reindexSystemContent( CachedNode systemRoot,
NodeCache systemWorkspaceCache ) {
final NodeTypeSchemata schemata = runningState.nodeTypeManager().getRepositorySchemata();
// first reindex only /jcr:system
reindexSystemContent(systemRoot, 1, schemata, null);
for (ChildReference childReference : systemRoot.getChildReferences(systemWorkspaceCache)) {
CachedNode systemNode = systemWorkspaceCache.getNode(childReference.getKey());
reindexSystemContent(systemNode, Integer.MAX_VALUE, schemata, null);
}
}
/**
* Asynchronously crawl and index the content in the named workspace.
*
* @param workspace the workspace
* @return the future for the asynchronous operation; never null
* @throws IllegalArgumentException if the workspace is null
*/
public Future reindexContentAsync( final JcrWorkspace workspace ) {
return indexingExecutorService.submit(new Callable() {
@Override
public Boolean call() throws Exception {
reindexContent(workspace);
return Boolean.TRUE;
}
});
}
/**
* Asynchronously crawl and index the content starting at the supplied path in the named workspace, to the designated depth.
*
* @param workspace the workspace
* @param path the path of the content to be indexed
* @param depth the depth of the content to be indexed
* @return the future for the asynchronous operation; never null
* @throws IllegalArgumentException if the workspace or path are null, or if the depth is less than 1
*/
public Future reindexContentAsync( final JcrWorkspace workspace,
final Path path,
final int depth ) {
return indexingExecutorService.submit(new Callable() {
@Override
public Boolean call() throws Exception {
reindexContent(workspace, path, depth);
return Boolean.TRUE;
}
});
}
protected static final TransactionContext NO_TRANSACTION = new TransactionContext() {
@Override
public boolean isTransactionInProgress() {
return false;
}
@Override
public Object getTransactionIdentifier() {
throw new UnsupportedOperationException("Should not be called since we're just reading content");
}
@Override
public void registerSynchronization( Synchronization synchronization ) {
throw new UnsupportedOperationException("Should not be called since we're just reading content");
}
};
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy