org.apache.jackrabbit.oak.plugins.document.rdb.RDBVersionGCSupport Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.jackrabbit.oak.plugins.document.rdb;
import static com.google.common.collect.Iterables.filter;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import java.util.Set;
import org.apache.jackrabbit.oak.plugins.document.Collection;
import org.apache.jackrabbit.oak.plugins.document.NodeDocument;
import org.apache.jackrabbit.oak.plugins.document.NodeDocument.SplitDocType;
import org.apache.jackrabbit.oak.plugins.document.VersionGCSupport;
import org.apache.jackrabbit.oak.plugins.document.rdb.RDBDocumentStore.QueryCondition;
import com.google.common.base.Predicate;
import com.google.common.collect.AbstractIterator;
/**
* RDB specific version of {@link VersionGCSupport} which uses an extended query
* interface to fetch required {@link NodeDocument}s.
*/
public class RDBVersionGCSupport extends VersionGCSupport {
private RDBDocumentStore store;
public RDBVersionGCSupport(RDBDocumentStore store) {
super(store);
this.store = store;
}
@Override
public Iterable getPossiblyDeletedDocs(final long lastModifiedTime) {
List conditions = new ArrayList();
conditions.add(new QueryCondition(NodeDocument.DELETED_ONCE, "=", 1));
conditions.add(new QueryCondition(NodeDocument.MODIFIED_IN_SECS, "<", NodeDocument.getModifiedInSecs(lastModifiedTime)));
return getIterator(RDBDocumentStore.EMPTY_KEY_PATTERN, conditions);
}
private Iterable getSplitDocuments() {
List conditions = Collections.emptyList();
// absent support for SDTYPE as indexed property: exclude those
// documents from the query which definitively aren't split documents
List excludeKeyPatterns = Arrays.asList("_:/%", "__:/%", "___:/%");
return getIterator(excludeKeyPatterns, conditions);
}
@Override
protected Iterable identifyGarbage(final Set gcTypes, final long oldestRevTimeStamp) {
return filter(getSplitDocuments(), new Predicate() {
@Override
public boolean apply(NodeDocument doc) {
return gcTypes.contains(doc.getSplitDocType()) && doc.hasAllRevisionLessThan(oldestRevTimeStamp);
}
});
}
private Iterable getIterator(final List excludeKeyPatterns, final List conditions) {
return new Iterable() {
@Override
public Iterator iterator() {
return new AbstractIterator() {
private static final int BATCH_SIZE = 100;
private String startId = NodeDocument.MIN_ID_VALUE;
private Iterator batch = nextBatch();
@Override
protected NodeDocument computeNext() {
// read next batch if necessary
if (!batch.hasNext()) {
batch = nextBatch();
}
NodeDocument doc;
if (batch.hasNext()) {
doc = batch.next();
// remember current id
startId = doc.getId();
} else {
doc = endOfData();
}
return doc;
}
private Iterator nextBatch() {
List result = store.query(Collection.NODES, startId, NodeDocument.MAX_ID_VALUE,
excludeKeyPatterns, conditions, BATCH_SIZE);
return result.iterator();
}
};
}
};
}
}