org.apache.jackrabbit.oak.segment.WriterCacheManager Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.jackrabbit.oak.segment;
import static com.google.common.base.Preconditions.checkNotNull;
import static com.google.common.base.Suppliers.memoize;
import static com.google.common.collect.Iterators.transform;
import static com.google.common.collect.Maps.newConcurrentMap;
import static java.lang.Integer.getInteger;
import static org.apache.jackrabbit.oak.segment.RecordCache.newRecordCache;
import java.util.Iterator;
import java.util.concurrent.ConcurrentMap;
import com.google.common.base.Function;
import com.google.common.base.Predicate;
import com.google.common.base.Supplier;
import com.google.common.cache.CacheStats;
import org.apache.jackrabbit.oak.api.jmx.CacheStatsMBean;
import org.apache.jackrabbit.oak.segment.file.PriorityCache;
import org.apache.jackrabbit.oak.stats.StatisticsProvider;
import org.jetbrains.annotations.NotNull;
import org.jetbrains.annotations.Nullable;
/**
* Instances of this class manage the deduplication caches used by the {@link
* SegmentWriter} to avoid writing multiple copies of the same record. The
* caches are striped into generations with one generation per gc cycle. This
* avoids records old generations being reused.
*/
public abstract class WriterCacheManager {
/**
* Default size of the string cache, used as default for OSGi config.
*/
static final int DEFAULT_STRING_CACHE_SIZE_OSGi = 15000;
/**
* Default size of the string cache.
* @see #getStringCache(int)
*/
public static final int DEFAULT_STRING_CACHE_SIZE = getInteger(
"oak.tar.stringsCacheSize", DEFAULT_STRING_CACHE_SIZE_OSGi);
/**
* Default size of the template cache, used as default for OSGi config.
*/
static final int DEFAULT_TEMPLATE_CACHE_SIZE_OSGi = 3000;
/**
* Default size of the template cache.
* @see #getTemplateCache(int)
*/
public static final int DEFAULT_TEMPLATE_CACHE_SIZE = getInteger(
"oak.tar.templatesCacheSize", DEFAULT_TEMPLATE_CACHE_SIZE_OSGi);
/**
* Default size of the node deduplication cache, used as default for OSGi
* config.
*/
static final int DEFAULT_NODE_CACHE_SIZE_OSGi = 1048576;
/**
* Default size of the node deduplication cache.
* @see #getNodeCache(int)
*/
public static final int DEFAULT_NODE_CACHE_SIZE = getInteger(
"oak.tar.nodeCacheSize", DEFAULT_NODE_CACHE_SIZE_OSGi);
/**
* @return cache for string records of the given {@code generation} and {@code operation}.
*/
@NotNull
public abstract Cache getStringCache(int generation);
/**
* @param generation
* @return cache for template records of the given {@code generation} and {@code operation}.
*/
@NotNull
public abstract Cache getTemplateCache(int generation);
/**
* @return cache for node records of the given {@code generation} and {@code operation}.
*/
@NotNull
public abstract Cache getNodeCache(int generation);
/**
* Enable access statistics for this cache. The instance returned by from
* this method delegates back to this instance and adds access statistics
* via the passed {@code statisticsProvider}.
* @param name
* @param statisticsProvider
* @return an instance of this cache with access statistics enabled.
*/
@NotNull
public WriterCacheManager withAccessTracking(
@NotNull String name,
@NotNull StatisticsProvider statisticsProvider) {
return new AccessTrackingCacheManager(checkNotNull(name), checkNotNull(statisticsProvider), this);
}
/**
* @return statistics for the string cache or {@code null} if not available.
*/
@Nullable
public CacheStatsMBean getStringCacheStats() {
return null;
}
/**
* @return statistics for the template cache or {@code null} if not available.
*/
@Nullable
public CacheStatsMBean getTemplateCacheStats() {
return null;
}
/**
* @return statistics for the node cache or {@code null} if not available.
*/
@Nullable
public CacheStatsMBean getNodeCacheStats() {
return null;
}
/**
* Get occupancy information for the node deduplication cache indicating occupancy and
* evictions per priority.
* @return occupancy information for the node deduplication cache.
*/
@Nullable
public String getNodeCacheOccupancyInfo() { return null; }
/**
* This implementation of {@link WriterCacheManager} returns empty caches
* of size 0.
* @see #INSTANCE
*/
public static class Empty extends WriterCacheManager {
/**
* Singleton instance of {@link Empty}
*/
public static final WriterCacheManager INSTANCE = new Empty();
private final RecordCache stringCache = newRecordCache(0);
private final RecordCache templateCache = newRecordCache(0);
private Empty() {}
/**
* @return empty cache of size 0
*/
@NotNull
@Override
public RecordCache getStringCache(int generation) {
return stringCache;
}
/**
* @return empty cache of size 0
*/
@NotNull
@Override
public RecordCache getTemplateCache(int generation) {
return templateCache;
}
/**
* @return a {@code Cache} cache that is always empty
*/
@NotNull
@Override
public Cache getNodeCache(int generation) {
return new Cache() {
@Override
public void put(@NotNull String stableId, @NotNull RecordId recordId, byte cost) { }
@Override
public void put(@NotNull String key, @NotNull RecordId value) {
throw new UnsupportedOperationException();
}
@Nullable
@Override
public RecordId get(@NotNull String stableId) { return null; }
};
}
}
/**
* This implementation of {@link WriterCacheManager} returns
* {@link RecordCache} instances for the string and template cache
* and {@link Cache} instance for the node cache.
*/
public static class Default extends WriterCacheManager {
/**
* Cache of recently stored string records, used to avoid storing duplicates
* of frequently occurring data.
*/
private final Generations> stringCaches;
/**
* Cache of recently stored template records, used to avoid storing
* duplicates of frequently occurring data.
*/
private final Generations> templateCaches;
/**
* Cache of recently stored nodes to avoid duplicating linked nodes (i.e. checkpoints)
* during compaction.
*/
private final Supplier> nodeCache;
/**
* New instance using the passed factories for creating cache instances.
* The factories will be invoked exactly once when a generation of a
* cache is requested that has not been requested before.
*
* @param stringCacheFactory factory for the string cache
* @param templateCacheFactory factory for the template cache
* @param nodeCacheFactory factory for the node cache
*/
public Default(
@NotNull Supplier> stringCacheFactory,
@NotNull Supplier> templateCacheFactory,
@NotNull Supplier> nodeCacheFactory) {
this.stringCaches = new Generations<>(stringCacheFactory);
this.templateCaches = new Generations<>(templateCacheFactory);
this.nodeCache = memoize(nodeCacheFactory);
}
/**
* New instance using the default factories {@link RecordCache#factory(int)}
* and {@link PriorityCache#factory(int)} with the sizes
* {@link #DEFAULT_STRING_CACHE_SIZE}, {@link #DEFAULT_TEMPLATE_CACHE_SIZE}
* and {@link #DEFAULT_NODE_CACHE_SIZE}.
*/
public Default() {
this(RecordCache.factory(DEFAULT_STRING_CACHE_SIZE),
RecordCache.factory(DEFAULT_TEMPLATE_CACHE_SIZE),
PriorityCache.factory(DEFAULT_NODE_CACHE_SIZE));
}
private static class Generations implements Iterable {
private final ConcurrentMap> generations = newConcurrentMap();
private final Supplier cacheFactory;
Generations(@NotNull Supplier cacheFactory) {
this.cacheFactory = checkNotNull(cacheFactory);
}
T getGeneration(final int generation) {
// Preemptive check to limit the number of wasted (Memoizing)Supplier instances
if (!generations.containsKey(generation)) {
generations.putIfAbsent(generation, memoize(cacheFactory));
}
return generations.get(generation).get();
}
@NotNull
@Override
public Iterator iterator() {
return transform(generations.values().iterator(), new Function, T>() {
@Nullable @Override
public T apply(Supplier cacheFactory) {
return cacheFactory.get();
}
});
}
void evictGenerations(@NotNull Predicate evict) {
Iterator it = generations.keySet().iterator();
while (it.hasNext()) {
if (evict.apply(it.next())) {
it.remove();
}
}
}
}
@NotNull
@Override
public Cache getStringCache(int generation) {
return stringCaches.getGeneration(generation);
}
@NotNull
@Override
public Cache getTemplateCache(int generation) {
return templateCaches.getGeneration(generation);
}
private PriorityCache nodeCache() {
return nodeCache.get();
}
@Override
@NotNull
public Cache getNodeCache(final int generation) {
return new Cache() {
@Override
public void put(@NotNull String stableId, @NotNull RecordId recordId, byte cost) {
nodeCache().put(stableId, recordId, generation, cost);
}
@Override
public void put(@NotNull String key, @NotNull RecordId value) {
throw new UnsupportedOperationException();
}
@Nullable
@Override
public RecordId get(@NotNull String stableId) {
return nodeCache().get(stableId, generation);
}
};
}
@Nullable
@Override
public CacheStatsMBean getStringCacheStats() {
return new RecordCacheStats("String deduplication cache stats",
accumulateRecordCacheStats(stringCaches),
accumulateRecordCacheSizes(stringCaches),
accumulateRecordCacheWeights(stringCaches));
}
@Nullable
@Override
public CacheStatsMBean getTemplateCacheStats() {
return new RecordCacheStats("Template deduplication cache stats",
accumulateRecordCacheStats(templateCaches),
accumulateRecordCacheSizes(templateCaches),
accumulateRecordCacheWeights(templateCaches));
}
@NotNull
private static Supplier accumulateRecordCacheStats(
final Iterable> caches) {
return new Supplier() {
@Override
public CacheStats get() {
CacheStats stats = new CacheStats(0, 0, 0, 0, 0, 0);
for (RecordCache> cache : caches) {
stats = stats.plus(cache.getStats());
}
return stats;
}
};
}
@NotNull
public static Supplier accumulateRecordCacheSizes(
final Iterable> caches) {
return new Supplier() {
@Override
public Long get() {
long size = 0;
for (RecordCache> cache : caches) {
size += cache.size();
}
return size;
}
};
}
@NotNull
public static Supplier accumulateRecordCacheWeights(
final Iterable> caches) {
return new Supplier() {
@Override
public Long get() {
long size = 0;
for (RecordCache> cache : caches) {
size += cache.estimateCurrentWeight();
}
return size;
}
};
}
@Nullable
@Override
public CacheStatsMBean getNodeCacheStats() {
return new RecordCacheStats("Node deduplication cache stats",
new Supplier() {
@Override
public CacheStats get() {
return nodeCache().getStats();
}
},
new Supplier() {
@Override
public Long get() {
return nodeCache().size();
}
},
new Supplier() {
@Override
public Long get() {
return nodeCache().estimateCurrentWeight();
}
});
}
/**
* Remove all cache generations matching the passed {@code generations} predicate.
* @param generations
*/
protected final void evictCaches(Predicate generations) {
stringCaches.evictGenerations(generations);
templateCaches.evictGenerations(generations);
nodeCache().purgeGenerations(generations);
}
}
/**
* Wrapper wrapping all caches returned by a {@link WriterCacheManager}
* into a {@link CacheAccessTracker}.
*/
private static class AccessTrackingCacheManager extends WriterCacheManager {
@NotNull
private final String name;
@NotNull
private final StatisticsProvider statisticsProvider;
@NotNull
private final WriterCacheManager delegate;
/**
* Create a new instance. The {@code name} passed is used to prepend to the
* names used to expose the access statistics.
* @param name name under which to expose the access statistics
* @param statisticsProvider statistics provider where the access statistics is recorded to
* @param delegate the underlying, wrapped cache manager
*
* @see #getStringCache(int)
* @see #getTemplateCache(int)
* @see #getNodeCache(int)
*/
public AccessTrackingCacheManager(
@NotNull String name,
@NotNull StatisticsProvider statisticsProvider,
@NotNull WriterCacheManager delegate) {
this.name = name;
this.statisticsProvider = statisticsProvider;
this.delegate = delegate;
}
/**
* @return the wrapped cache returned by the delegate's method of
* the same name exposing access statistics under
* {@code "oak.segment.string-deduplication-cache-" + name}
*/
@NotNull
@Override
public Cache getStringCache(int generation) {
return new CacheAccessTracker<>(
"oak.segment.string-deduplication-cache-" + name,
statisticsProvider, delegate.getStringCache(generation)
);
}
/**
* @return the wrapped cache returned by the delegate's method of
* the same name exposing access statistics under
* {@code "oak.segment.template-deduplication-cache-" + name}
*/
@NotNull
@Override
public Cache getTemplateCache(int generation) {
return new CacheAccessTracker<>(
"oak.segment.template-deduplication-cache-" + name,
statisticsProvider, delegate.getTemplateCache(generation)
);
}
/**
* @return the wrapped cache returned by the delegate's method of
* the same name exposing access statistics under
* {@code "oak.segment.node-deduplication-cache-" + name}
*/
@NotNull
@Override
public Cache getNodeCache(int generation) {
return new CacheAccessTracker<>(
"oak.segment.node-deduplication-cache-" + name,
statisticsProvider, delegate.getNodeCache(generation)
);
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy