org.lenskit.eval.traintest.ComponentCache Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of lenskit-eval Show documentation
Show all versions of lenskit-eval Show documentation
Facilities for evaluating recommender algorithms.
/*
* LensKit, an open source recommender systems toolkit.
* Copyright 2010-2014 LensKit Contributors. See CONTRIBUTORS.md.
* Work on LensKit has been funded by the National Science Foundation under
* grants IIS 05-34939, 08-08692, 08-12148, and 10-17697.
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as
* published by the Free Software Foundation; either version 2.1 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License along with
* this program; if not, write to the Free Software Foundation, Inc., 51
* Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
*/
package org.lenskit.eval.traintest;
import com.google.common.base.Optional;
import com.google.common.collect.Lists;
import org.grouplens.grapht.Component;
import org.grouplens.grapht.Dependency;
import org.grouplens.grapht.InjectionException;
import org.grouplens.grapht.graph.DAGEdge;
import org.grouplens.grapht.graph.DAGNode;
import org.grouplens.grapht.graph.DAGNodeBuilder;
import org.grouplens.grapht.reflect.Satisfaction;
import org.grouplens.grapht.reflect.SatisfactionVisitor;
import org.grouplens.grapht.reflect.Satisfactions;
import org.lenskit.inject.GraphtUtils;
import org.lenskit.inject.NodeInstantiator;
import org.lenskit.inject.NodeProcessor;
import org.grouplens.lenskit.util.io.*;
import org.lenskit.util.UncheckedInterruptException;
import org.lenskit.util.io.StagedWrite;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import javax.annotation.Nonnull;
import javax.annotation.Nullable;
import javax.annotation.concurrent.ThreadSafe;
import javax.inject.Provider;
import java.io.*;
import java.lang.ref.SoftReference;
import java.nio.channels.ClosedByInterruptException;
import java.nio.file.Files;
import java.nio.file.Path;
import java.nio.file.StandardOpenOption;
import java.util.List;
import java.util.concurrent.ConcurrentHashMap;
import java.util.zip.GZIPInputStream;
import java.util.zip.GZIPOutputStream;
/**
* Shared cache for components in merged compilations. This cache implements two kinds of caching for shareable nodes:
*
* - Soft references to allow instances to be opportunistically reused between invocations
* - Optional disk-based caching to allow shareable components to be shared between all uses, even if their soft
* references might be flushed out of memory, as well as reused by subsequent evaluator invocations.
*/
@ThreadSafe
class ComponentCache implements NodeProcessor {
private static final Logger logger = LoggerFactory.getLogger(ComponentCache.class);
@Nullable
private final Path cacheDir;
@Nullable
private final ClassLoader classLoader;
private NodeInstantiator instantiator;
/**
* The set of cacheable nodes.
*/
private final ConcurrentHashMap,CacheEntry> cache;
/**
* Construct a new component cache.
*
* @param dir The cache directory (or {@code null} to disable disk-based caching).
* @param loader The class loader to be used when loading components from disk (or {@code null} if not needed).
*/
public ComponentCache(@Nullable Path dir, @Nullable ClassLoader loader) {
cacheDir = dir;
classLoader = loader;
instantiator = NodeInstantiator.create();
cache = new ConcurrentHashMap<>();
}
@Nullable
public Path getCacheDir() {
return cacheDir;
}
Object instantiate(@Nonnull DAGNode node) throws InjectionException {
DAGNode n2 = processNode(node, node);
return instantiator.instantiate(n2);
}
@Nonnull
@Override
public DAGNode processNode(@Nonnull DAGNode node,
@Nonnull DAGNode original) throws InjectionException {
// We only want to process shareable nodes.
if (!GraphtUtils.isShareable(node)) {
return node;
}
// Is the object pre-instantiated? If so, we will skip the caching logic.
Component label = node.getLabel();
Satisfaction satisfaction = label.getSatisfaction();
if (satisfaction.hasInstance()) {
return node;
}
// Make sure we have a cache entry for this node.
CacheEntry newEntry = new CacheEntry(node);
CacheEntry entry = cache.putIfAbsent(original, newEntry);
if (entry == null) {
// didn't find an entry, but inserted the new one
entry = newEntry;
}
// Now try to get the instantiated object from the cache
Object obj;
try {
obj = entry.getObject(node);
} catch (IOException e) {
throw new InjectionException("Cache I/O error", e);
}
// Build a new satisfaction and a node, with all non-transient edges.
Satisfaction instanceSat;
if (obj == null) {
instanceSat = Satisfactions.nullOfType(satisfaction.getErasedType());
} else {
instanceSat = Satisfactions.instance(obj);
}
Component newLabel = Component.create(instanceSat, label.getCachePolicy());
// build new node with replacement label
DAGNodeBuilder bld = DAGNode.newBuilder(newLabel);
// retain all non-transient edges
for (DAGEdge edge: node.getOutgoingEdges()) {
if (!GraphtUtils.edgeIsTransient(edge)) {
bld.addEdge(edge.getTail(), edge.getLabel());
}
}
return bld.build();
}
/**
* Class with the cache entry logic.
*/
private class CacheEntry {
private final String key;
// reference *inside* optional so we don't GC the optional while keeping the object
// this is null for uncached, empty for cached null
private Optional> cachedObject;
/**
* Createa a cache entry.
* @param n The node.
*/
public CacheEntry(DAGNode n) {
key = makeNodeKey(n);
}
@Nullable
private Path getCacheFile() {
if (cacheDir == null) {
return null;
} else {
return cacheDir.resolve(key + ".dat.gz");
}
}
/**
* Get the object.
* @param node The live version of the node. It must be compatible with the node used
* to create this object! That means that it should be the same node, or a
* mutation of the node.
* @return The object loaded from the cache, or from instantiating {@code node}.
* @throws IOException If there is an I/O error with the cache.
*/
public synchronized Object getObject(DAGNode node) throws IOException, InjectionException {
// check soft-reference cache
Optional
© 2015 - 2025 Weber Informatics LLC | Privacy Policy