All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.telicent.core.FMod_InitialCompaction Maven / Gradle / Ivy

Go to download

System code - plugins, extensions, entrypoints etc. - for Smart Cache Graph

There is a newer version: 0.82.9
Show newest version
package io.telicent.core;

import org.apache.commons.io.FileUtils;
import org.apache.jena.atlas.lib.Timer;
import org.apache.jena.atlas.lib.Version;
import org.apache.jena.atlas.logging.FmtLog;
import org.apache.jena.fuseki.Fuseki;
import org.apache.jena.fuseki.kafka.FKS;
import org.apache.jena.fuseki.main.FusekiServer;
import org.apache.jena.fuseki.main.sys.FusekiAutoModule;
import org.apache.jena.rdf.model.Model;
import org.apache.jena.sparql.core.DatasetGraph;
import org.apache.jena.sparql.core.DatasetGraphWrapper;
import org.apache.jena.tdb2.DatabaseMgr;
import org.apache.jena.tdb2.store.DatasetGraphSwitchable;
import org.apache.jena.tdb2.sys.TDBInternal;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.io.File;
import java.util.*;
import java.util.function.Predicate;

import static java.lang.String.format;

public class FMod_InitialCompaction implements FusekiAutoModule {

    public static final Logger LOG = LoggerFactory.getLogger("io.telicent.core.FMod_InitialCompaction");
    final Set datasets = new HashSet<>();
    final boolean DELETE_OLD = true;
    public static final String DISABLE_INITIAL_COMPACTION = "DISABLE_INITIAL_COMPACTION";
    private static final String VERSION = Version.versionForClass(FMod_InitialCompaction.class).orElse("");
    final Map sizes = new HashMap<>();

    @Override
    public String name() {
        return "Initial Compaction";
    }

    @Override
    public void prepare(FusekiServer.Builder builder, Set names, Model configModel) {
        FmtLog.info(Fuseki.configLog, "%s Fuseki Module (%s)", name(), VERSION);
        this.datasets.addAll(names);
    }

    @Override
    public void serverAfterStarting(FusekiServer server) {
        // Run after starting
        compactDatabases(server);
    }

    /**
     * Compacts the database
     *
     * @param server Server
     */
    private void compactDatabases(FusekiServer server) {
        for (String name : datasets) {
            Optional optionalDatasetGraph = FKS.findDataset(server, name);
            if (optionalDatasetGraph.isPresent()) {
                DatasetGraph dsg = getTDB2(optionalDatasetGraph.get());
                if (dsg != null) {
                    // See how big the database is, and whether it's size has changed
                    // NB - Due to how the module is registered twice (see SmartCacheGraph) we'll get called twice, once
                    //      before Kafka connectors are started, and again after they are started, this gives us two
                    //      opportunities to compact stuff
                    long sizeBefore = findDatabaseSize(dsg);
                    if (this.sizes.containsKey(name)) {
                        if (sizeBefore <= this.sizes.get(name)) {
                            FmtLog.info(LOG,
                                        "[Compaction] Additional compaction not required for %s as it is already maximally compacted at %s",
                                        name, humanReadableSize(sizeBefore));
                            continue;
                        }
                    }

                    FmtLog.info(LOG, "[Compaction] >>>> Start compact %s, current size is %s", name,
                                humanReadableSize(sizeBefore));
                    Timer timer = new Timer();
                    timer.startTimer();
                    DatabaseMgr.compact(dsg, DELETE_OLD);
                    long sizeAfter = findDatabaseSize(dsg);
                    FmtLog.info(LOG, "[Compaction] <<<< Finish compact %s. Took %s seconds.  Compacted size is %s",
                                name, Timer.timeStr(timer.endTimer()), humanReadableSize(sizeAfter));
                    this.sizes.put(name, sizeAfter);
                } else {
                    FmtLog.debug(LOG, "Compaction not required for %s as not TDB2", name);
                }
            } else {
                FmtLog.debug(LOG, "Compaction not required for %s as no graph", name);
            }
        }
    }

    /**
     * Finds the database size on disk (assuming it's a TDB 2 on-disk database)
     *
     * @param dsg Dataset Graph
     * @return Size on disk, of {@code -1} if not calculable
     */
    public static long findDatabaseSize(DatasetGraph dsg) {
        if (dsg instanceof DatasetGraphSwitchable switchable) {
            File dbDir = switchable.getContainerPath().toFile();
            if (dbDir.exists()) {
                return FileUtils.sizeOfDirectory(dbDir);
            }
        }
        return -1;
    }

    /**
     * Formats a database size (if known) as a human-readable size
     *
     * @param size Size, may be less than zero if unknown
     * @return Human-readable size
     */
    public static String humanReadableSize(long size) {
        if (size < 0) {
            return "Unknown";
        } else {
            return FileUtils.byteCountToDisplaySize(size);
        }
    }

    /**
     * Check the given Graph and, if possible, return the underlying TDB2 instance
     *
     * @param dsg Graph
     * @return TDB2 compatible DSG or null
     */
    public static DatasetGraph getTDB2(DatasetGraph dsg) {
        for (; ; ) {
            if (IS_TDB_2.test(dsg)) {
                return dsg;
            }
            if (!(dsg instanceof DatasetGraphWrapper dsgw)) {
                return null;
            }
            dsg = dsgw.getWrapped();
        }
    }

    private static final Predicate IS_TDB_2 = TDBInternal::isTDB2;
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy