All Downloads are FREE. Search and download functionalities are using the official Maven repository.

apoc.periodic.Periodic Maven / Gradle / Ivy

There is a newer version: 5.25.1
Show newest version
/*
 * Copyright (c) "Neo4j"
 * Neo4j Sweden AB [http://neo4j.com]
 *
 * This file is part of Neo4j.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package apoc.periodic;

import static apoc.periodic.PeriodicUtils.recordError;
import static apoc.periodic.PeriodicUtils.submitJob;
import static apoc.periodic.PeriodicUtils.submitProc;
import static apoc.periodic.PeriodicUtils.wrapTask;
import static apoc.util.Util.merge;
import static org.neo4j.graphdb.QueryExecutionType.QueryType;

import apoc.Pools;
import apoc.periodic.PeriodicUtils.JobInfo;
import apoc.util.Util;
import apoc.util.collection.Iterables;
import apoc.util.collection.Iterators;
import java.util.*;
import java.util.concurrent.*;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.util.stream.Stream;
import org.apache.commons.lang3.tuple.Pair;
import org.neo4j.graphdb.GraphDatabaseService;
import org.neo4j.graphdb.Result;
import org.neo4j.graphdb.Transaction;
import org.neo4j.graphdb.schema.ConstraintDefinition;
import org.neo4j.graphdb.schema.IndexDefinition;
import org.neo4j.graphdb.schema.Schema;
import org.neo4j.kernel.impl.coreapi.InternalTransaction;
import org.neo4j.logging.Log;
import org.neo4j.procedure.*;

public class Periodic {

    enum Planner {
        DEFAULT,
        COST,
        IDP,
        DP
    }

    public static final Pattern PLANNER_PATTERN =
            Pattern.compile("\\bplanner\\s*=\\s*[^\\s]*", Pattern.CASE_INSENSITIVE);
    public static final Pattern RUNTIME_PATTERN = Pattern.compile("\\bruntime\\s*=", Pattern.CASE_INSENSITIVE);
    public static final Pattern CYPHER_PREFIX_PATTERN = Pattern.compile("^\\s*\\bcypher\\b", Pattern.CASE_INSENSITIVE);
    public static final String CYPHER_RUNTIME_SLOTTED = " runtime=slotted ";
    static final Pattern LIMIT_PATTERN = Pattern.compile("\\slimit\\s", Pattern.CASE_INSENSITIVE);

    @Context
    public GraphDatabaseService db;

    @Context
    public TerminationGuard terminationGuard;

    @Context
    public Log log;

    @Context
    public Pools pools;

    @Context
    public Transaction tx;

    @Admin
    @Procedure(name = "apoc.periodic.truncate", mode = Mode.SCHEMA)
    @Description(
            "Removes all entities (and optionally indexes and constraints) from the database using the `apoc.periodic.iterate` procedure.")
    public void truncate(
            @Name(
                            value = "config",
                            defaultValue = "{}",
                            description =
                                    """
            {
                dropSchema = true :: BOOLEAN,
                batchSize = 10000 :: INTEGER,
                parallel = false :: BOOLEAN,
                retries = 0 :: INTEGER,
                batchMode = "BATCH" :: STRING,
                params = {} :: MAP,
                concurrency :: INTEGER,
                failedParams = -1 :: INTEGER,
                planner = "DEFAULT" :: ["DEFAULT", "COST", "IDP", "DP"]
            }
            """)
                    Map config) {

        iterate("MATCH ()-[r]->() RETURN id(r) as id", "MATCH ()-[r]->() WHERE id(r) = id DELETE r", config);
        iterate("MATCH (n) RETURN id(n) as id", "MATCH (n) WHERE id(n) = id DELETE n", config);

        if (Util.toBoolean(config.get("dropSchema"))) {
            Schema schema = tx.schema();
            schema.getConstraints().forEach(ConstraintDefinition::drop);
            Util.getIndexes(tx).forEach(IndexDefinition::drop);
        }
    }

    @Procedure("apoc.periodic.list")
    @Description("Returns a `LIST` of all background jobs.")
    public Stream list() {
        return pools.getJobList().entrySet().stream().map((e) -> e.getKey().update(e.getValue()));
    }

    @Procedure(name = "apoc.periodic.commit", mode = Mode.WRITE)
    @Description("Runs the given statement in separate batched transactions.")
    public Stream commit(
            @Name(value = "statement", description = "The Cypher statement to run.") String statement,
            @Name(value = "params", defaultValue = "{}", description = "The parameters for the given Cypher statement.")
                    Map parameters) {
        validateQuery(statement);
        Map params = parameters == null ? Collections.emptyMap() : parameters;
        long total = 0, executions = 0, updates = 0;
        long start = System.nanoTime();

        if (!LIMIT_PATTERN.matcher(statement).find()) {
            throw new IllegalArgumentException("the statement sent to apoc.periodic.commit must contain a `limit`");
        }

        AtomicInteger batches = new AtomicInteger();
        AtomicInteger failedCommits = new AtomicInteger();
        Map commitErrors = new ConcurrentHashMap<>();
        AtomicInteger failedBatches = new AtomicInteger();
        Map batchErrors = new ConcurrentHashMap<>();
        String periodicId = UUID.randomUUID().toString();
        if (log.isDebugEnabled()) {
            log.debug("Starting periodic commit from `%s` in separate thread with id: `%s`", statement, periodicId);
        }
        do {
            Map window = Util.map("_count", updates, "_total", total);
            updates = Util.getFuture(
                    pools.getScheduledExecutorService().submit(() -> {
                        batches.incrementAndGet();
                        try {
                            return executeNumericResultStatement(statement, merge(window, params));
                        } catch (Exception e) {
                            failedBatches.incrementAndGet();
                            recordError(batchErrors, e);
                            return 0L;
                        }
                    }),
                    commitErrors,
                    failedCommits,
                    0L);
            total += updates;
            if (updates > 0) executions++;
            if (log.isDebugEnabled()) {
                log.debug("Processed in periodic commit with id %s, no %d executions", periodicId, executions);
            }
        } while (updates > 0 && !Util.transactionIsTerminated(terminationGuard));
        if (log.isDebugEnabled()) {
            log.debug("Terminated periodic commit with id %s with %d executions", periodicId, executions);
        }
        long timeTaken = TimeUnit.NANOSECONDS.toSeconds(System.nanoTime() - start);
        boolean wasTerminated = Util.transactionIsTerminated(terminationGuard);
        return Stream.of(new RundownResult(
                total,
                executions,
                timeTaken,
                batches.get(),
                failedBatches.get(),
                batchErrors,
                failedCommits.get(),
                commitErrors,
                wasTerminated));
    }

    public static class RundownResult {
        @Description("The total number of updates.")
        public final long updates;

        @Description("The total number of executions.")
        public final long executions;

        @Description("The total time taken in nanoseconds.")
        public final long runtime;

        @Description("The number of run batches.")
        public final long batches;

        @Description("The number of failed batches.")
        public final long failedBatches;

        @Description("Errors returned from the failed batches.")
        public final Map batchErrors;

        @Description("The number of failed commits.")
        public final long failedCommits;

        @Description("Errors returned from the failed commits.")
        public final Map commitErrors;

        @Description("If the job was terminated.")
        public final boolean wasTerminated;

        public RundownResult(
                long total,
                long executions,
                long timeTaken,
                long batches,
                long failedBatches,
                Map batchErrors,
                long failedCommits,
                Map commitErrors,
                boolean wasTerminated) {
            this.updates = total;
            this.executions = executions;
            this.runtime = timeTaken;
            this.batches = batches;
            this.failedBatches = failedBatches;
            this.batchErrors = batchErrors;
            this.failedCommits = failedCommits;
            this.commitErrors = commitErrors;
            this.wasTerminated = wasTerminated;
        }
    }

    private long executeNumericResultStatement(
            @Name("statement") String statement, @Name("params") Map parameters) {
        return db.executeTransactionally(statement, parameters, result -> {
            String column = Iterables.single(result.columns());
            return result.columnAs(column).stream().mapToLong(o -> (long) o).sum();
        });
    }

    @Procedure("apoc.periodic.cancel")
    @Description("Cancels the given background job.")
    public Stream cancel(@Name(value = "name", description = "The name of the job to cancel.") String name) {
        JobInfo info = new JobInfo(name);
        Future future = pools.getJobList().remove(info);
        if (future != null) {
            future.cancel(false);
            return Stream.of(info.update(future));
        }
        return Stream.empty();
    }

    @Procedure(name = "apoc.periodic.submit", mode = Mode.WRITE)
    @Description("Creates a background job which runs the given Cypher statement once.")
    public Stream submit(
            @Name(value = "name", description = "The name of the job.") String name,
            @Name(value = "statement", description = "The Cypher statement to run.") String statement,
            @Name(value = "params", defaultValue = "{}", description = "{ params = {} :: MAP }")
                    Map config) {
        validateQuery(statement);
        return submitProc(name, statement, config, db, log, pools);
    }

    @Procedure(name = "apoc.periodic.repeat", mode = Mode.WRITE)
    @Description("Runs a repeatedly called background job.\n" + "To stop this procedure, use `apoc.periodic.cancel`.")
    public Stream repeat(
            @Name(value = "name", description = "The name of the job.") String name,
            @Name(value = "statement", description = "The Cypher statement to run.") String statement,
            @Name(value = "rate", description = "The delay in seconds to wait between each job execution.") long rate,
            @Name(value = "config", defaultValue = "{}", description = "{ params = {} :: MAP }")
                    Map config) {
        validateQuery(statement);
        Map params = (Map) config.getOrDefault("params", Collections.emptyMap());
        JobInfo info = schedule(
                name,
                () -> {
                    // `resultAsString` in order to consume result
                    db.executeTransactionally(statement, params, Result::resultAsString);
                },
                0,
                rate);
        return Stream.of(info);
    }

    private void validateQuery(String statement) {
        Util.validateQuery(
                db,
                statement,
                Set.of(Mode.WRITE, Mode.READ, Mode.DEFAULT),
                QueryType.READ_ONLY,
                QueryType.WRITE,
                QueryType.READ_WRITE);
    }

    @Procedure(name = "apoc.periodic.countdown", mode = Mode.WRITE)
    @Description("Runs a repeatedly called background statement until it returns 0.")
    public Stream countdown(
            @Name(value = "name", description = "The name of the job.") String name,
            @Name(
                            value = "statement",
                            description =
                                    "The Cypher statement to run, returning a count on each run indicating the remaining iterations.")
                    String statement,
            @Name(value = "delay", description = "The delay in seconds to wait between each job execution.")
                    long delay) {
        validateQuery(statement);
        JobInfo info = submitJob(name, new Countdown(name, statement, delay, log), log, pools);
        info.delay = delay;
        return Stream.of(info);
    }

    /**
     * Call from a procedure that gets a @Context GraphDatbaseAPI db; injected and provide that db to the runnable.
     */
    public JobInfo schedule(String name, Runnable task, long delay, long repeat) {
        JobInfo info = new JobInfo(name, delay, repeat);
        Future future = pools.getJobList().remove(info);
        if (future != null && !future.isDone()) future.cancel(false);

        Runnable wrappingTask = wrapTask(name, task, log);
        ScheduledFuture newFuture = pools.getScheduledExecutorService()
                .scheduleWithFixedDelay(wrappingTask, delay, repeat, TimeUnit.SECONDS);
        pools.getJobList().put(info, newFuture);
        return info;
    }

    /**
     * Invoke cypherAction in batched transactions being fed from cypherIteration running in main thread
     * @param cypherIterate
     * @param cypherAction
     */
    @Procedure(name = "apoc.periodic.iterate", mode = Mode.WRITE)
    @Description("Runs the second statement for each item returned by the first statement.\n"
            + "This procedure returns the number of batches and the total number of processed rows.")
    public Stream iterate(
            @Name(value = "cypherIterate", description = "The first Cypher statement to be run.") String cypherIterate,
            @Name(
                            value = "cypherAction",
                            description =
                                    "The Cypher statement to run for each item returned by the initial Cypher statement.")
                    String cypherAction,
            @Name(
                            value = "config",
                            description =
                                    """
                    {
                        batchSize = 10000 :: INTEGER,
                        parallel = false :: BOOLEAN,
                        retries = 0 :: INTEGER,
                        batchMode = "BATCH" :: STRING,
                        params = {} :: MAP,
                        concurrency :: INTEGER,
                        failedParams = -1 :: INTEGER,
                        planner = "DEFAULT" :: ["DEFAULT", "COST", "IDP", "DP"]
                    }
                    """)
                    Map config) {
        validateQuery(cypherIterate);

        long batchSize = Util.toLong(config.getOrDefault("batchSize", 10000));
        if (batchSize < 1) {
            throw new IllegalArgumentException("batchSize parameter must be > 0");
        }
        int concurrency = Util.toInteger(
                config.getOrDefault("concurrency", Runtime.getRuntime().availableProcessors()));
        if (concurrency < 1) {
            throw new IllegalArgumentException("concurrency parameter must be > 0");
        }
        boolean parallel = Util.toBoolean(config.getOrDefault("parallel", false));
        long retries = Util.toLong(config.getOrDefault(
                "retries", 0)); // todo sleep/delay or push to end of batch to try again or immediate ?
        int failedParams = Util.toInteger(config.getOrDefault("failedParams", -1));

        final Map metaData;
        if (tx instanceof InternalTransaction iTx) {
            metaData = iTx.kernelTransaction().getMetaData();
        } else {
            metaData = Map.of();
        }

        BatchMode batchMode = BatchMode.fromConfig(config);
        Map params = (Map) config.getOrDefault("params", Collections.emptyMap());

        try (Result result = tx.execute(slottedRuntime(cypherIterate), params)) {
            Pair prepared =
                    PeriodicUtils.prepareInnerStatement(cypherAction, batchMode, result.columns(), "_batch");
            String innerStatement = applyPlanner(prepared.getLeft(), Planner.valueOf((String)
                    config.getOrDefault("planner", Planner.DEFAULT.name())));
            boolean iterateList = prepared.getRight();
            String periodicId = UUID.randomUUID().toString();
            if (log.isDebugEnabled()) {
                log.debug(
                        "Starting periodic iterate from `%s` operation using iteration `%s` in separate thread with id: `%s`",
                        cypherIterate, cypherAction, periodicId);
            }
            return PeriodicUtils.iterateAndExecuteBatchedInSeparateThread(
                    db,
                    terminationGuard,
                    log,
                    pools,
                    (int) batchSize,
                    parallel,
                    iterateList,
                    retries,
                    result,
                    (tx, p) -> {
                        if (tx instanceof InternalTransaction iTx) {
                            iTx.setMetaData(metaData);
                        }
                        final Result r = tx.execute(innerStatement, merge(params, p));
                        Iterators.count(r); // XXX: consume all results
                        return r.getQueryStatistics();
                    },
                    concurrency,
                    failedParams,
                    periodicId);
        }
    }

    static String slottedRuntime(String cypherIterate) {
        if (RUNTIME_PATTERN.matcher(cypherIterate).find()) {
            return cypherIterate;
        }

        return prependQueryOption(cypherIterate, CYPHER_RUNTIME_SLOTTED);
    }

    public static String applyPlanner(String query, Planner planner) {
        if (planner.equals(Planner.DEFAULT)) {
            return query;
        }
        Matcher matcher = PLANNER_PATTERN.matcher(query);
        String cypherPlanner = String.format(" planner=%s ", planner.name().toLowerCase());
        if (matcher.find()) {
            return matcher.replaceFirst(cypherPlanner);
        }
        return prependQueryOption(query, cypherPlanner);
    }

    private static String prependQueryOption(String query, String cypherOption) {
        String cypherPrefix = "cypher";
        String completePrefix = cypherPrefix + cypherOption;
        return CYPHER_PREFIX_PATTERN.matcher(query).find()
                ? query.replaceFirst("(?i)" + cypherPrefix, completePrefix)
                : completePrefix + query;
    }

    private class Countdown implements Runnable {
        private final String name;
        private final String statement;
        private final long delay;
        private final transient Log log;

        public Countdown(String name, String statement, long delay, Log log) {
            this.name = name;
            this.statement = statement;
            this.delay = delay;
            this.log = log;
        }

        @Override
        public void run() {
            if (Periodic.this.executeNumericResultStatement(statement, Collections.emptyMap()) > 0) {
                pools.getScheduledExecutorService()
                        .schedule(() -> submitJob(name, this, log, pools), delay, TimeUnit.SECONDS);
            }
        }
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy