org.neo4j.kernel.impl.scheduler.ScheduledJobHandle Maven / Gradle / Ivy
/*
* Copyright (c) "Neo4j"
* Neo4j Sweden AB [https://neo4j.com]
*
* This file is part of Neo4j.
*
* Neo4j is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see .
*/
package org.neo4j.kernel.impl.scheduler;
import java.time.Duration;
import java.time.Instant;
import java.util.Set;
import java.util.concurrent.CancellationException;
import java.util.concurrent.CopyOnWriteArrayList;
import java.util.concurrent.ExecutionException;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicInteger;
import org.neo4j.internal.helpers.Exceptions;
import org.neo4j.logging.InternalLog;
import org.neo4j.scheduler.CancelListener;
import org.neo4j.scheduler.FailedJobRun;
import org.neo4j.scheduler.Group;
import org.neo4j.scheduler.JobHandle;
import org.neo4j.scheduler.JobMonitoringParams;
import org.neo4j.scheduler.JobType;
import org.neo4j.scheduler.MonitoredJobInfo;
import org.neo4j.time.SystemNanoClock;
import org.neo4j.util.concurrent.BinaryLatch;
/**
* The JobHandle implementation for jobs scheduled with the {@link TimeBasedTaskScheduler}.
*
* As the handle gets scheduled, it transitions through various states:
*
* - The handle is initially in the RUNNABLE state, which means that it is ready to be executed but isn't
* scheduled to do so yet.
* - When it gets scheduled, it transitions into the SUBMITTED state after which it transitions to EXECUTING state,
* when it starts being executed by a thread
* - A handle that is in the SUBMITTED or EXECUTING state cannot be submitted again, even if it comes due.
* - A handle that is both due and in SUBMITTED or EXECUTING state is overdue, and its execution will be delayed until it
* changes out of the SUBMITTED state.
* - If a scheduled handle successfully finishes its execution, it will transition back to the RUNNABLE state.
* - If an exception is thrown during the execution, then the handle transitions to the FAILED state in case task is not recurring,
* otherwise its rescheduled for next execution.
*
*/
final class ScheduledJobHandle implements JobHandle {
// We extend AtomicInteger to inline our state field.
// These are the possible state values:
private static final int RUNNABLE = 0;
private static final int SUBMITTED = 1;
private static final int EXECUTING = 2;
private static final int FAILED = 3;
// Access is synchronized via the PriorityBlockingQueue in TimeBasedTaskScheduler:
// - Write to this field happens before the handle is added to the queue.
// - Reads of this field happens after the handle has been read from the queue.
// - Reads of this field for the purpose of ordering the queue are either thread local,
// or happens after the relevant handles have been added to the queue.
long nextDeadlineNanos;
private final AtomicInteger state;
private final TimeBasedTaskScheduler scheduler;
private final Group group;
private final CopyOnWriteArrayList cancelListeners;
private final BinaryLatch handleRelease;
private final Runnable task;
private final JobMonitoringParams jobMonitoringParams;
private final long submittedMillis;
private final InternalLog log;
private final long reschedulingDelayNanos;
private final Set> monitoredJobs;
private final FailedJobRunsStore failedJobRunsStore;
private final long jobId;
private volatile JobHandle> latestHandle;
private volatile Throwable lastException;
ScheduledJobHandle(
TimeBasedTaskScheduler scheduler,
Group group,
Runnable task,
long nextDeadlineNanos,
long reschedulingDelayNanos,
JobMonitoringParams jobMonitoringParams,
long submittedMillis,
Set> monitoredJobs,
FailedJobRunsStore failedJobRunsStore,
SystemNanoClock clock,
long jobId,
InternalLog log) {
this.jobMonitoringParams = jobMonitoringParams;
this.submittedMillis = submittedMillis;
this.log = log;
this.state = new AtomicInteger();
this.scheduler = scheduler;
this.group = group;
this.nextDeadlineNanos = nextDeadlineNanos;
this.reschedulingDelayNanos = reschedulingDelayNanos;
this.monitoredJobs = monitoredJobs;
this.failedJobRunsStore = failedJobRunsStore;
this.jobId = jobId;
handleRelease = new BinaryLatch();
cancelListeners = new CopyOnWriteArrayList<>();
boolean isRecurring = reschedulingDelayNanos > 0;
this.task = () -> {
Instant executionStart = clock.instant();
try {
if (state.compareAndSet(SUBMITTED, EXECUTING)) {
task.run();
}
lastException = null;
} catch (Throwable e) {
lastException = e;
if (!isRecurring) {
state.set(FAILED);
}
recordFailedRun(executionStart, clock.instant(), e);
} finally {
// Use compareAndSet to avoid overriding any cancellation state.
if (state.compareAndSet(EXECUTING, RUNNABLE) && isRecurring) {
// We only reschedule if the rescheduling delay is greater than zero.
// A rescheduling delay of zero means this is a delayed task.
// If the rescheduling delay is greater than zero, then this is a recurring task.
this.nextDeadlineNanos += reschedulingDelayNanos;
scheduler.enqueueTask(this);
} else {
monitoredJobs.remove(this);
}
}
};
}
void submitIfRunnable(ThreadPoolManager pools) {
if (state.compareAndSet(RUNNABLE, SUBMITTED)) {
latestHandle = pools.getThreadPool(group).submit(JobMonitoringParams.NOT_MONITORED, task);
handleRelease.release();
}
}
@Override
public void cancel() {
monitoredJobs.remove(this);
state.set(FAILED);
var handle = latestHandle;
if (handle != null) {
handle.cancel();
}
for (CancelListener cancelListener : cancelListeners) {
cancelListener.cancelled();
}
scheduler.cancelTask(this);
// Release the handle to allow waitTermination() to observe the cancellation.
handleRelease.release();
}
@Override
public void waitTermination() throws ExecutionException, InterruptedException {
handleRelease.await();
RuntimeException runtimeException = null;
try {
var handleDelegate = this.latestHandle;
if (handleDelegate != null) {
handleDelegate.waitTermination();
}
} catch (RuntimeException t) {
runtimeException = t;
}
if (state.get() == FAILED) {
Throwable exception = this.lastException;
if (exception != null) {
var executionException = new ExecutionException(exception);
if (runtimeException != null) {
executionException.addSuppressed(runtimeException);
}
throw executionException;
} else {
throw Exceptions.chain(new CancellationException(), runtimeException);
}
}
}
@Override
public void waitTermination(long timeout, TimeUnit unit) {
throw new UnsupportedOperationException("Not supported for repeating tasks.");
}
@Override
public T get() {
throw new UnsupportedOperationException("Not supported for repeating tasks.");
}
@Override
public void registerCancelListener(CancelListener listener) {
cancelListeners.add(listener);
}
MonitoredJobInfo getMonitoringInfo() {
if (JobMonitoringParams.NOT_MONITORED == jobMonitoringParams) {
return null;
}
return new MonitoredJobInfo(
jobId,
group,
Instant.ofEpochMilli(submittedMillis),
jobMonitoringParams.getSubmitter(),
jobMonitoringParams.getTargetDatabaseName(),
jobMonitoringParams.getDescription(),
Instant.ofEpochMilli(TimeUnit.NANOSECONDS.toMillis(nextDeadlineNanos)),
reschedulingDelayNanos == 0 ? null : Duration.ofNanos(reschedulingDelayNanos),
getStatus(),
getJobType(),
jobMonitoringParams.getCurrentStateDescription());
}
private MonitoredJobInfo.State getStatus() {
var state = this.state.get();
return switch (state) {
case RUNNABLE, SUBMITTED -> MonitoredJobInfo.State.SCHEDULED;
// A job can be in failed state only for a glimpse between being marked
// as failed and being removed from monitored jobs immediately after that.
// Let's show such job as still executing as there is no point confusing
// users with this esoteric state.
case EXECUTING, FAILED -> MonitoredJobInfo.State.EXECUTING;
default -> throw new IllegalStateException("Unexpected job state: " + state);
};
}
private void recordFailedRun(Instant executionStart, Instant failureTime, Throwable t) {
log.error(
"Unhandled exception in job " + jobId + " from group " + group + " with params " + jobMonitoringParams,
t);
if (jobMonitoringParams == JobMonitoringParams.NOT_MONITORED) {
return;
}
FailedJobRun failedJobRun = new FailedJobRun(
jobId,
group,
jobMonitoringParams.getSubmitter(),
jobMonitoringParams.getTargetDatabaseName(),
jobMonitoringParams.getDescription(),
getJobType(),
Instant.ofEpochMilli(submittedMillis),
executionStart,
failureTime,
t);
failedJobRunsStore.add(failedJobRun);
}
private JobType getJobType() {
return reschedulingDelayNanos > 0 ? JobType.PERIODIC : JobType.DELAYED;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy