org.apache.flink.runtime.state.SharedStateRegistry Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.runtime.state;
import org.apache.flink.runtime.concurrent.Executors;
import org.apache.flink.util.Preconditions;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import java.util.HashMap;
import java.util.Map;
import java.util.Objects;
import java.util.concurrent.Executor;
import java.util.concurrent.RejectedExecutionException;
/**
* This registry manages state that is shared across (incremental) checkpoints, and is responsible
* for deleting shared state that is no longer used in any valid checkpoint.
*
* A {@code SharedStateRegistry} will be deployed in the {@link
* org.apache.flink.runtime.checkpoint.CheckpointCoordinator} to maintain the reference count of
* {@link StreamStateHandle}s by a key that (logically) identifies them.
*/
public class SharedStateRegistry implements AutoCloseable {
private static final Logger LOG = LoggerFactory.getLogger(SharedStateRegistry.class);
/** A singleton object for the default implementation of a {@link SharedStateRegistryFactory} */
public static final SharedStateRegistryFactory DEFAULT_FACTORY = SharedStateRegistry::new;
/** All registered state objects by an artificial key */
private final Map
registeredStates;
/** This flag indicates whether or not the registry is open or if close() was called */
private boolean open;
/** Executor for async state deletion */
private final Executor asyncDisposalExecutor;
/** Default uses direct executor to delete unreferenced state */
public SharedStateRegistry() {
this(Executors.directExecutor());
}
public SharedStateRegistry(Executor asyncDisposalExecutor) {
this.registeredStates = new HashMap<>();
this.asyncDisposalExecutor = Preconditions.checkNotNull(asyncDisposalExecutor);
this.open = true;
}
/**
* Register a reference to the given shared state in the registry. This does the following: We
* check if the state handle is actually new by the registrationKey. If it is new, we register
* it with a reference count of 1. If there is already a state handle registered under the given
* key, we dispose the given "new" state handle, uptick the reference count of the previously
* existing state handle and return it as a replacement with the result.
*
* IMPORTANT: caller should check the state handle returned by the result, because the
* registry is performing de-duplication and could potentially return a handle that is supposed
* to replace the one from the registration request.
*
* @param state the shared state for which we register a reference.
* @return the result of this registration request, consisting of the state handle that is
* registered under the key by the end of the operation and its current reference count.
*/
public Result registerReference(
SharedStateRegistryKey registrationKey, StreamStateHandle state) {
Preconditions.checkNotNull(state);
StreamStateHandle scheduledStateDeletion = null;
SharedStateRegistry.SharedStateEntry entry;
synchronized (registeredStates) {
Preconditions.checkState(
open, "Attempt to register state to closed SharedStateRegistry.");
entry = registeredStates.get(registrationKey);
if (entry == null) {
// Additional check that should never fail, because only state handles that are not
// placeholders should
// ever be inserted to the registry.
Preconditions.checkState(
!isPlaceholder(state),
"Attempt to reference unknown state: " + registrationKey);
entry = new SharedStateRegistry.SharedStateEntry(state);
registeredStates.put(registrationKey, entry);
} else {
// delete if this is a real duplicate
if (!Objects.equals(state, entry.stateHandle)) {
scheduledStateDeletion = state;
LOG.trace(
"Identified duplicate state registration under key {}. New state {} was determined to "
+ "be an unnecessary copy of existing state {} and will be dropped.",
registrationKey,
state,
entry.stateHandle);
}
entry.increaseReferenceCount();
}
}
scheduleAsyncDelete(scheduledStateDeletion);
LOG.trace("Registered shared state {} under key {}.", entry, registrationKey);
return new Result(entry);
}
/**
* Releases one reference to the given shared state in the registry. This decreases the
* reference count by one. Once the count reaches zero, the shared state is deleted.
*
* @param registrationKey the shared state for which we release a reference.
* @return the result of the request, consisting of the reference count after this operation and
* the state handle, or null if the state handle was deleted through this request. Returns
* null if the registry was previously closed.
*/
public Result unregisterReference(SharedStateRegistryKey registrationKey) {
Preconditions.checkNotNull(registrationKey);
final Result result;
final StreamStateHandle scheduledStateDeletion;
SharedStateRegistry.SharedStateEntry entry;
synchronized (registeredStates) {
entry = registeredStates.get(registrationKey);
Preconditions.checkState(
entry != null,
"Cannot unregister a state that is not registered: %s",
registrationKey);
entry.decreaseReferenceCount();
// Remove the state from the registry when it's not referenced any more.
if (entry.getReferenceCount() <= 0) {
registeredStates.remove(registrationKey);
scheduledStateDeletion = entry.getStateHandle();
result = new Result(null, 0);
} else {
scheduledStateDeletion = null;
result = new Result(entry);
}
}
LOG.trace("Unregistered shared state {} under key {}.", entry, registrationKey);
scheduleAsyncDelete(scheduledStateDeletion);
return result;
}
/**
* Register given shared states in the registry.
*
* @param stateHandles The shared states to register.
*/
public void registerAll(Iterable extends CompositeStateHandle> stateHandles) {
if (stateHandles == null) {
return;
}
synchronized (registeredStates) {
for (CompositeStateHandle stateHandle : stateHandles) {
stateHandle.registerSharedStates(this);
}
}
}
@Override
public String toString() {
synchronized (registeredStates) {
return "SharedStateRegistry{" + "registeredStates=" + registeredStates + '}';
}
}
private void scheduleAsyncDelete(StreamStateHandle streamStateHandle) {
// We do the small optimization to not issue discards for placeholders, which are NOPs.
if (streamStateHandle != null && !isPlaceholder(streamStateHandle)) {
LOG.trace("Scheduled delete of state handle {}.", streamStateHandle);
AsyncDisposalRunnable asyncDisposalRunnable =
new AsyncDisposalRunnable(streamStateHandle);
try {
asyncDisposalExecutor.execute(asyncDisposalRunnable);
} catch (RejectedExecutionException ex) {
// TODO This is a temporary fix for a problem during
// ZooKeeperCompletedCheckpointStore#shutdown:
// Disposal is issued in another async thread and the shutdown proceeds to close the
// I/O Executor pool.
// This leads to RejectedExecutionException once the async deletes are triggered by
// ZK. We need to
// wait for all pending ZK deletes before closing the I/O Executor pool. We can
// simply call #run()
// because we are already in the async ZK thread that disposes the handles.
asyncDisposalRunnable.run();
}
}
}
private boolean isPlaceholder(StreamStateHandle stateHandle) {
return stateHandle instanceof PlaceholderStreamStateHandle;
}
@Override
public void close() {
synchronized (registeredStates) {
open = false;
}
}
/** An entry in the registry, tracking the handle and the corresponding reference count. */
private static class SharedStateEntry {
/** The shared state handle */
private final StreamStateHandle stateHandle;
/** The current reference count of the state handle */
private int referenceCount;
SharedStateEntry(StreamStateHandle value) {
this.stateHandle = value;
this.referenceCount = 1;
}
StreamStateHandle getStateHandle() {
return stateHandle;
}
int getReferenceCount() {
return referenceCount;
}
void increaseReferenceCount() {
++referenceCount;
}
void decreaseReferenceCount() {
--referenceCount;
}
@Override
public String toString() {
return "SharedStateEntry{"
+ "stateHandle="
+ stateHandle
+ ", referenceCount="
+ referenceCount
+ '}';
}
}
/** The result of an attempt to (un)/reference state */
public static class Result {
/** The (un)registered state handle from the request */
private final StreamStateHandle reference;
/** The reference count to the state handle after the request to (un)register */
private final int referenceCount;
private Result(SharedStateEntry sharedStateEntry) {
this.reference = sharedStateEntry.getStateHandle();
this.referenceCount = sharedStateEntry.getReferenceCount();
}
public Result(StreamStateHandle reference, int referenceCount) {
Preconditions.checkArgument(referenceCount >= 0);
this.reference = reference;
this.referenceCount = referenceCount;
}
public StreamStateHandle getReference() {
return reference;
}
public int getReferenceCount() {
return referenceCount;
}
@Override
public String toString() {
return "Result{"
+ "reference="
+ reference
+ ", referenceCount="
+ referenceCount
+ '}';
}
}
/** Encapsulates the operation the delete state handles asynchronously. */
private static final class AsyncDisposalRunnable implements Runnable {
private final StateObject toDispose;
public AsyncDisposalRunnable(StateObject toDispose) {
this.toDispose = Preconditions.checkNotNull(toDispose);
}
@Override
public void run() {
try {
toDispose.discardState();
} catch (Exception e) {
LOG.warn(
"A problem occurred during asynchronous disposal of a shared state object: {}",
toDispose,
e);
}
}
}
}