org.apache.flink.runtime.instance.SlotSharingGroupAssignment Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.runtime.instance;
import java.util.ArrayList;
import java.util.Collections;
import java.util.HashSet;
import java.util.Iterator;
import java.util.LinkedHashMap;
import java.util.LinkedHashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.flink.runtime.clusterframework.types.ResourceID;
import org.apache.flink.runtime.jobmanager.scheduler.CoLocationConstraint;
import org.apache.flink.runtime.jobmanager.scheduler.Locality;
import org.apache.flink.runtime.taskmanager.TaskManagerLocation;
import org.apache.flink.util.AbstractID;
import org.apache.flink.runtime.executiongraph.ExecutionVertex;
import org.apache.flink.runtime.jobgraph.JobVertexID;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
/**
* The SlotSharingGroupAssignment manages a set of shared slots, which are shared between
* tasks of a {@link org.apache.flink.runtime.jobmanager.scheduler.SlotSharingGroup}.
*
* The assignments shares tasks by allowing a shared slot to hold one vertex per
* JobVertexID. For example, consider a program consisting of job vertices "source", "map",
* "reduce", and "sink". If the slot sharing group spans all four job vertices, then
* each shared slot can hold one parallel subtask of the source, the map, the reduce, and the
* sink vertex. Each shared slot holds the actual subtasks in child slots, which are (at the leaf level),
* the {@link SimpleSlot}s.
*
* An exception are the co-location-constraints, that define that the i-th subtask of one
* vertex needs to be scheduled strictly together with the i-th subtasks of of the vertices
* that share the co-location-constraint. To manage that, a co-location-constraint gets its
* own shared slot inside the shared slots of a sharing group.
*
* Consider a job set up like this:
*
* {@code
* +-------------- Slot Sharing Group --------------+
* | |
* | +-- Co Location Group --+ |
* | | | |
* | (source) ---> (head) ---> (tail) ---> (sink) |
* | | | |
* | +-----------------------+ |
* +------------------------------------------------+
* }
*
* The slot hierarchy in the slot sharing group will look like the following
*
*
* Shared(0)(root)
* |
* +-- Simple(2)(sink)
* |
* +-- Shared(1)(co-location-group)
* | |
* | +-- Simple(0)(tail)
* | +-- Simple(1)(head)
* |
* +-- Simple(0)(source)
*
*/
public class SlotSharingGroupAssignment {
private final static Logger LOG = LoggerFactory.getLogger(SlotSharingGroupAssignment.class);
/** The lock globally guards against concurrent modifications in the data structures */
private final Object lock = new Object();
/** All slots currently allocated to this sharing group */
private final Set allSlots = new LinkedHashSet();
/** The slots available per vertex type (JobVertexId), keyed by TaskManager, to make them locatable */
private final Map>> availableSlotsPerJid = new LinkedHashMap<>();
// --------------------------------------------------------------------------------------------
// Accounting
// --------------------------------------------------------------------------------------------
/**
* Gets the number of slots that are currently governed by this assignment group.
* This refers to the slots allocated from an {@link org.apache.flink.runtime.instance.Instance},
* and not the sub-slots given out as children of those shared slots.
*
* @return The number of resource slots managed by this assignment group.
*/
public int getNumberOfSlots() {
return allSlots.size();
}
/**
* Gets the number of shared slots into which the given group can place subtasks or
* nested task groups.
*
* @param groupId The ID of the group.
* @return The number of shared slots available to the given job vertex.
*/
public int getNumberOfAvailableSlotsForGroup(AbstractID groupId) {
synchronized (lock) {
Map> available = availableSlotsPerJid.get(groupId);
if (available != null) {
Set set = new HashSet();
for (List list : available.values()) {
for (SharedSlot slot : list) {
set.add(slot);
}
}
return set.size();
}
else {
// if no entry exists for a JobVertexID so far, then the vertex with that ID can
// add a subtask into each shared slot of this group. Consequently, all
// of them are available for that JobVertexID.
return allSlots.size();
}
}
}
// ------------------------------------------------------------------------
// Slot allocation
// ------------------------------------------------------------------------
public SimpleSlot addSharedSlotAndAllocateSubSlot(SharedSlot sharedSlot, Locality locality, JobVertexID groupId) {
return addSharedSlotAndAllocateSubSlot(sharedSlot, locality, groupId, null);
}
public SimpleSlot addSharedSlotAndAllocateSubSlot(
SharedSlot sharedSlot, Locality locality, CoLocationConstraint constraint)
{
return addSharedSlotAndAllocateSubSlot(sharedSlot, locality, null, constraint);
}
private SimpleSlot addSharedSlotAndAllocateSubSlot(
SharedSlot sharedSlot, Locality locality, JobVertexID groupId, CoLocationConstraint constraint) {
// sanity checks
if (!sharedSlot.isRootAndEmpty()) {
throw new IllegalArgumentException("The given slot is not an empty root slot.");
}
final ResourceID location = sharedSlot.getTaskManagerID();
synchronized (lock) {
// early out in case that the slot died (instance disappeared)
if (!sharedSlot.isAlive()) {
return null;
}
// add to the total bookkeeping
if (!allSlots.add(sharedSlot)) {
throw new IllegalArgumentException("Slot was already contained in the assignment group");
}
SimpleSlot subSlot;
AbstractID groupIdForMap;
if (constraint == null) {
// allocate us a sub slot to return
subSlot = sharedSlot.allocateSubSlot(groupId);
groupIdForMap = groupId;
}
else {
// sanity check
if (constraint.isAssignedAndAlive()) {
throw new IllegalStateException(
"Trying to add a shared slot to a co-location constraint that has a life slot.");
}
// we need a co-location slot --> a SimpleSlot nested in a SharedSlot to
// host other co-located tasks
SharedSlot constraintGroupSlot = sharedSlot.allocateSharedSlot(constraint.getGroupId());
groupIdForMap = constraint.getGroupId();
if (constraintGroupSlot != null) {
// the sub-slots in the co-location constraint slot have no own group IDs
subSlot = constraintGroupSlot.allocateSubSlot(null);
if (subSlot != null) {
// all went well, we can give the constraint its slot
constraint.setSharedSlot(constraintGroupSlot);
// NOTE: Do not lock the location constraint, because we don't yet know whether we will
// take the slot here
}
else {
// if we could not create a sub slot, release the co-location slot
// note that this does implicitly release the slot we have just added
// as well, because we release its last child slot. That is expected
// and desired.
constraintGroupSlot.releaseSlot();
}
}
else {
// this should not happen, as we are under the lock that also
// guards slot disposals. Keep the check to be on the safe side
subSlot = null;
}
}
if (subSlot != null) {
// preserve the locality information
subSlot.setLocality(locality);
// let the other groups know that this slot exists and that they
// can place a task into this slot.
boolean entryForNewJidExists = false;
for (Map.Entry>> entry : availableSlotsPerJid.entrySet()) {
// there is already an entry for this groupID
if (entry.getKey().equals(groupIdForMap)) {
entryForNewJidExists = true;
continue;
}
Map> available = entry.getValue();
putIntoMultiMap(available, location, sharedSlot);
}
// make sure an empty entry exists for this group, if no other entry exists
if (!entryForNewJidExists) {
availableSlotsPerJid.put(groupIdForMap, new LinkedHashMap>());
}
return subSlot;
}
else {
// if sharedSlot is releases, abort.
// This should be a rare case, since this method is called with a fresh slot.
return null;
}
}
// end synchronized (lock)
}
/**
* Gets a slot suitable for the given task vertex. This method will prefer slots that are local
* (with respect to {@link ExecutionVertex#getPreferredLocationsBasedOnInputs()}), but will return non local
* slots if no local slot is available. The method returns null, when this sharing group has
* no slot is available for the given JobVertexID.
*
* @param vertex The vertex to allocate a slot for.
*
* @return A slot to execute the given ExecutionVertex in, or null, if none is available.
*/
public SimpleSlot getSlotForTask(ExecutionVertex vertex) {
return getSlotForTask(vertex.getJobvertexId(), vertex.getPreferredLocationsBasedOnInputs());
}
/**
*
*/
SimpleSlot getSlotForTask(JobVertexID vertexID, Iterable locationPreferences) {
synchronized (lock) {
Tuple2 p = getSlotForTaskInternal(vertexID, locationPreferences, false);
if (p != null) {
SharedSlot ss = p.f0;
SimpleSlot slot = ss.allocateSubSlot(vertexID);
slot.setLocality(p.f1);
return slot;
}
else {
return null;
}
}
}
/**
* Gets a slot for a task that has a co-location constraint. This method tries to grab
* a slot form the location-constraint's shared slot. If that slot has not been initialized,
* then the method tries to grab another slot that is available for the location-constraint-group.
*
* In cases where the co-location constraint has not yet been initialized with a slot,
* or where that slot has been disposed in the meantime, this method tries to allocate a shared
* slot for the co-location constraint (inside on of the other available slots).
*
* If a suitable shared slot is available, this method allocates a simple slot within that
* shared slot and returns it. If no suitable shared slot could be found, this method
* returns null.
*
* @param vertex The execution vertex to find a slot for.
* @param constraint The co-location constraint for the placement of the execution vertex.
*
* @return A simple slot allocate within a suitable shared slot, or {@code null}, if no suitable
* shared slot is available.
*/
public SimpleSlot getSlotForTask(ExecutionVertex vertex, CoLocationConstraint constraint) {
return getSlotForTask(constraint, vertex.getPreferredLocationsBasedOnInputs());
}
SimpleSlot getSlotForTask(CoLocationConstraint constraint, Iterable locationPreferences) {
synchronized (lock) {
if (constraint.isAssignedAndAlive()) {
// the shared slot of the co-location group is initialized and set we allocate a sub-slot
final SharedSlot shared = constraint.getSharedSlot();
SimpleSlot subslot = shared.allocateSubSlot(null);
subslot.setLocality(Locality.LOCAL);
return subslot;
}
else if (constraint.isAssigned()) {
// we had an assignment before.
SharedSlot previous = constraint.getSharedSlot();
if (previous == null) {
throw new IllegalStateException("Bug: Found assigned co-location constraint without a slot.");
}
TaskManagerLocation location = previous.getTaskManagerLocation();
Tuple2 p = getSlotForTaskInternal(
constraint.getGroupId(), Collections.singleton(location), true);
if (p == null) {
return null;
}
else {
SharedSlot newSharedSlot = p.f0;
// allocate the co-location group slot inside the shared slot
SharedSlot constraintGroupSlot = newSharedSlot.allocateSharedSlot(constraint.getGroupId());
if (constraintGroupSlot != null) {
constraint.setSharedSlot(constraintGroupSlot);
// the sub slots in the co location constraint slot have no group that they belong to
// (other than the co-location-constraint slot)
SimpleSlot subSlot = constraintGroupSlot.allocateSubSlot(null);
subSlot.setLocality(Locality.LOCAL);
return subSlot;
}
else {
// could not allocate the co-location-constraint shared slot
return null;
}
}
}
else {
// the location constraint has not been associated with a shared slot, yet.
// grab a new slot and initialize the constraint with that one.
// preferred locations are defined by the vertex
Tuple2 p =
getSlotForTaskInternal(constraint.getGroupId(), locationPreferences, false);
if (p == null) {
// could not get a shared slot for this co-location-group
return null;
}
else {
final SharedSlot availableShared = p.f0;
final Locality l = p.f1;
// allocate the co-location group slot inside the shared slot
SharedSlot constraintGroupSlot = availableShared.allocateSharedSlot(constraint.getGroupId());
// IMPORTANT: We do not lock the location, yet, since we cannot be sure that the
// caller really sticks with the slot we picked!
constraint.setSharedSlot(constraintGroupSlot);
// the sub slots in the co location constraint slot have no group that they belong to
// (other than the co-location-constraint slot)
SimpleSlot sub = constraintGroupSlot.allocateSubSlot(null);
sub.setLocality(l);
return sub;
}
}
}
}
private Tuple2 getSlotForTaskInternal(
AbstractID groupId, Iterable preferredLocations, boolean localOnly)
{
// check if there is anything at all in this group assignment
if (allSlots.isEmpty()) {
return null;
}
// get the available slots for the group
Map> slotsForGroup = availableSlotsPerJid.get(groupId);
if (slotsForGroup == null) {
// we have a new group, so all slots are available
slotsForGroup = new LinkedHashMap<>();
availableSlotsPerJid.put(groupId, slotsForGroup);
for (SharedSlot availableSlot : allSlots) {
putIntoMultiMap(slotsForGroup, availableSlot.getTaskManagerID(), availableSlot);
}
}
else if (slotsForGroup.isEmpty()) {
// the group exists, but nothing is available for that group
return null;
}
// check whether we can schedule the task to a preferred location
boolean didNotGetPreferred = false;
if (preferredLocations != null) {
for (TaskManagerLocation location : preferredLocations) {
// set the flag that we failed a preferred location. If one will be found,
// we return early anyways and skip the flag evaluation
didNotGetPreferred = true;
SharedSlot slot = removeFromMultiMap(slotsForGroup, location.getResourceID());
if (slot != null && slot.isAlive()) {
return new Tuple2<>(slot, Locality.LOCAL);
}
}
}
// if we want only local assignments, exit now with a "not found" result
if (didNotGetPreferred && localOnly) {
return null;
}
Locality locality = didNotGetPreferred ? Locality.NON_LOCAL : Locality.UNCONSTRAINED;
// schedule the task to any available location
SharedSlot slot;
while ((slot = pollFromMultiMap(slotsForGroup)) != null) {
if (slot.isAlive()) {
return new Tuple2<>(slot, locality);
}
}
// nothing available after all, all slots were dead
return null;
}
// ------------------------------------------------------------------------
// Slot releasing
// ------------------------------------------------------------------------
/**
* Releases the simple slot from the assignment group.
*
* @param simpleSlot The SimpleSlot to be released
*/
void releaseSimpleSlot(SimpleSlot simpleSlot) {
synchronized (lock) {
// try to transition to the CANCELED state. That state marks
// that the releasing is in progress
if (simpleSlot.markCancelled()) {
// sanity checks
if (simpleSlot.isAlive()) {
throw new IllegalStateException("slot is still alive");
}
// check whether the slot is already released
if (simpleSlot.markReleased()) {
LOG.debug("Release simple slot {}.", simpleSlot);
AbstractID groupID = simpleSlot.getGroupID();
SharedSlot parent = simpleSlot.getParent();
// if we have a group ID, then our parent slot is tracked here
if (groupID != null && !allSlots.contains(parent)) {
throw new IllegalArgumentException("Slot was not associated with this SlotSharingGroup before.");
}
int parentRemaining = parent.removeDisposedChildSlot(simpleSlot);
if (parentRemaining > 0) {
// the parent shared slot is still alive. make sure we make it
// available again to the group of the just released slot
if (groupID != null) {
// if we have a group ID, then our parent becomes available
// for that group again. otherwise, the slot is part of a
// co-location group and nothing becomes immediately available
Map> slotsForJid = availableSlotsPerJid.get(groupID);
// sanity check
if (slotsForJid == null) {
throw new IllegalStateException("Trying to return a slot for group " + groupID +
" when available slots indicated that all slots were available.");
}
putIntoMultiMap(slotsForJid, parent.getTaskManagerID(), parent);
}
} else {
// the parent shared slot is now empty and can be released
parent.markCancelled();
internalDisposeEmptySharedSlot(parent);
}
}
}
}
}
/**
* Called from {@link org.apache.flink.runtime.instance.SharedSlot#releaseSlot()}.
*
* @param sharedSlot The slot to be released.
*/
void releaseSharedSlot(SharedSlot sharedSlot) {
synchronized (lock) {
if (sharedSlot.markCancelled()) {
// we are releasing this slot
if (sharedSlot.hasChildren()) {
// by simply releasing all children, we should eventually release this slot.
Set children = sharedSlot.getSubSlots();
while (children.size() > 0) {
children.iterator().next().releaseSlot();
}
}
else {
// if there are no children that trigger the release, we trigger it directly
internalDisposeEmptySharedSlot(sharedSlot);
}
}
}
}
/**
*
* NOTE: This method must be called from within a scope that holds the lock.
*/
private void internalDisposeEmptySharedSlot(SharedSlot sharedSlot) {
// sanity check
if (sharedSlot.isAlive() | !sharedSlot.getSubSlots().isEmpty()) {
throw new IllegalArgumentException();
}
final SharedSlot parent = sharedSlot.getParent();
final AbstractID groupID = sharedSlot.getGroupID();
// 1) If we do not have a parent, we are a root slot.
// 2) If we are not a root slot, we are a slot with a groupID and our parent
// becomes available for that group
if (parent == null) {
// root slot, return to the instance.
sharedSlot.getOwner().returnAllocatedSlot(sharedSlot);
// also, make sure we remove this slot from everywhere
allSlots.remove(sharedSlot);
removeSlotFromAllEntries(availableSlotsPerJid, sharedSlot);
}
else if (groupID != null) {
// we remove ourselves from our parent slot
if (sharedSlot.markReleased()) {
LOG.debug("Internally dispose empty shared slot {}.", sharedSlot);
int parentRemaining = parent.removeDisposedChildSlot(sharedSlot);
if (parentRemaining > 0) {
// the parent becomes available for the group again
Map> slotsForGroup = availableSlotsPerJid.get(groupID);
// sanity check
if (slotsForGroup == null) {
throw new IllegalStateException("Trying to return a slot for group " + groupID +
" when available slots indicated that all slots were available.");
}
putIntoMultiMap(slotsForGroup, parent.getTaskManagerID(), parent);
}
else {
// this was the last child of the parent. release the parent.
parent.markCancelled();
internalDisposeEmptySharedSlot(parent);
}
}
}
else {
throw new IllegalStateException(
"Found a shared slot that is neither a root slot, nor associated with a vertex group.");
}
}
// ------------------------------------------------------------------------
// Utilities
// ------------------------------------------------------------------------
private static void putIntoMultiMap(Map> map, ResourceID location, SharedSlot slot) {
List slotsForInstance = map.get(location);
if (slotsForInstance == null) {
slotsForInstance = new ArrayList();
map.put(location, slotsForInstance);
}
slotsForInstance.add(slot);
}
private static SharedSlot removeFromMultiMap(Map> map, ResourceID location) {
List slotsForLocation = map.get(location);
if (slotsForLocation == null) {
return null;
}
else {
SharedSlot slot = slotsForLocation.remove(slotsForLocation.size() - 1);
if (slotsForLocation.isEmpty()) {
map.remove(location);
}
return slot;
}
}
private static SharedSlot pollFromMultiMap(Map> map) {
Iterator>> iter = map.entrySet().iterator();
while (iter.hasNext()) {
List slots = iter.next().getValue();
if (slots.isEmpty()) {
iter.remove();
}
else if (slots.size() == 1) {
SharedSlot slot = slots.remove(0);
iter.remove();
return slot;
}
else {
return slots.remove(slots.size() - 1);
}
}
return null;
}
private static void removeSlotFromAllEntries(
Map>> availableSlots, SharedSlot slot)
{
final ResourceID taskManagerId = slot.getTaskManagerID();
for (Map.Entry>> entry : availableSlots.entrySet()) {
Map> map = entry.getValue();
List list = map.get(taskManagerId);
if (list != null) {
list.remove(slot);
if (list.isEmpty()) {
map.remove(taskManagerId);
}
}
}
}
}