org.apache.flink.runtime.jobgraph.JobGraph Maven / Gradle / Ivy

Show more of this group Show more artifacts with this name
Show all versions of flink-runtime_2.11 Show documentation
There is a newer version: 1.5.1
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.flink.runtime.jobgraph;

import org.apache.flink.annotation.VisibleForTesting;
import org.apache.flink.api.common.ExecutionConfig;
import org.apache.flink.api.common.InvalidProgramException;
import org.apache.flink.api.common.JobID;
import org.apache.flink.api.common.cache.DistributedCache;
import org.apache.flink.configuration.Configuration;
import org.apache.flink.core.fs.Path;
import org.apache.flink.runtime.blob.PermanentBlobKey;
import org.apache.flink.runtime.jobgraph.tasks.JobCheckpointingSettings;
import org.apache.flink.runtime.resourcemanager.placementconstraint.PlacementConstraint;
import org.apache.flink.util.InstantiationUtil;
import org.apache.flink.util.SerializedValue;

import java.io.IOException;
import java.io.Serializable;
import java.net.URL;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.Iterator;
import java.util.LinkedHashMap;
import java.util.LinkedHashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;

import static org.apache.flink.util.Preconditions.checkNotNull;

/**
 * The JobGraph represents a Flink dataflow program, at the low level that the JobManager accepts.
 * All programs from higher level APIs are transformed into JobGraphs.
 *
 * The JobGraph is a graph of vertices and intermediate results that are connected together to
 * form a DAG. Note that iterations (feedback edges) are currently not encoded inside the JobGraph
 * but inside certain special vertices that establish the feedback channel amongst themselves.
 *
 * The JobGraph defines the job-wide configuration settings, while each vertex and intermediate result
 * define the characteristics of the concrete operation and intermediate data.
 */
public class JobGraph implements Serializable {

	private static final long serialVersionUID = 1L;

	// --- job and configuration ---

	/** List of task vertices included in this job graph. */
	private final Map taskVertices = new LinkedHashMap();

	/** Map of results produced by vertices in this job graph. */
	private final Map results = new HashMap<>();

	/** The job configuration attached to this job. */
	private final Configuration jobConfiguration = new Configuration();

	/** The configuration for scheduling. It's not visible to tasks. */
	private final Configuration schedulingConfiguration = new Configuration();

	/** ID of this job. May be set if specific job id is desired (e.g. session management) */
	private final JobID jobID;

	/** Name of this job. */
	private final String jobName;

	/** The number of seconds after which the corresponding ExecutionGraph is removed at the
	 * job manager after it has been executed. */
	private long sessionTimeout = 0;

	/** flag to enable queued scheduling */
	private boolean allowQueuedScheduling;

	/** Whether the job has non-deterministic shuffles. */
	private boolean hasNonDeterministicShuffles = false;

	/** Placement constraints of this job. */
	private List placementConstraints = new ArrayList<>();

	/** Version of this job. The version will change each time the job is updated. */
	private long jobVersion = 0L;

	// --- checkpointing ---

	/** Job specific execution config */
	private SerializedValue serializedExecutionConfig;

	/** The settings for the job checkpoints */
	private JobCheckpointingSettings snapshotSettings;

	/** Savepoint restore settings. */
	private SavepointRestoreSettings savepointRestoreSettings = SavepointRestoreSettings.none();

	// --- attached resources ---

	/** Set of JAR files required to run this job. */
	private final List userJars = new ArrayList();

	/** Set of custom files required to run this job. */
	private final Map userArtifacts = new HashMap<>();

	/** Set of blob keys identifying the JAR files required to run this job. */
	private final List userJarBlobKeys = new ArrayList<>();

	/** List of classpaths required to run this job. */
	private List classpaths = Collections.emptyList();

	// --------------------------------------------------------------------------------------------

	/**
	 * Constructs a new job graph with the given name, the given {@link ExecutionConfig},
	 * and a random job ID. The ExecutionConfig will be serialized and can't be modified afterwards.
	 *
	 * @param jobName The name of the job.
	 */
	public JobGraph(String jobName) {
		this(null, jobName);
	}

	/**
	 * Constructs a new job graph with the given job ID (or a random ID, if {@code null} is passed),
	 * the given name and the given execution configuration (see {@link ExecutionConfig}).
	 * The ExecutionConfig will be serialized and can't be modified afterwards.
	 *
	 * @param jobId The id of the job. A random ID is generated, if {@code null} is passed.
	 * @param jobName The name of the job.
	 */
	public JobGraph(JobID jobId, String jobName) {
		this.jobID = jobId == null ? new JobID() : jobId;
		this.jobName = jobName == null ? "(unnamed job)" : jobName;

		try {
			setExecutionConfig(new ExecutionConfig());
		} catch (IOException e) {
			// this should never happen, since an empty execution config is always serializable
			throw new RuntimeException("bug, empty execution config is not serializable");
		}
	}

	/**
	 * Constructs a new job graph with no name, a random job ID, the given {@link ExecutionConfig}, and
	 * the given job vertices. The ExecutionConfig will be serialized and can't be modified afterwards.
	 *
	 * @param vertices The vertices to add to the graph.
	 */
	public JobGraph(JobVertex... vertices) {
		this(null, vertices);
	}

	/**
	 * Constructs a new job graph with the given name, the given {@link ExecutionConfig}, a random job ID,
	 * and the given job vertices. The ExecutionConfig will be serialized and can't be modified afterwards.
	 *
	 * @param jobName The name of the job.
	 * @param vertices The vertices to add to the graph.
	 */
	public JobGraph(String jobName, JobVertex... vertices) {
		this(null, jobName, vertices);
	}

	/**
	 * Constructs a new job graph with the given name, the given {@link ExecutionConfig},
	 * the given jobId or a random one if null supplied, and the given job vertices.
	 * The ExecutionConfig will be serialized and can't be modified afterwards.
	 *
	 * @param jobId The id of the job. A random ID is generated, if {@code null} is passed.
	 * @param jobName The name of the job.
	 * @param vertices The vertices to add to the graph.
	 */
	public JobGraph(JobID jobId, String jobName, JobVertex... vertices) {
		this(jobId, jobName);

		for (JobVertex vertex : vertices) {
			addVertex(vertex);
		}
	}

	// --------------------------------------------------------------------------------------------

	/**
	 * Returns the ID of the job.
	 *
	 * @return the ID of the job
	 */
	public JobID getJobID() {
		return this.jobID;
	}

	/**
	 * Returns the name assigned to the job graph.
	 *
	 * @return the name assigned to the job graph
	 */
	public String getName() {
		return this.jobName;
	}

	/**
	 * Returns the configuration object for this job. Job-wide parameters should be set into that
	 * configuration object.
	 *
	 * @return The configuration object for this job.
	 */
	public Configuration getJobConfiguration() {
		return this.jobConfiguration;
	}

	/**
	 * Adds custom configuration for this job.
	 *
	 * @param configuration The custom configuration for this job.
	 */
	public void addCustomConfiguration(Configuration configuration) {
		if (configuration != null) {
			this.jobConfiguration.addAll(configuration);
		}
	}

	/**
	 * Returns the configuration object for scheduling.
	 * Parameters in this config will not be visible to tasks.
	 *
	 * @return The configuration object for scheduling.
	 */
	public Configuration getSchedulingConfiguration() {
		return this.schedulingConfiguration;
	}

	/**
	 * Returns the {@link ExecutionConfig}
	 *
	 * @return ExecutionConfig
	 */
	public SerializedValue getSerializedExecutionConfig() {
		return serializedExecutionConfig;
	}

	/**
	 * Gets the timeout after which the corresponding ExecutionGraph is removed at the
	 * job manager after it has been executed.
	 * @return a timeout as a long in seconds.
	 */
	public long getSessionTimeout() {
		return sessionTimeout;
	}

	/**
	 * Sets the timeout of the session in seconds. The timeout specifies how long a job will be kept
	 * in the job manager after it finishes.
	 * @param sessionTimeout The timeout in seconds
	 */
	public void setSessionTimeout(long sessionTimeout) {
		this.sessionTimeout = sessionTimeout;
	}

	public void setAllowQueuedScheduling(boolean allowQueuedScheduling) {
		this.allowQueuedScheduling = allowQueuedScheduling;
	}

	public boolean getAllowQueuedScheduling() {
		return allowQueuedScheduling;
	}

	public void setHasNonDeterministicShuffles(boolean hasNonDeterministicShuffles) {
		this.hasNonDeterministicShuffles = hasNonDeterministicShuffles;
	}

	public boolean hasNonDeterministicShuffles() {
		return hasNonDeterministicShuffles;
	}

	public List getPlacementConstraints() {
		return placementConstraints;
	}

	public void addPlacementConstraint(PlacementConstraint constraint) {
		this.placementConstraints.add(constraint);
	}

	public long getJobVersion() {
		return this.jobVersion;
	}

	public void setJobVersion(long newJobVersion) {
		this.jobVersion = newJobVersion;
	}

	@VisibleForTesting
	public void setScheduleMode(ScheduleMode scheduleMode) {
		this.schedulingConfiguration.setString(ScheduleMode.class.getName(), scheduleMode.toString());
	}

	/**
	 * Sets the savepoint restore settings.
	 * @param settings The savepoint restore settings.
	 */
	public void setSavepointRestoreSettings(SavepointRestoreSettings settings) {
		this.savepointRestoreSettings = checkNotNull(settings, "Savepoint restore settings");
	}

	/**
	 * Returns the configured savepoint restore setting.
	 * @return The configured savepoint restore settings.
	 */
	public SavepointRestoreSettings getSavepointRestoreSettings() {
		return savepointRestoreSettings;
	}

	/**
	 * Sets the execution config. This method eagerly serialized the ExecutionConfig for future RPC
	 * transport. Further modification of the referenced ExecutionConfig object will not affect
	 * this serialized copy.
	 *
	 * @param executionConfig The ExecutionConfig to be serialized.
	 * @throws IOException Thrown if the serialization of the ExecutionConfig fails
	 */
	public void setExecutionConfig(ExecutionConfig executionConfig) throws IOException {
		checkNotNull(executionConfig, "ExecutionConfig must not be null.");
		this.serializedExecutionConfig = new SerializedValue<>(executionConfig);
	}

	/**
	 * Adds a new task vertex to the job graph if it is not already included.
	 *
	 * @param vertex
	 *        the new task vertex to be added
	 */
	public void addVertex(JobVertex vertex) {
		final JobVertexID id = vertex.getID();
		JobVertex previous = taskVertices.put(id, vertex);

		// if we had a prior association, restore and throw an exception
		if (previous != null) {
			taskVertices.put(id, previous);
			throw new IllegalArgumentException("The JobGraph already contains a vertex with that id.");
		}
	}

	/**
	 * Adds new task vertices to the job graph.
	 *
	 * @param vertices the new task vertices to be added
	 */
	public void addVertices(Collection vertices) {
		checkNotNull(vertices);

		for (JobVertex vertex : vertices) {
			addVertex(vertex);
		}
	}

	/**
	 * Returns an Iterable to iterate all vertices registered with the job graph.
	 *
	 * @return an Iterable to iterate all vertices registered with the job graph
	 */
	public Iterable getVertices() {
		return this.taskVertices.values();
	}

	/**
	 * Returns an array of all job vertices that are registered with the job graph. The order in which the vertices
	 * appear in the list is not defined.
	 *
	 * @return an array of all job vertices that are registered with the job graph
	 */
	public JobVertex[] getVerticesAsArray() {
		return this.taskVertices.values().toArray(new JobVertex[this.taskVertices.size()]);
	}

	/**
	 * Returns the number of all vertices.
	 *
	 * @return The number of all vertices.
	 */
	public int getNumberOfVertices() {
		return this.taskVertices.size();
	}

	/**
	 * Sets the settings for asynchronous snapshots. A value of {@code null} means that
	 * snapshotting is not enabled.
	 *
	 * @param settings The snapshot settings, or null, to disable snapshotting.
	 */
	public void setSnapshotSettings(JobCheckpointingSettings settings) {
		this.snapshotSettings = settings;
	}

	/**
	 * Gets the settings for asynchronous snapshots. This method returns null, when
	 * checkpointing is not enabled.
	 *
	 * @return The snapshot settings, or null, if checkpointing is not enabled.
	 */
	public JobCheckpointingSettings getCheckpointingSettings() {
		return snapshotSettings;
	}

	/**
	 * Searches for a vertex with a matching ID and returns it.
	 *
	 * @param id
	 *        the ID of the vertex to search for
	 * @return the vertex with the matching ID or null if no vertex with such ID could be found
	 */
	public JobVertex findVertexByID(JobVertexID id) {
		return this.taskVertices.get(id);
	}

	/**
	 * Sets the classpaths required to run the job on a task manager.
	 *
	 * @param paths paths of the directories/JAR files required to run the job on a task manager
	 */
	public void setClasspaths(List paths) {
		classpaths = paths;
	}

	public List getClasspaths() {
		return classpaths;
	}

	/**
	 * Gets the maximum parallelism of all operations in this job graph.
	 *
	 * @return The maximum parallelism of this job graph
	 */
	public int getMaximumParallelism() {
		int maxParallelism = -1;
		for (JobVertex vertex : taskVertices.values()) {
			maxParallelism = Math.max(vertex.getParallelism(), maxParallelism);
		}
		return maxParallelism;
	}

	public List> getResultPartitionConsumerExecutionVertices(
		IntermediateDataSetID resultID,
		int partitionNumber) {

		IntermediateDataSet result = getResult(resultID);
		if (result == null) {
			throw new IllegalArgumentException("Cannot find the given result " + resultID + " in job graph");
		}
		if (partitionNumber >= result.getProducer().getParallelism()) {
			throw new IllegalArgumentException("Result partition index out of bounds: " + partitionNumber
				+ "/" + result.getProducer().getParallelism());
		}

		List> consumerVertices = new ArrayList<>();
		for (JobEdge edge : getResult(resultID).getConsumers()) {
			consumerVertices.add(edge.getConsumerExecutionVertices(partitionNumber));
		}
		return consumerVertices;
	}

	public JobVertexID getResultProducerID(IntermediateDataSetID resultID) {
		IntermediateDataSet result = getResult(resultID);
		if (result == null) {
			throw new IllegalArgumentException("Cannot find the given result " + resultID + " in job graph");
		}
		return result.getProducer().getID();
	}

	public Collection getResultIDs() {
		// Lazy build the result map if the result is not found, as edges may be late added
		for (JobVertex vertex : getVertices()) {
			for (IntermediateDataSet result : vertex.getProducedDataSets()) {
				results.put(result.getId(), result);
			}
		}

		return results.keySet();
	}

	public IntermediateDataSet getResult(IntermediateDataSetID resultID) {
		// Lazy build the result map if the result is not found, as edges may be late added
		if (!results.containsKey(resultID)) {
			for (JobVertex vertex : getVertices()) {
				for (IntermediateDataSet result : vertex.getProducedDataSets()) {
					results.put(result.getId(), result);
				}
			}
		}

		return results.get(resultID);
	}

	// --------------------------------------------------------------------------------------------
	//  Topological Graph Access
	// --------------------------------------------------------------------------------------------

	public List getVerticesSortedTopologicallyFromSources() throws InvalidProgramException {
		// early out on empty lists
		if (this.taskVertices.isEmpty()) {
			return Collections.emptyList();
		}

		List sorted = new ArrayList(this.taskVertices.size());
		Set remaining = new LinkedHashSet(this.taskVertices.values());

		// start by finding the vertices with no input edges
		// and the ones with disconnected inputs (that refer to some standalone data set)
		{
			Iterator iter = remaining.iterator();
			while (iter.hasNext()) {
				JobVertex vertex = iter.next();

				if (vertex.hasNoConnectedInputs()) {
					sorted.add(vertex);
					iter.remove();
				}
			}
		}

		int startNodePos = 0;

		// traverse from the nodes that were added until we found all elements
		while (!remaining.isEmpty()) {

			// first check if we have more candidates to start traversing from. if not, then the
			// graph is cyclic, which is not permitted
			if (startNodePos >= sorted.size()) {
				throw new InvalidProgramException("The job graph is cyclic.");
			}

			JobVertex current = sorted.get(startNodePos++);
			addNodesThatHaveNoNewPredecessors(current, sorted, remaining);
		}

		return sorted;
	}

	private void addNodesThatHaveNoNewPredecessors(JobVertex start, List target, Set remaining) {

		// forward traverse over all produced data sets and all their consumers
		for (IntermediateDataSet dataSet : start.getProducedDataSets()) {
			for (JobEdge edge : dataSet.getConsumers()) {

				// a vertex can be added, if it has no predecessors that are still in the 'remaining' set
				JobVertex v = edge.getTarget();
				if (!remaining.contains(v)) {
					continue;
				}

				boolean hasNewPredecessors = false;

				for (JobEdge e : v.getInputs()) {
					// skip the edge through which we came
					if (e == edge) {
						continue;
					}

					IntermediateDataSet source = e.getSource();
					if (remaining.contains(source.getProducer())) {
						hasNewPredecessors = true;
						break;
					}
				}

				if (!hasNewPredecessors) {
					target.add(v);
					remaining.remove(v);
					addNodesThatHaveNoNewPredecessors(v, target, remaining);
				}
			}
		}
	}

	// --------------------------------------------------------------------------------------------
	//  Handling of attached JAR files
	// --------------------------------------------------------------------------------------------

	/**
	 * Adds the path of a JAR file required to run the job on a task manager.
	 *
	 * @param jar
	 *        path of the JAR file required to run the job on a task manager
	 */
	public void addJar(Path jar) {
		if (jar == null) {
			throw new IllegalArgumentException();
		}

		if (!userJars.contains(jar)) {
			userJars.add(jar);
		}
	}

	/**
	 * Gets the list of assigned user jar paths.
	 *
	 * @return The list of assigned user jar paths
	 */
	public List getUserJars() {
		return userJars;
	}

	/**
	 * Adds the path of a custom file required to run the job on a task manager.
	 *
	 * @param name a name under which this artifact will be accessible through {@link DistributedCache}
	 * @param file path of a custom file required to run the job on a task manager
	 */
	public void addUserArtifact(String name, DistributedCache.DistributedCacheEntry file) {
		if (file == null) {
			throw new IllegalArgumentException();
		}

		userArtifacts.putIfAbsent(name, file);
	}

	/**
	 * Gets the list of assigned user jar paths.
	 *
	 * @return The list of assigned user jar paths
	 */
	public Map getUserArtifacts() {
		return userArtifacts;
	}

	/**
	 * Adds the BLOB referenced by the key to the JobGraph's dependencies.
	 *
	 * @param key
	 *        path of the JAR file required to run the job on a task manager
	 */
	public void addUserJarBlobKey(PermanentBlobKey key) {
		if (key == null) {
			throw new IllegalArgumentException();
		}

		if (!userJarBlobKeys.contains(key)) {
			userJarBlobKeys.add(key);
		}
	}

	/**
	 * Checks whether the JobGraph has user code JAR files attached.
	 *
	 * @return True, if the JobGraph has user code JAR files attached, false otherwise.
	 */
	public boolean hasUsercodeJarFiles() {
		return this.userJars.size() > 0;
	}

	/**
	 * Returns a set of BLOB keys referring to the JAR files required to run this job.
	 *
	 * @return set of BLOB keys referring to the JAR files required to run this job
	 */
	public List getUserJarBlobKeys() {
		return this.userJarBlobKeys;
	}

	@Override
	public String toString() {
		return "JobGraph(jobId: " + jobID + ")";
	}

	public void setUserArtifactBlobKey(String entryName, PermanentBlobKey blobKey) throws IOException {
		byte[] serializedBlobKey;
		serializedBlobKey = InstantiationUtil.serializeObject(blobKey);

		userArtifacts.computeIfPresent(entryName, (key, originalEntry) -> new DistributedCache.DistributedCacheEntry(
			originalEntry.filePath,
			originalEntry.isExecutable,
			serializedBlobKey,
			originalEntry.isZipped
		));
	}

	public void writeUserArtifactEntriesToConfiguration() {
		for (Map.Entry userArtifact : userArtifacts.entrySet()) {
			DistributedCache.writeFileInfoToConfig(
				userArtifact.getKey(),
				userArtifact.getValue(),
				jobConfiguration
			);
		}
	}
}