org.apache.flink.runtime.jobgraph.IntermediateDataSet Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.runtime.jobgraph;
import org.apache.flink.runtime.io.network.partition.ResultPartitionType;
import java.util.ArrayList;
import java.util.List;
import static com.google.common.base.Preconditions.checkNotNull;
/**
* An intermediate data set is the data set produced by an operator - either a
* source or any intermediate operation.
*
* Intermediate data sets may be read by other operators, materialized, or
* discarded.
*/
public class IntermediateDataSet implements java.io.Serializable {
private static final long serialVersionUID = 1L;
private final IntermediateDataSetID id; // the identifier
private final JobVertex producer; // the operation that produced this data set
private final List consumers = new ArrayList();
// The type of partition to use at runtime
private final ResultPartitionType resultType;
/**
* Flag indicating whether to eagerly deploy consumers.
*
* If true
, the consumers are deployed as soon as the
* runtime result is registered at the result manager of the task manager.
*/
private boolean eagerlyDeployConsumers;
// --------------------------------------------------------------------------------------------
public IntermediateDataSet(JobVertex producer) {
this(new IntermediateDataSetID(), producer);
}
public IntermediateDataSet(IntermediateDataSetID id, JobVertex producer) {
this(id, ResultPartitionType.PIPELINED, producer);
}
public IntermediateDataSet(IntermediateDataSetID id, ResultPartitionType resultType, JobVertex producer) {
this.id = checkNotNull(id);
this.producer = checkNotNull(producer);
this.resultType = checkNotNull(resultType);
}
// --------------------------------------------------------------------------------------------
public IntermediateDataSetID getId() {
return id;
}
public JobVertex getProducer() {
return producer;
}
public List getConsumers() {
return this.consumers;
}
public ResultPartitionType getResultType() {
return resultType;
}
/**
* Sets the flag indicating whether to eagerly deploy consumers (default:
* false
).
*
* @param eagerlyDeployConsumers If true
, the consumers are
* deployed as soon as the runtime result is
* registered at the result manager of the
* task manager. Default is false
.
*/
public void setEagerlyDeployConsumers(boolean eagerlyDeployConsumers) {
this.eagerlyDeployConsumers = eagerlyDeployConsumers;
}
/**
* Returns whether consumers should be deployed eagerly (as soon as they
* are registered at the result manager of the task manager).
*
* @return Whether consumers should be deployed eagerly
*/
public boolean getEagerlyDeployConsumers() {
return eagerlyDeployConsumers;
}
// --------------------------------------------------------------------------------------------
public void addConsumer(JobEdge edge) {
this.consumers.add(edge);
}
// --------------------------------------------------------------------------------------------
@Override
public String toString() {
return "Intermediate Data Set (" + id + ")";
}
}