All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.wayang.flink.channels.DataSetChannel Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.wayang.flink.channels;

import org.apache.flink.api.java.DataSet;
import org.apache.wayang.core.optimizer.OptimizationContext;
import org.apache.wayang.core.plan.executionplan.Channel;
import org.apache.wayang.core.plan.wayangplan.OutputSlot;
import org.apache.wayang.core.platform.AbstractChannelInstance;
import org.apache.wayang.core.platform.ChannelDescriptor;
import org.apache.wayang.core.platform.ChannelInstance;
import org.apache.wayang.core.platform.Executor;
import org.apache.wayang.flink.execution.FlinkExecutor;

import java.util.OptionalLong;

/**
 * Describes the situation where one {@link DataSet} is operated on, producing a further {@link DataSet}.
 * 

NB: We might be more specific: Distinguish between cached/uncached and pipelined/aggregated.

*/ public class DataSetChannel extends Channel{ public static final ChannelDescriptor DESCRIPTOR = new ChannelDescriptor( DataSetChannel.class, true, false ); public static final ChannelDescriptor DESCRIPTOR_MANY = new ChannelDescriptor( DataSetChannel.class, true, false ); public DataSetChannel(ChannelDescriptor descriptor, OutputSlot outputSlot) { super(descriptor, outputSlot); assert descriptor == DESCRIPTOR || descriptor == DESCRIPTOR_MANY; // this.markForInstrumentation(); } private DataSetChannel(DataSetChannel parent) { super(parent); } @Override public Channel copy() { return new DataSetChannel(this); } @Override public Instance createInstance(Executor executor, OptimizationContext.OperatorContext producerOperatorContext, int producerOutputIndex) { return new Instance((FlinkExecutor) executor, producerOperatorContext, producerOutputIndex); } /** * {@link ChannelInstance} implementation for {@link DataSet}s. */ public class Instance extends AbstractChannelInstance { private DataSet dataSet; private long size; public Instance(FlinkExecutor executor, OptimizationContext.OperatorContext producerOperatorContext, int producerOutputIndex) { super(executor, producerOperatorContext, producerOutputIndex); } public void accept(DataSet dataSet, FlinkExecutor flinkExecutor) { this.dataSet = dataSet; } @SuppressWarnings("unchecked") public DataSet provideDataSet() { return (DataSet) this.dataSet; } @Override protected void doDispose() { this.dataSet = null; } @Override public OptionalLong getMeasuredCardinality() { return this.size == 0 ? super.getMeasuredCardinality() : OptionalLong.of(this.size); } @Override public DataSetChannel getChannel() { return DataSetChannel.this; } } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy