All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.flink.streaming.runtime.tasks.OneInputStreamTask Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.flink.streaming.runtime.tasks;

import org.apache.flink.annotation.Internal;
import org.apache.flink.annotation.VisibleForTesting;
import org.apache.flink.api.common.typeutils.TypeSerializer;
import org.apache.flink.core.memory.ManagedMemoryUseCase;
import org.apache.flink.metrics.Counter;
import org.apache.flink.runtime.execution.Environment;
import org.apache.flink.runtime.io.network.partition.consumer.IndexedInputGate;
import org.apache.flink.runtime.metrics.MetricNames;
import org.apache.flink.streaming.api.graph.StreamConfig;
import org.apache.flink.streaming.api.operators.Input;
import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
import org.apache.flink.streaming.api.operators.sort.SortingDataInput;
import org.apache.flink.streaming.api.watermark.Watermark;
import org.apache.flink.streaming.runtime.io.PushingAsyncDataInput.DataOutput;
import org.apache.flink.streaming.runtime.io.RecordProcessorUtils;
import org.apache.flink.streaming.runtime.io.StreamOneInputProcessor;
import org.apache.flink.streaming.runtime.io.StreamTaskInput;
import org.apache.flink.streaming.runtime.io.StreamTaskNetworkInput;
import org.apache.flink.streaming.runtime.io.StreamTaskNetworkInputFactory;
import org.apache.flink.streaming.runtime.io.checkpointing.CheckpointBarrierHandler;
import org.apache.flink.streaming.runtime.io.checkpointing.CheckpointedInputGate;
import org.apache.flink.streaming.runtime.io.checkpointing.InputProcessorUtil;
import org.apache.flink.streaming.runtime.metrics.WatermarkGauge;
import org.apache.flink.streaming.runtime.streamrecord.LatencyMarker;
import org.apache.flink.streaming.runtime.streamrecord.RecordAttributes;
import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
import org.apache.flink.streaming.runtime.watermarkstatus.StatusWatermarkValve;
import org.apache.flink.streaming.runtime.watermarkstatus.WatermarkStatus;
import org.apache.flink.util.function.ThrowingConsumer;

import org.apache.flink.shaded.curator5.com.google.common.collect.Iterables;

import javax.annotation.Nullable;

import java.util.Arrays;
import java.util.Collections;
import java.util.List;
import java.util.Optional;

import static org.apache.flink.streaming.api.graph.StreamConfig.requiresSorting;
import static org.apache.flink.util.Preconditions.checkNotNull;
import static org.apache.flink.util.Preconditions.checkState;

/** A {@link StreamTask} for executing a {@link OneInputStreamOperator}. */
@Internal
public class OneInputStreamTask extends StreamTask> {

    @Nullable private CheckpointBarrierHandler checkpointBarrierHandler;

    private final WatermarkGauge inputWatermarkGauge = new WatermarkGauge();

    /**
     * Constructor for initialization, possibly with initial state (recovery / savepoint / etc).
     *
     * @param env The task environment for this task.
     */
    public OneInputStreamTask(Environment env) throws Exception {
        super(env);
    }

    /**
     * Constructor for initialization, possibly with initial state (recovery / savepoint / etc).
     *
     * 

This constructor accepts a special {@link TimerService}. By default (and if null is passes * for the time provider) a {@link SystemProcessingTimeService DefaultTimerService} will be * used. * * @param env The task environment for this task. * @param timeProvider Optionally, a specific time provider to use. */ @VisibleForTesting public OneInputStreamTask(Environment env, @Nullable TimerService timeProvider) throws Exception { super(env, timeProvider); } @Override public void init() throws Exception { StreamConfig configuration = getConfiguration(); int numberOfInputs = configuration.getNumberOfNetworkInputs(); if (numberOfInputs > 0) { CheckpointedInputGate inputGate = createCheckpointedInputGate(); Counter numRecordsIn = setupNumRecordsInCounter(mainOperator); DataOutput output = createDataOutput(numRecordsIn); StreamTaskInput input = createTaskInput(inputGate); StreamConfig.InputConfig[] inputConfigs = configuration.getInputs(getUserCodeClassLoader()); StreamConfig.InputConfig inputConfig = inputConfigs[0]; if (requiresSorting(inputConfig)) { checkState( !configuration.isCheckpointingEnabled(), "Checkpointing is not allowed with sorted inputs."); input = wrapWithSorted(input); } getEnvironment() .getMetricGroup() .getIOMetricGroup() .reuseRecordsInputCounter(numRecordsIn); inputProcessor = new StreamOneInputProcessor<>(input, output, operatorChain); } mainOperator .getMetricGroup() .gauge(MetricNames.IO_CURRENT_INPUT_WATERMARK, inputWatermarkGauge); // wrap watermark gauge since registered metrics must be unique getEnvironment() .getMetricGroup() .gauge(MetricNames.IO_CURRENT_INPUT_WATERMARK, inputWatermarkGauge::getValue); } @Override protected Optional getCheckpointBarrierHandler() { return Optional.ofNullable(checkpointBarrierHandler); } private StreamTaskInput wrapWithSorted(StreamTaskInput input) { ClassLoader userCodeClassLoader = getUserCodeClassLoader(); return new SortingDataInput<>( input, configuration.getTypeSerializerIn(input.getInputIndex(), userCodeClassLoader), configuration.getStateKeySerializer(userCodeClassLoader), configuration.getStatePartitioner(input.getInputIndex(), userCodeClassLoader), getEnvironment().getMemoryManager(), getEnvironment().getIOManager(), getExecutionConfig().isObjectReuseEnabled(), configuration.getManagedMemoryFractionOperatorUseCaseOfSlot( ManagedMemoryUseCase.OPERATOR, getJobConfiguration(), getEnvironment().getTaskConfiguration(), userCodeClassLoader), getEnvironment().getTaskManagerInfo().getConfiguration(), this, getExecutionConfig()); } @SuppressWarnings("unchecked") private CheckpointedInputGate createCheckpointedInputGate() { IndexedInputGate[] inputGates = getEnvironment().getAllInputGates(); checkpointBarrierHandler = InputProcessorUtil.createCheckpointBarrierHandler( this, configuration, getCheckpointCoordinator(), getTaskNameWithSubtaskAndId(), new List[] {Arrays.asList(inputGates)}, Collections.emptyList(), mainMailboxExecutor, systemTimerService); CheckpointedInputGate[] checkpointedInputGates = InputProcessorUtil.createCheckpointedMultipleInputGate( mainMailboxExecutor, new List[] {Arrays.asList(inputGates)}, getEnvironment().getMetricGroup().getIOMetricGroup(), checkpointBarrierHandler, configuration); return Iterables.getOnlyElement(Arrays.asList(checkpointedInputGates)); } private DataOutput createDataOutput(Counter numRecordsIn) { return new StreamTaskNetworkOutput<>( operatorChain.getFinishedOnRestoreInputOrDefault(mainOperator), inputWatermarkGauge, numRecordsIn); } private StreamTaskInput createTaskInput(CheckpointedInputGate inputGate) { StatusWatermarkValve statusWatermarkValve = new StatusWatermarkValve(inputGate); TypeSerializer inSerializer = configuration.getTypeSerializerIn1(getUserCodeClassLoader()); return StreamTaskNetworkInputFactory.create( inputGate, inSerializer, getEnvironment().getIOManager(), statusWatermarkValve, 0, getEnvironment().getTaskStateManager().getInputRescalingDescriptor(), gateIndex -> configuration .getInPhysicalEdges(getUserCodeClassLoader()) .get(gateIndex) .getPartitioner(), getEnvironment().getTaskInfo(), getCanEmitBatchOfRecords()); } /** * The network data output implementation used for processing stream elements from {@link * StreamTaskNetworkInput} in one input processor. */ private static class StreamTaskNetworkOutput implements DataOutput { private final Input operator; private final WatermarkGauge watermarkGauge; private final Counter numRecordsIn; private final ThrowingConsumer, Exception> recordProcessor; private StreamTaskNetworkOutput( Input operator, WatermarkGauge watermarkGauge, Counter numRecordsIn) { this.operator = checkNotNull(operator); this.watermarkGauge = checkNotNull(watermarkGauge); this.numRecordsIn = checkNotNull(numRecordsIn); this.recordProcessor = RecordProcessorUtils.getRecordProcessor(operator); } @Override public void emitRecord(StreamRecord record) throws Exception { numRecordsIn.inc(); recordProcessor.accept(record); } @Override public void emitWatermark(Watermark watermark) throws Exception { watermarkGauge.setCurrentWatermark(watermark.getTimestamp()); operator.processWatermark(watermark); } @Override public void emitWatermarkStatus(WatermarkStatus watermarkStatus) throws Exception { operator.processWatermarkStatus(watermarkStatus); } @Override public void emitLatencyMarker(LatencyMarker latencyMarker) throws Exception { operator.processLatencyMarker(latencyMarker); } @Override public void emitRecordAttributes(RecordAttributes recordAttributes) throws Exception { operator.processRecordAttributes(recordAttributes); } } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy