com.google.cloud.dataflow.sdk.util.BatchTimerInternals Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of google-cloud-dataflow-java-sdk-all Show documentation
Show all versions of google-cloud-dataflow-java-sdk-all Show documentation
Google Cloud Dataflow Java SDK provides a simple, Java-based
interface for processing virtually any size data using Google cloud
resources. This artifact includes entire Dataflow Java SDK.
/*
* Copyright (C) 2015 Google Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License"); you may not
* use this file except in compliance with the License. You may obtain a copy of
* the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
* License for the specific language governing permissions and limitations under
* the License.
*/
package com.google.cloud.dataflow.sdk.util;
import static com.google.common.base.Preconditions.checkState;
import com.google.cloud.dataflow.sdk.transforms.windowing.BoundedWindow;
import com.google.common.base.MoreObjects;
import org.joda.time.Instant;
import java.util.ArrayList;
import java.util.HashSet;
import java.util.PriorityQueue;
import java.util.Set;
import javax.annotation.Nullable;
/**
* TimerInternals that uses priority queues to manage the timers that are ready to fire.
*/
public class BatchTimerInternals implements TimerInternals {
/** Set of timers that are scheduled used for deduplicating timers. */
private Set existingTimers = new HashSet<>();
// Keep these queues separate so we can advance over them separately.
private PriorityQueue watermarkTimers = new PriorityQueue<>(11);
private PriorityQueue processingTimers = new PriorityQueue<>(11);
private Instant inputWatermarkTime;
private Instant processingTime;
private PriorityQueue queue(TimeDomain domain) {
return TimeDomain.EVENT_TIME.equals(domain) ? watermarkTimers : processingTimers;
}
public BatchTimerInternals(Instant processingTime) {
this.processingTime = processingTime;
this.inputWatermarkTime = BoundedWindow.TIMESTAMP_MIN_VALUE;
}
@Override
public void setTimer(TimerData timer) {
if (existingTimers.add(timer)) {
queue(timer.getDomain()).add(timer);
}
}
@Override
public void deleteTimer(TimerData timer) {
existingTimers.remove(timer);
queue(timer.getDomain()).remove(timer);
}
@Override
public Instant currentProcessingTime() {
return processingTime;
}
/**
* {@inheritDoc}
*
* @return {@link BoundedWindow#TIMESTAMP_MAX_VALUE}: in batch mode, upstream processing
* is already complete.
*/
@Override
@Nullable
public Instant currentSynchronizedProcessingTime() {
return BoundedWindow.TIMESTAMP_MAX_VALUE;
}
@Override
public Instant currentInputWatermarkTime() {
return inputWatermarkTime;
}
@Override
@Nullable
public Instant currentOutputWatermarkTime() {
// The output watermark is always undefined in batch mode.
return null;
}
@Override
public String toString() {
return MoreObjects.toStringHelper(getClass())
.add("watermarkTimers", watermarkTimers)
.add("processingTimers", processingTimers)
.toString();
}
public void advanceInputWatermark(ReduceFnRunner runner, Instant newInputWatermark)
throws Exception {
checkState(!newInputWatermark.isBefore(inputWatermarkTime),
"Cannot move input watermark time backwards from %s to %s", inputWatermarkTime,
newInputWatermark);
inputWatermarkTime = newInputWatermark;
advance(runner, newInputWatermark, TimeDomain.EVENT_TIME);
}
public void advanceProcessingTime(ReduceFnRunner runner, Instant newProcessingTime)
throws Exception {
checkState(!newProcessingTime.isBefore(processingTime),
"Cannot move processing time backwards from %s to %s", processingTime, newProcessingTime);
processingTime = newProcessingTime;
advance(runner, newProcessingTime, TimeDomain.PROCESSING_TIME);
}
private void advance(ReduceFnRunner runner, Instant newTime, TimeDomain domain)
throws Exception {
PriorityQueue timers = queue(domain);
boolean shouldFire = false;
while (true) {
ArrayList firedTimers = new ArrayList();
while (!timers.isEmpty() && newTime.isAfter(timers.peek().getTimestamp())) {
// Remove before firing, so that if the callback adds another identical
// timer we don't remove it.
TimerData timer = timers.remove();
existingTimers.remove(timer);
firedTimers.add(timer);
}
if (firedTimers.isEmpty()) {
break;
}
runner.onTimers(firedTimers);
}
}
}