com.spotify.scio.util.FunctionsWithWindowedValue.scala Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of scio-core_2.13 Show documentation
Show all versions of scio-core_2.13 Show documentation
Scio - A Scala API for Apache Beam and Google Cloud Dataflow
/*
* Copyright 2019 Spotify AB.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package com.spotify.scio.util
import com.spotify.scio.values.WindowedValue
import org.apache.beam.sdk.transforms.DoFn
import org.apache.beam.sdk.transforms.DoFn.{Element, OutputReceiver, ProcessElement, Timestamp}
import org.apache.beam.sdk.transforms.windowing.{BoundedWindow, PaneInfo}
import com.twitter.chill.ClosureCleaner
import org.joda.time.Instant
import scala.collection.compat._
private[scio] object FunctionsWithWindowedValue {
def filterFn[T, U](f: WindowedValue[T] => Boolean): DoFn[T, T] =
new NamedDoFn[T, T] {
val g = ClosureCleaner.clean(f) // defeat closure
@ProcessElement
private[scio] def processElement(
@Element element: T,
@Timestamp timestamp: Instant,
out: OutputReceiver[T],
pane: PaneInfo,
window: BoundedWindow
): Unit = {
val wv = WindowedValue(element, timestamp, window, pane)
if (g(wv)) out.output(element)
}
}
def flatMapFn[T, U](f: WindowedValue[T] => TraversableOnce[WindowedValue[U]]): DoFn[T, U] =
new NamedDoFn[T, U] {
val g = ClosureCleaner.clean(f) // defeat closure
@ProcessElement
private[scio] def processElement(
@Element element: T,
@Timestamp timestamp: Instant,
out: OutputReceiver[U],
pane: PaneInfo,
window: BoundedWindow
): Unit = {
val wv = WindowedValue(element, timestamp, window, pane)
val i = g(wv).iterator
while (i.hasNext) {
val v = i.next()
out.outputWithTimestamp(v.value, v.timestamp)
}
}
}
def mapFn[T, U](f: WindowedValue[T] => WindowedValue[U]): DoFn[T, U] =
new NamedDoFn[T, U] {
val g = ClosureCleaner.clean(f) // defeat closure
@ProcessElement
private[scio] def processElement(
@Element element: T,
@Timestamp timestamp: Instant,
out: OutputReceiver[U],
pane: PaneInfo,
window: BoundedWindow
): Unit = {
val wv = g(WindowedValue(element, timestamp, window, pane))
out.outputWithTimestamp(wv.value, wv.timestamp)
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy