com.spotify.scio.util.ParallelLimitedFn.scala Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of scio-core_2.13 Show documentation
Show all versions of scio-core_2.13 Show documentation
Scio - A Scala API for Apache Beam and Google Cloud Dataflow
The newest version!
/*
* Copyright 2019 Spotify AB.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package com.spotify.scio.util
import java.util.concurrent.Semaphore
import com.spotify.scio.transforms.DoFnWithResource
import com.spotify.scio.transforms.DoFnWithResource.ResourceType
import org.apache.beam.sdk.transforms.DoFn
import org.apache.beam.sdk.transforms.DoFn.ProcessElement
/**
* Utility class to limit the number of parallel doFns
* @param maxDoFns
* Max number of doFns
*/
abstract private[scio] class ParallelLimitedFn[T, U](maxDoFns: Int)
extends DoFnWithResource[T, U, Semaphore]
with NamedFn {
def getResourceType: ResourceType = ResourceType.PER_CLASS
def createResource: Semaphore = new Semaphore(maxDoFns, true)
def parallelProcessElement(x: DoFn[T, U]#ProcessContext): Unit
/*
* ProcessContext is required as an argument because it is passed to public via parallelProcessElement
* */
@ProcessElement def processElement(x: DoFn[T, U]#ProcessContext): Unit = {
val semaphore = getResource
try {
semaphore.acquire()
parallelProcessElement(x)
} finally {
semaphore.release()
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy