All Downloads are FREE. Search and download functionalities are using the official Maven repository.

eu.ostrzyciel.jelly.stream.SizeLimiter.scala Maven / Gradle / Ivy

package eu.ostrzyciel.jelly.stream

import eu.ostrzyciel.jelly.core.proto.v1.RdfStreamRow
import org.apache.pekko.NotUsed
import org.apache.pekko.stream.scaladsl.Flow

/**
 * Policy for limiting the size of stream frames in the Jelly stream producer.
 *
 * Note that the limiter is only a **limit**. When streaming grouped triples,
 * grouped quads, or graphs, the size of the stream frame may be smaller than
 * the limit, as the stream frame is always created after the group is complete.
 *
 * See also: [[EncoderFlow]], [[EncoderSource]]
 */
trait SizeLimiter:
  /**
   * Flow that limits the size of stream frames.
   *
   * The flow should group the incoming rows into Seqs that will be later used to
   * create stream frames.
   * @return Apache Pekko Flow
   */
  def flow: Flow[RdfStreamRow, Seq[RdfStreamRow], NotUsed]

/**
 * Stream frame size limiter that tries to maintain a specific byte size of stream frames.
 * 
 * NOTE: this does not guarantee that the size of the stream frames will be less or equal
 * to the target size. The frames will in general be slightly larger than the target size,
 * by as much as one stream row.
 * 
 * @param targetSize target byte size of stream frames
 */
final class ByteSizeLimiter(targetSize: Long) extends SizeLimiter:
  override def flow: Flow[RdfStreamRow, Seq[RdfStreamRow], NotUsed] =
    Flow[RdfStreamRow].groupedWeighted(targetSize)(row => row.serializedSize)

/**
 * Stream frame size limiter that maintains a maximum number of rows in stream frames.
 * @param maxRows maximum number of rows in stream frames
 */
final class StreamRowCountLimiter(maxRows: Int) extends SizeLimiter:
  override def flow: Flow[RdfStreamRow, Seq[RdfStreamRow], NotUsed] =
    Flow[RdfStreamRow].grouped(maxRows)




© 2015 - 2025 Weber Informatics LLC | Privacy Policy