All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.cequence.jinaapi.model.SegmenterSettings.scala Maven / Gradle / Ivy

package io.cequence.jinaapi.model

case class SegmenterSettings(
  // Return the tokens and their corresponding ids in the response. Toggle to see the result visualization.
  returnTokens: Option[Boolean] = None,

  // Chunking the input into semantically meaningful segments while handling a wide variety of text types and edge cases based on common structural cues.
  returnChunks: Option[Boolean] = None,

  // Maximum number of characters in each chunk. In practice the chunk length can be smaller than this value, if there is a good boundary in the text.
  // The limit seems to be 2000
  maxChunkLength: Option[Int] = None,

  // Return the first N tokens of the given content. Boundary exclusive. Can not be used with 'tail'.
  head: Option[Int] = None,

  // Return the last N tokens of the given content. Boundary exclusive. Can not be used with 'head'.
  tail: Option[Int] = None,

  // The tokenizer to use.
  tokenizer: Option[String] = None
)




© 2015 - 2024 Weber Informatics LLC | Privacy Policy