
com.johnsnowlabs.nlp.annotators.sbd.pragmatic.PragmaticSymbols.scala Maven / Gradle / Ivy
package com.johnsnowlabs.nlp.annotators.sbd.pragmatic
/**
* Created by Saif Addin on 6/3/2017.
*/
/**
* Extends RuleSymbols with specific symbols used for the pragmatic approach. Right now, the only one.
*/
object PragmaticSymbols extends RuleSymbols {
/**
* ====================
* BREAKING SYMBOLS
* ====================
*/
/**
* Punctuation line breaker
* alt 200
*/
val PUNCT_INDICATOR = "╚"
/**
* Ellipsis breaker
* looks up -> "..."
* alt 203
*/
val ELLIPSIS_INDICATOR = "╦"
/**
* =====================
* NON BREAKING SYMBOLS
* =====================
*/
/**
* Non separation dots for abbreviations
* looks up -> .
* alt 198
*/
val ABBREVIATOR = "╞"
/**
* Non separation dots for numbers
* looks up -> .
* alt 199
*/
val NUM_INDICATOR = "╟"
/**
* Period container non breaker
* looks up -> .
* alt 201
*/
val MULT_PERIOD = "╔"
/**
* Special non breaking symbol
* alt 202
*/
val SPECIAL_PERIOD = "╩"
/**
* Question in quotes
* alt 209
*/
val QUESTION_IN_QUOTE = "╤" // ?
/**
* Exclamation mark in rules
* alt 210
*/
val EXCLAMATION_INDICATOR = "╥" // !
override def symbolRecovery: Map[String, String] = super.symbolRecovery ++ Map(
ABBREVIATOR -> ".",
NUM_INDICATOR -> ".",
MULT_PERIOD -> ".",
QUESTION_IN_QUOTE -> "?",
EXCLAMATION_INDICATOR -> "!",
ELLIPSIS_INDICATOR -> "..."
)
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy