parsley.errors.tokenextractors.TillNextWhitespace.scala Maven / Gradle / Ivy
/* SPDX-FileCopyrightText: © 2022 Parsley Contributors
* SPDX-License-Identifier: BSD-3-Clause
*/
package parsley.errors.tokenextractors
import scala.collection.immutable.WrappedString
import parsley.XCompat.unused
import parsley.errors.{helpers, ErrorBuilder, Token, TokenSpan}
// Turn coverage off, because the tests have their own error builder
// We might want to test this on its own though
// $COVERAGE-OFF$
/** This extractor mixin provides an implementation for
* [[parsley.errors.ErrorBuilder.unexpectedToken `ErrorBuilder.unexpectedToken`]] when mixed into
* an error builder: it will construct a token that extends to the next available whitespace
* in the remaining input. It can be configured to constrict this token to the minimum of the
* next whitespace or whatever the parser demanded (see [[MatchParserDemand `MatchParserDemand`]]).
* @since 4.0.0
* @note In the case of unprintable characters or whitespace, this extractor will favour reporting
* a more meaningful name.
*/
trait TillNextWhitespace { this: ErrorBuilder[_] =>
/** Should tokens be trimed to only be as wide as ''either'' the next whitespace or the
* amount of input the parser tried to consumed, whichever is smaller?
* @since 4.0.0
*/
def trimToParserDemand: Boolean
/** @see [[parsley.errors.ErrorBuilder.unexpectedToken `ErrorBuilder.unexpectedToken`]] */
override final def unexpectedToken(cs: Iterable[Char], amountOfInputParserWanted: Int, @unused lexicalError: Boolean): Token = {
if (trimToParserDemand) TillNextWhitespace.unexpectedToken(cs, amountOfInputParserWanted)
else TillNextWhitespace.unexpectedToken(cs)
}
}
/** Contains the functionality of `TillNextWhitespace` as a function.
* @since 4.0.0
*/
object TillNextWhitespace {
// TODO: better factoring of this code
/** The implementation of `unexpectedToken` as done by `TillNextWhitespace`, with redundant arguments removed.
*
* This function will not trim the token to parser demand
*
* @since 4.0.0
*/
def unexpectedToken(cs: Iterable[Char]): Token = cs match {
case helpers.WhitespaceOrUnprintable(name) => Token.Named(name, TokenSpan.Width(1))
// these cases automatically handle the utf-16 surrogate pairs
case cs => Token.Raw(extractTillNextWhitespace(cs))
}
/** The implementation of `unexpectedToken` as done by `TillNextWhitespace`, with redundant arguments removed.
*
* This function will not trim the token to parser demand
*
* @since 4.0.0
*/
def unexpectedToken(cs: Iterable[Char], amountOfInputParserWanted: Int): Token = cs match {
case helpers.WhitespaceOrUnprintable(name) => Token.Named(name, TokenSpan.Width(1))
// these cases automatically handle the utf-16 surrogate pairs
case cs => Token.Raw(helpers.takeCodePoints(extractTillNextWhitespace(cs), amountOfInputParserWanted))
}
// TODO: we should take to minimum of parser demand and next whitespace, this would potentially be much much cheaper
private def extractTillNextWhitespace(cs: Iterable[Char]): String = cs match {
case cs: WrappedString =>
// These do not require allocation on the string
val idx = {
val idx = cs.indexWhere(_.isWhitespace)
if (idx != -1) idx else cs.length
}
cs.slice(0, idx).toString
case cs => cs.takeWhile(!_.isWhitespace).mkString
}
}
// $COVERAGE-ON$
© 2015 - 2025 Weber Informatics LLC | Privacy Policy