org.unlaxer.CodePointString Maven / Gradle / Ivy

Go to download
package org.unlaxer;

import java.io.UnsupportedEncodingException;
import java.lang.CharSequence;
import java.lang.Character;
import java.lang.IllegalArgumentException;
import java.lang.IndexOutOfBoundsException;
import java.lang.Object;
import java.lang.String;
import java.lang.StringBuffer;
import java.nio.charset.Charset;
import java.util.Locale;
import java.util.function.Function;
import java.util.regex.PatternSyntaxException;
import java.util.stream.IntStream;
import java.util.stream.Stream;

/**
 * CP　means CodePoint
 */
public interface CodePointString {
  
  Function stringToStringInterface();
  Function stringInterfaceToStgring();
  
  StringIndex toStringIndex(CodePointIndex codePointIndex);
  CodePointIndex toCodePointIndex(StringIndex stringIndex);

  /**
   * Returns the length of this string.
   * The length is equal to the number of Unicode
   * code units in the string.
   *
   * @return  the length of the sequence of characters represented by this
   *          object.
   */
  StringLength stringLength();
  
  CodePointLength codePointLength();
  
  String getSource();

  /**
   * Returns {@code true} if, and only if, {@link #length()} is {@code 0}.
   *
   * @return {@code true} if {@link #length()} is {@code 0}, otherwise
   * {@code false}
   *
   * @since 1.6
   */
  boolean isEmpty();

  /**
   * Returns the {@code char} value at the
   * specified index. An index ranges from {@code 0} to
   * {@code length() - 1}. The first {@code char} value of the sequence
   * is at index {@code 0}, the next at index {@code 1},
   * and so on, as for array indexing.
   *
   * If the {@code char} value specified by the index is a
   * surrogate, the surrogate
   * value is returned.
   *
   * @param      index   the index of the {@code char} value.
   * @return     the {@code char} value at the specified index of this string.
   *             The first {@code char} value is at index {@code 0}.
   * @exception  IndexOutOfBoundsException  if the {@code index}
   *             argument is negative or not less than the length of this
   *             string.
   */
  char charAt(int index);
  
  default char charAt(StringIndex index) {
    return charAt(index.value());
  }


  /**
   * Returns the character (Unicode code point) at the specified
   * index. The index refers to {@code char} values
   * (Unicode code units) and ranges from {@code 0} to
   * {@link #length()}{@code  - 1}.
   *
   * 
 If the {@code char} value specified at the given index
   * is in the high-surrogate range, the following index is less
   * than the length of this {@code String}, and the
   * {@code char} value at the following index is in the
   * low-surrogate range, then the supplementary code point
   * corresponding to this surrogate pair is returned. Otherwise,
   * the {@code char} value at the given index is returned.
   *
   * @param      index the index to the {@code char} values
   * @return     the code point value of the character at the
   *             {@code index}
   * @exception  IndexOutOfBoundsException  if the {@code index}
   *             argument is negative or not less than the length of this
   *             string.
   * @since      1.5
   */
  int  codePointAt(int index);

  default CodePoint codePointAt(CodePointIndex index) {
    return new CodePoint(codePointAt(index.value()));
  }
  /**
   * Returns the character (Unicode code point) before the specified
   * index. The index refers to {@code char} values
   * (Unicode code units) and ranges from {@code 1} to {@link
   * CharSequence#length() length}.
   *
   * 
 If the {@code char} value at {@code (index - 1)}
   * is in the low-surrogate range, {@code (index - 2)} is not
   * negative, and the {@code char} value at {@code (index -
   * 2)} is in the high-surrogate range, then the
   * supplementary code point value of the surrogate pair is
   * returned. If the {@code char} value at {@code index -
   * 1} is an unpaired low-surrogate or a high-surrogate, the
   * surrogate value is returned.
   *
   * @param     index the index following the code point that should be returned
   * @return    the Unicode code point value before the given index.
   * @exception IndexOutOfBoundsException if the {@code index}
   *            argument is less than 1 or greater than the length
   *            of this string.
   * @since     1.5
   */
  int codePointBefore(int index);
  
  default CodePoint codePointBefore(CodePointIndex index) {
    return new CodePoint(codePointBefore(index.value()));
  }

  /**
   * Returns the number of Unicode code points in the specified text
   * range of this {@code String}. The text range begins at the
   * specified {@code beginIndex} and extends to the
   * {@code char} at index {@code endIndex - 1}. Thus the
   * length (in {@code char}s) of the text range is
   * {@code endIndex-beginIndex}. Unpaired surrogates within
   * the text range count as one code point each.
   *
   * @param beginIndex the index to the first {@code char} of
   * the text range.
   * @param endIndex the index after the last {@code char} of
   * the text range.
   * @return the number of Unicode code points in the specified text
   * range
   * @exception IndexOutOfBoundsException if the
   * {@code beginIndex} is negative, or {@code endIndex}
   * is larger than the length of this {@code String}, or
   * {@code beginIndex} is larger than {@code endIndex}.
   * @since  1.5
   */
  int codePointCount(int beginIndex, int endIndex);
  
  default CodePoint codePointCount(StringIndex beginIndex, StringIndex endIndex) {
    return new CodePoint(codePointCount(beginIndex.value(), endIndex.value()));
  }

  /**
   * Returns the index within this {@code String} that is
   * offset from the given {@code index} by
   * {@code codePointOffset} code points. Unpaired surrogates
   * within the text range given by {@code index} and
   * {@code codePointOffset} count as one code point each.
   *
   * @param index the index to be offset
   * @param codePointOffset the offset in code points
   * @return the index within this {@code String}
   * @exception IndexOutOfBoundsException if {@code index}
   *   is negative or larger then the length of this
   *   {@code String}, or if {@code codePointOffset} is positive
   *   and the substring starting with {@code index} has fewer
   *   than {@code codePointOffset} code points,
   *   or if {@code codePointOffset} is negative and the substring
   *   before {@code index} has fewer than the absolute value
   *   of {@code codePointOffset} code points.
   * @since 1.5
   */
  int offsetByCodePoints(int index, int codePointOffset);
  
  default StringIndex offsetByCodePoints(StringIndex index, CodePointOffset codePointOffset) {
    return new StringIndex(offsetByCodePoints(index.value(), codePointOffset.value()));
  }

  /**
   * Copies characters from this string into the destination character
   * array.
   * 

   * The first character to be copied is at index {@code srcBegin};
   * the last character to be copied is at index {@code srcEnd-1}
   * (thus the total number of characters to be copied is
   * {@code srcEnd-srcBegin}). The characters are copied into the
   * subarray of {@code dst} starting at index {@code dstBegin}
   * and ending at index:
   * 
   *     dstBegin + (srcEnd-srcBegin) - 1
   * 
   *
   * @param      srcBegin   index of the first character in the string
   *                        to copy.
   * @param      srcEnd     index after the last character in the string
   *                        to copy.
   * @param      dst        the destination array.
   * @param      dstBegin   the start offset in the destination array.
   * @exception IndexOutOfBoundsException If any of the following
   *            is true:
   *            {@code srcBegin} is negative.
   *            
{@code srcBegin} is greater than {@code srcEnd}
   *            
{@code srcEnd} is greater than the length of this
   *                string
   *            
{@code dstBegin} is negative
   *            
{@code dstBegin+(srcEnd-srcBegin)} is larger than
   *                {@code dst.length}
   */
  void getChars(int srcBegin, int srcEnd, char dst[], int dstBegin);
  
  default void getChars(StringIndex srcBegin, StringIndex srcEnd, char dst[], StringIndex dstBegin) {
    getChars(srcBegin.value(), srcEnd.value(), dst, dstBegin.value());
  }

  /**
   * Copies characters from this string into the destination byte array. Each
   * byte receives the 8 low-order bits of the corresponding character. The
   * eight high-order bits of each character are not copied and do not
   * participate in the transfer in any way.
   *
   *  The first character to be copied is at index {@code srcBegin}; the
   * last character to be copied is at index {@code srcEnd-1}.  The total
   * number of characters to be copied is {@code srcEnd-srcBegin}. The
   * characters, converted to bytes, are copied into the subarray of {@code
   * dst} starting at index {@code dstBegin} and ending at index:
   *
   * 
   *     dstBegin + (srcEnd-srcBegin) - 1
   * 
   *
   * @deprecated  This method does not properly convert characters into
   * bytes.  As of JDK 1.1, the preferred way to do this is via the
   * {@link #getBytes()} method, which uses the platform's default charset.
   *
   * @param  srcBegin
   *         Index of the first character in the string to copy
   *
   * @param  srcEnd
   *         Index after the last character in the string to copy
   *
   * @param  dst
   *         The destination array
   *
   * @param  dstBegin
   *         The start offset in the destination array
   *
   * @throws  IndexOutOfBoundsException
   *          If any of the following is true:
   *          
   *             {@code srcBegin} is negative
   *            
 {@code srcBegin} is greater than {@code srcEnd}
   *            
 {@code srcEnd} is greater than the length of this String
   *            
 {@code dstBegin} is negative
   *            
 {@code dstBegin+(srcEnd-srcBegin)} is larger than {@code
   *                 dst.length}
   *          
   */
  void getBytes(int srcBegin, int srcEnd, byte dst[], int dstBegin);

  default void getBytes(StringIndex srcBegin, StringIndex srcEnd, byte dst[], StringIndex dstBegin) {
    getBytes(srcBegin.value(), srcEnd.value(), dst, dstBegin.value());
  }
  
  /**
   * Encodes this {@code String} into a sequence of bytes using the named
   * charset, storing the result into a new byte array.
   *
   *  The behavior of this method when this string cannot be encoded in
   * the given charset is unspecified.  The {@link
   * java.nio.charset.CharsetEncoder} class should be used when more control
   * over the encoding process is required.
   *
   * @param  charsetName
   *         The name of a supported {@linkplain java.nio.charset.Charset
   *         charset}
   *
   * @return  The resultant byte array
   *
   * @throws  UnsupportedEncodingException
   *          If the named charset is not supported
   *
   * @since  1.1
   */
  byte[] getBytes(String charsetName) throws UnsupportedEncodingException;

  /**
   * Encodes this {@code String} into a sequence of bytes using the given
   * {@linkplain java.nio.charset.Charset charset}, storing the result into a
   * new byte array.
   *
   * 
 This method always replaces malformed-input and unmappable-character
   * sequences with this charset's default replacement byte array.  The
   * {@link java.nio.charset.CharsetEncoder} class should be used when more
   * control over the encoding process is required.
   *
   * @param  charset
   *         The {@linkplain java.nio.charset.Charset} to be used to encode
   *         the {@code String}
   *
   * @return  The resultant byte array
   *
   * @since  1.6
   */
  byte[] getBytes(Charset charset);

  /**
   * Encodes this {@code String} into a sequence of bytes using the
   * platform's default charset, storing the result into a new byte array.
   *
   * 
 The behavior of this method when this string cannot be encoded in
   * the default charset is unspecified.  The {@link
   * java.nio.charset.CharsetEncoder} class should be used when more control
   * over the encoding process is required.
   *
   * @return  The resultant byte array
   *
   * @since      1.1
   */
  byte[] getBytes();

  /**
   * Compares this string to the specified object.  The result is {@code
   * true} if and only if the argument is not {@code null} and is a {@code
   * String} object that represents the same sequence of characters as this
   * object.
   *
   * 
For finer-grained String comparison, refer to
   * {@link java.text.Collator}.
   *
   * @param  anObject
   *         The object to compare this {@code String} against
   *
   * @return  {@code true} if the given object represents a {@code String}
   *          equivalent to this string, {@code false} otherwise
   *
   * @see  #compareTo(String)
   * @see  #equalsIgnoreCase(String)
   */
  boolean equals(Object anObject);

  /**
   * Compares this string to the specified {@code StringBuffer}.  The result
   * is {@code true} if and only if this {@code String} represents the same
   * sequence of characters as the specified {@code StringBuffer}. This method
   * synchronizes on the {@code StringBuffer}.
   *
   * 
For finer-grained String comparison, refer to
   * {@link java.text.Collator}.
   *
   * @param  sb
   *         The {@code StringBuffer} to compare this {@code String} against
   *
   * @return  {@code true} if this {@code String} represents the same
   *          sequence of characters as the specified {@code StringBuffer},
   *          {@code false} otherwise
   *
   * @since  1.4
   */
  boolean contentEquals(StringBuffer sb);

  /**
   * Compares this string to the specified {@code CharSequence}.  The
   * result is {@code true} if and only if this {@code String} represents the
   * same sequence of char values as the specified sequence. Note that if the
   * {@code CharSequence} is a {@code StringBuffer} then the method
   * synchronizes on it.
   *
   * 
For finer-grained String comparison, refer to
   * {@link java.text.Collator}.
   *
   * @param  cs
   *         The sequence to compare this {@code String} against
   *
   * @return  {@code true} if this {@code String} represents the same
   *          sequence of char values as the specified sequence, {@code
   *          false} otherwise
   *
   * @since  1.5
   */
  boolean contentEquals(CharSequence cs);

  /**
   * Compares this {@code String} to another {@code String}, ignoring case
   * considerations.  Two strings are considered equal ignoring case if they
   * are of the same length and corresponding characters in the two strings
   * are equal ignoring case.
   *
   * 
 Two characters {@code c1} and {@code c2} are considered the same
   * ignoring case if at least one of the following is true:
   * 

   *    The two characters are the same (as compared by the
   *        {@code ==} operator)
   *   
 Calling {@code Character.toLowerCase(Character.toUpperCase(char))}
   *        on each character produces the same result
   * 
   *
   * Note that this method does not take locale into account, and
   * will result in unsatisfactory results for certain locales.  The
   * {@link java.text.Collator} class provides locale-sensitive comparison.
   *
   * @param  anotherString
   *         The {@code String} to compare this {@code String} against
   *
   * @return  {@code true} if the argument is not {@code null} and it
   *          represents an equivalent {@code String} ignoring case; {@code
   *          false} otherwise
   *
   * @see  #equals(Object)
   */
  boolean equalsIgnoreCase(String anotherString);

  default boolean equalsIgnoreCase(CodePointString anotherString) {
    return equalsIgnoreCase(anotherString.toString());
  }

  /**
   * Compares two strings lexicographically.
   * The comparison is based on the Unicode value of each character in
   * the strings. The character sequence represented by this
   * {@code String} object is compared lexicographically to the
   * character sequence represented by the argument string. The result is
   * a negative integer if this {@code String} object
   * lexicographically precedes the argument string. The result is a
   * positive integer if this {@code String} object lexicographically
   * follows the argument string. The result is zero if the strings
   * are equal; {@code compareTo} returns {@code 0} exactly when
   * the {@link #equals(Object)} method would return {@code true}.
   * 

   * This is the definition of lexicographic ordering. If two strings are
   * different, then either they have different characters at some index
   * that is a valid index for both strings, or their lengths are different,
   * or both. If they have different characters at one or more index
   * positions, let k be the smallest such index; then the string
   * whose character at position k has the smaller value, as
   * determined by using the {@code <} operator, lexicographically precedes the
   * other string. In this case, {@code compareTo} returns the
   * difference of the two character values at position {@code k} in
   * the two string -- that is, the value:
   * 
   * this.charAt(k)-anotherString.charAt(k)
   * 
   * If there is no index position at which they differ, then the shorter
   * string lexicographically precedes the longer string. In this case,
   * {@code compareTo} returns the difference of the lengths of the
   * strings -- that is, the value:
   *    * this.length()-anotherString.length()
   * 
   *
   * For finer-grained String comparison, refer to
   * {@link java.text.Collator}.
   *
   * @param   anotherString   the {@code String} to be compared.
   * @return  the value {@code 0} if the argument string is equal to
   *          this string; a value less than {@code 0} if this string
   *          is lexicographically less than the string argument; and a
   *          value greater than {@code 0} if this string is
   *          lexicographically greater than the string argument.
   */
  int compareTo(String anotherString);
  
  default int compareTo(CodePointString  anotherString) {
    return compareTo(anotherString.toString());
  }

  /**
   * Compares two strings lexicographically, ignoring case
   * differences. This method returns an integer whose sign is that of
   * calling {@code compareTo} with normalized versions of the strings
   * where case differences have been eliminated by calling
   * {@code Character.toLowerCase(Character.toUpperCase(character))} on
   * each character.
   * 

   * Note that this method does not take locale into account,
   * and will result in an unsatisfactory ordering for certain locales.
   * The {@link java.text.Collator} class provides locale-sensitive comparison.
   *
   * @param   str   the {@code String} to be compared.
   * @return  a negative integer, zero, or a positive integer as the
   *          specified String is greater than, equal to, or less
   *          than this String, ignoring case considerations.
   * @see     java.text.Collator
   * @since   1.2
   */
  int compareToIgnoreCase(String str);
  
  default int compareToIgnoreCase(CodePointString str) {
    return compareToIgnoreCase(str.toString());
  }

  /**
   * Tests if two string regions are equal.
   * 

   * A substring of this {@code String} object is compared to a substring
   * of the argument other. The result is true if these substrings
   * represent identical character sequences. The substring of this
   * {@code String} object to be compared begins at index {@code toffset}
   * and has length {@code len}. The substring of other to be compared
   * begins at index {@code ooffset} and has length {@code len}. The
   * result is {@code false} if and only if at least one of the following
   * is true:
   * 
{@code toffset} is negative.
   * 
{@code ooffset} is negative.
   * 
{@code toffset+len} is greater than the length of this
   * {@code String} object.
   * 
{@code ooffset+len} is greater than the length of the other
   * argument.
   * 
There is some nonnegative integer k less than {@code len}
   * such that:
   * {@code this.charAt(toffset + }k{@code ) != other.charAt(ooffset + }
   * k{@code )}
   * 
   *
   * Note that this method does not take locale into account.  The
   * {@link java.text.Collator} class provides locale-sensitive comparison.
   *
   * @param   toffset   the starting offset of the subregion in this string.
   * @param   other     the string argument.
   * @param   ooffset   the starting offset of the subregion in the string
   *                    argument.
   * @param   len       the number of characters to compare.
   * @return  {@code true} if the specified subregion of this string
   *          exactly matches the specified subregion of the string argument;
   *          {@code false} otherwise.
   */
  boolean regionMatches(int toffset, String other, int ooffset, int len);
  
  default boolean regionMatches(CodePointIndex toffset, String other, CodePointIndex ooffset, Length len) {
    return regionMatches(toStringIndex(toffset).value(), other , toStringIndex(ooffset).value(), len.value());
  }
  
  default boolean regionMatches(CodePointIndex toffset, CodePointString other, CodePointIndex ooffset, Length len) {
    return regionMatches(toStringIndex(toffset).value() 
, other.getSource(), toStringIndex(ooffset).value(), len.value());
  }
  
  /**
   * Tests if two string regions are equal.
   * 

   * A substring of this {@code String} object is compared to a substring
   * of the argument {@code other}. The result is {@code true} if these
   * substrings represent character sequences that are the same, ignoring
   * case if and only if {@code ignoreCase} is true. The substring of
   * this {@code String} object to be compared begins at index
   * {@code toffset} and has length {@code len}. The substring of
   * {@code other} to be compared begins at index {@code ooffset} and
   * has length {@code len}. The result is {@code false} if and only if
   * at least one of the following is true:
   * 
{@code toffset} is negative.
   * 
{@code ooffset} is negative.
   * 
{@code toffset+len} is greater than the length of this
   * {@code String} object.
   * 
{@code ooffset+len} is greater than the length of the other
   * argument.
   * 
{@code ignoreCase} is {@code false} and there is some nonnegative
   * integer k less than {@code len} such that:
   *    * this.charAt(toffset+k) != other.charAt(ooffset+k)
   * 
   * 
{@code ignoreCase} is {@code true} and there is some nonnegative
   * integer k less than {@code len} such that:
   *    * Character.toLowerCase(Character.toUpperCase(this.charAt(toffset+k))) !=
   Character.toLowerCase(Character.toUpperCase(other.charAt(ooffset+k)))
   * 
   * 
   *
   * Note that this method does not take locale into account,
   * and will result in unsatisfactory results for certain locales when
   * {@code ignoreCase} is {@code true}.  The {@link java.text.Collator} class
   * provides locale-sensitive comparison.
   *
   * @param   ignoreCase   if {@code true}, ignore case when comparing
   *                       characters.
   * @param   toffset      the starting offset of the subregion in this
   *                       string.
   * @param   other        the string argument.
   * @param   ooffset      the starting offset of the subregion in the string
   *                       argument.
   * @param   len          the number of characters to compare.
   * @return  {@code true} if the specified subregion of this string
   *          matches the specified subregion of the string argument;
   *          {@code false} otherwise. Whether the matching is exact
   *          or case insensitive depends on the {@code ignoreCase}
   *          argument.
   */
  boolean regionMatches(boolean ignoreCase, int toffset, String other, int ooffset, int len);
  
  default boolean regionMatches(boolean ignoreCase, CodePointIndex toffset, String other, CodePointIndex ooffset, Length len) {
    return regionMatches(ignoreCase, toStringIndex(toffset).value(), other, toStringIndex(ooffset).value(), len.value());
  }
  
  default boolean regionMatches(boolean ignoreCase, CodePointIndex toffset, CodePointString other, CodePointIndex ooffset, Length len) {
    return regionMatches(ignoreCase, toStringIndex(toffset).value(), other.getSource(), toStringIndex(ooffset).value(), len.value());
  }

  /**
   * Tests if the substring of this string beginning at the
   * specified index starts with the specified prefix.
   *
   * @param   prefix    the prefix.
   * @param   toffset   where to begin looking in this string.
   * @return  {@code true} if the character sequence represented by the
   *          argument is a prefix of the substring of this object starting
   *          at index {@code toffset}; {@code false} otherwise.
   *          The result is {@code false} if {@code toffset} is
   *          negative or greater than the length of this
   *          {@code String} object; otherwise the result is the same
   *          as the result of the expression
   *          
   *          this.substring(toffset).startsWith(prefix)
   *          
   */
  boolean startsWith(String prefix, int toffset);
  
  default boolean startsWith(String prefix, CodePointIndex toffset) {
    return startsWith(prefix, toStringIndex(toffset).value());
  }
  
  default boolean startsWith(CodePointString prefix, CodePointIndex toffset) {
    return startsWith(prefix.getSource(), toStringIndex(toffset).value());
  }

  /**
   * Tests if this string starts with the specified prefix.
   *
   * @param   prefix   the prefix.
   * @return  {@code true} if the character sequence represented by the
   *          argument is a prefix of the character sequence represented by
   *          this string; {@code false} otherwise.
   *          Note also that {@code true} will be returned if the
   *          argument is an empty string or is equal to this
   *          {@code String} object as determined by the
   *          {@link #equals(Object)} method.
   * @since   1.0
   */
  boolean startsWith(String prefix);
  
  default boolean startsWith(CodePointString prefix) {
    return startsWith(prefix.getSource());
  }

  /**
   * Tests if this string ends with the specified suffix.
   *
   * @param   suffix   the suffix.
   * @return  {@code true} if the character sequence represented by the
   *          argument is a suffix of the character sequence represented by
   *          this object; {@code false} otherwise. Note that the
   *          result will be {@code true} if the argument is the
   *          empty string or is equal to this {@code String} object
   *          as determined by the {@link #equals(Object)} method.
   */
  boolean endsWith(String suffix);
  
  default boolean endsWith(CodePointString suffix) {
    return endsWith(suffix.getSource());
  }

  /**
   * Returns a hash code for this string. The hash code for a
   * {@code String} object is computed as
   *    * s[0]*31^(n-1) + s[1]*31^(n-2) + ... + s[n-1]
   * 
   * using {@code int} arithmetic, where {@code s[i]} is the
   * ith character of the string, {@code n} is the length of
   * the string, and {@code ^} indicates exponentiation.
   * (The hash value of the empty string is zero.)
   *
   * @return  a hash code value for this object.
   */
  int hashCode();

  /**
   * Returns the index within this string of the first occurrence of
   * the specified character. If a character with value
   * {@code ch} occurs in the character sequence represented by
   * this {@code String} object, then the index (in Unicode
   * code units) of the first such occurrence is returned. For
   * values of {@code ch} in the range from 0 to 0xFFFF
   * (inclusive), this is the smallest value k such that:
   *    * this.charAt(k) == ch
   * 
   * is true. For other values of {@code ch}, it is the
   * smallest value k such that:
   *    * this.codePointAt(k) == ch
   * 
   * is true. In either case, if no such character occurs in this
   * string, then {@code -1} is returned.
   *
   * @param   ch   a character (Unicode code point).
   * @return  the index of the first occurrence of the character in the
   *          character sequence represented by this object, or
   *          {@code -1} if the character does not occur.
   */
  int indexOf(int ch);
  
  default CodePointIndexWithNegativeValue indexOf(CodePoint codePoint) {
    return new CodePointIndexWithNegativeValue(
        toCodePointIndex(new StringIndex(indexOf(codePoint.value()))));
  }

  /**
   * Returns the index within this string of the first occurrence of the
   * specified character, starting the search at the specified index.
   * 
   * If a character with value {@code ch} occurs in the
   * character sequence represented by this {@code String}
   * object at an index no smaller than {@code fromIndex}, then
   * the index of the first such occurrence is returned. For values
   * of {@code ch} in the range from 0 to 0xFFFF (inclusive),
   * this is the smallest value k such that:
   * 
   * (this.charAt(k) == ch) {@code &&} (k >= fromIndex)
   * 
   * is true. For other values of {@code ch}, it is the
   * smallest value k such that:
   *    * (this.codePointAt(k) == ch) {@code &&} (k >= fromIndex)
   * 
   * is true. In either case, if no such character occurs in this
   * string at or after position {@code fromIndex}, then
   * {@code -1} is returned.
   *
   * 
   * There is no restriction on the value of {@code fromIndex}. If it
   * is negative, it has the same effect as if it were zero: this entire
   * string may be searched. If it is greater than the length of this
   * string, it has the same effect as if it were equal to the length of
   * this string: {@code -1} is returned.
   *
   * 
All indices are specified in {@code char} values
   * (Unicode code units).
   *
   * @param   ch          a character (Unicode code point).
   * @param   fromIndex   the index to start the search from.
   * @return  the index of the first occurrence of the character in the
   *          character sequence represented by this object that is greater
   *          than or equal to {@code fromIndex}, or {@code -1}
   *          if the character does not occur.
   */
  int indexOf(int ch, int fromIndex);
  
  default CodePointIndexWithNegativeValue indexOf(CodePoint codePoint, CodePointIndex fromIndex) {
    return new CodePointIndexWithNegativeValue(
        toCodePointIndex(new StringIndex(indexOf(codePoint.value(),toStringIndex(fromIndex).value()))));
  }

  /**
   * Returns the index within this string of the last occurrence of
   * the specified character. For values of {@code ch} in the
   * range from 0 to 0xFFFF (inclusive), the index (in Unicode code
   * units) returned is the largest value k such that:
   * 
   * this.charAt(k) == ch
   * 
   * is true. For other values of {@code ch}, it is the
   * largest value k such that:
   *    * this.codePointAt(k) == ch
   * 
   * is true.  In either case, if no such character occurs in this
   * string, then {@code -1} is returned.  The
   * {@code String} is searched backwards starting at the last
   * character.
   *
   * @param   ch   a character (Unicode code point).
   * @return  the index of the last occurrence of the character in the
   *          character sequence represented by this object, or
   *          {@code -1} if the character does not occur.
   */
  int lastIndexOf(int ch);
  
  default CodePointIndexWithNegativeValue lastIndexOf(CodePoint codePoint) {
    return new CodePointIndexWithNegativeValue(
        toCodePointIndex(new StringIndex(lastIndexOf(codePoint.value()))));
  }

  /**
   * Returns the index within this string of the last occurrence of
   * the specified character, searching backward starting at the
   * specified index. For values of {@code ch} in the range
   * from 0 to 0xFFFF (inclusive), the index returned is the largest
   * value k such that:
   *    * (this.charAt(k) == ch) {@code &&} (k <= fromIndex)
   * 
   * is true. For other values of {@code ch}, it is the
   * largest value k such that:
   *    * (this.codePointAt(k) == ch) {@code &&} (k <= fromIndex)
   * 
   * is true. In either case, if no such character occurs in this
   * string at or before position {@code fromIndex}, then
   * {@code -1} is returned.
   *
   * All indices are specified in {@code char} values
   * (Unicode code units).
   *
   * @param   ch          a character (Unicode code point).
   * @param   fromIndex   the index to start the search from. There is no
   *          restriction on the value of {@code fromIndex}. If it is
   *          greater than or equal to the length of this string, it has
   *          the same effect as if it were equal to one less than the
   *          length of this string: this entire string may be searched.
   *          If it is negative, it has the same effect as if it were -1:
   *          -1 is returned.
   * @return  the index of the last occurrence of the character in the
   *          character sequence represented by this object that is less
   *          than or equal to {@code fromIndex}, or {@code -1}
   *          if the character does not occur before that point.
   */
  int lastIndexOf(int ch, int fromIndex);
  
  default CodePointIndexWithNegativeValue lastIndexOf(CodePoint codePoint, CodePointIndex fromIndex) {
    return new CodePointIndexWithNegativeValue(
        toCodePointIndex(new StringIndex(lastIndexOf(codePoint.value(), toStringIndex(fromIndex).value()))));
  }

  /**
   * Returns the index within this string of the first occurrence of the
   * specified substring.
   *
   * 
The returned index is the smallest value {@code k} for which:
   * 
{@code
   * this.startsWith(str, k)
   * }
   * If no such value of {@code k} exists, then {@code -1} is returned.
   *
   * @param   str   the substring to search for.
   * @return  the index of the first occurrence of the specified substring,
   *          or {@code -1} if there is no such occurrence.
   */
  int indexOf(String str);
  
  default CodePointIndexWithNegativeValue indexOf(CodePointString str) {
    return new CodePointIndexWithNegativeValue(
        toCodePointIndex(new StringIndex(indexOf(str.getSource()))));
  }

  /**
   * Returns the index within this string of the first occurrence of the
   * specified substring, starting at the specified index.
   *
   * The returned index is the smallest value {@code k} for which:
   * 
{@code
   *     k >= Math.min(fromIndex, this.length()) &&
   *                   this.startsWith(str, k)
   * }
   * If no such value of {@code k} exists, then {@code -1} is returned.
   *
   * @param   str         the substring to search for.
   * @param   fromIndex   the index from which to start the search.
   * @return  the index of the first occurrence of the specified substring,
   *          starting at the specified index,
   *          or {@code -1} if there is no such occurrence.
   */
  int indexOf(String str, int fromIndex);
  
  default CodePointIndex indexOf(CodePointString str, CodePointIndex fromIndex) {
    return 
        toCodePointIndex(new StringIndex(indexOf(str.getSource(),
            toStringIndex(fromIndex).value())));
  }


  /**
   * Returns the index within this string of the last occurrence of the
   * specified substring.  The last occurrence of the empty string ""
   * is considered to occur at the index value {@code this.length()}.
   *
   * The returned index is the largest value {@code k} for which:
   * 
{@code
   * this.startsWith(str, k)
   * }
   * If no such value of {@code k} exists, then {@code -1} is returned.
   *
   * @param   str   the substring to search for.
   * @return  the index of the last occurrence of the specified substring,
   *          or {@code -1} if there is no such occurrence.
   */
  int lastIndexOf(String str);

  default CodePointIndex lastIndexOf(CodePointString str) {
    return 
        toCodePointIndex(new StringIndex(lastIndexOf(str.getSource())));
  }

  /**
   * Returns the index within this string of the last occurrence of the
   * specified substring, searching backward starting at the specified index.
   *
   * The returned index is the largest value {@code k} for which:
   * 
{@code
   *     k <= Math.min(fromIndex, this.length()) &&
   *                   this.startsWith(str, k)
   * }
   * If no such value of {@code k} exists, then {@code -1} is returned.
   *
   * @param   str         the substring to search for.
   * @param   fromIndex   the index to start the search from.
   * @return  the index of the last occurrence of the specified substring,
   *          searching backward from the specified index,
   *          or {@code -1} if there is no such occurrence.
   */
  int lastIndexOf(String str, int fromIndex);

  default CodePointIndex lastIndexOf(CodePointString str, CodePointIndex fromIndex) {
    return 
        toCodePointIndex(new StringIndex(lastIndexOf(str.getSource() , 
            toStringIndex(fromIndex).value())));
  }
  
  /**
   * Returns a string that is a substring of this string. The
   * substring begins with the character at the specified index and
   * extends to the end of this string. 
   * Examples:
   * 
   * "unhappy".substring(2) returns "happy"
   * "Harbison".substring(3) returns "bison"
   * "emptiness".substring(9) returns "" (an empty string)
   * 
   *
   * @param      beginIndex   the beginning index, inclusive.
   * @return     the specified substring.
   * @exception  IndexOutOfBoundsException  if
   *             {@code beginIndex} is negative or larger than the
   *             length of this {@code String} object.
   */
  String substring(int beginIndex);
  
  default CodePointString substring(CodePointIndex beginIndex) {
    return stringToStringInterface().apply(substring(toStringIndex(beginIndex).value()));
  }

  /**
   * Returns a string that is a substring of this string. The
   * substring begins at the specified {@code beginIndex} and
   * extends to the character at index {@code endIndex - 1}.
   * Thus the length of the substring is {@code endIndex-beginIndex}.
   * 
   * Examples:
   * 
   * "hamburger".substring(4, 8) returns "urge"
   * "smiles".substring(1, 5) returns "mile"
   * 
   *
   * @param      beginIndex   the beginning index, inclusive.
   * @param      endIndex     the ending index, exclusive.
   * @return     the specified substring.
   * @exception  IndexOutOfBoundsException  if the
   *             {@code beginIndex} is negative, or
   *             {@code endIndex} is larger than the length of
   *             this {@code String} object, or
   *             {@code beginIndex} is larger than
   *             {@code endIndex}.
   */
  String substring(int beginIndex, int endIndex);
  
  default CodePointString substring(CodePointIndex beginIndex, CodePointIndex endIndex) {
      return stringToStringInterface().apply(substring(
          toStringIndex(beginIndex).value(),toStringIndex(endIndex).value()));
  }

  /**
   * Returns a character sequence that is a subsequence of this sequence.
   *
   *  An invocation of this method of the form
   *
   * 
   * str.subSequence(begin, end)
   *
   * behaves in exactly the same way as the invocation
   *
   *    * str.substring(begin, end)
   *
   * @apiNote
   * This method is defined so that the {@code String} class can implement
   * the {@link CharSequence} interface.
   *
   * @param   beginIndex   the begin index, inclusive.
   * @param   endIndex     the end index, exclusive.
   * @return  the specified subsequence.
   *
   * @throws  IndexOutOfBoundsException
   *          if {@code beginIndex} or {@code endIndex} is negative,
   *          if {@code endIndex} is greater than {@code length()},
   *          or if {@code beginIndex} is greater than {@code endIndex}
   *
   * @since 1.4
   * @spec JSR-51
   */
  CharSequence subSequence(int beginIndex, int endIndex);

  /**
   * Concatenates the specified string to the end of this string.
   * 
   * If the length of the argument string is {@code 0}, then this
   * {@code String} object is returned. Otherwise, a
   * {@code String} object is returned that represents a character
   * sequence that is the concatenation of the character sequence
   * represented by this {@code String} object and the character
   * sequence represented by the argument string.

   * Examples:
   * 
   * "cares".concat("s") returns "caress"
   * "to".concat("get").concat("her") returns "together"
   * 
   *
   * @param   str   the {@code String} that is concatenated to the end
   *                of this {@code String}.
   * @return  a string that represents the concatenation of this object's
   *          characters followed by the string argument's characters.
   */
  String concat(String str);
  
  default CodePointString concat(CodePointString str) {
    return stringToStringInterface().apply(concat(str.getSource()));
  }

  /**
   * Returns a string resulting from replacing all occurrences of
   * {@code oldChar} in this string with {@code newChar}.
   * 
   * If the character {@code oldChar} does not occur in the
   * character sequence represented by this {@code String} object,
   * then a reference to this {@code String} object is returned.
   * Otherwise, a {@code String} object is returned that
   * represents a character sequence identical to the character sequence
   * represented by this {@code String} object, except that every
   * occurrence of {@code oldChar} is replaced by an occurrence
   * of {@code newChar}.
   * 

   * Examples:
   * 
   * "mesquite in your cellar".replace('e', 'o')
   *         returns "mosquito in your collar"
   * "the war of baronets".replace('r', 'y')
   *         returns "the way of bayonets"
   * "sparring with a purple porpoise".replace('p', 't')
   *         returns "starring with a turtle tortoise"
   * "JonL".replace('q', 'x') returns "JonL" (no change)
   * 
   *
   * @param   oldChar   the old character.
   * @param   newChar   the new character.
   * @return  a string derived from this string by replacing every
   *          occurrence of {@code oldChar} with {@code newChar}.
   */
  String replace(char oldChar, char newChar);
  
  default CodePointString replaceAsStringInterface(char oldChar, char newChar) {
    
    return stringToStringInterface().apply(replace(oldChar, newChar));
  }
  
  /**
   * Tells whether or not this string matches the given regular expression.
   *
   *  An invocation of this method of the form
   * str{@code .matches(}regex{@code )} yields exactly the
   * same result as the expression
   *
   * 

   * {@link java.util.regex.Pattern}.{@link java.util.regex.Pattern#matches(String,CharSequence)
   * matches(regex, str)}
   * 
   *
   * @param   regex
   *          the regular expression to which this string is to be matched
   *
   * @return  {@code true} if, and only if, this string matches the
   *          given regular expression
   *
   * @throws  PatternSyntaxException
   *          if the regular expression's syntax is invalid
   *
   * @see java.util.regex.Pattern
   *
   * @since 1.4
   * @spec JSR-51
   */
  boolean matches(String regex);

  /**
   * Returns true if and only if this string contains the specified
   * sequence of char values.
   *
   * @param s the sequence to search for
   * @return true if this string contains {@code s}, false otherwise
   * @since 1.5
   */
  boolean contains(CharSequence s);

  /**
   * Replaces the first substring of this string that matches the given regular expression with the
   * given replacement.
   *
   *  An invocation of this method of the form
   * str{@code .replaceFirst(}regex{@code ,} repl{@code )}
   * yields exactly the same result as the expression
   *
   * 

   * 
   * {@link java.util.regex.Pattern}.{@link
   * java.util.regex.Pattern#compile compile}(regex).{@link
   * java.util.regex.Pattern#matcher(java.lang.CharSequence) matcher}(str).{@link
   * java.util.regex.Matcher#replaceFirst replaceFirst}(repl)
   * 
   * 
   *
   *
   * Note that backslashes ({@code \}) and dollar signs ({@code $}) in the
   * replacement string may cause the results to be different than if it were
   * being treated as a literal replacement string; see
   * {@link java.util.regex.Matcher#replaceFirst}.
   * Use {@link java.util.regex.Matcher#quoteReplacement} to suppress the special
   * meaning of these characters, if desired.
   *
   * @param   regex
   *          the regular expression to which this string is to be matched
   * @param   replacement
   *          the string to be substituted for the first match
   *
   * @return  The resulting {@code String}
   *
   * @throws  PatternSyntaxException
   *          if the regular expression's syntax is invalid
   *
   * @see java.util.regex.Pattern
   *
   * @since 1.4
   * @spec JSR-51
   */
  String replaceFirst(String regex, String replacement);
  
  default CodePointString replaceFirst(String regex, CodePointString replacement) {
    return stringToStringInterface().apply(replaceFirst(regex, replacement.toString()));
  }


  /**
   * Replaces each substring of this string that matches the given regular expression with the
   * given replacement.
   *
   * 
 An invocation of this method of the form
   * str{@code .replaceAll(}regex{@code ,} repl{@code )}
   * yields exactly the same result as the expression
   *
   * 

   * 
   * {@link java.util.regex.Pattern}.{@link
   * java.util.regex.Pattern#compile compile}(regex).{@link
   * java.util.regex.Pattern#matcher(java.lang.CharSequence) matcher}(str).{@link
   * java.util.regex.Matcher#replaceAll replaceAll}(repl)
   * 
   * 
   *
   *
   * Note that backslashes ({@code \}) and dollar signs ({@code $}) in the
   * replacement string may cause the results to be different than if it were
   * being treated as a literal replacement string; see
   * {@link java.util.regex.Matcher#replaceAll Matcher.replaceAll}.
   * Use {@link java.util.regex.Matcher#quoteReplacement} to suppress the special
   * meaning of these characters, if desired.
   *
   * @param   regex
   *          the regular expression to which this string is to be matched
   * @param   replacement
   *          the string to be substituted for each match
   *
   * @return  The resulting {@code String}
   *
   * @throws  PatternSyntaxException
   *          if the regular expression's syntax is invalid
   *
   * @see java.util.regex.Pattern
   *
   * @since 1.4
   * @spec JSR-51
   */
  String replaceAll(String regex, String replacement);
  
  default CodePointString replaceAll(String regex, CodePointString replacement) {
    return stringToStringInterface().apply(replaceAll(regex, replacement.toString()));
  }

  /**
   * Replaces each substring of this string that matches the literal target
   * sequence with the specified literal replacement sequence. The
   * replacement proceeds from the beginning of the string to the end, for
   * example, replacing "aa" with "b" in the string "aaa" will result in
   * "ba" rather than "ab".
   *
   * @param  target The sequence of char values to be replaced
   * @param  replacement The replacement sequence of char values
   * @return  The resulting string
   * @since 1.5
   */
  String replace(CharSequence target, CharSequence replacement);
  
  default CodePointString replaceaAsStringInterface(CharSequence target, CharSequence replacement) {
    return stringToStringInterface().apply(replace(target, replacement));
  }

  /**
   * Splits this string around matches of the given
   * regular expression.
   *
   * 
 The array returned by this method contains each substring of this
   * string that is terminated by another substring that matches the given
   * expression or is terminated by the end of the string.  The substrings in
   * the array are in the order in which they occur in this string.  If the
   * expression does not match any part of the input then the resulting array
   * has just one element, namely this string.
   *
   * 
 When there is a positive-width match at the beginning of this
   * string then an empty leading substring is included at the beginning
   * of the resulting array. A zero-width match at the beginning however
   * never produces such empty leading substring.
   *
   * 
 The {@code limit} parameter controls the number of times the
   * pattern is applied and therefore affects the length of the resulting
   * array.
   * 

   *    
   *    If the limit is positive then the pattern will be applied
   *    at most limit - 1 times, the array's length will be
   *    no greater than limit, and the array's last entry will contain
   *    all input beyond the last matched delimiter.
   *
   *    
   *    If the limit is zero then the pattern will be applied as
   *    many times as possible, the array can have any length, and trailing
   *    empty strings will be discarded.
   *
   *    
   *    If the limit is negative then the pattern will be applied
   *    as many times as possible and the array can have any length.
   * 
   *
   *  The string {@code "boo:and:foo"}, for example, yields the
   * following results with these parameters:
   *
   * 

   * 
   * 
   * 
   *     
   *     
   *     
   * 
   * 
   * 
   * 
   *     
   *     
   * 
   *     
   *     
   * 
   *     
   *     
   * 
   *     
   *     
   * 
   *     
   *     
   * 
   *     
   *     
   * 
   * Split example showing regex, limit, and resultRegex Limit Result
: 2 {@code { "boo", "and:foo" }}
5 {@code { "boo", "and", "foo" }}
-2 {@code { "boo", "and", "foo" }}
o 5 {@code { "b", "", ":and:f", "", "" }}
-2 {@code { "b", "", ":and:f", "", "" }}
0 {@code { "b", "", ":and:f" }}
   *
   *  An invocation of this method of the form
   * str.{@code split(}regex{@code ,} n{@code )}
   * yields the same result as the expression
   *
   * 

   * 
   * {@link java.util.regex.Pattern}.{@link
   * java.util.regex.Pattern#compile compile}(regex).{@link
   * java.util.regex.Pattern#split(java.lang.CharSequence,int) split}(str, n)
   * 
   * 
   *
   *
   * @param  regex
   *         the delimiting regular expression
   *
   * @param  limit
   *         the result threshold, as described above
   *
   * @return  the array of strings computed by splitting this string
   *          around matches of the given regular expression
   *
   * @throws  PatternSyntaxException
   *          if the regular expression's syntax is invalid
   *
   * @see java.util.regex.Pattern
   *
   * @since 1.4
   * @spec JSR-51
   */
  String[] split(String regex, int limit);
  
  default CodePointString[] splitAsStringInterface(String regex, int limit) {
    
    String[] returning = split(regex, limit);
    
    CodePointString[] result = new CodePointString[returning.length];
    
    int i =0;
    for (String string : returning) {
      
      result[i++] = stringToStringInterface().apply(string);
    }
    return result;
  }


  /**
   * Splits this string around matches of the given regular expression.
   *
   *  This method works as if by invoking the two-argument {@link
   * #split(String, int) split} method with the given expression and a limit
   * argument of zero.  Trailing empty strings are therefore not included in
   * the resulting array.
   *
   * 
 The string {@code "boo:and:foo"}, for example, yields the following
   * results with these expressions:
   *
   * 

   * 
   * 
   * 
   *  
   *  
   * 
   * 
   * 
   * 
   *     
   * 
   *     
   * 
   * Split examples showing regex and resultRegex Result
: {@code { "boo", "and", "foo" }}
o {@code { "b", "", ":and:f" }}
   *
   *
   * @param  regex
   *         the delimiting regular expression
   *
   * @return  the array of strings computed by splitting this string
   *          around matches of the given regular expression
   *
   * @throws  PatternSyntaxException
   *          if the regular expression's syntax is invalid
   *
   * @see java.util.regex.Pattern
   *
   * @since 1.4
   * @spec JSR-51
   */
  String[] split(String regex);
  
  default CodePointString[] splitAsStringInterface(String regex) {
    
    String[] returning = split(regex);
    
    CodePointString[] result = new CodePointString[returning.length];
    
    int i =0;
    for (String string : returning) {
      
      result[i++] = stringToStringInterface().apply(string);
    }
    return result;
  }


  /**
   * Converts all of the characters in this {@code String} to lower
   * case using the rules of the given {@code Locale}.  Case mapping is based
   * on the Unicode Standard version specified by the {@link org.unlaxer.java.lang.Character Character}
   * class. Since case mappings are not always 1:1 char mappings, the resulting
   * {@code String} may be a different length than the original {@code String}.
   * 
   * Examples of lowercase  mappings are in the following table:
   * 
   * 
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   * Lowercase mapping examples showing language code of locale, upper case, lower case, and descriptionLanguage Code of Locale Upper Case Lower Case Description
tr (Turkish) \u0130 \u0069 capital letter I with dot above -> small letter i
tr (Turkish) \u0049 \u0131 capital letter I -> small letter dotless i 
(all) French Fries french fries lowercased all chars in String
(all) 
   *       ΙΧΘΥΣ ιχθυσ lowercased all chars in String
   *
   * @param locale use the case transformation rules for this locale
   * @return the {@code String}, converted to lowercase.
   * @see     java.lang.String#toLowerCase()
   * @see     java.lang.String#toUpperCase()
   * @see     java.lang.String#toUpperCase(Locale)
   * @since   1.1
   */
  String toLowerCase(Locale locale);
  
  default CodePointString toLowerCaseAsStringInterface(Locale locale){
    return stringToStringInterface().apply(toLowerCase(locale));
  }

  /**
   * Converts all of the characters in this {@code String} to lower
   * case using the rules of the default locale. This is equivalent to calling
   * {@code toLowerCase(Locale.getDefault())}.
   * 
   * Note: This method is locale sensitive, and may produce unexpected
   * results if used for strings that are intended to be interpreted locale
   * independently.
   * Examples are programming language identifiers, protocol keys, and HTML
   * tags.
   * For instance, {@code "TITLE".toLowerCase()} in a Turkish locale
   * returns {@code "t\u005Cu0131tle"}, where '\u005Cu0131' is the
   * LATIN SMALL LETTER DOTLESS I character.
   * To obtain correct results for locale insensitive strings, use
   * {@code toLowerCase(Locale.ROOT)}.
   *
   * @return  the {@code String}, converted to lowercase.
   * @see     java.lang.String#toLowerCase(Locale)
   */
  String toLowerCase();
  
  default CodePointString toLowerCaseAsStringInterface(){
    return stringToStringInterface().apply(toLowerCase());
  }

  /**
   * Converts all of the characters in this {@code String} to upper
   * case using the rules of the given {@code Locale}. Case mapping is based
   * on the Unicode Standard version specified by the {@link org.unlaxer.java.lang.Character Character}
   * class. Since case mappings are not always 1:1 char mappings, the resulting
   * {@code String} may be a different length than the original {@code String}.
   * 

   * Examples of locale-sensitive and 1:M case mappings are in the following table.
   *
   * 
   * 
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   *   
   *   
   *   
   *   
   * 
   * 
   * Examples of locale-sensitive and 1:M case mappings. Shows Language code of locale, lower case, upper case, and description.Language Code of Locale Lower Case Upper Case Description
tr (Turkish) \u0069 \u0130 small letter i -> capital letter I with dot above
tr (Turkish) \u0131 \u0049 small letter dotless i -> capital letter I
(all) \u00df \u0053 \u0053 small letter sharp s -> two letters: SS
(all) Fahrvergnügen FAHRVERGNÜGEN 
   * @param locale use the case transformation rules for this locale
   * @return the {@code String}, converted to uppercase.
   * @see     java.lang.String#toUpperCase()
   * @see     java.lang.String#toLowerCase()
   * @see     java.lang.String#toLowerCase(Locale)
   * @since   1.1
   */
  String toUpperCase(Locale locale);
  
  default CodePointString toUpperCaseAsStringInterface(Locale locale){
    return stringToStringInterface().apply(toUpperCase(locale));
  }

  /**
   * Converts all of the characters in this {@code String} to upper
   * case using the rules of the default locale. This method is equivalent to
   * {@code toUpperCase(Locale.getDefault())}.
   * 
   * Note: This method is locale sensitive, and may produce unexpected
   * results if used for strings that are intended to be interpreted locale
   * independently.
   * Examples are programming language identifiers, protocol keys, and HTML
   * tags.
   * For instance, {@code "title".toUpperCase()} in a Turkish locale
   * returns {@code "T\u005Cu0130TLE"}, where '\u005Cu0130' is the
   * LATIN CAPITAL LETTER I WITH DOT ABOVE character.
   * To obtain correct results for locale insensitive strings, use
   * {@code toUpperCase(Locale.ROOT)}.
   *
   * @return  the {@code String}, converted to uppercase.
   * @see     java.lang.String#toUpperCase(Locale)
   */
  String toUpperCase();
  
  default CodePointString toUpperCaseAsStringInterface(){
    return stringToStringInterface().apply(toUpperCase());
  }

  /**
   * Returns a string whose value is this string, with all leading
   * and trailing space removed, where space is defined
   * as any character whose codepoint is less than or equal to
   * {@code 'U+0020'} (the space character).
   * 

   * If this {@code String} object represents an empty character
   * sequence, or the first and last characters of character sequence
   * represented by this {@code String} object both have codes
   * that are not space (as defined above), then a
   * reference to this {@code String} object is returned.
   * 

   * Otherwise, if all characters in this string are space (as
   * defined above), then a  {@code String} object representing an
   * empty string is returned.
   * 

   * Otherwise, let k be the index of the first character in the
   * string whose code is not a space (as defined above) and let
   * m be the index of the last character in the string whose code
   * is not a space (as defined above). A {@code String}
   * object is returned, representing the substring of this string that
   * begins with the character at index k and ends with the
   * character at index m-that is, the result of
   * {@code this.substring(k, m + 1)}.
   * 

   * This method may be used to trim space (as defined above) from
   * the beginning and end of a string.
   *
   * @return  a string whose value is this string, with all leading
   *          and trailing space removed, or this string if it
   *          has no leading or trailing space.
   */
  String trim();
  
  default CodePointString trimAsStringInterface() {
    return stringToStringInterface().apply(trim());
  }

  /**
   * Returns a string whose value is this string, with all leading
   * and trailing {@link Character#isWhitespace(int) white space}
   * removed.
   * 

   * If this {@code String} object represents an empty string,
   * or if all code points in this string are
   * {@link Character#isWhitespace(int) white space}, then an empty string
   * is returned.
   * 

   * Otherwise, returns a substring of this string beginning with the first
   * code point that is not a {@link Character#isWhitespace(int) white space}
   * up to and including the last code point that is not a
   * {@link Character#isWhitespace(int) white space}.
   * 

   * This method may be used to strip
   * {@link Character#isWhitespace(int) white space} from
   * the beginning and end of a string.
   *
   * @return  a string whose value is this string, with all leading
   *          and trailing white space removed
   *
   * @see Character#isWhitespace(int)
   *
   * @since 11
   */
  String strip();
  
  default CodePointString stripAsStringInterface() {
    
    return stringToStringInterface().apply(strip());
  }

  /**
   * Returns a string whose value is this string, with all leading
   * {@link Character#isWhitespace(int) white space} removed.
   * 

   * If this {@code String} object represents an empty string,
   * or if all code points in this string are
   * {@link Character#isWhitespace(int) white space}, then an empty string
   * is returned.
   * 

   * Otherwise, returns a substring of this string beginning with the first
   * code point that is not a {@link Character#isWhitespace(int) white space}
   * up to to and including the last code point of this string.
   * 

   * This method may be used to trim
   * {@link Character#isWhitespace(int) white space} from
   * the beginning of a string.
   *
   * @return  a string whose value is this string, with all leading white
   *          space removed
   *
   * @see Character#isWhitespace(int)
   *
   * @since 11
   */
  String stripLeading();
  
  default CodePointString stripLeadingAsStringInterface() {
    return stringToStringInterface().apply((stripLeading()));
  }

  /**
   * Returns a string whose value is this string, with all trailing
   * {@link Character#isWhitespace(int) white space} removed.
   * 

   * If this {@code String} object represents an empty string,
   * or if all characters in this string are
   * {@link Character#isWhitespace(int) white space}, then an empty string
   * is returned.
   * 

   * Otherwise, returns a substring of this string beginning with the first
   * code point of this string up to and including the last code point
   * that is not a {@link Character#isWhitespace(int) white space}.
   * 

   * This method may be used to trim
   * {@link Character#isWhitespace(int) white space} from
   * the end of a string.
   *
   * @return  a string whose value is this string, with all trailing white
   *          space removed
   *
   * @see Character#isWhitespace(int)
   *
   * @since 11
   */
  String stripTrailing();
  
  default CodePointString stripTrailingAsStringInterface() {
    return stringToStringInterface().apply(stripTrailing());
  }

  /**
   * Returns {@code true} if the string is empty or contains only
   * {@link Character#isWhitespace(int) white space} codepoints,
   * otherwise {@code false}.
   *
   * @return {@code true} if the string is empty or contains only
   *         {@link Character#isWhitespace(int) white space} codepoints,
   *         otherwise {@code false}
   *
   * @see Character#isWhitespace(int)
   *
   * @since 11
   */
  boolean isBlank();

  /**
   * Returns a stream of lines extracted from this string,
   * separated by line terminators.
   * 

   * A line terminator is one of the following:
   * a line feed character {@code "\n"} (U+000A),
   * a carriage return character {@code "\r"} (U+000D),
   * or a carriage return followed immediately by a line feed
   * {@code "\r\n"} (U+000D U+000A).
   * 

   * A line is either a sequence of zero or more characters
   * followed by a line terminator, or it is a sequence of one or
   * more characters followed by the end of the string. A
   * line does not include the line terminator.
   * 

   * The stream returned by this method contains the lines from
   * this string in the order in which they occur.
   *
   * @apiNote This definition of line implies that an empty
   *          string has zero lines and that there is no empty line
   *          following a line terminator at the end of a string.
   *
   * @implNote This method provides better performance than
   *           split("\R") by supplying elements lazily and
   *           by faster search of new line terminators.
   *
   * @return  the stream of lines extracted from this string
   *
   * @since 11
   */
  Stream lines();
  
  default Stream linesAsStringInterface(){
    Function stringToStringInterface = stringToStringInterface();
    return lines().map(stringToStringInterface);
  }

  /**
   * This object (which is already a string!) is itself returned.
   *
   * @return  the string itself.
   */
  String toString();

  /**
   * Returns a stream of {@code int} zero-extending the {@code char} values
   * from this sequence.  Any char which maps to a surrogate code
   * point is passed through uninterpreted.
   *
   * @return an IntStream of char values from this sequence
   * @since 9
   */
  IntStream chars();

  /**
   * Returns a stream of code point values from this sequence.  Any surrogate
   * pairs encountered in the sequence are combined as if by {@linkplain
   * Character#toCodePoint Character.toCodePoint} and the result is passed
   * to the stream. Any other code units, including ordinary BMP characters,
   * unpaired surrogates, and undefined code units, are zero-extended to
   * {@code int} values which are then passed to the stream.
   *
   * @return an IntStream of Unicode code points from this sequence
   * @since 9
   */
  IntStream codePoints();

  /**
   * Converts this string to a new character array.
   *
   * @return  a newly allocated character array whose length is the length
   *          of this string and whose contents are initialized to contain
   *          the character sequence represented by this string.
   */
  char[] toCharArray();

  /**
   * Returns a canonical representation for the string object.
   * 

   * A pool of strings, initially empty, is maintained privately by the
   * class {@code String}.
   * 

   * When the intern method is invoked, if the pool already contains a
   * string equal to this {@code String} object as determined by
   * the {@link #equals(Object)} method, then the string from the pool is
   * returned. Otherwise, this {@code String} object is added to the
   * pool and a reference to this {@code String} object is returned.
   * 

   * It follows that for any two strings {@code s} and {@code t},
   * {@code s.intern() == t.intern()} is {@code true}
   * if and only if {@code s.equals(t)} is {@code true}.
   * 

   * All literal strings and string-valued constant expressions are
   * interned. String literals are defined in section 3.10.5 of the
   * The Java™ Language Specification.
   *
   * @return  a string that has the same contents as this string, but is
   *          guaranteed to be from a pool of unique strings.
   * @jls 3.10.5 String Literals
   */
  String intern();

  /**
   * Returns a string whose value is the concatenation of this
   * string repeated {@code count} times.
   * 
   * If this string is empty or count is zero then the empty
   * string is returned.
   *
   * @param   count number of times to repeat
   *
   * @return  A string composed of this string repeated
   *          {@code count} times or the empty string if this
   *          string is empty or count is zero
   *
   * @throws  IllegalArgumentException if the {@code count} is
   *          negative.
   *
   * @since 11
   */
  String repeat(int count);
  
  default CodePointString repeatAsStringInterface(int count) {
    
    return stringToStringInterface().apply(repeat(count));
  }
}
Regex	Limit	Result
:	2	{@code { "boo", "and:foo" }}
	5	{@code { "boo", "and", "foo" }}
	-2	{@code { "boo", "and", "foo" }}
o	5	{@code { "b", "", ":and:f", "", "" }}
	-2	{@code { "b", "", ":and:f", "", "" }}
	0	{@code { "b", "", ":and:f" }}
Language Code of Locale	Upper Case	Lower Case	Description
tr (Turkish)	\u0130	\u0069	capital letter I with dot above -> small letter i
tr (Turkish)	\u0049	\u0131	capital letter I -> small letter dotless i
(all)	French Fries	french fries	lowercased all chars in String
(all)	* ΙΧΘΥΣ	ιχθυσ	lowercased all chars in String