All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.snakeyaml.engine.v2.common.CharConstants Maven / Gradle / Ivy

The newest version!
/*
 * Copyright (c) 2018, SnakeYAML
 *
 * Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except
 * in compliance with the License. You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software distributed under the License
 * is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
 * or implied. See the License for the specific language governing permissions and limitations under
 * the License.
 */
package org.snakeyaml.engine.v2.common;

import java.util.Arrays;
import java.util.Collections;
import java.util.HashMap;
import java.util.Map;

public final class CharConstants {

  private static final String ALPHA_S =
      "abcdefghijklmnopqrstuvwxyz0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ-_";

  private static final String LINEBR_S = "\n";
  private final static String FULL_LINEBR_S = "\r" + LINEBR_S;
  private static final String NULL_OR_LINEBR_S = "\0" + FULL_LINEBR_S;
  private static final String NULL_BL_LINEBR_S = " " + NULL_OR_LINEBR_S;
  private static final String NULL_BL_T_LINEBR_S = "\t" + NULL_BL_LINEBR_S;
  private static final String NULL_BL_T_S = "\0 \t";

  // the suffix must not contain the “[”, “]”, “{”, “}” and “,” characters.
  // These characters would cause ambiguity with flow collection structures.
  // https://yaml.org/spec/1.2.2/#691-node-tags
  private static final String URI_CHARS_SUFFIX_S = ALPHA_S + "-;/?:@&=+$_.!~*'()%";

  public static final CharConstants LINEBR = new CharConstants(LINEBR_S);
  public static final CharConstants NULL_OR_LINEBR = new CharConstants(NULL_OR_LINEBR_S);
  public static final CharConstants NULL_BL_LINEBR = new CharConstants(NULL_BL_LINEBR_S);
  public static final CharConstants NULL_BL_T_LINEBR = new CharConstants(NULL_BL_T_LINEBR_S);
  public static final CharConstants NULL_BL_T = new CharConstants(NULL_BL_T_S);
  // prefix may contain ,[]
  public static final CharConstants URI_CHARS_FOR_TAG_PREFIX =
      new CharConstants(URI_CHARS_SUFFIX_S + ",[]");
  public static final CharConstants URI_CHARS_FOR_TAG_SUFFIX =
      new CharConstants(URI_CHARS_SUFFIX_S);

  public static final CharConstants ALPHA = new CharConstants(ALPHA_S);

  private static final int ASCII_SIZE = 128;
  boolean[] contains = new boolean[ASCII_SIZE];

  private CharConstants(String content) {
    Arrays.fill(contains, false);
    for (int i = 0; i < content.length(); i++) {
      int c = content.codePointAt(i);
      contains[c] = true;
    }
  }

  public boolean has(int c) {
    return (c < ASCII_SIZE) && contains[c];
  }

  public boolean hasNo(int c) {
    return !has(c);
  }

  public boolean has(int c, String additional) {
    return has(c) || additional.indexOf(c) != -1;
  }

  public boolean hasNo(int c, String additional) {
    return !has(c, additional);
  }

  /**
   * A mapping from an escaped character in the input stream to the character that they should be
   * replaced with.
   * 

* YAML defines several common and a few uncommon escape sequences. */ public static final Map ESCAPE_REPLACEMENTS; /** * A mapping from a character to a number of bytes to read-ahead for that escape sequence. These * escape sequences are used to handle unicode escaping in the following formats, where H is a * hexadecimal character: * *

   * \xHH         : escaped 8-bit Unicode character
   * \uHHHH       : escaped 16-bit Unicode character
   * \UHHHHHHHH   : escaped 32-bit Unicode character
   * 
*/ public static final Map ESCAPE_CODES; static { Map escapes = new HashMap<>(); escapes.put(Character.valueOf('0'), "\0");// ASCII null escapes.put(Character.valueOf('a'), "\u0007");// ASCII bell escapes.put(Character.valueOf('b'), "\u0008"); // ASCII backspace escapes.put(Character.valueOf('t'), "\u0009"); // ASCII horizontal tab escapes.put(Character.valueOf('n'), "\n");// ASCII newline (line feed; \n maps to 0x0A) escapes.put(Character.valueOf('v'), "\u000B");// ASCII vertical tab escapes.put(Character.valueOf('f'), "\u000C");// ASCII form-feed escapes.put(Character.valueOf('r'), "\r");// carriage-return (\r maps to 0x0D) escapes.put(Character.valueOf('e'), "\u001B");// ASCII escape character (Esc) escapes.put(Character.valueOf(' '), "\u0020");// ASCII space escapes.put(Character.valueOf('"'), "\"");// ASCII double-quote escapes.put(Character.valueOf('/'), "/");// ASCII slash, for JSON compatibility. escapes.put(Character.valueOf('\\'), "\\");// ASCII backslash escapes.put(Character.valueOf('N'), "\u0085");// Unicode next line escapes.put(Character.valueOf('_'), "\u00A0");// Unicode non-breaking-space ESCAPE_REPLACEMENTS = Collections.unmodifiableMap(escapes); Map escapeCodes = new HashMap<>(); escapeCodes.put(Character.valueOf('x'), 2);// 8-bit Unicode escapeCodes.put(Character.valueOf('u'), 4);// 16-bit Unicode // 32-bit Unicode (Supplementary characters are supported) escapeCodes.put(Character.valueOf('U'), 8); ESCAPE_CODES = Collections.unmodifiableMap(escapeCodes); } /** * Replace a single character with its string representation * * @param chRepresentation - the char to escape * @return the same string or its escaped representation */ public static String escapeChar(String chRepresentation) { for (Character s : ESCAPE_REPLACEMENTS.keySet()) { String v = ESCAPE_REPLACEMENTS.get(s); if (" ".equals(v) || "/".equals(v) || "\"".equals(v)) { continue; } if (v.equals(chRepresentation)) { return "\\" + s; // '' -> '\t' } } return chRepresentation; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy