All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.yaml.snakeyaml.reader.StreamReader Maven / Gradle / Ivy

/**
 * Copyright (c) 2008, http://www.snakeyaml.org
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.yaml.snakeyaml.reader;

import java.io.IOException;
import java.io.Reader;
import java.nio.charset.Charset;

import org.yaml.snakeyaml.error.Mark;
import org.yaml.snakeyaml.error.YAMLException;
import org.yaml.snakeyaml.scanner.Constant;

/**
 * Reader: checks if code points are in allowed range, adds '\0' to the end.
 */
public class StreamReader {
    private String name;
    private final Reader stream;
    private int pointer = 0; //in characters
    private boolean eof = true;
    private String buffer;
    private int index = 0; //in characters
    private int line = 0;
    private int column = 0; //in code points
    private char[] data;

    private static final int BUFFER_SIZE = 1025;

    public StreamReader(String stream) {
        this.name = "'string'";
        this.buffer = ""; // to set length to 0
        checkPrintable(stream);
        this.buffer = stream + "\0";
        this.stream = null;
        this.eof = true;
        this.data = null;
    }

    public StreamReader(Reader reader) {
        this.name = "'reader'";
        this.buffer = "";
        this.stream = reader;
        this.eof = false;
        this.data = new char[BUFFER_SIZE];
        this.update();
    }

    void checkPrintable(String data) {
        final int length = data.length();
        for (int offset = 0; offset < length; ) {
            final int codePoint = data.codePointAt(offset);

            if (!isPrintable(codePoint)) {
                throw new ReaderException(name, offset, codePoint,
                                          "special characters are not allowed");
            }

            offset += Character.charCount(codePoint);
        }
    }

    public static boolean isPrintable(final String data) {
        final int length = data.length();
        for (int offset = 0; offset < length; ) {
            final int codePoint = data.codePointAt(offset);

            if (!isPrintable(codePoint)) {
                return false;
            }

            offset += Character.charCount(codePoint);
        }

        return true;
    }

    public static boolean isPrintable(final int c) {
        return (c >= 0x20 && c <= 0x7E) || c == 0x9 || c == 0xA || c == 0xD
                || c == 0x85 || (c >= 0xA0 && c <= 0xD7FF)
                || (c >= 0xE000 && c <= 0xFFFD)
                || (c >= 0x10000 && c <= 0x10FFFF);
    }

    public Mark getMark() {
        return new Mark(name, this.index, this.line, this.column, this.buffer, this.pointer);
    }

    public void forward() {
        forward(1);
    }

    /**
     * read the next length characters and move the pointer.
     * if the last character is high surrogate one more character will be read
     * 
     * @param length amount of characters to move forward
     */
    public void forward(int length) {
        int c;
        for (int i = 0; i < length; i++) {
            if (this.pointer == this.buffer.length()) {
                update();
            }
            if (this.pointer == this.buffer.length()) {
                break;
            }

            c = this.buffer.codePointAt(this.pointer);
            this.pointer += Character.charCount(c);
            this.index += Character.charCount(c);
            if (Constant.LINEBR.has(c) || (c == '\r' && buffer.charAt(pointer) != '\n')) {
                this.line++;
                this.column = 0;
            } else if (c != 0xFEFF) {
                this.column++;
            }
        }

        if (this.pointer == this.buffer.length()) {
            update();
        }
    }

    public int peek() {
        if (this.pointer == this.buffer.length()) {
            update();
        }
        if (this.pointer == this.buffer.length()) {
            return -1;
        }

        return this.buffer.codePointAt(this.pointer);
    }

    /**
     * Peek the next index-th code point
     *
     * @param index to peek
     * @return the next index-th code point
     */
    public int peek(int index) {
        int offset = 0;
        int nextIndex = 0;
        int codePoint;
        do {
            if (this.pointer + offset == this.buffer.length()) {
                update();
            }
            if (this.pointer + offset == this.buffer.length()) {
                return -1;
            }

            codePoint = this.buffer.codePointAt(this.pointer + offset);
            offset += Character.charCount(codePoint);
            nextIndex++;

        } while (nextIndex <= index);

        return codePoint;
    }

    /**
     * peek the next length code points
     * 
     * @param length amount of the characters to peek
     * @return the next length code points
     */
    public String prefix(int length) {
        final StringBuilder builder = new StringBuilder();

        int offset = 0;
        int resultLength = 0;
        while (resultLength < length) {
            if (this.pointer + offset == this.buffer.length()) {
                update();
            }
            if (this.pointer + offset == this.buffer.length()) {
                break;
            }

            int c = this.buffer.codePointAt(this.pointer + offset);
            builder.appendCodePoint(c);
            offset += Character.charCount(c);
            resultLength++;
        }

        return builder.toString();
    }

    /**
     * prefix(length) immediately followed by forward(length)
     * @param length amount of characters to get
     * @return  the next length code points
     */
    public String prefixForward(int length) {
        final String prefix = prefix(length);
        this.pointer += prefix.length();
        this.index += prefix.length();
        // prefix never contains new line characters
        this.column += length;
        return prefix;
    }

    private void update() {
        if (!this.eof) {
            this.buffer = buffer.substring(this.pointer);
            this.pointer = 0;
            try {
                boolean eofDetected = false;
                int converted = this.stream.read(data, 0, BUFFER_SIZE - 1);
                if (converted > 0) {
                    if (Character.isHighSurrogate(data[converted - 1])) {
                        int oneMore = this.stream.read(data, converted, 1);
                        if (oneMore != -1) {
                            converted += oneMore;
                        } else {
                            eofDetected = true;
                        }
                    }

                    /*
                     * Let's create StringBuilder manually. Anyway str1 + str2
                     * generates new StringBuilder(str1).append(str2).toSting()
                     * Giving correct capacity to the constructor prevents
                     * unnecessary operations in appends.
                     */
                    StringBuilder builder  = new StringBuilder(buffer.length() + converted)
                            .append(buffer)
                            .append(data, 0, converted);
                    if (eofDetected) {
                        this.eof = true;
                        builder.append('\0');
                    }
                    this.buffer = builder.toString();
                    checkPrintable(this.buffer);
                } else {
                    this.eof = true;
                    this.buffer += "\0";
                }
            } catch (IOException ioe) {
                throw new YAMLException(ioe);
            }
        }
    }

    public int getColumn() {
        return column;
    }

    public Charset getEncoding() {
        return Charset.forName(((UnicodeReader) this.stream).getEncoding());
    }

    public int getIndex() {
        return index;
    }

    public int getLine() {
        return line;
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy