All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.nhl.link.move.runtime.json.query.Scanner Maven / Gradle / Ivy

package com.nhl.link.move.runtime.json.query;

import java.io.IOException;
import java.io.PushbackReader;
import java.io.StringReader;
import java.util.ArrayDeque;
import java.util.Deque;

class Scanner {

    private final CountingPushbackReader reader;
    private boolean isEOF;

    private Deque returnedTokens = new ArrayDeque<>();

    Scanner(String query) {
        reader = new CountingPushbackReader(new PushbackReader(new StringReader(query)));
    }

    private static class CountingPushbackReader {

        private final PushbackReader reader;
        private int currentIndex;

        CountingPushbackReader(PushbackReader reader) {
            this.reader = reader;
        }

        int read() {
            try {
                currentIndex++;
                return reader.read();
            } catch (IOException e) {
                throw new RuntimeException("Unexpected I/O error", e);
            }
        }

        void unread(int c) {
            try {
                currentIndex--;
                reader.unread(c);
            } catch (IOException e) {
                throw new RuntimeException("Unexpected I/O error", e);
            }
        }

        int getCurrentIndex() {
            return currentIndex;
        }
    }

    boolean hasNext() {
        if (isEOF) {
            return false;
        }
        int c = reader.read();
        if (c == -1) {
            isEOF = true;
        } else {
            reader.unread(c);
        }
        return !isEOF;
    }

    Token nextToken() {

        if (returnedTokens.size() > 0) {
            return returnedTokens.removeLast();
        }

        if (isEOF) {
            throw new ParseException("No more tokens to read", reader.getCurrentIndex());
        }

        TokenBuilder builder = new TokenBuilder(reader.getCurrentIndex());
        try {
            int c;
            while ((c = reader.read()) != -1 && builder.acceptCharacter((char) c))
                ;

            if (c == -1) {
                isEOF = true;
            } else {
                reader.unread(c);
            }

            return builder.build();

        } catch (Exception e) {
            throw new ParseException(e.getMessage(), reader.getCurrentIndex(), e);
        }
    }

    void returnToken(Token token) {
        returnedTokens.addLast(token);
    }

    private static class TokenBuilder {

        private static class IdentifierBuilder {

            private StringBuilder buffer; // used to store identifier name
            private boolean isQuoted;
            private boolean isComplete;

            IdentifierBuilder(boolean isQuoted) {
                this.isQuoted = isQuoted;
            }

            boolean acceptCharacter(char c) {

                if (isComplete) {
                    return false;
                }

                // TODO: support backslash escape in quoted identifiers
                if (isQuoted && isQuote(c)) {
                    isComplete = true;
                    return true;
                } else if (!isQuoted && isReserved(c)) {
                    return false;
                } else if (Character.isWhitespace(c)) {
                    return false;
//                    throw new RuntimeException("Whitespace in unquoted identifier");
                }

                if (buffer == null) {
                    buffer = new StringBuilder();
                }
                buffer.append(c);
                return true;
            }

            String build() {

                if (buffer == null || buffer.length() == 0) {
                    throw new RuntimeException("Empty identifier");
                }
                if (isQuoted && !isComplete) {
                    throw new RuntimeException("Unmatched quote in identifier");
                }
                // TODO: Check for illegal identifiers
                return buffer.toString();
            }
        }

        private int startPosition;
        private IdentifierBuilder identifierBuilder;
        private TokenType tokenType;

        TokenBuilder(int startPosition) {
            this.startPosition = startPosition;
        }

        boolean acceptCharacter(char c) throws Exception {

            boolean accepted = doAccept(c);
            return accepted;
        }

        private boolean doAccept(char c) throws Exception {

            if (tokenType == null && Character.isWhitespace(c)) {
                startPosition++;
                return true;
            }

            if (tokenType == TokenType.CHILD_ACCESS && c == '.') {
                tokenType = TokenType.RECURSIVE_DESCENT;
                return true;
            }

            // token type is already known,
            // will not accept anymore
            if (identifierBuilder == null && tokenType != null) {
                return false;
            }

            if (identifierBuilder != null) {
                boolean accepted =  identifierBuilder.acceptCharacter(c);
                if (accepted && tokenType == TokenType.NUMERIC_VALUE && !Character.isDigit(c)) {
                    tokenType = TokenType.IDENTIFIER;
                }
                return accepted;
            }

            // prediction block -
            // if we're here, then current token's type is unknown yet
            switch (c) {
                case '$': {
                    tokenType = TokenType.ROOT_NODE_REF;
                    return true;
                }
                case '@': {
                    tokenType = TokenType.CURRENT_NODE_REF;
                    return true;
                }
                case '.': {
                    tokenType = TokenType.CHILD_ACCESS;
                    return true;
                }
                case '*': {
                    tokenType = TokenType.WILDCARD;
                    return true;
                }
                case '[': {
                    tokenType = TokenType.FILTER_START;
                    return true;
                }
                case ']': {
                    tokenType = TokenType.FILTER_END;
                    return true;
                }
                case '?': {
                    tokenType = TokenType.PREDICATE_START;
                    return true;
                }
                case '(': {
                    tokenType = TokenType.SCRIPT_START;
                    return true;
                }
                case ')': {
                    tokenType = TokenType.SCRIPT_END;
                    return true;
                }
                case ',': {
                    tokenType = TokenType.UNION;
                    return true;
                }
                case '#': {
                    tokenType = TokenType.META;
                    return true;
                }
                case '\'':
                case '\"': {
                    tokenType = TokenType.QUOTED_IDENTIFIER;
                    identifierBuilder = new IdentifierBuilder(true);
                    return true;
                }
                default: {
                    if (Character.isDigit(c)) {
                        tokenType = TokenType.NUMERIC_VALUE;
                    } else {
                        tokenType = TokenType.IDENTIFIER;
                    }
                    identifierBuilder = new IdentifierBuilder(false);
                    identifierBuilder.acceptCharacter(c);
                    return true;
                }
            }
        }

        private static boolean isQuote(char c) {
            return c == '\'' || c == '\"';
        }

        private static boolean isReserved(char c) {
            switch (c) {
                case '$':
                case '@':
                case '.':
                case '*':
                case '[':
                case ']':
                case '?':
                case '(':
                case ')':
                case ',':
                case '#':
                case '\'':
                case '\"':
                    return true;
                default:
                    return false;
            }
        }

        Token build() {

            String literal;
            if (tokenType == TokenType.IDENTIFIER || tokenType == TokenType.QUOTED_IDENTIFIER
                    || tokenType == TokenType.NUMERIC_VALUE) {

                literal = identifierBuilder.build();
            } else {
                literal = getTokenLiteral(tokenType);
            }

            return new Token(tokenType, literal, startPosition);
        }
    }

    static String getTokenLiteral(TokenType tokenType) {

        switch (tokenType) {
            case ROOT_NODE_REF: {
                return "$";
            }
            case CURRENT_NODE_REF: {
                return "@";
            }
            case CHILD_ACCESS: {
                return ".";
            }
            case RECURSIVE_DESCENT: {
                return "..";
            }
            case WILDCARD: {
                return "*";
            }
            case UNION: {
                return ",";
            }
            case META: {
                return "#";
            }
            case FILTER_START: {
                return "[";
            }
            case FILTER_END: {
                return "]";
            }
            case PREDICATE_START: {
                return "?";
            }
            case SCRIPT_START: {
                return "(";
            }
            case SCRIPT_END: {
                return ")";
            }
            case NUMERIC_VALUE: {
                return "numeric";
            }
            case IDENTIFIER: {
                return "identifier";
            }
            case QUOTED_IDENTIFIER: {
                return "\"";
            }
            default: {
                throw new RuntimeException("Unknown token type: " + tokenType.name());
            }
        }
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy