All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.prestosql.sql.parser.ErrorHandler Maven / Gradle / Ivy

There is a newer version: 350
Show newest version
/*
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package io.prestosql.sql.parser;

import com.google.common.collect.HashMultimap;
import com.google.common.collect.Multimap;
import io.airlift.log.Logger;
import org.antlr.v4.runtime.BaseErrorListener;
import org.antlr.v4.runtime.NoViableAltException;
import org.antlr.v4.runtime.Parser;
import org.antlr.v4.runtime.RecognitionException;
import org.antlr.v4.runtime.Recognizer;
import org.antlr.v4.runtime.RuleContext;
import org.antlr.v4.runtime.Token;
import org.antlr.v4.runtime.TokenStream;
import org.antlr.v4.runtime.Vocabulary;
import org.antlr.v4.runtime.atn.ATN;
import org.antlr.v4.runtime.atn.ATNState;
import org.antlr.v4.runtime.atn.NotSetTransition;
import org.antlr.v4.runtime.atn.RuleStopState;
import org.antlr.v4.runtime.atn.RuleTransition;
import org.antlr.v4.runtime.atn.Transition;
import org.antlr.v4.runtime.atn.WildcardTransition;
import org.antlr.v4.runtime.misc.IntervalSet;

import java.util.ArrayDeque;
import java.util.Comparator;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Map;
import java.util.Queue;
import java.util.Set;
import java.util.stream.Collectors;

import static java.lang.String.format;
import static org.antlr.v4.runtime.atn.ATNState.BLOCK_START;
import static org.antlr.v4.runtime.atn.ATNState.RULE_START;

class ErrorHandler
        extends BaseErrorListener
{
    private static final Logger LOG = Logger.get(ErrorHandler.class);

    private final Map specialRules;
    private final Map specialTokens;
    private final Set ignoredRules;

    private ErrorHandler(Map specialRules, Map specialTokens, Set ignoredRules)
    {
        this.specialRules = new HashMap<>(specialRules);
        this.specialTokens = specialTokens;
        this.ignoredRules = new HashSet<>(ignoredRules);
    }

    @Override
    public void syntaxError(Recognizer recognizer, Object offendingSymbol, int line, int charPositionInLine, String message, RecognitionException e)
    {
        try {
            Parser parser = (Parser) recognizer;

            ATN atn = parser.getATN();

            ATNState currentState;
            Token currentToken;
            RuleContext context;

            if (e != null) {
                currentState = atn.states.get(e.getOffendingState());
                currentToken = e.getOffendingToken();
                context = e.getCtx();

                if (e instanceof NoViableAltException) {
                    currentToken = ((NoViableAltException) e).getStartToken();
                }
            }
            else {
                currentState = atn.states.get(parser.getState());
                currentToken = parser.getCurrentToken();
                context = parser.getContext();
            }

            Analyzer analyzer = new Analyzer(atn, parser.getVocabulary(), specialRules, specialTokens, ignoredRules, parser.getTokenStream());
            Multimap candidates = analyzer.process(currentState, currentToken.getTokenIndex(), context);

            // pick the candidate tokens associated largest token index processed (i.e., the path that consumed the most input)
            String expected = candidates.asMap().entrySet().stream()
                    .max(Comparator.comparing(Map.Entry::getKey))
                    .get()
                    .getValue().stream()
                    .sorted()
                    .collect(Collectors.joining(", "));

            message = format("mismatched input '%s'. Expecting: %s", ((Token) offendingSymbol).getText(), expected);
        }
        catch (Exception exception) {
            LOG.error(exception, "Unexpected failure when handling parsing error. This is likely a bug in the implementation");
        }

        throw new ParsingException(message, e, line, charPositionInLine);
    }

    private static class ParsingState
    {
        public final ATNState state;
        public final int tokenIndex;
        private final CallerContext caller;

        public ParsingState(ATNState state, int tokenIndex, CallerContext caller)
        {
            this.state = state;
            this.tokenIndex = tokenIndex;
            this.caller = caller;
        }
    }

    private static class CallerContext
    {
        public final ATNState followState;
        public final CallerContext parent;

        public CallerContext(CallerContext parent, ATNState followState)
        {
            this.parent = parent;
            this.followState = followState;
        }
    }

    private static class Analyzer
    {
        private final ATN atn;
        private final Vocabulary vocabulary;
        private final Map specialRules;
        private final Map specialTokens;
        private final Set ignoredRules;
        private final TokenStream stream;

        public Analyzer(
                ATN atn,
                Vocabulary vocabulary,
                Map specialRules,
                Map specialTokens,
                Set ignoredRules,
                TokenStream stream)
        {
            this.stream = stream;
            this.atn = atn;
            this.vocabulary = vocabulary;
            this.specialRules = specialRules;
            this.specialTokens = specialTokens;
            this.ignoredRules = ignoredRules;
        }

        public Multimap process(ATNState currentState, int tokenIndex, RuleContext context)
        {
            return process(new ParsingState(currentState, tokenIndex, makeCallStack(context)));
        }

        private Multimap process(ParsingState start)
        {
            Multimap candidates = HashMultimap.create();

            // Simulates the ATN by consuming input tokens and walking transitions.
            // The ATN can be in multiple states (similar to an NFA)
            Queue activeStates = new ArrayDeque<>();
            activeStates.add(start);

            while (!activeStates.isEmpty()) {
                ParsingState current = activeStates.poll();

                ATNState state = current.state;
                int tokenIndex = current.tokenIndex;
                CallerContext caller = current.caller;

                if (state.getStateType() == BLOCK_START || state.getStateType() == RULE_START) {
                    int rule = state.ruleIndex;

                    if (specialRules.containsKey(rule)) {
                        candidates.put(tokenIndex, specialRules.get(rule));
                        continue;
                    }
                    else if (ignoredRules.contains(rule)) {
                        continue;
                    }
                }

                if (state instanceof RuleStopState) {
                    if (caller != null) {
                        // continue from the target state of the rule transition in the parent rule
                        activeStates.add(new ParsingState(caller.followState, tokenIndex, caller.parent));
                    }
                    else {
                        // we've reached the end of the top-level rule, so the only candidate left is EOF at this point
                        candidates.putAll(tokenIndex, getTokenNames(IntervalSet.of(Token.EOF)));
                    }
                    continue;
                }

                for (int i = 0; i < state.getNumberOfTransitions(); i++) {
                    Transition transition = state.transition(i);

                    if (transition instanceof RuleTransition) {
                        activeStates.add(new ParsingState(transition.target, tokenIndex, new CallerContext(caller, ((RuleTransition) transition).followState)));
                    }
                    else if (transition.isEpsilon()) {
                        activeStates.add(new ParsingState(transition.target, tokenIndex, caller));
                    }
                    else if (transition instanceof WildcardTransition) {
                        throw new UnsupportedOperationException("not yet implemented: wildcard transition");
                    }
                    else {
                        IntervalSet labels = transition.label();

                        if (transition instanceof NotSetTransition) {
                            labels = labels.complement(IntervalSet.of(Token.MIN_USER_TOKEN_TYPE, atn.maxTokenType));
                        }

                        int currentToken = stream.get(tokenIndex).getType();
                        if (labels.contains(currentToken)) {
                            activeStates.add(new ParsingState(transition.target, tokenIndex + 1, caller));
                        }
                        else {
                            candidates.putAll(tokenIndex, getTokenNames(labels));
                        }
                    }
                }
            }

            return candidates;
        }

        private Set getTokenNames(IntervalSet tokens)
        {
            return tokens.toSet().stream()
                    .map(token -> {
                        if (token == Token.EOF) {
                            return "";
                        }
                        return specialTokens.getOrDefault(token, vocabulary.getDisplayName(token));
                    })
                    .collect(Collectors.toSet());
        }

        private CallerContext makeCallStack(RuleContext context)
        {
            if (context == null || context.invokingState == -1) {
                return null;
            }

            CallerContext parent = makeCallStack(context.parent);

            ATNState followState = ((RuleTransition) atn.states.get(context.invokingState).transition(0)).followState;
            return new CallerContext(parent, followState);
        }
    }

    public static Builder builder()
    {
        return new Builder();
    }

    public static class Builder
    {
        private final Map specialRules = new HashMap<>();
        private final Map specialTokens = new HashMap<>();
        private final Set ignoredRules = new HashSet<>();

        public Builder specialRule(int ruleId, String name)
        {
            specialRules.put(ruleId, name);
            return this;
        }

        public Builder specialToken(int tokenId, String name)
        {
            specialTokens.put(tokenId, name);
            return this;
        }

        public Builder ignoredRule(int ruleId)
        {
            ignoredRules.add(ruleId);
            return this;
        }

        public ErrorHandler build()
        {
            return new ErrorHandler(specialRules, specialTokens, ignoredRules);
        }
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy