All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.eclipse.jetty.util.RFC9110QuotedStringTokenizer Maven / Gradle / Ivy

There is a newer version: 2.0.31
Show newest version
//
// ========================================================================
// Copyright (c) 1995 Mort Bay Consulting Pty Ltd and others.
//
// This program and the accompanying materials are made available under the
// terms of the Eclipse Public License v. 2.0 which is available at
// https://www.eclipse.org/legal/epl-2.0, or the Apache License, Version 2.0
// which is available at https://www.apache.org/licenses/LICENSE-2.0.
//
// SPDX-License-Identifier: EPL-2.0 OR Apache-2.0
// ========================================================================
//

package org.eclipse.jetty.util;

import java.io.IOException;
import java.util.Iterator;
import java.util.NoSuchElementException;
import java.util.Objects;

/**
 * An implementation of {@link QuotedStringTokenizer} with partial handling of
 * RFC9110 quoted-strings.
 * The deviation from the RFC is that characters are not enforced to be
 * {@code qdtext = HTAB / SP / %x21 / %x23-5B / %x5D-7E / obs-text} and it is expected
 * that the caller will enforce any character restrictions.
 */
public class RFC9110QuotedStringTokenizer implements QuotedStringTokenizer
{
    private final String _delim;
    private final boolean _optionalWhiteSpace;
    private final boolean _returnDelimiters;
    private final boolean _returnQuotes;
    private final boolean _embeddedQuotes;
    private final boolean _escapeOnlyQuote;

    RFC9110QuotedStringTokenizer(String delim,
                                 boolean optionalWhiteSpace,
                                 boolean returnDelimiters,
                                 boolean returnQuotes,
                                 boolean embeddedQuotes,
                                 boolean escapeOnlyQuote)
    {
        _delim = Objects.requireNonNull(delim);
        _optionalWhiteSpace = optionalWhiteSpace;
        _returnDelimiters = returnDelimiters;
        _returnQuotes = returnQuotes;
        _embeddedQuotes = embeddedQuotes;
        _escapeOnlyQuote = escapeOnlyQuote;

        if (_delim.indexOf('"') >= 0)
            throw new IllegalArgumentException("Can't use quote as delimiters: " + _delim);
        if (_optionalWhiteSpace && _delim.indexOf(' ') >= 0)
            throw new IllegalArgumentException("Can't delimit with space with optional white space");
    }

    protected boolean isOptionalWhiteSpace(char c)
    {
        return Character.isWhitespace(c);
    }

    @Override
    public Iterator tokenize(String string)
    {
        Objects.requireNonNull(string);

        return new Iterator<>()
        {
            private enum State
            {
                START,
                TOKEN,
                QUOTE,
                END,
            }

            private final StringBuilder _token = new StringBuilder();
            State _state = State.START;
            private boolean _hasToken;
            private int _ows = -1;
            private int _i = 0;

            @Override
            public boolean hasNext()
            {
                if (_hasToken)
                    return true;

                boolean escape = false;
                while (_i < string.length())
                {
                    char c = string.charAt(_i++);

                    switch (_state)
                    {
                        case START ->
                        {
                            if (_delim.indexOf(c) >= 0)
                            {
                                if (_returnDelimiters)
                                {
                                    _token.append(c);
                                    return _hasToken = true;
                                }
                            }
                            else if (c == '"')
                            {
                                if (_returnQuotes)
                                    _token.append(c);
                                _ows = -1;
                                _state = State.QUOTE;
                            }
                            else if (!_optionalWhiteSpace || !isOptionalWhiteSpace(c))
                            {
                                _token.append(c);
                                _hasToken = true;
                                _ows = -1;
                                _state = State.TOKEN;
                            }
                        }
                        case TOKEN ->
                        {
                            _hasToken = true;
                            if (_delim.indexOf(c) >= 0)
                            {
                                if (_returnDelimiters)
                                    _i--;
                                _state = State.START;
                                if (_ows >= 0)
                                    _token.setLength(_ows);
                                return _hasToken;
                            }
                            else if (_embeddedQuotes && c == '"')
                            {
                                if (_returnQuotes)
                                    _token.append(c);
                                _ows = -1;
                                _state = State.QUOTE;
                            }
                            else if (_optionalWhiteSpace && isOptionalWhiteSpace(c))
                            {
                                if (_ows < 0)
                                    _ows = _token.length();
                                _token.append(c);
                            }
                            else
                            {
                                _ows = -1;
                                _token.append(c);
                            }
                        }
                        case QUOTE ->
                        {
                            _hasToken = true;
                            if (escape)
                            {
                                escape = false;
                                _token.append(c);
                            }
                            else if (c == '\"')
                            {
                                if (_returnQuotes)
                                    _token.append(c);
                                if (_embeddedQuotes)
                                {
                                    _ows = -1;
                                    _state = State.TOKEN;
                                }
                                else
                                {
                                    _state = State.END;
                                    return _hasToken;
                                }
                            }
                            else if (c == '\\')
                            {
                                if (_escapeOnlyQuote && (_i >= string.length() || string.charAt(_i) != '"'))
                                    _token.append(c);
                                else
                                {
                                    if (_returnQuotes)
                                        _token.append(c);
                                    escape = true;
                                }
                            }
                            else
                            {
                                _token.append(c);
                            }
                        }
                        case END ->
                        {
                            if (_delim.indexOf(c) >= 0)
                            {
                                _state = State.START;
                                if (_returnDelimiters)
                                {
                                    _token.append(c);
                                    return _hasToken = true;
                                }
                            }
                            else if (!_optionalWhiteSpace || !isOptionalWhiteSpace(c))
                                throw new IllegalArgumentException("characters after end quote");
                        }
                        default -> throw new IllegalStateException();
                    }
                }

                if (_state == State.QUOTE)
                    throw new IllegalArgumentException("unterminated quote");

                if (_ows >= 0 && _hasToken)
                    _token.setLength(_ows);

                return _hasToken;
            }

            @Override
            public String next()
            {
                if (!hasNext())
                    throw new NoSuchElementException();
                String t = _token.toString();
                _token.setLength(0);
                _hasToken = false;
                return t;
            }
        };
    }

    @Override
    public void quote(Appendable buffer, String input)
    {
        if (input == null)
            return;

        try
        {
            buffer.append('"');
            for (int i = 0; i < input.length(); ++i)
            {
                char c = input.charAt(i);
                if (c == '"' || c == '\\')
                    buffer.append('\\').append(c);
                else
                    buffer.append(c);
            }
            buffer.append('"');
        }
        catch (IOException x)
        {
            throw new RuntimeException(x);
        }
    }

    @Override
    public String quoteIfNeeded(String s)
    {
        return quoteIfNeededImpl(null, s);
    }

    @Override
    public void quoteIfNeeded(StringBuilder buf, String str)
    {
        quoteIfNeededImpl(buf, str);
    }

    @Override
    public boolean needsQuoting(char c)
    {
        return c == '\\' || c == '"' || _optionalWhiteSpace && Character.isWhitespace(c) || _delim.indexOf(c) >= 0;
    }

    private String quoteIfNeededImpl(StringBuilder buf, String str)
    {
        if (str == null)
            return null;
        if (str.length() == 0)
        {
            if (buf == null)
                return "\"\"";

            buf.append("\"\"");
            return null;
        }

        for (int i = 0; i < str.length(); i++)
        {
            char c = str.charAt(i);
            if (needsQuoting(c))
            {
                if (buf == null)
                    return quote(str);
                quote(buf, str);
                return null;
            }
        }

        // no special delimiters used, no quote needed.
        if (buf == null)
            return str;
        buf.append(str);
        return null;
    }

    @Override
    public String unquote(String s)
    {
        if (s == null)
            return null;
        if (s.length() < 2)
            return s;

        char first = s.charAt(0);
        char last = s.charAt(s.length() - 1);
        if (first != '"' || last != '"')
            return s;

        StringBuilder b = new StringBuilder(s.length() - 2);
        boolean escape = false;
        for (int i = 1; i < s.length() - 1; i++)
        {
            char c = s.charAt(i);

            if (escape)
            {
                escape = false;
                b.append(c);
            }
            else if (c == '\\')
            {
                escape = true;
            }
            else
            {
                b.append(c);
            }
        }

        return b.toString();
    }

    @Override
    public String toString()
    {
        StringBuilder out = new StringBuilder();
        out.append(getClass().getSimpleName()).append('@').append(Long.toHexString(hashCode()))
            .append("{'").append(_delim).append('\'');

        if (_optionalWhiteSpace)
            out.append(",optionalWhiteSpace");
        if (_returnDelimiters)
            out.append(",returnDelimiters");
        if (_returnQuotes)
            out.append(",returnQuotes");
        if (_embeddedQuotes)
            out.append(",embeddedQuotes");
        if (_escapeOnlyQuote)
            out.append(",escapeOnlyQuote");
        out.append('}');
        return out.toString();
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy