All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.yahoo.vespa.model.application.validation.TokenizeAndDeQuote Maven / Gradle / Ivy

There is a newer version: 8.409.18
Show newest version
// Copyright Vespa.ai. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
package com.yahoo.vespa.model.application.validation;

import java.util.ArrayList;
import java.util.List;

/**
 * Will tokenize based on the delimiters while dequoting any qouted text.
 * @author baldersheim
 */
public class TokenizeAndDeQuote {
    private static final char ESCAPE = '\\';
    private final String delims;
    private final String quotes;

    public TokenizeAndDeQuote(String delims,String quotes) {
        this.delims = delims;
        this.quotes = quotes;
    }

    public List tokenize(String string) {
        StringBuilder current = new StringBuilder();
        List tokens = new ArrayList<>();
        char quote = 0;

        for (int i = 0; i < string.length(); i++) {
            char c = string.charAt(i);

            if ((c == ESCAPE) && (i + 1 < string.length())) {
                // Escaped, append next char
                current.append(string.charAt(++i));
            } else if ((quote == 0) && (delims.indexOf(c) >=0 )) {
                // Delimiter found outside quoted section, add token and start next
                tokens.add(current.toString());
                current.setLength(0);
            } else if ((quote == 0) && (quotes.indexOf(c) >= 0)) {
                // Start of quote
                quote = c;
            } else if (quote == c) {
                // End of quote
                quote = 0;
            } else {
                current.append(c);
            }
        }

        if ( ! current.isEmpty()) {
            // And then the last token if any
            tokens.add(current.toString());
        }

        return tokens;
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy