All Downloads are FREE. Search and download functionalities are using the official Maven repository.

ch.randelshofer.fastdoubleparser.bte.ByteTrie Maven / Gradle / Ivy

The newest version!
/*
 * @(#)ByteTrie.java
 * Copyright © 2024 Werner Randelshofer, Switzerland. MIT License.
 */
package ch.randelshofer.fastdoubleparser.bte;

import java.nio.charset.StandardCharsets;
import java.util.HashSet;
import java.util.LinkedHashSet;
import java.util.Set;

/**
 * Interface for a data retrieval tree (trie) of bytes.
 */
public interface ByteTrie {


    /**
     * Searches for the longest matching string in the trie
     * that matches the provided string.
     *
     * @param str a string in the form of a byte array
     * @return the length of the longest matching string, or 0 if no string matches
     */
    default int match(byte[] str) {
        return match(str, 0, str.length);
    }


    /**
     * Searches for the longest matching string in the trie
     * that matches the provided string.
     *
     * @param str        a string
     * @param startIndex start index (inclusive)
     * @param endIndex   end index (exclusive)
     * @return the length of the longest matching string, or 0 if no string matches
     */
    int match(byte[] str, int startIndex, int endIndex);

    /**
     * Creates a new {@link ByteTrie} from the provided set.
     *
     * @param set        a set of strings
     * @param ignoreCase whether the {@link ByteTrie} shall ignore the
     *                   case of the characters
     * @return a new {@link ByteTrie} instance
     */
    static ByteTrie copyOf(Set set, boolean ignoreCase) {
        switch (set.size()) {
            case 0:
                return new ByteTrieOfNone();
            case 1:
                String str = set.iterator().next();
                if (ignoreCase) {
                    switch (str.length()) {
                        case 0:
                            return new ByteTrieOfNone();
                        case 1:
                            LinkedHashSet newSet = new LinkedHashSet<>();
                            newSet.add(str.toLowerCase());
                            newSet.add(str.toUpperCase());
                            if (newSet.size() == 1) {
                                if (newSet.iterator().next().getBytes(StandardCharsets.UTF_8).length == 1) {
                                    return new ByteTrieOfOneSingleByte(newSet);
                                }
                                return new ByteTrieOfOne(newSet);
                            }
                            return new ByteTrieOfFew(newSet);
                        default:
                            return new ByteTrieOfFewIgnoreCase(set);
                    }
                }
                if (set.iterator().next().getBytes(StandardCharsets.UTF_8).length == 1) {
                    return new ByteTrieOfOneSingleByte(set);
                }
                return new ByteTrieOfOne(set);
            default:
                if (ignoreCase) {
                    return new ByteTrieOfFewIgnoreCase(set);
                }
                return new ByteTrieOfFew(set);
        }
    }

    /**
     * Creates a new {@link ByteTrie} from the provided set.
     *
     * @param set a set of characters
     * @param ignoreCase whether the {@link ByteTrie} shall ignore the
     *                   case of the characters
     * @return a new {@link ByteTrie} instance
     */
    static ByteTrie copyOfChars(Set set, boolean ignoreCase) {
        Set strSet = new HashSet<>(set.size() * 2);
        if (ignoreCase) {
            for (char ch : set) {
                String string = new String(new char[]{ch});
                strSet.add(string.toLowerCase());
                strSet.add(string.toUpperCase());

            }
            return copyOf(strSet, false);
        }

        for (char ch : set) {
            strSet.add(new String(new char[]{ch}));

        }
        return copyOf(strSet, ignoreCase);
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy