All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.github.netty.protocol.mysql.MysqlCharacterSet Maven / Gradle / Ivy

The newest version!
/*
 * Copyright 2016 The Netty Project
 *
 * The Netty Project licenses this file to you under the Apache License,
 * version 2.0 (the "License"); you may not use this file except in compliance
 * with the License. You may obtain a copy of the License at:
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
 * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
 * License for the specific language governing permissions and limitations
 * under the License.
 */

package com.github.netty.protocol.mysql;

import com.github.netty.core.util.LoggerFactoryX;
import com.github.netty.core.util.LoggerX;
import io.netty.util.collection.IntObjectHashMap;
import io.netty.util.collection.IntObjectMap;

import java.nio.charset.Charset;
import java.util.Arrays;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.stream.Collectors;

public enum MysqlCharacterSet {
    /**
     * Used to indicate that the server sent no field-level character set information, so the driver should use the connection-level character encoding instead.
     */
//	NO_CHARSET_INFO((byte) -1, "UTF-8"),
    big5_chinese_ci("big5", "Big5", 1),
    latin2_czech_cs("latin2", "ISO8859_2", 2),
    dec8_swedish_ci("dec8", "Cp1252", 3),
    cp850_general_ci("cp850", "Cp850", 4),
    latin1_german1_ci("latin1", "Cp1252", 5),
    hp8_english_ci("hp8", "Cp1252", 6),
    koi8r_general_ci("koi8r", "KOI8_R", 7),
    latin1_swedish_ci("latin1", "Cp1252", 8),
    latin2_general_ci("latin2", "ISO8859_2", 9),
    swe7_swedish_ci("swe7", "Cp1252", 10),
    ascii_general_ci("ascii", "US-ASCII", 11),
    ujis_japanese_ci("ujis", "EUC_JP", 12),
    sjis_japanese_ci("sjis", "SJIS", 13),
    cp1251_bulgarian_ci("cp1251", "Cp1251", 14),
    latin1_danish_ci("latin1", "Cp1252", 15),
    hebrew_general_ci("hebrew", "ISO8859_8", 16),
    tis620_thai_ci("tis620", "TIS620", 18),
    euckr_korean_ci("euckr", "EUC_KR", 19),
    latin7_estonian_cs("latin7", "ISO-8859-13", 20),
    latin2_hungarian_ci("latin2", "ISO8859_2", 21),
    koi8u_general_ci("koi8u", "KOI8_R", 22),
    cp1251_ukrainian_ci("cp1251", "Cp1251", 23),
    gb2312_chinese_ci("gb2312", "EUC_CN", 24),
    greek_general_ci("greek", "ISO8859_7", 25),
    cp1250_general_ci("cp1250", "Cp1250", 26),
    latin2_croatian_ci("latin2", "ISO8859_2", 27),
    gbk_chinese_ci("gbk", "GBK", 28),
    cp1257_lithuanian_ci("cp1257", "Cp1257", 29),
    latin5_turkish_ci("latin5", "ISO8859_9", 30),
    latin1_german2_ci("latin1", "Cp1252", 31),
    armscii8_general_ci("armscii8", "Cp1252", 32),
    utf8_general_ci("utf8", "UTF-8", 33),
    cp1250_czech_cs("cp1250", "Cp1250", 34),
    ucs2_general_ci("ucs2", "UnicodeBig", 35),
    cp866_general_ci("cp866", "Cp866", 36),
    keybcs2_general_ci("keybcs2", "Cp852", 37),
    macce_general_ci("macce", "MacCentralEurope", 38),
    macroman_general_ci("macroman", "MacRoman", 39),
    cp852_general_ci("cp852", "Cp852", 40),
    latin7_general_ci("latin7", "ISO-8859-13", 41),
    latin7_general_cs("latin7", "ISO-8859-13", 42),
    macce_bin("macce", "MacCentralEurope", 43),
    cp1250_croatian_ci("cp1250", "Cp1250", 44),
    utf8mb4_general_ci("utf8mb4", "UTF-8", 45),
    utf8mb4_bin("utf8mb4", "UTF-8", 46),
    latin1_bin("latin1", "Cp1252", 47),
    latin1_general_ci("latin1", "Cp1252", 48),
    latin1_general_cs("latin1", "Cp1252", 49),
    cp1251_bin("cp1251", "Cp1251", 50),
    cp1251_general_ci("cp1251", "Cp1251", 51),
    cp1251_general_cs("cp1251", "Cp1251", 52),
    macroman_bin("macroman", "MacRoman", 53),
    utf16_general_ci("utf16", "UTF-16", 54),
    utf16_bin("utf16", "UTF-16", 55),
    utf16le_general_ci("utf16le", "UTF-16LE", 56),
    cp1256_general_ci("cp1256", "Cp1256", 57),
    cp1257_bin("cp1257", "Cp1257", 58),
    cp1257_general_ci("cp1257", "Cp1257", 59),
    utf32_general_ci("utf32", "UTF-32", 60),
    utf32_bin("utf32", "UTF-32", 61),
    utf16le_bin("utf16le", "UTF-16LE", 62),
    binary("binary", "ISO8859_1", 63),
    armscii8_bin("armscii8", "Cp1252", 64),
    ascii_bin("ascii", "US-ASCII", 65),
    cp1250_bin("cp1250", "Cp1250", 66),
    cp1256_bin("cp1256", "Cp1256", 67),
    cp866_bin("cp866", "Cp866", 68),
    dec8_bin("dec8", "Cp1252", 69),
    greek_bin("greek", "ISO8859_7", 70),
    hebrew_bin("hebrew", "ISO8859_8", 71),
    hp8_bin("hp8", "Cp1252", 72),
    keybcs2_bin("keybcs2", "Cp852", 73),
    koi8r_bin("koi8r", "KOI8_R", 74),
    koi8u_bin("koi8u", "KOI8_R", 75),
    latin2_bin("latin2", "ISO8859_2", 77),
    latin5_bin("latin5", "ISO8859_9", 78),
    latin7_bin("latin7", "ISO-8859-13", 79),
    cp850_bin("cp850", "Cp850", 80),
    cp852_bin("cp852", "Cp852", 81),
    swe7_bin("swe7", "Cp1252", 82),
    utf8_bin("utf8", "UTF-8", 83),
    big5_bin("big5", "Big5", 84),
    euckr_bin("euckr", "EUC_KR", 85),
    gb2312_bin("gb2312", "EUC_CN", 86),
    gbk_bin("gbk", "GBK", 87),
    sjis_bin("sjis", "SJIS", 88),
    tis620_bin("tis620", "TIS620", 89),
    ucs2_bin("ucs2", "UnicodeBig", 90),
    ujis_bin("ujis", "EUC_JP", 91),
    geostd8_general_ci("geostd8", "Cp1252", 92),
    geostd8_bin("geostd8", "Cp1252", 93),
    latin1_spanish_ci("latin1", "Cp1252", 94),
    cp932_japanese_ci("cp932", "Cp932", 95),
    cp932_bin("cp932", "Cp932", 96),
    eucjpms_japanese_ci("eucjpms", "EUC_JP_Solaris", 97),
    eucjpms_bin("eucjpms", "EUC_JP_Solaris", 98),
    cp1250_polish_ci("cp1250", "Cp1250", 99),
    utf16_unicode_ci("utf16", "UTF-16", 101),
    utf16_icelandic_ci("utf16", "UTF-16", 102),
    utf16_latvian_ci("utf16", "UTF-16", 103),
    utf16_romanian_ci("utf16", "UTF-16", 104),
    utf16_slovenian_ci("utf16", "UTF-16", 105),
    utf16_polish_ci("utf16", "UTF-16", 106),
    utf16_estonian_ci("utf16", "UTF-16", 107),
    utf16_spanish_ci("utf16", "UTF-16", 108),
    utf16_swedish_ci("utf16", "UTF-16", 109),
    utf16_turkish_ci("utf16", "UTF-16", 110),
    utf16_czech_ci("utf16", "UTF-16", 111),
    utf16_danish_ci("utf16", "UTF-16", 112),
    utf16_lithuanian_ci("utf16", "UTF-16", 113),
    utf16_slovak_ci("utf16", "UTF-16", 114),
    utf16_spanish2_ci("utf16", "UTF-16", 115),
    utf16_roman_ci("utf16", "UTF-16", 116),
    utf16_persian_ci("utf16", "UTF-16", 117),
    utf16_esperanto_ci("utf16", "UTF-16", 118),
    utf16_hungarian_ci("utf16", "UTF-16", 119),
    utf16_sinhala_ci("utf16", "UTF-16", 120),
    utf16_german2_ci("utf16", "UTF-16", 121),
    utf16_croatian_ci("utf16", "UTF-16", 122),
    utf16_unicode_520_ci("utf16", "UTF-16", 123),
    utf16_vietnamese_ci("utf16", "UTF-16", 124),
    ucs2_unicode_ci("ucs2", "UnicodeBig", 128),
    ucs2_icelandic_ci("ucs2", "UnicodeBig", 129),
    ucs2_latvian_ci("ucs2", "UnicodeBig", 130),
    ucs2_romanian_ci("ucs2", "UnicodeBig", 131),
    ucs2_slovenian_ci("ucs2", "UnicodeBig", 132),
    ucs2_polish_ci("ucs2", "UnicodeBig", 133),
    ucs2_estonian_ci("ucs2", "UnicodeBig", 134),
    ucs2_spanish_ci("ucs2", "UnicodeBig", 135),
    ucs2_swedish_ci("ucs2", "UnicodeBig", 136),
    ucs2_turkish_ci("ucs2", "UnicodeBig", 137),
    ucs2_czech_ci("ucs2", "UnicodeBig", 138),
    ucs2_danish_ci("ucs2", "UnicodeBig", 139),
    ucs2_lithuanian_ci("ucs2", "UnicodeBig", 140),
    ucs2_slovak_ci("ucs2", "UnicodeBig", 141),
    ucs2_spanish2_ci("ucs2", "UnicodeBig", 142),
    ucs2_roman_ci("ucs2", "UnicodeBig", 143),
    ucs2_persian_ci("ucs2", "UnicodeBig", 144),
    ucs2_esperanto_ci("ucs2", "UnicodeBig", 145),
    ucs2_hungarian_ci("ucs2", "UnicodeBig", 146),
    ucs2_sinhala_ci("ucs2", "UnicodeBig", 147),
    ucs2_german2_ci("ucs2", "UnicodeBig", 148),
    ucs2_croatian_ci("ucs2", "UnicodeBig", 149),
    ucs2_unicode_520_ci("ucs2", "UnicodeBig", 150),
    ucs2_vietnamese_ci("ucs2", "UnicodeBig", 151),
    ucs2_general_mysql500_ci("ucs2", "UnicodeBig", 159),
    utf32_unicode_ci("utf32", "UTF-32", 160),
    utf32_icelandic_ci("utf32", "UTF-32", 161),
    utf32_latvian_ci("utf32", "UTF-32", 162),
    utf32_romanian_ci("utf32", "UTF-32", 163),
    utf32_slovenian_ci("utf32", "UTF-32", 164),
    utf32_polish_ci("utf32", "UTF-32", 165),
    utf32_estonian_ci("utf32", "UTF-32", 166),
    utf32_spanish_ci("utf32", "UTF-32", 167),
    utf32_swedish_ci("utf32", "UTF-32", 168),
    utf32_turkish_ci("utf32", "UTF-32", 169),
    utf32_czech_ci("utf32", "UTF-32", 170),
    utf32_danish_ci("utf32", "UTF-32", 171),
    utf32_lithuanian_ci("utf32", "UTF-32", 172),
    utf32_slovak_ci("utf32", "UTF-32", 173),
    utf32_spanish2_ci("utf32", "UTF-32", 174),
    utf32_roman_ci("utf32", "UTF-32", 175),
    utf32_persian_ci("utf32", "UTF-32", 176),
    utf32_esperanto_ci("utf32", "UTF-32", 177),
    utf32_hungarian_ci("utf32", "UTF-32", 178),
    utf32_sinhala_ci("utf32", "UTF-32", 179),
    utf32_german2_ci("utf32", "UTF-32", 180),
    utf32_croatian_ci("utf32", "UTF-32", 181),
    utf32_unicode_520_ci("utf32", "UTF-32", 182),
    utf32_vietnamese_ci("utf32", "UTF-32", 183),
    utf8_unicode_ci("utf8", "UTF-8", 192),
    utf8_icelandic_ci("utf8", "UTF-8", 193),
    utf8_latvian_ci("utf8", "UTF-8", 194),
    utf8_romanian_ci("utf8", "UTF-8", 195),
    utf8_slovenian_ci("utf8", "UTF-8", 196),
    utf8_polish_ci("utf8", "UTF-8", 197),
    utf8_estonian_ci("utf8", "UTF-8", 198),
    utf8_spanish_ci("utf8", "UTF-8", 199),
    utf8_swedish_ci("utf8", "UTF-8", 200),
    utf8_turkish_ci("utf8", "UTF-8", 201),
    utf8_czech_ci("utf8", "UTF-8", 202),
    utf8_danish_ci("utf8", "UTF-8", 203),
    utf8_lithuanian_ci("utf8", "UTF-8", 204),
    utf8_slovak_ci("utf8", "UTF-8", 205),
    utf8_spanish2_ci("utf8", "UTF-8", 206),
    utf8_roman_ci("utf8", "UTF-8", 207),
    utf8_persian_ci("utf8", "UTF-8", 208),
    utf8_esperanto_ci("utf8", "UTF-8", 209),
    utf8_hungarian_ci("utf8", "UTF-8", 210),
    utf8_sinhala_ci("utf8", "UTF-8", 211),
    utf8_german2_ci("utf8", "UTF-8", 212),
    utf8_croatian_ci("utf8", "UTF-8", 213),
    utf8_unicode_520_ci("utf8", "UTF-8", 214),
    utf8_vietnamese_ci("utf8", "UTF-8", 215),
    utf8_general_mysql500_ci("utf8", "UTF-8", 223),
    utf8mb4_unicode_ci("utf8mb4", "UTF-8", 224),
    utf8mb4_icelandic_ci("utf8mb4", "UTF-8", 225),
    utf8mb4_latvian_ci("utf8mb4", "UTF-8", 226),
    utf8mb4_romanian_ci("utf8mb4", "UTF-8", 227),
    utf8mb4_slovenian_ci("utf8mb4", "UTF-8", 228),
    utf8mb4_polish_ci("utf8mb4", "UTF-8", 229),
    utf8mb4_estonian_ci("utf8mb4", "UTF-8", 230),
    utf8mb4_spanish_ci("utf8mb4", "UTF-8", 231),
    utf8mb4_swedish_ci("utf8mb4", "UTF-8", 232),
    utf8mb4_turkish_ci("utf8mb4", "UTF-8", 233),
    utf8mb4_czech_ci("utf8mb4", "UTF-8", 234),
    utf8mb4_danish_ci("utf8mb4", "UTF-8", 235),
    utf8mb4_lithuanian_ci("utf8mb4", "UTF-8", 236),
    utf8mb4_slovak_ci("utf8mb4", "UTF-8", 237),
    utf8mb4_spanish2_ci("utf8mb4", "UTF-8", 238),
    utf8mb4_roman_ci("utf8mb4", "UTF-8", 239),
    utf8mb4_persian_ci("utf8mb4", "UTF-8", 240),
    utf8mb4_esperanto_ci("utf8mb4", "UTF-8", 241),
    utf8mb4_hungarian_ci("utf8mb4", "UTF-8", 242),
    utf8mb4_sinhala_ci("utf8mb4", "UTF-8", 243),
    utf8mb4_german2_ci("utf8mb4", "UTF-8", 244),
    utf8mb4_croatian_ci("utf8mb4", "UTF-8", 245),
    utf8mb4_unicode_520_ci("utf8mb4", "UTF-8", 246),
    utf8mb4_vietnamese_ci("utf8mb4", "UTF-8", 247),
    gb18030_chinese_ci("gb18030", "GB18030", 248),
    gb18030_bin("gb18030", "GB18030", 249),
    gb18030_unicode_520_ci("gb18030", "GB18030", 250),
    utf8mb4_0900_ai_ci("utf8mb4", "UTF-8", 255);

    public static final MysqlCharacterSet DEFAULT = utf8mb4_general_ci;
    public static final List SUPPORTED_COLLATION_NAMES = Arrays.stream(values()).map(Enum::name).collect(Collectors.toList());
    public static final List SUPPORTED_CHARSET_NAMES = Arrays.stream(values()).map(MysqlCharacterSet::getMysqlCharsetName).distinct().collect(Collectors.toList());
    private static final LoggerX LOGGER = LoggerFactoryX.getLogger(MysqlCharacterSet.class);
    private static final Map charsetToDefaultCollationMapping = new HashMap<>();
    private static final IntObjectMap idToJavaCharsetMapping = new IntObjectHashMap<>();

    static {
        charsetToDefaultCollationMapping.put("big5", "big5_chinese_ci");
        charsetToDefaultCollationMapping.put("dec8", "dec8_swedish_ci");
        charsetToDefaultCollationMapping.put("cp850", "cp850_general_ci");
        charsetToDefaultCollationMapping.put("hp8", "hp8_english_ci");
        charsetToDefaultCollationMapping.put("koi8r", "koi8r_general_ci");
        charsetToDefaultCollationMapping.put("latin1", "latin1_swedish_ci");
        charsetToDefaultCollationMapping.put("latin2", "latin2_general_ci");
        charsetToDefaultCollationMapping.put("swe7", "swe7_swedish_ci");
        charsetToDefaultCollationMapping.put("ascii", "ascii_general_ci");
        charsetToDefaultCollationMapping.put("ujis", "ujis_japanese_ci");
        charsetToDefaultCollationMapping.put("sjis", "sjis_japanese_ci");
        charsetToDefaultCollationMapping.put("hebrew", "hebrew_general_ci");
        charsetToDefaultCollationMapping.put("tis620", "tis620_thai_ci");
        charsetToDefaultCollationMapping.put("euckr", "euckr_korean_ci");
        charsetToDefaultCollationMapping.put("koi8u", "koi8u_general_ci");
        charsetToDefaultCollationMapping.put("gb2312", "gb2312_chinese_ci");
        charsetToDefaultCollationMapping.put("greek", "greek_general_ci");
        charsetToDefaultCollationMapping.put("cp1250", "cp1250_general_ci");
        charsetToDefaultCollationMapping.put("gbk", "gbk_chinese_ci");
        charsetToDefaultCollationMapping.put("latin5", "latin5_turkish_ci");
        charsetToDefaultCollationMapping.put("armscii8", "armscii8_general_ci");
        charsetToDefaultCollationMapping.put("utf8", "utf8_general_ci");
        charsetToDefaultCollationMapping.put("ucs2", "ucs2_general_ci");
        charsetToDefaultCollationMapping.put("cp866", "cp866_general_ci");
        charsetToDefaultCollationMapping.put("keybcs2", "keybcs2_general_ci");
        charsetToDefaultCollationMapping.put("macce", "macce_general_ci");
        charsetToDefaultCollationMapping.put("macroman", "macroman_general_ci");
        charsetToDefaultCollationMapping.put("cp852", "cp852_general_ci");
        charsetToDefaultCollationMapping.put("latin7", "latin7_general_ci");
        charsetToDefaultCollationMapping.put("utf8mb4", "utf8mb4_general_ci");
        charsetToDefaultCollationMapping.put("cp1251", "cp1251_general_ci");
        charsetToDefaultCollationMapping.put("utf16", "utf16_general_ci");
        charsetToDefaultCollationMapping.put("utf16le", "utf16le_general_ci");
        charsetToDefaultCollationMapping.put("cp1256", "cp1256_general_ci");
        charsetToDefaultCollationMapping.put("cp1257", "cp1257_general_ci");
        charsetToDefaultCollationMapping.put("utf32", "utf32_general_ci");
        charsetToDefaultCollationMapping.put("binary", "binary");
        charsetToDefaultCollationMapping.put("geostd8", "geostd8_general_ci");
        charsetToDefaultCollationMapping.put("cp932", "cp932_japanese_ci");
        charsetToDefaultCollationMapping.put("eucjpms", "eucjpms_japanese_ci");
        charsetToDefaultCollationMapping.put("gb18030", "gb18030_chinese_ci");

        for (MysqlCharacterSet collation : MysqlCharacterSet.values()) {
            try {
                Charset charset = Charset.forName(collation.mappedJavaCharsetName);
                idToJavaCharsetMapping.put(collation.id, charset);
            } catch (Exception e) {
                LOGGER.warn(String.format("Java charset: [%s] is not supported by this platform, data with collation[%s] will be decoded in UTF-8 instead.", collation.mysqlCharsetName, collation.name()));
            }
        }
    }

    private final String mysqlCharsetName;
    private final String mappedJavaCharsetName;
    private final int id;

    MysqlCharacterSet(String mysqlCharsetName, String mappedJavaCharsetName, int id) {
        this.mysqlCharsetName = mysqlCharsetName;
        this.mappedJavaCharsetName = mappedJavaCharsetName;
        this.id = id;
    }

    public static MysqlCharacterSet findById(int id) {
        return findById(id, DEFAULT);
    }

    public static MysqlCharacterSet findById(int id, MysqlCharacterSet characterSet) {
        for (MysqlCharacterSet charset : values()) {
            if (charset.id == id) {
                return charset;
            }
        }
        return characterSet;
    }

    public static String getDefaultCollationFromCharsetName(String charset) {
        String defaultCollationName = charsetToDefaultCollationMapping.get(charset);
        if (defaultCollationName == null) {
            throw new IllegalArgumentException("Unknown charset name: [" + charset + "]");
        } else {
            return defaultCollationName;
        }
    }

    public Charset getCharset() {
        return Charset.forName(mappedJavaCharsetName);
    }

    public int getId() {
        return id;
    }

    public String getMysqlCharsetName() {
        return mysqlCharsetName;
    }

    public String getMappedJavaCharsetName() {
        return mappedJavaCharsetName;
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy