org.lealone.plugins.mysql.server.util.CharsetUtil Maven / Gradle / Ivy
/*
* Copyright 1999-2012 Alibaba Group.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.lealone.plugins.mysql.server.util;
import java.util.HashMap;
import java.util.Map;
/**
* @author xianmao.hexm 2010-8-3 下午06:12:53
*/
public final class CharsetUtil {
private static final String[] INDEX_TO_CHARSET = new String[99];
private static final String[] INDEX_TO_DB_CHARSET = new String[99];
private static final Map CHARSET_TO_INDEX = new HashMap<>();
private static final Map DB_CHARSET_TO_INDEX = new HashMap<>();
// public static final String UTF8_MB4 = "utf8mb4";
// public static final String UTF8 = "utf8";
static {
// index --> charset
// http://dev.mysql.com/doc/internals/en/character-set.html#packet-Protocol::CharacterSet
// SELECT id, collation_name FROM information_schema.collations ORDER BY id;
INDEX_TO_CHARSET[1] = "big5";
INDEX_TO_CHARSET[2] = "czech";
INDEX_TO_CHARSET[3] = "dec8";
INDEX_TO_CHARSET[4] = "dos";
INDEX_TO_CHARSET[5] = "german1";
INDEX_TO_CHARSET[6] = "hp8";
INDEX_TO_CHARSET[7] = "koi8_ru";
INDEX_TO_CHARSET[8] = "latin1";
INDEX_TO_CHARSET[9] = "latin2";
INDEX_TO_CHARSET[10] = "swe7";
INDEX_TO_CHARSET[11] = "usa7";
INDEX_TO_CHARSET[12] = "ujis";
INDEX_TO_CHARSET[13] = "sjis";
INDEX_TO_CHARSET[14] = "cp1251";
INDEX_TO_CHARSET[15] = "danish";
INDEX_TO_CHARSET[16] = "hebrew";
INDEX_TO_CHARSET[18] = "tis620";
INDEX_TO_CHARSET[19] = "euc_kr";
INDEX_TO_CHARSET[20] = "estonia";
INDEX_TO_CHARSET[21] = "hungarian";
INDEX_TO_CHARSET[22] = "koi8_ukr";
INDEX_TO_CHARSET[23] = "win1251ukr";
INDEX_TO_CHARSET[24] = "gb2312";
INDEX_TO_CHARSET[25] = "greek";
INDEX_TO_CHARSET[26] = "win1250";
INDEX_TO_CHARSET[27] = "croat";
INDEX_TO_CHARSET[28] = "gbk";
INDEX_TO_CHARSET[29] = "cp1257";
INDEX_TO_CHARSET[30] = "latin5";
INDEX_TO_CHARSET[31] = "latin1_de";
INDEX_TO_CHARSET[32] = "armscii8";
INDEX_TO_CHARSET[33] = "utf8";
INDEX_TO_CHARSET[34] = "win1250ch";
INDEX_TO_CHARSET[35] = "ucs2";
INDEX_TO_CHARSET[36] = "cp866";
INDEX_TO_CHARSET[37] = "keybcs2";
INDEX_TO_CHARSET[38] = "macce";
INDEX_TO_CHARSET[39] = "macroman";
INDEX_TO_CHARSET[40] = "pclatin2";
INDEX_TO_CHARSET[41] = "latvian";
INDEX_TO_CHARSET[42] = "latvian1";
INDEX_TO_CHARSET[43] = "maccebin";
INDEX_TO_CHARSET[44] = "macceciai";
INDEX_TO_CHARSET[45] = "utf8";
INDEX_TO_CHARSET[46] = "utf8";
INDEX_TO_CHARSET[47] = "latin1bin";
INDEX_TO_CHARSET[48] = "latin1cias";
INDEX_TO_CHARSET[49] = "latin1csas";
INDEX_TO_CHARSET[50] = "cp1251bin";
INDEX_TO_CHARSET[51] = "cp1251cias";
INDEX_TO_CHARSET[52] = "cp1251csas";
INDEX_TO_CHARSET[53] = "macromanbin";
INDEX_TO_CHARSET[54] = "macromancias";
INDEX_TO_CHARSET[55] = "macromanciai";
INDEX_TO_CHARSET[56] = "macromancsas";
INDEX_TO_CHARSET[57] = "cp1256";
INDEX_TO_CHARSET[63] = "binary";
INDEX_TO_CHARSET[64] = "armscii";
INDEX_TO_CHARSET[65] = "ascii";
INDEX_TO_CHARSET[66] = "cp1250";
INDEX_TO_CHARSET[67] = "cp1256";
INDEX_TO_CHARSET[68] = "cp866";
INDEX_TO_CHARSET[69] = "dec8";
INDEX_TO_CHARSET[70] = "greek";
INDEX_TO_CHARSET[71] = "hebrew";
INDEX_TO_CHARSET[72] = "hp8";
INDEX_TO_CHARSET[73] = "keybcs2";
INDEX_TO_CHARSET[74] = "koi8r";
INDEX_TO_CHARSET[75] = "koi8ukr";
INDEX_TO_CHARSET[77] = "latin2";
INDEX_TO_CHARSET[78] = "latin5";
INDEX_TO_CHARSET[79] = "latin7";
INDEX_TO_CHARSET[80] = "cp850";
INDEX_TO_CHARSET[81] = "cp852";
INDEX_TO_CHARSET[82] = "swe7";
INDEX_TO_CHARSET[83] = "utf8";
INDEX_TO_CHARSET[84] = "big5";
INDEX_TO_CHARSET[85] = "euckr";
INDEX_TO_CHARSET[86] = "gb2312";
INDEX_TO_CHARSET[87] = "gbk";
INDEX_TO_CHARSET[88] = "sjis";
INDEX_TO_CHARSET[89] = "tis620";
INDEX_TO_CHARSET[90] = "ucs2";
INDEX_TO_CHARSET[91] = "ujis";
INDEX_TO_CHARSET[92] = "geostd8";
INDEX_TO_CHARSET[93] = "geostd8";
INDEX_TO_CHARSET[94] = "latin1";
INDEX_TO_CHARSET[95] = "cp932";
INDEX_TO_CHARSET[96] = "cp932";
INDEX_TO_CHARSET[97] = "eucjpms";
INDEX_TO_CHARSET[98] = "eucjpms";
INDEX_TO_DB_CHARSET[1] = "big5";
INDEX_TO_DB_CHARSET[2] = "czech";
INDEX_TO_DB_CHARSET[3] = "dec8";
INDEX_TO_DB_CHARSET[4] = "dos";
INDEX_TO_DB_CHARSET[5] = "german1";
INDEX_TO_DB_CHARSET[6] = "hp8";
INDEX_TO_DB_CHARSET[7] = "koi8_ru";
INDEX_TO_DB_CHARSET[8] = "latin1";
INDEX_TO_DB_CHARSET[9] = "latin2";
INDEX_TO_DB_CHARSET[10] = "swe7";
INDEX_TO_DB_CHARSET[11] = "usa7";
INDEX_TO_DB_CHARSET[12] = "ujis";
INDEX_TO_DB_CHARSET[13] = "sjis";
INDEX_TO_DB_CHARSET[14] = "cp1251";
INDEX_TO_DB_CHARSET[15] = "danish";
INDEX_TO_DB_CHARSET[16] = "hebrew";
INDEX_TO_DB_CHARSET[18] = "tis620";
INDEX_TO_DB_CHARSET[19] = "euc_kr";
INDEX_TO_DB_CHARSET[20] = "estonia";
INDEX_TO_DB_CHARSET[21] = "hungarian";
INDEX_TO_DB_CHARSET[22] = "koi8_ukr";
INDEX_TO_DB_CHARSET[23] = "win1251ukr";
INDEX_TO_DB_CHARSET[24] = "gb2312";
INDEX_TO_DB_CHARSET[25] = "greek";
INDEX_TO_DB_CHARSET[26] = "win1250";
INDEX_TO_DB_CHARSET[27] = "croat";
INDEX_TO_DB_CHARSET[28] = "gbk";
INDEX_TO_DB_CHARSET[29] = "cp1257";
INDEX_TO_DB_CHARSET[30] = "latin5";
INDEX_TO_DB_CHARSET[31] = "latin1_de";
INDEX_TO_DB_CHARSET[32] = "armscii8";
INDEX_TO_DB_CHARSET[33] = "utf8";
INDEX_TO_DB_CHARSET[34] = "win1250ch";
INDEX_TO_DB_CHARSET[35] = "ucs2";
INDEX_TO_DB_CHARSET[36] = "cp866";
INDEX_TO_DB_CHARSET[37] = "keybcs2";
INDEX_TO_DB_CHARSET[38] = "macce";
INDEX_TO_DB_CHARSET[39] = "macroman";
INDEX_TO_DB_CHARSET[40] = "pclatin2";
INDEX_TO_DB_CHARSET[41] = "latvian";
INDEX_TO_DB_CHARSET[42] = "latvian1";
INDEX_TO_DB_CHARSET[43] = "maccebin";
INDEX_TO_DB_CHARSET[44] = "macceciai";
INDEX_TO_DB_CHARSET[45] = "utf8mb4";
INDEX_TO_DB_CHARSET[46] = "";
INDEX_TO_DB_CHARSET[47] = "latin1bin";
INDEX_TO_DB_CHARSET[48] = "latin1cias";
INDEX_TO_DB_CHARSET[49] = "latin1csas";
INDEX_TO_DB_CHARSET[50] = "cp1251bin";
INDEX_TO_DB_CHARSET[51] = "cp1251cias";
INDEX_TO_DB_CHARSET[52] = "cp1251csas";
INDEX_TO_DB_CHARSET[53] = "macromanbin";
INDEX_TO_DB_CHARSET[54] = "macromancias";
INDEX_TO_DB_CHARSET[55] = "macromanciai";
INDEX_TO_DB_CHARSET[56] = "macromancsas";
INDEX_TO_DB_CHARSET[57] = "cp1256";
INDEX_TO_DB_CHARSET[63] = "binary";
INDEX_TO_DB_CHARSET[64] = "armscii";
INDEX_TO_DB_CHARSET[65] = "ascii";
INDEX_TO_DB_CHARSET[66] = "cp1250";
INDEX_TO_DB_CHARSET[67] = "cp1256";
INDEX_TO_DB_CHARSET[68] = "cp866";
INDEX_TO_DB_CHARSET[69] = "dec8";
INDEX_TO_DB_CHARSET[70] = "greek";
INDEX_TO_DB_CHARSET[71] = "hebrew";
INDEX_TO_DB_CHARSET[72] = "hp8";
INDEX_TO_DB_CHARSET[73] = "keybcs2";
INDEX_TO_DB_CHARSET[74] = "koi8r";
INDEX_TO_DB_CHARSET[75] = "koi8ukr";
INDEX_TO_DB_CHARSET[77] = "latin2";
INDEX_TO_DB_CHARSET[78] = "latin5";
INDEX_TO_DB_CHARSET[79] = "latin7";
INDEX_TO_DB_CHARSET[80] = "cp850";
INDEX_TO_DB_CHARSET[81] = "cp852";
INDEX_TO_DB_CHARSET[82] = "swe7";
INDEX_TO_DB_CHARSET[83] = "utf8";
INDEX_TO_DB_CHARSET[84] = "big5";
INDEX_TO_DB_CHARSET[85] = "euckr";
INDEX_TO_DB_CHARSET[86] = "gb2312";
INDEX_TO_DB_CHARSET[87] = "gbk";
INDEX_TO_DB_CHARSET[88] = "sjis";
INDEX_TO_DB_CHARSET[89] = "tis620";
INDEX_TO_DB_CHARSET[90] = "ucs2";
INDEX_TO_DB_CHARSET[91] = "ujis";
INDEX_TO_DB_CHARSET[92] = "geostd8";
INDEX_TO_DB_CHARSET[93] = "geostd8";
INDEX_TO_DB_CHARSET[94] = "latin1";
INDEX_TO_DB_CHARSET[95] = "cp932";
INDEX_TO_DB_CHARSET[96] = "cp932";
INDEX_TO_DB_CHARSET[97] = "eucjpms";
INDEX_TO_DB_CHARSET[98] = "eucjpms";
// charset --> index
for (int i = 0; i < INDEX_TO_CHARSET.length; i++) {
String charset = INDEX_TO_CHARSET[i];
if (charset != null && CHARSET_TO_INDEX.get(charset) == null) {
CHARSET_TO_INDEX.put(charset, i);
}
charset = INDEX_TO_DB_CHARSET[i];
if (charset != null && DB_CHARSET_TO_INDEX.get(charset) == null) {
DB_CHARSET_TO_INDEX.put(charset, i);
}
}
CHARSET_TO_INDEX.put("iso-8859-1", 14);
CHARSET_TO_INDEX.put("iso_8859_1", 14);
CHARSET_TO_INDEX.put("utf-8", 33);
DB_CHARSET_TO_INDEX.put("iso-8859-1", 14);
DB_CHARSET_TO_INDEX.put("iso_8859_1", 14);
DB_CHARSET_TO_INDEX.put("utf-8", 33);
}
public static String getCharset(int index) {
if (index < 0 || index > 98) {
index = 83;
}
return INDEX_TO_CHARSET[index];
}
public static int getIndex(String charset) {
if (charset == null || charset.length() == 0) {
return 0;
} else {
Integer i = CHARSET_TO_INDEX.get(charset.toLowerCase());
return (i == null) ? 0 : i.intValue();
}
}
public static String getDbCharset(int index) {
if (index < 0 || index > 98) {
index = 83;
}
return INDEX_TO_DB_CHARSET[index];
}
public static int getDBIndex(String charset) {
if (charset == null || charset.length() == 0) {
return 0;
} else {
Integer i = DB_CHARSET_TO_INDEX.get(charset.toLowerCase());
return (i == null) ? 0 : i.intValue();
}
}
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy