Source code: com/mysql/jdbc/CharsetMapping.java
1 /*
2 Copyright (C) 2002-2004 MySQL AB
3
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of version 2 of the GNU General Public License as
6 published by the Free Software Foundation.
7
8
9 There are special exceptions to the terms and conditions of the GPL
10 as it is applied to this software. View the full text of the
11 exception exception in file EXCEPTIONS-CONNECTOR-J in the directory of this
12 software distribution.
13
14 This program is distributed in the hope that it will be useful,
15 but WITHOUT ANY WARRANTY; without even the implied warranty of
16 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 GNU General Public License for more details.
18
19 You should have received a copy of the GNU General Public License
20 along with this program; if not, write to the Free Software
21 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
22
23 */
24 package com.mysql.jdbc;
25
26 import java.util.Collections;
27 import java.util.HashMap;
28 import java.util.Iterator;
29 import java.util.Map;
30 import java.util.Set;
31
32
33 /**
34 * Mapping between MySQL charset names
35 * and Java charset names.
36 *
37 * I've investigated placing these in a .properties file,
38 * but unfortunately under most appservers this complicates
39 * configuration because the security policy needs to be changed
40 * by the user to allow the driver to read them :(
41 *
42 * @author Mark Matthews
43 */
44 public class CharsetMapping {
45 //~ Static fields/initializers ---------------------------------------------
46
47 /**
48 * Mapping of Java charset names to MySQL charset names
49 */
50 public static final Map JAVA_TO_MYSQL_CHARSET_MAP;
51
52 /**
53 * Mapping of upper-case Java charset names to MySQL charset names
54 */
55 public static final Map JAVA_UC_TO_MYSQL_CHARSET_MAP;
56
57
58 /**
59 * Mapping of MySQL charset names to Java charset names
60 */
61 public static final Map MYSQL_TO_JAVA_CHARSET_MAP;
62
63 /**
64 * Map/List of multibyte character sets (using MySQL names)
65 */
66 public static final Map MULTIBYTE_CHARSETS;
67
68 /**
69 * Map of MySQL-4.1 charset indexes to Java encoding names
70 */
71 public static final String[] INDEX_TO_CHARSET;
72
73 static {
74 HashMap tempMap = new HashMap();
75
76 tempMap.put("usa7", "US-ASCII");
77 tempMap.put("ascii", "US-ASCII");
78 tempMap.put("big5", "Big5");
79 tempMap.put("gbk", "GBK");
80 tempMap.put("sjis", "SJIS");
81 tempMap.put("gb2312", "EUC_CN");
82 tempMap.put("ujis", "EUC_JP");
83 tempMap.put("euc_kr", "EUC_KR");
84 tempMap.put("latin1", "ISO8859_1");
85 tempMap.put("latin1_de", "ISO8859_1");
86 tempMap.put("german1", "ISO8859_1");
87 tempMap.put("danish", "ISO8859_1");
88 tempMap.put("latin2", "ISO8859_2");
89 tempMap.put("czech", "ISO8859_2");
90 tempMap.put("hungarian", "ISO8859_2");
91 tempMap.put("croat", "ISO8859_2");
92 tempMap.put("greek", "ISO8859_7");
93 tempMap.put("latin7", "ISO8859_7");
94 tempMap.put("hebrew", "ISO8859_8");
95 tempMap.put("latin5", "ISO8859_9");
96 tempMap.put("latvian", "ISO8859_13");
97 tempMap.put("latvian1", "ISO8859_13");
98 tempMap.put("estonia", "ISO8859_13");
99 tempMap.put("dos", "Cp437");
100 tempMap.put("Cp850", "Cp850");
101 tempMap.put("Cp852", "Cp852");
102 tempMap.put("cp866", "Cp866");
103 tempMap.put("koi8_ru", "KOI8_R");
104 tempMap.put("koi8r", "KOI8_R");
105 tempMap.put("tis620", "TIS620");
106 tempMap.put("Cp1250", "Cp1250");
107 tempMap.put("Cp1250", "Cp1250");
108 tempMap.put("win1251", "Cp1251");
109 tempMap.put("cp1251", "Cp1251");
110 tempMap.put("cp1256", "Cp1256");
111 tempMap.put("win1251ukr", "Cp1251");
112 tempMap.put("cp1257", "Cp1257");
113 tempMap.put("macroman", "MacRoman");
114 tempMap.put("macce", "MacCentralEurope");
115 tempMap.put("utf8", "UTF-8");
116 tempMap.put("ucs2", "UnicodeBig");
117 tempMap.put("binary", "US-ASCII"); // closest match
118
119 MYSQL_TO_JAVA_CHARSET_MAP = Collections.unmodifiableMap(tempMap);
120
121 HashMap javaToMysqlMap = new HashMap();
122
123 Set keySet = MYSQL_TO_JAVA_CHARSET_MAP.keySet();
124
125 Iterator keys = keySet.iterator();
126
127 while (keys.hasNext()) {
128 Object mysqlEncodingName = keys.next();
129 Object javaEncodingName = MYSQL_TO_JAVA_CHARSET_MAP.get(mysqlEncodingName);
130
131 //
132 // Use 'closest' encodings here...as Java encoding names
133 // overlap with some MySQL character sets.
134 //
135 if ("ISO8859_1".equals(javaEncodingName)) {
136 if ("latin1".equals(mysqlEncodingName)) {
137 javaToMysqlMap.put(javaEncodingName, mysqlEncodingName);
138
139 }
140 } else if ("ISO8859_2".equals(javaEncodingName)) {
141 if ("latin2".equals(mysqlEncodingName)) {
142 javaToMysqlMap.put(javaEncodingName, mysqlEncodingName);
143 }
144 }
145 else if ("ISO8859_13".equals(javaEncodingName)) {
146 if ("latin7".equals(mysqlEncodingName)) {
147 javaToMysqlMap.put(javaEncodingName, mysqlEncodingName);
148 }
149 } else {
150 javaToMysqlMap.put(javaEncodingName, mysqlEncodingName);
151 }
152 }
153
154 JAVA_TO_MYSQL_CHARSET_MAP = Collections.unmodifiableMap(javaToMysqlMap);
155
156 HashMap ucMap = new HashMap(JAVA_TO_MYSQL_CHARSET_MAP.size());
157
158 Iterator javaNamesKeys = JAVA_TO_MYSQL_CHARSET_MAP.keySet().iterator();
159
160 while (javaNamesKeys.hasNext()) {
161 String key = (String)javaNamesKeys.next();
162
163 ucMap.put(key.toUpperCase(), JAVA_TO_MYSQL_CHARSET_MAP.get(key));
164 }
165
166 ucMap.put("ASCII", "ascii"); // special case
167 ucMap.put("LATIN5", "latin5");
168 ucMap.put("LATIN7", "latin7");
169 ucMap.put("HEBREW", "hebrew");
170 ucMap.put("GREEK", "greek");
171 ucMap.put("EUCKR", "euckr");
172 ucMap.put("GB2312", "gb2312");
173 ucMap.put("LATIN2", "latin2");
174
175 JAVA_UC_TO_MYSQL_CHARSET_MAP = Collections.unmodifiableMap(ucMap);
176
177
178 //
179 // Character sets that we can't convert
180 // ourselves.
181 //
182 HashMap tempMapMulti = new HashMap();
183
184 tempMapMulti.put("big5", "big5");
185 tempMapMulti.put("euc_kr", "euc_kr");
186 tempMapMulti.put("gb2312", "gb2312");
187 tempMapMulti.put("gbk", "gbk");
188 tempMapMulti.put("sjis", "sjis");
189 tempMapMulti.put("ujis", "ujist");
190 tempMapMulti.put("utf8", "utf8");
191 tempMapMulti.put("ucs2", "UnicodeBig");
192
193 MULTIBYTE_CHARSETS = Collections.unmodifiableMap(tempMapMulti);
194
195 INDEX_TO_CHARSET = new String[95];
196
197 INDEX_TO_CHARSET[1] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("big5");
198 INDEX_TO_CHARSET[2] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("czech");
199 INDEX_TO_CHARSET[3] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("dec8");
200 INDEX_TO_CHARSET[4] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("dos");
201 INDEX_TO_CHARSET[5] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("german1");
202 INDEX_TO_CHARSET[6] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hp8");
203 INDEX_TO_CHARSET[7] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("koi8_ru");
204 INDEX_TO_CHARSET[8] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1");
205 INDEX_TO_CHARSET[9] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin2");
206 INDEX_TO_CHARSET[10] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("swe7");
207 INDEX_TO_CHARSET[11] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("usa7");
208 INDEX_TO_CHARSET[12] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ujis");
209 INDEX_TO_CHARSET[13] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("sjis");
210 INDEX_TO_CHARSET[14] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1251");
211 INDEX_TO_CHARSET[15] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("danish");
212 INDEX_TO_CHARSET[16] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hebrew");
213 INDEX_TO_CHARSET[18] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("tis620");
214 INDEX_TO_CHARSET[19] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("euc_kr");
215 INDEX_TO_CHARSET[20] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("estonia");
216 INDEX_TO_CHARSET[21] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hungarian");
217 INDEX_TO_CHARSET[22] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("koi8_ukr");
218 INDEX_TO_CHARSET[23] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("win1251ukr");
219 INDEX_TO_CHARSET[24] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("gb2312");
220 INDEX_TO_CHARSET[25] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("greek");
221 INDEX_TO_CHARSET[26] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("win1250");
222 INDEX_TO_CHARSET[27] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("croat");
223 INDEX_TO_CHARSET[28] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("gbk");
224 INDEX_TO_CHARSET[29] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1257");
225 INDEX_TO_CHARSET[30] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin5");
226 INDEX_TO_CHARSET[31] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1_de");
227 INDEX_TO_CHARSET[32] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("armscii8");
228 INDEX_TO_CHARSET[33] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("utf8");
229 INDEX_TO_CHARSET[34] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("win1250ch");
230 INDEX_TO_CHARSET[35] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ucs2");
231 INDEX_TO_CHARSET[36] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp866");
232 INDEX_TO_CHARSET[37] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("keybcs2");
233 INDEX_TO_CHARSET[38] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macce");
234 INDEX_TO_CHARSET[39] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macroman");
235 INDEX_TO_CHARSET[40] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("pclatin2");
236 INDEX_TO_CHARSET[41] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latvian");
237 INDEX_TO_CHARSET[42] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latvian1");
238 INDEX_TO_CHARSET[43] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("maccebin");
239 INDEX_TO_CHARSET[44] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macceciai");
240 INDEX_TO_CHARSET[45] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("maccecias");
241 INDEX_TO_CHARSET[46] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("maccecsas");
242 INDEX_TO_CHARSET[47] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1bin");
243 INDEX_TO_CHARSET[48] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1cias");
244 INDEX_TO_CHARSET[49] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1csas");
245 INDEX_TO_CHARSET[50] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1251bin");
246 INDEX_TO_CHARSET[51] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1251cias");
247 INDEX_TO_CHARSET[52] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1251csas");
248 INDEX_TO_CHARSET[53] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macromanbin");
249 INDEX_TO_CHARSET[54] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macromancias");
250 INDEX_TO_CHARSET[55] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macromanciai");
251 INDEX_TO_CHARSET[56] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macromancsas");
252 INDEX_TO_CHARSET[57] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1256");
253 INDEX_TO_CHARSET[63] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("binary");
254 INDEX_TO_CHARSET[64] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("armscii");
255 INDEX_TO_CHARSET[65] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ascii");
256 INDEX_TO_CHARSET[66] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1250");
257 INDEX_TO_CHARSET[67] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1256");
258 INDEX_TO_CHARSET[68] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp866");
259 INDEX_TO_CHARSET[69] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("dec8");
260 INDEX_TO_CHARSET[70] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("greek");
261 INDEX_TO_CHARSET[71] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hebrew");
262 INDEX_TO_CHARSET[72] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hp8");
263 INDEX_TO_CHARSET[73] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("keybcs2");
264 INDEX_TO_CHARSET[74] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("koi8r");
265 INDEX_TO_CHARSET[75] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("koi8ukr");
266 INDEX_TO_CHARSET[77] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin2");
267 INDEX_TO_CHARSET[78] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin5");
268 INDEX_TO_CHARSET[79] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin7");
269 INDEX_TO_CHARSET[80] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp850");
270 INDEX_TO_CHARSET[81] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp852");
271 INDEX_TO_CHARSET[82] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("swe7");
272 INDEX_TO_CHARSET[83] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("utf8");
273 INDEX_TO_CHARSET[84] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("big5");
274 INDEX_TO_CHARSET[85] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("euckr");
275 INDEX_TO_CHARSET[86] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("gb2312");
276 INDEX_TO_CHARSET[87] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("gbk");
277 INDEX_TO_CHARSET[88] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("sjis");
278 INDEX_TO_CHARSET[89] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("tis620");
279 INDEX_TO_CHARSET[90] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ucs2");
280 INDEX_TO_CHARSET[91] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ujis");
281 INDEX_TO_CHARSET[92] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("geostd8");
282 INDEX_TO_CHARSET[93] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("geostd8");
283 INDEX_TO_CHARSET[94] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1");
284 }
285 }