Docjar: A Java Source and Docuemnt Enginecom.*    java.*    javax.*    org.*    all    new    plug-in

Quick Search    Search Deep

Source code: com/mysql/jdbc/CharsetMapping.java


1   /*
2    Copyright (C) 2002-2004 MySQL AB
3   
4    This program is free software; you can redistribute it and/or modify
5    it under the terms of version 2 of the GNU General Public License as
6    published by the Free Software Foundation.
7    
8   
9    There are special exceptions to the terms and conditions of the GPL 
10   as it is applied to this software. View the full text of the 
11   exception exception in file EXCEPTIONS-CONNECTOR-J in the directory of this 
12   software distribution.
13  
14   This program is distributed in the hope that it will be useful,
15   but WITHOUT ANY WARRANTY; without even the implied warranty of
16   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
17   GNU General Public License for more details.
18  
19   You should have received a copy of the GNU General Public License
20   along with this program; if not, write to the Free Software
21   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
22  
23   */
24  package com.mysql.jdbc;
25  
26  import java.util.Collections;
27  import java.util.HashMap;
28  import java.util.Iterator;
29  import java.util.Map;
30  import java.util.Set;
31  
32  
33  /**
34   * Mapping between MySQL charset names
35   * and Java charset names.
36   *
37   * I've investigated placing these in a .properties file,
38   * but unfortunately under most appservers this complicates
39   * configuration because the security policy needs to be changed
40   * by the user to allow the driver to read them :(
41   *
42   * @author Mark Matthews
43   */
44  public class CharsetMapping {
45      //~ Static fields/initializers ---------------------------------------------
46  
47      /**
48       * Mapping of Java charset names to MySQL charset names
49       */
50      public static final Map JAVA_TO_MYSQL_CHARSET_MAP;
51      
52      /**
53       * Mapping of upper-case Java charset names to MySQL charset names
54       */
55      public static final Map JAVA_UC_TO_MYSQL_CHARSET_MAP;
56      
57     
58      /**
59       * Mapping of MySQL charset names to Java charset names
60       */
61      public static final Map MYSQL_TO_JAVA_CHARSET_MAP;
62  
63      /**
64       * Map/List of multibyte character sets (using MySQL names)
65       */
66      public static final Map MULTIBYTE_CHARSETS;
67  
68      /**
69       * Map of MySQL-4.1 charset indexes to Java encoding names
70       */
71      public static final String[] INDEX_TO_CHARSET;
72  
73      static {
74          HashMap tempMap = new HashMap();
75  
76          tempMap.put("usa7", "US-ASCII");
77          tempMap.put("ascii", "US-ASCII");
78          tempMap.put("big5", "Big5");
79          tempMap.put("gbk", "GBK");
80          tempMap.put("sjis", "SJIS");
81          tempMap.put("gb2312", "EUC_CN");
82          tempMap.put("ujis", "EUC_JP");
83          tempMap.put("euc_kr", "EUC_KR");
84          tempMap.put("latin1", "ISO8859_1");
85          tempMap.put("latin1_de", "ISO8859_1");
86          tempMap.put("german1", "ISO8859_1");
87          tempMap.put("danish", "ISO8859_1");
88          tempMap.put("latin2", "ISO8859_2");
89          tempMap.put("czech", "ISO8859_2");
90          tempMap.put("hungarian", "ISO8859_2");
91          tempMap.put("croat", "ISO8859_2");
92          tempMap.put("greek", "ISO8859_7");
93          tempMap.put("latin7", "ISO8859_7");
94          tempMap.put("hebrew", "ISO8859_8");
95          tempMap.put("latin5", "ISO8859_9");
96          tempMap.put("latvian", "ISO8859_13");
97          tempMap.put("latvian1", "ISO8859_13");
98          tempMap.put("estonia", "ISO8859_13");
99          tempMap.put("dos", "Cp437");
100         tempMap.put("Cp850", "Cp850");
101         tempMap.put("Cp852", "Cp852");
102         tempMap.put("cp866", "Cp866");
103         tempMap.put("koi8_ru", "KOI8_R");
104         tempMap.put("koi8r", "KOI8_R");
105         tempMap.put("tis620", "TIS620");
106         tempMap.put("Cp1250", "Cp1250");
107         tempMap.put("Cp1250", "Cp1250");
108         tempMap.put("win1251", "Cp1251");
109         tempMap.put("cp1251", "Cp1251");
110         tempMap.put("cp1256", "Cp1256");
111         tempMap.put("win1251ukr", "Cp1251");
112         tempMap.put("cp1257", "Cp1257");
113         tempMap.put("macroman", "MacRoman");
114         tempMap.put("macce", "MacCentralEurope");
115         tempMap.put("utf8", "UTF-8");
116         tempMap.put("ucs2", "UnicodeBig");
117         tempMap.put("binary", "US-ASCII"); // closest match
118 
119         MYSQL_TO_JAVA_CHARSET_MAP = Collections.unmodifiableMap(tempMap);
120         
121         HashMap javaToMysqlMap = new HashMap();
122         
123         Set keySet = MYSQL_TO_JAVA_CHARSET_MAP.keySet();
124 
125         Iterator keys = keySet.iterator();
126 
127         while (keys.hasNext()) {
128             Object mysqlEncodingName = keys.next();
129             Object javaEncodingName = MYSQL_TO_JAVA_CHARSET_MAP.get(mysqlEncodingName);
130 
131             //
132             // Use 'closest' encodings here...as Java encoding names
133             // overlap with some MySQL character sets.
134             //
135             if ("ISO8859_1".equals(javaEncodingName)) {
136               if ("latin1".equals(mysqlEncodingName)) {
137           javaToMysqlMap.put(javaEncodingName, mysqlEncodingName);
138           
139               }
140             } else if ("ISO8859_2".equals(javaEncodingName)) {
141         if ("latin2".equals(mysqlEncodingName)) {
142           javaToMysqlMap.put(javaEncodingName, mysqlEncodingName);
143         }
144       } 
145       else if ("ISO8859_13".equals(javaEncodingName)) {
146         if ("latin7".equals(mysqlEncodingName)) {
147           javaToMysqlMap.put(javaEncodingName, mysqlEncodingName);
148         }
149       } else {
150               javaToMysqlMap.put(javaEncodingName, mysqlEncodingName);
151             }
152         }
153 
154         JAVA_TO_MYSQL_CHARSET_MAP = Collections.unmodifiableMap(javaToMysqlMap);
155     
156         HashMap ucMap = new HashMap(JAVA_TO_MYSQL_CHARSET_MAP.size());
157         
158         Iterator javaNamesKeys = JAVA_TO_MYSQL_CHARSET_MAP.keySet().iterator();
159         
160         while (javaNamesKeys.hasNext()) {
161           String key = (String)javaNamesKeys.next();
162           
163           ucMap.put(key.toUpperCase(), JAVA_TO_MYSQL_CHARSET_MAP.get(key));
164         }
165         
166         ucMap.put("ASCII", "ascii"); // special case
167         ucMap.put("LATIN5", "latin5");
168         ucMap.put("LATIN7", "latin7");
169         ucMap.put("HEBREW", "hebrew");
170         ucMap.put("GREEK", "greek");
171         ucMap.put("EUCKR", "euckr");
172         ucMap.put("GB2312", "gb2312");
173         ucMap.put("LATIN2", "latin2");
174         
175         JAVA_UC_TO_MYSQL_CHARSET_MAP = Collections.unmodifiableMap(ucMap);
176 
177 
178         //
179         // Character sets that we can't convert
180         // ourselves.
181         //
182         HashMap tempMapMulti = new HashMap();
183 
184         tempMapMulti.put("big5", "big5");
185         tempMapMulti.put("euc_kr", "euc_kr");
186         tempMapMulti.put("gb2312", "gb2312");
187         tempMapMulti.put("gbk", "gbk");
188         tempMapMulti.put("sjis", "sjis");
189         tempMapMulti.put("ujis", "ujist");
190         tempMapMulti.put("utf8", "utf8");
191         tempMapMulti.put("ucs2", "UnicodeBig");
192 
193         MULTIBYTE_CHARSETS = Collections.unmodifiableMap(tempMapMulti);
194 
195         INDEX_TO_CHARSET = new String[95];
196 
197         INDEX_TO_CHARSET[1]  = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("big5");
198         INDEX_TO_CHARSET[2]  = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("czech");
199         INDEX_TO_CHARSET[3]  = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("dec8");
200         INDEX_TO_CHARSET[4]  = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("dos");
201         INDEX_TO_CHARSET[5]  = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("german1");
202         INDEX_TO_CHARSET[6]  = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hp8");
203         INDEX_TO_CHARSET[7]  = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("koi8_ru");
204         INDEX_TO_CHARSET[8]  = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1");
205         INDEX_TO_CHARSET[9]  = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin2");
206         INDEX_TO_CHARSET[10] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("swe7");
207         INDEX_TO_CHARSET[11] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("usa7");
208         INDEX_TO_CHARSET[12] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ujis");
209         INDEX_TO_CHARSET[13] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("sjis");
210         INDEX_TO_CHARSET[14] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1251");
211         INDEX_TO_CHARSET[15] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("danish");
212         INDEX_TO_CHARSET[16] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hebrew");
213         INDEX_TO_CHARSET[18] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("tis620");
214         INDEX_TO_CHARSET[19] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("euc_kr");
215         INDEX_TO_CHARSET[20] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("estonia");
216         INDEX_TO_CHARSET[21] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hungarian");
217         INDEX_TO_CHARSET[22] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("koi8_ukr");
218         INDEX_TO_CHARSET[23] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("win1251ukr");
219         INDEX_TO_CHARSET[24] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("gb2312");
220         INDEX_TO_CHARSET[25] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("greek");
221         INDEX_TO_CHARSET[26] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("win1250");
222         INDEX_TO_CHARSET[27] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("croat");
223         INDEX_TO_CHARSET[28] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("gbk");
224         INDEX_TO_CHARSET[29] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1257");
225         INDEX_TO_CHARSET[30] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin5");
226         INDEX_TO_CHARSET[31] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1_de");
227         INDEX_TO_CHARSET[32] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("armscii8");
228         INDEX_TO_CHARSET[33] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("utf8");
229         INDEX_TO_CHARSET[34] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("win1250ch");
230         INDEX_TO_CHARSET[35] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ucs2");
231         INDEX_TO_CHARSET[36] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp866");
232         INDEX_TO_CHARSET[37] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("keybcs2");
233         INDEX_TO_CHARSET[38] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macce");
234         INDEX_TO_CHARSET[39] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macroman");
235         INDEX_TO_CHARSET[40] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("pclatin2");
236         INDEX_TO_CHARSET[41] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latvian");
237         INDEX_TO_CHARSET[42] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latvian1");
238         INDEX_TO_CHARSET[43] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("maccebin");
239         INDEX_TO_CHARSET[44] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macceciai");
240         INDEX_TO_CHARSET[45] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("maccecias");
241         INDEX_TO_CHARSET[46] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("maccecsas");
242         INDEX_TO_CHARSET[47] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1bin");
243         INDEX_TO_CHARSET[48] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1cias");
244         INDEX_TO_CHARSET[49] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1csas");
245         INDEX_TO_CHARSET[50] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1251bin");
246         INDEX_TO_CHARSET[51] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1251cias");
247         INDEX_TO_CHARSET[52] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1251csas");
248         INDEX_TO_CHARSET[53] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macromanbin");
249         INDEX_TO_CHARSET[54] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macromancias");
250         INDEX_TO_CHARSET[55] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macromanciai");
251         INDEX_TO_CHARSET[56] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("macromancsas");
252         INDEX_TO_CHARSET[57] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1256");
253         INDEX_TO_CHARSET[63] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("binary");
254         INDEX_TO_CHARSET[64] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("armscii");
255         INDEX_TO_CHARSET[65] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ascii");
256         INDEX_TO_CHARSET[66] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1250");
257         INDEX_TO_CHARSET[67] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp1256");
258         INDEX_TO_CHARSET[68] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp866");
259         INDEX_TO_CHARSET[69] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("dec8");
260         INDEX_TO_CHARSET[70] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("greek");
261         INDEX_TO_CHARSET[71] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hebrew");
262         INDEX_TO_CHARSET[72] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("hp8");
263         INDEX_TO_CHARSET[73] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("keybcs2");
264         INDEX_TO_CHARSET[74] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("koi8r");
265         INDEX_TO_CHARSET[75] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("koi8ukr");
266         INDEX_TO_CHARSET[77] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin2");
267         INDEX_TO_CHARSET[78] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin5");
268         INDEX_TO_CHARSET[79] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin7");
269         INDEX_TO_CHARSET[80] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp850");
270         INDEX_TO_CHARSET[81] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("cp852");
271         INDEX_TO_CHARSET[82] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("swe7");
272         INDEX_TO_CHARSET[83] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("utf8");
273         INDEX_TO_CHARSET[84] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("big5");
274         INDEX_TO_CHARSET[85] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("euckr");
275         INDEX_TO_CHARSET[86] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("gb2312");
276         INDEX_TO_CHARSET[87] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("gbk");
277         INDEX_TO_CHARSET[88] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("sjis");
278         INDEX_TO_CHARSET[89] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("tis620");
279         INDEX_TO_CHARSET[90] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ucs2");
280         INDEX_TO_CHARSET[91] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("ujis");
281         INDEX_TO_CHARSET[92] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("geostd8");
282         INDEX_TO_CHARSET[93] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("geostd8");
283         INDEX_TO_CHARSET[94] = (String) MYSQL_TO_JAVA_CHARSET_MAP.get("latin1");
284     }
285 }