1 /* 2 * Copyright (C) 2007 Esmertec AG. 3 * Copyright (C) 2007 The Android Open Source Project 4 * 5 * Licensed under the Apache License, Version 2.0 (the "License"); 6 * you may not use this file except in compliance with the License. 7 * You may obtain a copy of the License at 8 * 9 * http://www.apache.org/licenses/LICENSE-2.0 10 * 11 * Unless required by applicable law or agreed to in writing, software 12 * distributed under the License is distributed on an "AS IS" BASIS, 13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 14 * See the License for the specific language governing permissions and 15 * limitations under the License. 16 */ 17 18 package com.android.messaging.mmslib.pdu; 19 20 import android.support.v4.util.SimpleArrayMap; 21 import android.util.SparseArray; 22 23 import java.io.UnsupportedEncodingException; 24 25 public class CharacterSets { 26 /** 27 * IANA assigned MIB enum numbers. 28 * 29 * From wap-230-wsp-20010705-a.pdf 30 * Any-charset = <Octet 128> 31 * Equivalent to the special RFC2616 charset value "*" 32 * 33 * Link to all the charsets: http://www.iana.org/assignments/character-sets/character-sets.xhtml 34 * Use Charset.availableCharsets() to see if a potential charset is supported in java: 35 * private void dumpCharsets() { 36 * logvv("dumpCharsets"); 37 * SortedMap<String, Charset> charsets = Charset.availableCharsets(); 38 * for (Entry<String, Charset> entry : charsets.entrySet()) { 39 * String key = entry.getKey(); 40 * Charset value = entry.getValue(); 41 * logvv("charset key: " + key + " value: " + value); 42 * } 43 * } 44 * 45 * As of March 21, 2014, here is the list from dumpCharsets: 46 * Adobe-Standard-Encoding value: java.nio.charset.CharsetICU[Adobe-Standard-Encoding] 47 * Big5 value: java.nio.charset.CharsetICU[Big5] 48 * Big5-HKSCS value: java.nio.charset.CharsetICU[Big5-HKSCS] 49 * BOCU-1 value: java.nio.charset.CharsetICU[BOCU-1] 50 * CESU-8 value: java.nio.charset.CharsetICU[CESU-8] 51 * cp1363 value: java.nio.charset.CharsetICU[cp1363] 52 * cp851 value: java.nio.charset.CharsetICU[cp851] 53 * cp864 value: java.nio.charset.CharsetICU[cp864] 54 * EUC-JP value: java.nio.charset.CharsetICU[EUC-JP] 55 * EUC-KR value: java.nio.charset.CharsetICU[EUC-KR] 56 * GB18030 value: java.nio.charset.CharsetICU[GB18030] 57 * GBK value: java.nio.charset.CharsetICU[GBK] 58 * hp-roman8 value: java.nio.charset.CharsetICU[hp-roman8] 59 * HZ-GB-2312 value: java.nio.charset.CharsetICU[HZ-GB-2312] 60 * IBM-Thai value: java.nio.charset.CharsetICU[IBM-Thai] 61 * IBM00858 value: java.nio.charset.CharsetICU[IBM00858] 62 * IBM01140 value: java.nio.charset.CharsetICU[IBM01140] 63 * IBM01141 value: java.nio.charset.CharsetICU[IBM01141] 64 * IBM01142 value: java.nio.charset.CharsetICU[IBM01142] 65 * IBM01143 value: java.nio.charset.CharsetICU[IBM01143] 66 * IBM01144 value: java.nio.charset.CharsetICU[IBM01144] 67 * IBM01145 value: java.nio.charset.CharsetICU[IBM01145] 68 * IBM01146 value: java.nio.charset.CharsetICU[IBM01146] 69 * IBM01147 value: java.nio.charset.CharsetICU[IBM01147] 70 * IBM01148 value: java.nio.charset.CharsetICU[IBM01148] 71 * IBM01149 value: java.nio.charset.CharsetICU[IBM01149] 72 * IBM037 value: java.nio.charset.CharsetICU[IBM037] 73 * IBM1026 value: java.nio.charset.CharsetICU[IBM1026] 74 * IBM1047 value: java.nio.charset.CharsetICU[IBM1047] 75 * IBM273 value: java.nio.charset.CharsetICU[IBM273] 76 * IBM277 value: java.nio.charset.CharsetICU[IBM277] 77 * IBM278 value: java.nio.charset.CharsetICU[IBM278] 78 * IBM280 value: java.nio.charset.CharsetICU[IBM280] 79 * IBM284 value: java.nio.charset.CharsetICU[IBM284] 80 * IBM285 value: java.nio.charset.CharsetICU[IBM285] 81 * IBM290 value: java.nio.charset.CharsetICU[IBM290] 82 * IBM297 value: java.nio.charset.CharsetICU[IBM297] 83 * IBM420 value: java.nio.charset.CharsetICU[IBM420] 84 * IBM424 value: java.nio.charset.CharsetICU[IBM424] 85 * IBM437 value: java.nio.charset.CharsetICU[IBM437] 86 * IBM500 value: java.nio.charset.CharsetICU[IBM500] 87 * IBM775 value: java.nio.charset.CharsetICU[IBM775] 88 * IBM850 value: java.nio.charset.CharsetICU[IBM850] 89 * IBM852 value: java.nio.charset.CharsetICU[IBM852] 90 * IBM855 value: java.nio.charset.CharsetICU[IBM855] 91 * IBM857 value: java.nio.charset.CharsetICU[IBM857] 92 * IBM860 value: java.nio.charset.CharsetICU[IBM860] 93 * IBM861 value: java.nio.charset.CharsetICU[IBM861] 94 * IBM862 value: java.nio.charset.CharsetICU[IBM862] 95 * IBM863 value: java.nio.charset.CharsetICU[IBM863] 96 * IBM865 value: java.nio.charset.CharsetICU[IBM865] 97 * IBM866 value: java.nio.charset.CharsetICU[IBM866] 98 * IBM868 value: java.nio.charset.CharsetICU[IBM868] 99 * IBM869 value: java.nio.charset.CharsetICU[IBM869] 100 * IBM870 value: java.nio.charset.CharsetICU[IBM870] 101 * IBM871 value: java.nio.charset.CharsetICU[IBM871] 102 * IBM918 value: java.nio.charset.CharsetICU[IBM918] 103 * ISO-2022-CN value: java.nio.charset.CharsetICU[ISO-2022-CN] 104 * ISO-2022-CN-EXT value: java.nio.charset.CharsetICU[ISO-2022-CN-EXT] 105 * ISO-2022-JP value: java.nio.charset.CharsetICU[ISO-2022-JP] 106 * ISO-2022-JP-1 value: java.nio.charset.CharsetICU[ISO-2022-JP-1] 107 * ISO-2022-JP-2 value: java.nio.charset.CharsetICU[ISO-2022-JP-2] 108 * ISO-2022-KR value: java.nio.charset.CharsetICU[ISO-2022-KR] 109 * ISO-8859-1 value: java.nio.charset.CharsetICU[ISO-8859-1] 110 * ISO-8859-10 value: java.nio.charset.CharsetICU[ISO-8859-10] 111 * ISO-8859-13 value: java.nio.charset.CharsetICU[ISO-8859-13] 112 * ISO-8859-14 value: java.nio.charset.CharsetICU[ISO-8859-14] 113 * ISO-8859-15 value: java.nio.charset.CharsetICU[ISO-8859-15] 114 * ISO-8859-2 value: java.nio.charset.CharsetICU[ISO-8859-2] 115 * ISO-8859-3 value: java.nio.charset.CharsetICU[ISO-8859-3] 116 * ISO-8859-4 value: java.nio.charset.CharsetICU[ISO-8859-4] 117 * ISO-8859-5 value: java.nio.charset.CharsetICU[ISO-8859-5] 118 * ISO-8859-6 value: java.nio.charset.CharsetICU[ISO-8859-6] 119 * ISO-8859-7 value: java.nio.charset.CharsetICU[ISO-8859-7] 120 * ISO-8859-8 value: java.nio.charset.CharsetICU[ISO-8859-8] 121 * ISO-8859-9 value: java.nio.charset.CharsetICU[ISO-8859-9] 122 * KOI8-R value: java.nio.charset.CharsetICU[KOI8-R] 123 * KOI8-U value: java.nio.charset.CharsetICU[KOI8-U] 124 * macintosh value: java.nio.charset.CharsetICU[macintosh] 125 * SCSU value: java.nio.charset.CharsetICU[SCSU] 126 * Shift_JIS value: java.nio.charset.CharsetICU[Shift_JIS] 127 * TIS-620 value: java.nio.charset.CharsetICU[TIS-620] 128 * US-ASCII value: java.nio.charset.CharsetICU[US-ASCII] 129 * UTF-16 value: java.nio.charset.CharsetICU[UTF-16] 130 * UTF-16BE value: java.nio.charset.CharsetICU[UTF-16BE] 131 * UTF-16LE value: java.nio.charset.CharsetICU[UTF-16LE] 132 * UTF-32 value: java.nio.charset.CharsetICU[UTF-32] 133 * UTF-32BE value: java.nio.charset.CharsetICU[UTF-32BE] 134 * UTF-32LE value: java.nio.charset.CharsetICU[UTF-32LE] 135 * UTF-7 value: java.nio.charset.CharsetICU[UTF-7] 136 * UTF-8 value: java.nio.charset.CharsetICU[UTF-8] 137 * windows-1250 value: java.nio.charset.CharsetICU[windows-1250] 138 * windows-1251 value: java.nio.charset.CharsetICU[windows-1251] 139 * windows-1252 value: java.nio.charset.CharsetICU[windows-1252] 140 * windows-1253 value: java.nio.charset.CharsetICU[windows-1253] 141 * windows-1254 value: java.nio.charset.CharsetICU[windows-1254] 142 * windows-1255 value: java.nio.charset.CharsetICU[windows-1255] 143 * windows-1256 value: java.nio.charset.CharsetICU[windows-1256] 144 * windows-1257 value: java.nio.charset.CharsetICU[windows-1257] 145 * windows-1258 value: java.nio.charset.CharsetICU[windows-1258] 146 * x-compound-text value: java.nio.charset.CharsetICU[x-compound-text] 147 * x-ebcdic-xml-us value: java.nio.charset.CharsetICU[x-ebcdic-xml-us] 148 * x-gsm-03.38-2000 value: java.nio.charset.CharsetICU[x-gsm-03.38-2000] 149 * x-ibm-1047-s390 value: java.nio.charset.CharsetICU[x-ibm-1047-s390] 150 * x-ibm-1125_P100-1997 value: java.nio.charset.CharsetICU[x-ibm-1125_P100-1997] 151 * x-ibm-1129_P100-1997 value: java.nio.charset.CharsetICU[x-ibm-1129_P100-1997] 152 * x-ibm-1130_P100-1997 value: java.nio.charset.CharsetICU[x-ibm-1130_P100-1997] 153 * x-ibm-1131_P100-1997 value: java.nio.charset.CharsetICU[x-ibm-1131_P100-1997] 154 * x-ibm-1132_P100-1998 value: java.nio.charset.CharsetICU[x-ibm-1132_P100-1998] 155 * x-ibm-1133_P100-1997 value: java.nio.charset.CharsetICU[x-ibm-1133_P100-1997] 156 * x-ibm-1137_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-1137_P100-1999] 157 * x-ibm-1140-s390 value: java.nio.charset.CharsetICU[x-ibm-1140-s390] 158 * x-ibm-1141-s390 value: java.nio.charset.CharsetICU[x-ibm-1141-s390] 159 * x-ibm-1142-s390 value: java.nio.charset.CharsetICU[x-ibm-1142-s390] 160 * x-ibm-1143-s390 value: java.nio.charset.CharsetICU[x-ibm-1143-s390] 161 * x-ibm-1144-s390 value: java.nio.charset.CharsetICU[x-ibm-1144-s390] 162 * x-ibm-1145-s390 value: java.nio.charset.CharsetICU[x-ibm-1145-s390] 163 * x-ibm-1146-s390 value: java.nio.charset.CharsetICU[x-ibm-1146-s390] 164 * x-ibm-1147-s390 value: java.nio.charset.CharsetICU[x-ibm-1147-s390] 165 * x-ibm-1148-s390 value: java.nio.charset.CharsetICU[x-ibm-1148-s390] 166 * x-ibm-1149-s390 value: java.nio.charset.CharsetICU[x-ibm-1149-s390] 167 * x-ibm-1153-s390 value: java.nio.charset.CharsetICU[x-ibm-1153-s390] 168 * x-ibm-1154_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-1154_P100-1999] 169 * x-ibm-1155_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-1155_P100-1999] 170 * x-ibm-1156_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-1156_P100-1999] 171 * x-ibm-1157_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-1157_P100-1999] 172 * x-ibm-1158_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-1158_P100-1999] 173 * x-ibm-1160_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-1160_P100-1999] 174 * x-ibm-1162_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-1162_P100-1999] 175 * x-ibm-1164_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-1164_P100-1999] 176 * x-ibm-1250_P100-1995 value: java.nio.charset.CharsetICU[x-ibm-1250_P100-1995] 177 * x-ibm-1251_P100-1995 value: java.nio.charset.CharsetICU[x-ibm-1251_P100-1995] 178 * x-ibm-1252_P100-2000 value: java.nio.charset.CharsetICU[x-ibm-1252_P100-2000] 179 * x-ibm-1253_P100-1995 value: java.nio.charset.CharsetICU[x-ibm-1253_P100-1995] 180 * x-ibm-1254_P100-1995 value: java.nio.charset.CharsetICU[x-ibm-1254_P100-1995] 181 * x-ibm-1255_P100-1995 value: java.nio.charset.CharsetICU[x-ibm-1255_P100-1995] 182 * x-ibm-1256_P110-1997 value: java.nio.charset.CharsetICU[x-ibm-1256_P110-1997] 183 * x-ibm-1257_P100-1995 value: java.nio.charset.CharsetICU[x-ibm-1257_P100-1995] 184 * x-ibm-1258_P100-1997 value: java.nio.charset.CharsetICU[x-ibm-1258_P100-1997] 185 * x-ibm-12712-s390 value: java.nio.charset.CharsetICU[x-ibm-12712-s390] 186 * x-ibm-12712_P100-1998 value: java.nio.charset.CharsetICU[x-ibm-12712_P100-1998] 187 * x-ibm-1373_P100-2002 value: java.nio.charset.CharsetICU[x-ibm-1373_P100-2002] 188 * x-ibm-1383_P110-1999 value: java.nio.charset.CharsetICU[x-ibm-1383_P110-1999] 189 * x-ibm-1386_P100-2001 value: java.nio.charset.CharsetICU[x-ibm-1386_P100-2001] 190 * x-ibm-16684_P110-2003 value: java.nio.charset.CharsetICU[x-ibm-16684_P110-2003] 191 * x-ibm-16804-s390 value: java.nio.charset.CharsetICU[x-ibm-16804-s390] 192 * x-ibm-16804_X110-1999 value: java.nio.charset.CharsetICU[x-ibm-16804_X110-1999] 193 * x-ibm-25546 value: java.nio.charset.CharsetICU[x-ibm-25546] 194 * x-ibm-33722_P12A_P12A-2009_U2 value: 195 * java.nio.charset.CharsetICU[x-ibm-33722_P12A_P12A-2009_U2] 196 * x-ibm-37-s390 value: java.nio.charset.CharsetICU[x-ibm-37-s390] 197 * x-ibm-4517_P100-2005 value: java.nio.charset.CharsetICU[x-ibm-4517_P100-2005] 198 * x-ibm-4899_P100-1998 value: java.nio.charset.CharsetICU[x-ibm-4899_P100-1998] 199 * x-ibm-4909_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-4909_P100-1999] 200 * x-ibm-4971_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-4971_P100-1999] 201 * x-ibm-5123_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-5123_P100-1999] 202 * x-ibm-5351_P100-1998 value: java.nio.charset.CharsetICU[x-ibm-5351_P100-1998] 203 * x-ibm-5352_P100-1998 value: java.nio.charset.CharsetICU[x-ibm-5352_P100-1998] 204 * x-ibm-5353_P100-1998 value: java.nio.charset.CharsetICU[x-ibm-5353_P100-1998] 205 * x-ibm-5478_P100-1995 value: java.nio.charset.CharsetICU[x-ibm-5478_P100-1995] 206 * x-ibm-803_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-803_P100-1999] 207 * x-ibm-813_P100-1995 value: java.nio.charset.CharsetICU[x-ibm-813_P100-1995] 208 * x-ibm-8482_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-8482_P100-1999] 209 * x-ibm-901_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-901_P100-1999] 210 * x-ibm-902_P100-1999 value: java.nio.charset.CharsetICU[x-ibm-902_P100-1999] 211 * x-ibm-9067_X100-2005 value: java.nio.charset.CharsetICU[x-ibm-9067_X100-2005] 212 * x-ibm-916_P100-1995 value: java.nio.charset.CharsetICU[x-ibm-916_P100-1995] 213 * x-IBM1006 value: java.nio.charset.CharsetICU[x-IBM1006] 214 * x-IBM1025 value: java.nio.charset.CharsetICU[x-IBM1025] 215 * x-IBM1097 value: java.nio.charset.CharsetICU[x-IBM1097] 216 * x-IBM1098 value: java.nio.charset.CharsetICU[x-IBM1098] 217 * x-IBM1112 value: java.nio.charset.CharsetICU[x-IBM1112] 218 * x-IBM1122 value: java.nio.charset.CharsetICU[x-IBM1122] 219 * x-IBM1123 value: java.nio.charset.CharsetICU[x-IBM1123] 220 * x-IBM1124 value: java.nio.charset.CharsetICU[x-IBM1124] 221 * x-IBM1153 value: java.nio.charset.CharsetICU[x-IBM1153] 222 * x-IBM1363 value: java.nio.charset.CharsetICU[x-IBM1363] 223 * x-IBM1364 value: java.nio.charset.CharsetICU[x-IBM1364] 224 * x-IBM1371 value: java.nio.charset.CharsetICU[x-IBM1371] 225 * x-IBM1388 value: java.nio.charset.CharsetICU[x-IBM1388] 226 * x-IBM1390 value: java.nio.charset.CharsetICU[x-IBM1390] 227 * x-IBM1399 value: java.nio.charset.CharsetICU[x-IBM1399] 228 * x-IBM33722 value: java.nio.charset.CharsetICU[x-IBM33722] 229 * x-IBM720 value: java.nio.charset.CharsetICU[x-IBM720] 230 * x-IBM737 value: java.nio.charset.CharsetICU[x-IBM737] 231 * x-IBM856 value: java.nio.charset.CharsetICU[x-IBM856] 232 * x-IBM867 value: java.nio.charset.CharsetICU[x-IBM867] 233 * x-IBM875 value: java.nio.charset.CharsetICU[x-IBM875] 234 * x-IBM922 value: java.nio.charset.CharsetICU[x-IBM922] 235 * x-IBM930 value: java.nio.charset.CharsetICU[x-IBM930] 236 * x-IBM933 value: java.nio.charset.CharsetICU[x-IBM933] 237 * x-IBM935 value: java.nio.charset.CharsetICU[x-IBM935] 238 * x-IBM937 value: java.nio.charset.CharsetICU[x-IBM937] 239 * x-IBM939 value: java.nio.charset.CharsetICU[x-IBM939] 240 * x-IBM942 value: java.nio.charset.CharsetICU[x-IBM942] 241 * x-IBM943 value: java.nio.charset.CharsetICU[x-IBM943] 242 * x-IBM949 value: java.nio.charset.CharsetICU[x-IBM949] 243 * x-IBM949C value: java.nio.charset.CharsetICU[x-IBM949C] 244 * x-IBM950 value: java.nio.charset.CharsetICU[x-IBM950] 245 * x-IBM954 value: java.nio.charset.CharsetICU[x-IBM954] 246 * x-IBM964 value: java.nio.charset.CharsetICU[x-IBM964] 247 * x-IBM970 value: java.nio.charset.CharsetICU[x-IBM970] 248 * x-IBM971 value: java.nio.charset.CharsetICU[x-IBM971] 249 * x-IMAP-mailbox-name value: java.nio.charset.CharsetICU[x-IMAP-mailbox-name] 250 * x-iscii-be value: java.nio.charset.CharsetICU[x-iscii-be] 251 * x-iscii-gu value: java.nio.charset.CharsetICU[x-iscii-gu] 252 * x-iscii-ka value: java.nio.charset.CharsetICU[x-iscii-ka] 253 * x-iscii-ma value: java.nio.charset.CharsetICU[x-iscii-ma] 254 * x-iscii-or value: java.nio.charset.CharsetICU[x-iscii-or] 255 * x-iscii-pa value: java.nio.charset.CharsetICU[x-iscii-pa] 256 * x-iscii-ta value: java.nio.charset.CharsetICU[x-iscii-ta] 257 * x-iscii-te value: java.nio.charset.CharsetICU[x-iscii-te] 258 * x-ISCII91 value: java.nio.charset.CharsetICU[x-ISCII91] 259 * x-ISO-2022-CN-CNS value: java.nio.charset.CharsetICU[x-ISO-2022-CN-CNS] 260 * x-iso-8859-11 value: java.nio.charset.CharsetICU[x-iso-8859-11] 261 * x-JavaUnicode value: java.nio.charset.CharsetICU[x-JavaUnicode] 262 * x-JavaUnicode2 value: java.nio.charset.CharsetICU[x-JavaUnicode2] 263 * x-JIS7 value: java.nio.charset.CharsetICU[x-JIS7] 264 * x-JIS8 value: java.nio.charset.CharsetICU[x-JIS8] 265 * x-LMBCS-1 value: java.nio.charset.CharsetICU[x-LMBCS-1] 266 * x-mac-centraleurroman value: java.nio.charset.CharsetICU[x-mac-centraleurroman] 267 * x-mac-cyrillic value: java.nio.charset.CharsetICU[x-mac-cyrillic] 268 * x-mac-greek value: java.nio.charset.CharsetICU[x-mac-greek] 269 * x-mac-turkish value: java.nio.charset.CharsetICU[x-mac-turkish] 270 * x-MS950-HKSCS value: java.nio.charset.CharsetICU[x-MS950-HKSCS] 271 * x-UnicodeBig value: java.nio.charset.CharsetICU[x-UnicodeBig] 272 * x-UTF-16LE-BOM value: java.nio.charset.CharsetICU[x-UTF-16LE-BOM] 273 * x-UTF16_OppositeEndian value: java.nio.charset.CharsetICU[x-UTF16_OppositeEndian] 274 * x-UTF16_PlatformEndian value: java.nio.charset.CharsetICU[x-UTF16_PlatformEndian] 275 * x-UTF32_OppositeEndian value: java.nio.charset.CharsetICU[x-UTF32_OppositeEndian] 276 * x-UTF32_PlatformEndian value: java.nio.charset.CharsetICU[x-UTF32_PlatformEndian] 277 * 278 */ 279 public static final int ANY_CHARSET = 0x00; 280 public static final int US_ASCII = 0x03; 281 public static final int ISO_8859_1 = 0x04; 282 public static final int ISO_8859_2 = 0x05; 283 public static final int ISO_8859_3 = 0x06; 284 public static final int ISO_8859_4 = 0x07; 285 public static final int ISO_8859_5 = 0x08; 286 public static final int ISO_8859_6 = 0x09; 287 public static final int ISO_8859_7 = 0x0A; 288 public static final int ISO_8859_8 = 0x0B; 289 public static final int ISO_8859_9 = 0x0C; 290 public static final int SHIFT_JIS = 0x11; 291 public static final int EUC_JP = 0x12; 292 public static final int EUC_KR = 0x26; 293 public static final int ISO_2022_JP = 0x27; 294 public static final int ISO_2022_JP_2 = 0x28; 295 public static final int UTF_8 = 0x6A; 296 public static final int GBK = 0x71; 297 public static final int GB18030 = 0x72; 298 public static final int GB2312 = 0x07E9; 299 public static final int BIG5 = 0x07EA; 300 public static final int UCS2 = 0x03E8; 301 public static final int UTF_16 = 0x03F7; 302 public static final int HZ_GB_2312 = 0x0825; 303 304 /** 305 * If the encoding of given data is unsupported, use UTF_8 to decode it. 306 */ 307 public static final int DEFAULT_CHARSET = UTF_8; 308 309 /** 310 * Array of MIB enum numbers. 311 */ 312 private static final int[] MIBENUM_NUMBERS = { 313 ANY_CHARSET, 314 US_ASCII, 315 ISO_8859_1, 316 ISO_8859_2, 317 ISO_8859_3, 318 ISO_8859_4, 319 ISO_8859_5, 320 ISO_8859_6, 321 ISO_8859_7, 322 ISO_8859_8, 323 ISO_8859_9, 324 SHIFT_JIS, 325 EUC_JP, 326 EUC_KR, 327 ISO_2022_JP, 328 ISO_2022_JP_2, 329 UTF_8, 330 GBK, 331 GB18030, 332 GB2312, 333 BIG5, 334 UCS2, 335 UTF_16, 336 HZ_GB_2312, 337 }; 338 339 /** 340 * The Well-known-charset Mime name. 341 */ 342 public static final String MIMENAME_ANY_CHARSET = "*"; 343 public static final String MIMENAME_US_ASCII = "us-ascii"; 344 public static final String MIMENAME_ISO_8859_1 = "iso-8859-1"; 345 public static final String MIMENAME_ISO_8859_2 = "iso-8859-2"; 346 public static final String MIMENAME_ISO_8859_3 = "iso-8859-3"; 347 public static final String MIMENAME_ISO_8859_4 = "iso-8859-4"; 348 public static final String MIMENAME_ISO_8859_5 = "iso-8859-5"; 349 public static final String MIMENAME_ISO_8859_6 = "iso-8859-6"; 350 public static final String MIMENAME_ISO_8859_7 = "iso-8859-7"; 351 public static final String MIMENAME_ISO_8859_8 = "iso-8859-8"; 352 public static final String MIMENAME_ISO_8859_9 = "iso-8859-9"; 353 public static final String MIMENAME_SHIFT_JIS = "shift_JIS"; 354 public static final String MIMENAME_EUC_JP = "euc-jp"; 355 public static final String MIMENAME_EUC_KR = "euc-kr"; 356 public static final String MIMENAME_ISO_2022_JP = "iso-2022-jp"; 357 public static final String MIMENAME_ISO_2022_JP_2 = "iso-2022-jp-2"; 358 public static final String MIMENAME_UTF_8 = "utf-8"; 359 public static final String MIMENAME_GBK = "gbk"; 360 public static final String MIMENAME_GB18030 = "gb18030"; 361 public static final String MIMENAME_GB2312 = "gb2312"; 362 public static final String MIMENAME_BIG5 = "big5"; 363 public static final String MIMENAME_UCS2 = "iso-10646-ucs-2"; 364 public static final String MIMENAME_UTF_16 = "utf-16"; 365 public static final String MIMENAME_HZ_GB_2312 = "hz-gb-2312"; 366 367 public static final String DEFAULT_CHARSET_NAME = MIMENAME_UTF_8; 368 369 /** 370 * Array of the names of character sets. 371 */ 372 private static final String[] MIME_NAMES = { 373 MIMENAME_ANY_CHARSET, 374 MIMENAME_US_ASCII, 375 MIMENAME_ISO_8859_1, 376 MIMENAME_ISO_8859_2, 377 MIMENAME_ISO_8859_3, 378 MIMENAME_ISO_8859_4, 379 MIMENAME_ISO_8859_5, 380 MIMENAME_ISO_8859_6, 381 MIMENAME_ISO_8859_7, 382 MIMENAME_ISO_8859_8, 383 MIMENAME_ISO_8859_9, 384 MIMENAME_SHIFT_JIS, 385 MIMENAME_EUC_JP, 386 MIMENAME_EUC_KR, 387 MIMENAME_ISO_2022_JP, 388 MIMENAME_ISO_2022_JP_2, 389 MIMENAME_UTF_8, 390 MIMENAME_GBK, 391 MIMENAME_GB18030, 392 MIMENAME_GB2312, 393 MIMENAME_BIG5, 394 MIMENAME_UCS2, 395 MIMENAME_UTF_16, 396 MIMENAME_HZ_GB_2312, 397 }; 398 399 private static final SparseArray<String> MIBENUM_TO_NAME_MAP; 400 401 private static final SimpleArrayMap<String, Integer> NAME_TO_MIBENUM_MAP; 402 403 static { 404 // Create the HashMaps. 405 MIBENUM_TO_NAME_MAP = new SparseArray<String>(); 406 NAME_TO_MIBENUM_MAP = new SimpleArrayMap<String, Integer>(); assert(MIBENUM_NUMBERS.length == MIME_NAMES.length)407 assert (MIBENUM_NUMBERS.length == MIME_NAMES.length); 408 final int count = MIBENUM_NUMBERS.length - 1; 409 for (int i = 0; i <= count; i++) { MIBENUM_TO_NAME_MAP.put(MIBENUM_NUMBERS[i], MIME_NAMES[i])410 MIBENUM_TO_NAME_MAP.put(MIBENUM_NUMBERS[i], MIME_NAMES[i]); NAME_TO_MIBENUM_MAP.put(MIME_NAMES[i], MIBENUM_NUMBERS[i])411 NAME_TO_MIBENUM_MAP.put(MIME_NAMES[i], MIBENUM_NUMBERS[i]); 412 } 413 } 414 CharacterSets()415 private CharacterSets() { 416 } // Non-instantiatable 417 418 /** 419 * Map an MIBEnum number to the name of the charset which this number 420 * is assigned to by IANA. 421 * 422 * @param mibEnumValue An IANA assigned MIBEnum number. 423 * @return The name string of the charset. 424 */ getMimeName(final int mibEnumValue)425 public static String getMimeName(final int mibEnumValue) 426 throws UnsupportedEncodingException { 427 final String name = MIBENUM_TO_NAME_MAP.get(mibEnumValue); 428 if (name == null) { 429 throw new UnsupportedEncodingException(); 430 } 431 return name; 432 } 433 434 /** 435 * Map a well-known charset name to its assigned MIBEnum number. 436 * 437 * @param mimeName The charset name. 438 * @return The MIBEnum number assigned by IANA for this charset. 439 */ getMibEnumValue(final String mimeName)440 public static int getMibEnumValue(final String mimeName) 441 throws UnsupportedEncodingException { 442 if (null == mimeName) { 443 return -1; 444 } 445 446 final Integer mibEnumValue = NAME_TO_MIBENUM_MAP.get(mimeName); 447 if (mibEnumValue == null) { 448 throw new UnsupportedEncodingException(); 449 } 450 return mibEnumValue; 451 } 452 } 453