blob: a3894d6d2d3434fd92464eaa00873549ae7a5b97 [file] [log] [blame]
/*
* Copyright (C) 2007 Esmertec AG.
* Copyright (C) 2007 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.google.android.mms.pdu;
import android.compat.annotation.UnsupportedAppUsage;
import java.io.UnsupportedEncodingException;
import java.util.HashMap;
public class CharacterSets {
/**
* IANA assigned MIB enum numbers.
*
* From wap-230-wsp-20010705-a.pdf
* Any-charset = <Octet 128>
* Equivalent to the special RFC2616 charset value "*"
*/
public static final int ANY_CHARSET = 0x00;
public static final int US_ASCII = 0x03;
public static final int ISO_8859_1 = 0x04;
public static final int ISO_8859_2 = 0x05;
public static final int ISO_8859_3 = 0x06;
public static final int ISO_8859_4 = 0x07;
public static final int ISO_8859_5 = 0x08;
public static final int ISO_8859_6 = 0x09;
public static final int ISO_8859_7 = 0x0A;
public static final int ISO_8859_8 = 0x0B;
public static final int ISO_8859_9 = 0x0C;
public static final int SHIFT_JIS = 0x11;
public static final int UTF_8 = 0x6A;
public static final int BIG5 = 0x07EA;
public static final int UCS2 = 0x03E8;
public static final int UTF_16 = 0x03F7;
/**
* Extend charsets.
*
* From http://www.iana.org/assignments/character-sets/
*/
public static final int BIG5_HKSCS = 0x0835; //2101
public static final int BOCU_1 = 0x03FC; //1020
public static final int CESU_8 = 0x03F8; //1016
public static final int CP864 = 0x0803; //2051
public static final int EUC_JP = 0x12; //18
public static final int EUC_KR = 0x26; //38
public static final int GB18030 = 0x72; //114
public static final int GBK = 0x71; //113
public static final int HZ_GB_2312 = 0x0825; //2085
public static final int GB_2312 = 0x07E9; //2025
public static final int ISO_2022_CN = 0x68; //104
public static final int ISO_2022_CN_EXT = 0x69; //105
public static final int ISO_2022_JP = 0x27; //39
public static final int ISO_2022_KR = 0x25; //37
public static final int ISO_8859_10 = 0x0D; //13
public static final int ISO_8859_13 = 0x6D; //109
public static final int ISO_8859_14 = 0x6E; //110
public static final int ISO_8859_15 = 0x6F; //111
public static final int ISO_8859_16 = 0x70; //112
public static final int KOI8_R = 0x0824; //2084
public static final int KOI8_U = 0x0828; //2088
public static final int MACINTOSH = 0x07EB; //2027
public static final int SCSU = 0x03F3; //1011
public static final int TIS_620 = 0x08D3; //2259
public static final int UTF_16BE = 0x03F5; //1013
public static final int UTF_16LE = 0x03F6; //1014
public static final int UTF_32 = 0x03F9; //1017
public static final int UTF_32BE = 0x03FA; //1018
public static final int UTF_32LE = 0x03FB; //1019
public static final int UTF_7 = 0x03F4; //1012
public static final int WINDOWS_1250 = 0x08CA; //2250
public static final int WINDOWS_1251 = 0x08CB; //2251
public static final int WINDOWS_1252 = 0x08CC; //2252
public static final int WINDOWS_1253 = 0x08CD; //2253
public static final int WINDOWS_1254 = 0x08CE; //2254
public static final int WINDOWS_1255 = 0x08CF; //2255
public static final int WINDOWS_1256 = 0x08D0; //2256
public static final int WINDOWS_1257 = 0x08D1; //2257
public static final int WINDOWS_1258 = 0x08D2; //2258
/**
* If the encoding of given data is unsupported, use UTF_8 to decode it.
*/
public static final int DEFAULT_CHARSET = UTF_8;
/**
* Array of MIB enum numbers.
*/
private static final int[] MIBENUM_NUMBERS = {
ANY_CHARSET,
US_ASCII,
ISO_8859_1,
ISO_8859_2,
ISO_8859_3,
ISO_8859_4,
ISO_8859_5,
ISO_8859_6,
ISO_8859_7,
ISO_8859_8,
ISO_8859_9,
SHIFT_JIS,
UTF_8,
BIG5,
UCS2,
UTF_16,
BIG5_HKSCS,
BOCU_1,
CESU_8,
CP864,
EUC_JP,
EUC_KR,
GB18030,
GBK,
HZ_GB_2312,
GB_2312,
ISO_2022_CN,
ISO_2022_CN_EXT,
ISO_2022_JP,
ISO_2022_KR,
ISO_8859_10,
ISO_8859_13,
ISO_8859_14,
ISO_8859_15,
ISO_8859_16,
KOI8_R,
KOI8_U,
MACINTOSH,
SCSU,
TIS_620,
UTF_16BE,
UTF_16LE,
UTF_32,
UTF_32BE,
UTF_32LE,
UTF_7,
WINDOWS_1250,
WINDOWS_1251,
WINDOWS_1252,
WINDOWS_1253,
WINDOWS_1254,
WINDOWS_1255,
WINDOWS_1256,
WINDOWS_1257,
WINDOWS_1258,
};
/**
* The Well-known-charset Mime name.
*/
public static final String MIMENAME_ANY_CHARSET = "*";
public static final String MIMENAME_US_ASCII = "us-ascii";
public static final String MIMENAME_ISO_8859_1 = "iso-8859-1";
public static final String MIMENAME_ISO_8859_2 = "iso-8859-2";
public static final String MIMENAME_ISO_8859_3 = "iso-8859-3";
public static final String MIMENAME_ISO_8859_4 = "iso-8859-4";
public static final String MIMENAME_ISO_8859_5 = "iso-8859-5";
public static final String MIMENAME_ISO_8859_6 = "iso-8859-6";
public static final String MIMENAME_ISO_8859_7 = "iso-8859-7";
public static final String MIMENAME_ISO_8859_8 = "iso-8859-8";
public static final String MIMENAME_ISO_8859_9 = "iso-8859-9";
public static final String MIMENAME_SHIFT_JIS = "shift_JIS";
public static final String MIMENAME_UTF_8 = "utf-8";
public static final String MIMENAME_BIG5 = "big5";
public static final String MIMENAME_UCS2 = "iso-10646-ucs-2";
public static final String MIMENAME_UTF_16 = "utf-16";
/**
* Extend charsets.
*
* From http://www.iana.org/assignments/character-sets/
*/
public static final String MIMENAME_BIG5_HKSCS = "Big5-HKSCS";
public static final String MIMENAME_BOCU_1 = "BOCU-1";
public static final String MIMENAME_CESU_8 = "CESU-8";
public static final String MIMENAME_CP864 = "cp864";
public static final String MIMENAME_EUC_JP = "EUC-JP";
public static final String MIMENAME_EUC_KR = "EUC-KR";
public static final String MIMENAME_GB18030 = "GB18030";
public static final String MIMENAME_GBK = "GBK";
public static final String MIMENAME_HZ_GB_2312 = "HZ-GB-2312";
public static final String MIMENAME_GB_2312 = "GB2312";
public static final String MIMENAME_ISO_2022_CN = "ISO-2022-CN";
public static final String MIMENAME_ISO_2022_CN_EXT = "ISO-2022-CN-EXT";
public static final String MIMENAME_ISO_2022_JP = "ISO-2022-JP";
public static final String MIMENAME_ISO_2022_KR = "ISO-2022-KR";
public static final String MIMENAME_ISO_8859_10 = "ISO-8859-10";
public static final String MIMENAME_ISO_8859_13 = "ISO-8859-13";
public static final String MIMENAME_ISO_8859_14 = "ISO-8859-14";
public static final String MIMENAME_ISO_8859_15 = "ISO-8859-15";
public static final String MIMENAME_ISO_8859_16 = "ISO-8859-16";
public static final String MIMENAME_KOI8_R = "KOI8-R";
public static final String MIMENAME_KOI8_U = "KOI8-U";
public static final String MIMENAME_MACINTOSH = "macintosh";
public static final String MIMENAME_SCSU = "SCSU";
public static final String MIMENAME_TIS_620 = "TIS-620";
public static final String MIMENAME_UTF_16BE = "UTF-16BE";
public static final String MIMENAME_UTF_16LE = "UTF-16LE";
public static final String MIMENAME_UTF_32 = "UTF-32";
public static final String MIMENAME_UTF_32BE = "UTF-32BE";
public static final String MIMENAME_UTF_32LE = "UTF-32LE";
public static final String MIMENAME_UTF_7 = "UTF-7";
public static final String MIMENAME_WINDOWS_1250 = "windows-1250";
public static final String MIMENAME_WINDOWS_1251 = "windows-1251";
public static final String MIMENAME_WINDOWS_1252 = "windows-1252";
public static final String MIMENAME_WINDOWS_1253 = "windows-1253";
public static final String MIMENAME_WINDOWS_1254 = "windows-1254";
public static final String MIMENAME_WINDOWS_1255 = "windows-1255";
public static final String MIMENAME_WINDOWS_1256 = "windows-1256";
public static final String MIMENAME_WINDOWS_1257 = "windows-1257";
public static final String MIMENAME_WINDOWS_1258 = "windows-1258";
public static final String DEFAULT_CHARSET_NAME = MIMENAME_UTF_8;
/**
* Array of the names of character sets.
*/
private static final String[] MIME_NAMES = {
MIMENAME_ANY_CHARSET,
MIMENAME_US_ASCII,
MIMENAME_ISO_8859_1,
MIMENAME_ISO_8859_2,
MIMENAME_ISO_8859_3,
MIMENAME_ISO_8859_4,
MIMENAME_ISO_8859_5,
MIMENAME_ISO_8859_6,
MIMENAME_ISO_8859_7,
MIMENAME_ISO_8859_8,
MIMENAME_ISO_8859_9,
MIMENAME_SHIFT_JIS,
MIMENAME_UTF_8,
MIMENAME_BIG5,
MIMENAME_UCS2,
MIMENAME_UTF_16,
MIMENAME_BIG5_HKSCS,
MIMENAME_BOCU_1,
MIMENAME_CESU_8,
MIMENAME_CP864,
MIMENAME_EUC_JP,
MIMENAME_EUC_KR,
MIMENAME_GB18030,
MIMENAME_GBK,
MIMENAME_HZ_GB_2312,
MIMENAME_GB_2312,
MIMENAME_ISO_2022_CN,
MIMENAME_ISO_2022_CN_EXT,
MIMENAME_ISO_2022_JP,
MIMENAME_ISO_2022_KR,
MIMENAME_ISO_8859_10,
MIMENAME_ISO_8859_13,
MIMENAME_ISO_8859_14,
MIMENAME_ISO_8859_15,
MIMENAME_ISO_8859_16,
MIMENAME_KOI8_R,
MIMENAME_KOI8_U,
MIMENAME_MACINTOSH,
MIMENAME_SCSU,
MIMENAME_TIS_620,
MIMENAME_UTF_16BE,
MIMENAME_UTF_16LE,
MIMENAME_UTF_32,
MIMENAME_UTF_32BE,
MIMENAME_UTF_32LE,
MIMENAME_UTF_7,
MIMENAME_WINDOWS_1250,
MIMENAME_WINDOWS_1251,
MIMENAME_WINDOWS_1252,
MIMENAME_WINDOWS_1253,
MIMENAME_WINDOWS_1254,
MIMENAME_WINDOWS_1255,
MIMENAME_WINDOWS_1256,
MIMENAME_WINDOWS_1257,
MIMENAME_WINDOWS_1258,
};
private static final HashMap<Integer, String> MIBENUM_TO_NAME_MAP;
private static final HashMap<String, Integer> NAME_TO_MIBENUM_MAP;
static {
// Create the HashMaps.
MIBENUM_TO_NAME_MAP = new HashMap<Integer, String>();
NAME_TO_MIBENUM_MAP = new HashMap<String, Integer>();
assert(MIBENUM_NUMBERS.length == MIME_NAMES.length);
int count = MIBENUM_NUMBERS.length - 1;
for(int i = 0; i <= count; i++) {
MIBENUM_TO_NAME_MAP.put(MIBENUM_NUMBERS[i], MIME_NAMES[i]);
NAME_TO_MIBENUM_MAP.put(MIME_NAMES[i], MIBENUM_NUMBERS[i]);
}
}
private CharacterSets() {} // Non-instantiatable
/**
* Map an MIBEnum number to the name of the charset which this number
* is assigned to by IANA.
*
* @param mibEnumValue An IANA assigned MIBEnum number.
* @return The name string of the charset.
* @throws UnsupportedEncodingException
*/
@UnsupportedAppUsage
public static String getMimeName(int mibEnumValue)
throws UnsupportedEncodingException {
String name = MIBENUM_TO_NAME_MAP.get(mibEnumValue);
if (name == null) {
throw new UnsupportedEncodingException();
}
return name;
}
/**
* Map a well-known charset name to its assigned MIBEnum number.
*
* @param mimeName The charset name.
* @return The MIBEnum number assigned by IANA for this charset.
* @throws UnsupportedEncodingException
*/
@UnsupportedAppUsage
public static int getMibEnumValue(String mimeName)
throws UnsupportedEncodingException {
if(null == mimeName) {
return -1;
}
Integer mibEnumValue = NAME_TO_MIBENUM_MAP.get(mimeName);
if (mibEnumValue == null) {
throw new UnsupportedEncodingException();
}
return mibEnumValue;
}
}