ICU-307 eliminate unneeded entries due to lenient matching, keeping IANA/MIME names; retry with MINIMAL changes

X-SVN-Rev: 1973
This commit is contained in:
Alan Liu 2000-07-20 16:04:19 +00:00
parent 24c2b9c0e6
commit 3d820108d3
2 changed files with 164 additions and 164 deletions

View File

@ -40,13 +40,13 @@
# be changed - or else code and/or file names must also be changed.
# Algorithmic
UTF8 utf-8 utf8 ibm-1208 utf_8 ibm1208 cp1208
UTF8 UTF-8 ibm-1208 cp1208
UTF16_BigEndian utf-16be
UTF16_LittleEndian utf-16le
UTF16_PlatformEndian iso-10646-ucs-2 csUnicode utf16 utf-16 ibm-1200 ibm1200 cp1200 ucs-2
UTF16_PlatformEndian iso-10646-ucs-2 csUnicode UTF-16 ibm-1200 cp1200 ucs-2
UTF16_OppositeEndian
LATIN_1 iso-8859-1 iso_8859-1 ibm-819 ibm819 cp819 latin1 latin-1 8859-1 csisolatin1 iso-ir-100 iso_8859-1:1978 cp367 iso-8859-1:1987 l1 iso_8859_1 ansi_x3.110-1983 iso8859-1 #!!!!! There's whole lot of names for this
ISO_2022 iso-2022 2022 cp2022 iso2022 iso_2022
LATIN_1 ISO-8859-1 ibm-819 cp819 latin1 8859-1 csisolatin1 iso-ir-100 cp367 ISO_8859-1:1987 l1 ansi_x3.110-1983 #!!!!! There's whole lot of names for this
ISO_2022 ISO-2022 2022 cp2022
LMBCS-1 lmbcs
LMBCS-2
LMBCS-3
@ -62,71 +62,71 @@ LMBCS-19
# Table-based
ibm-367 usascii ascii ascii-7 us-ascii usascii ansi_x3.4-1968 ansi_x3.4-1986 iso_646.irv:1991 iso646-us us csASCII 646
ibm-367 ascii ascii-7 US-ASCII ansi_x3.4-1968 ansi_x3.4-1986 iso_646.irv:1991 iso646-us us csASCII 646
# Special mapping for S/390 new line characters
ebcdic-xml-us
# Interchange codepages
ibm-912 iso-8859-2 iso_8859-2 iso8859-2 ibm912 cp912 latin2 8859-2 csisolatin2 iso-ir-101 iso_8859-2:1987 l2 # Central Europe
ibm-913 iso-8859-3 iso_8859-3 iso8859-3 latin3 cp913 ibm913 8859-3 csisolatin3 iso-ir-109 iso_8859-3:1988 l3 # Maltese Esperanto
ibm-914 iso-8859-4 iso_8859-4 iso8859-4 latin4 cp914 ibm914 8859-4 csisolatin4 iso-ir-110 iso_8859-4:1988 l4 # Baltic
ibm-915 iso-8859-5 iso_8859-5 iso8859-5 cyrillic cp915 ibm915 8859-5 csisolatincyrillic iso-ir-144 iso_8859-5:1988 # Cyrillic
ibm-1089 iso-8859-6 iso_8859-6 iso8859-6 arabic cp1089 ibm1089 8859-6 csisolatinarabic iso-ir-127 iso_8859-6:1987 ecma-114 asmo-708 # Arabic
ibm-4909 cp813 iso-8859-7 iso_8859-7 iso8859-7 cp813 greek greek8 elot_928 ecma-118 8859-7 csisolatingreek iso-ir-126 iso_8859-7:1987 # ISO Greek (w/ euro update)
ibm-912 ISO-8859-2 cp912 latin2 8859-2 csisolatin2 iso-ir-101 iso_8859-2:1987 l2 # Central Europe
ibm-913 ISO-8859-3 latin3 cp913 8859-3 csisolatin3 iso-ir-109 iso_8859-3:1988 l3 # Maltese Esperanto
ibm-914 ISO-8859-4 latin4 cp914 8859-4 csisolatin4 iso-ir-110 iso_8859-4:1988 l4 # Baltic
ibm-915 ISO-8859-5 cyrillic cp915 8859-5 csisolatincyrillic iso-ir-144 iso_8859-5:1988 # Cyrillic
ibm-1089 ISO-8859-6 arabic cp1089 8859-6 csisolatinarabic iso-ir-127 iso_8859-6:1987 ecma-114 asmo-708 # Arabic
ibm-4909 cp813 ISO-8859-7 greek greek8 elot_928 ecma-118 8859-7 csisolatingreek iso-ir-126 iso_8859-7:1987 # ISO Greek (w/ euro update)
ibm-813 # same as 4909 (w/o euro update)
ibm-916 iso-8859-8 iso_8859-8 iso8859-8 hebrew cp916 ibm916 8859-8 csisolatinhebrew iso-ir-138 iso_8859-8:1988 # hebrew iso-8859-8i - typo?
ibm-920 iso-8859-9 iso_8859-9 iso8859-9 ECMA-128 latin5 cp920 ibm920 8859-9 csisolatin5 iso-ir-148 l5 # Turkish
ibm-923 iso-8859-15 iso_8859-15 iso8859-15 latin9 cp923 ibm923 8859-15 latin0 csisolatin0 csisolatin9 # Latin 9
ibm-916 ISO-8859-8 hebrew cp916 8859-8 csisolatinhebrew iso-ir-138 iso_8859-8:1988 # hebrew iso-8859-8i - typo?
ibm-920 ISO-8859-9 ECMA-128 latin5 cp920 8859-9 csisolatin5 iso-ir-148 l5 # Turkish
ibm-923 ISO-8859-15 latin9 cp923 8859-15 latin0 csisolatin0 csisolatin9 # Latin 9
ibm-1252 windows-1252 cp1252 ibm-1004 cp1004 # Windows Latin 1 We don't have an ibm-5348, so this is a best possible match
ibm-943 shift_jis csWindows31J sjis shiftjis shift-jis ibm943 cp943 cp932 ms_kanji csshiftjis windows-31j x-sjis # japanese. Unicode name is \u30b7\u30d5\u30c8\u7b26\u53f7\u5316\u8868\u73fe Iana says that Windows-31J is an extension to csshiftjis ibm-932 removed
ibm-949 KS_C_5601-1987 iso-ir-149 KS_C_5601-1989 csKSC56011987 ibm949 ksc-5601 ksc_5601 johab ks_x_1001:1992 # KSC-5601-1992, korean
ibm-1370 Big5 csBig5 big-5 x-big5 cp950 # Taiwan Big-5 (w/ euro update)
ibm-943 Shift_JIS csWindows31J sjis cp943 cp932 ms_kanji csshiftjis windows-31j x-sjis # japanese. Unicode name is \u30b7\u30d5\u30c8\u7b26\u53f7\u5316\u8868\u73fe Iana says that Windows-31J is an extension to csshiftjis ibm-932 removed
ibm-949 KS_C_5601-1987 iso-ir-149 KS_C_5601-1989 csKSC56011987 KSC_5601 johab ks_x_1001:1992 # KSC-5601-1992, korean
ibm-1370 Big5 csBig5 x-big5 cp950 # Taiwan Big-5 (w/ euro update)
ibm-950 # Taiwan Big-5
ibm-1386 gb_2312-80 iso-ir-58 csISO58GB231280 gb2312-80 gbk chinese gb ibm1386 gb2312 gb2312-1980 cp936 zh_cn # Chinese GBK removed
ibm-954 euc-jp eucJP ibm-eucJP eucjis extended_unix_code_packed_format_for_japanese cseuckdfmtjapanese x-euc-jp x-eucjp # Japan EUC
ibm-970 euc-kr euckr ibm-eucKR csEUCKR # Korean EUC
#ibm-964 euc-tw euctw ibm-eucTW cns11643 # Taiwan EUC
ibm-1386 GB_2312-80 iso-ir-58 csISO58GB231280 gbk chinese gb gb2312 gb2312-1980 cp936 zh_cn # Chinese GBK removed
ibm-954 EUC-JP ibm-eucJP eucjis extended_unix_code_packed_format_for_japanese cseuckdfmtjapanese X-EUC-JP # Japan EUC
ibm-970 EUC-KR ibm-eucKR csEUCKR # Korean EUC
#ibm-964 EUC-TW ibm-eucTW cns11643 # Taiwan EUC
#ibm-1361 cp949 ksc korean # Korean KSC
ibm-1383 euc-cn euccn ibm-eucCN # China EUC
ibm-1383 EUC-CN ibm-eucCN # China EUC
#ibm-1162 tis-620 cp874 windows-874 ms874 # Thai (w/ euro support) #what is the connection between this and the one below!!!
ibm-874 ibm-1161 #same as 1162 (w/o euro update) ***This is commented out in Helena's
lmb-excp # special exceptions list for LMBCS algorithm
# Platform codepages
ibm-437 ibm437 cp437 csPC8CodePage437 437 # PC US
ibm-437 cp437 csPC8CodePage437 437 # PC US
# HSYS:
ibm-850 IBM850 cp850 850 csPC850Multilingual # PC latin1
ibm-851 IBM851 cp851 851 csPC851 # PC DOS Greek (no euro)
ibm-858 ibm858 cp858 # PC latin1 with Euro cp850 removed
ibm-850 cp850 850 csPC850Multilingual # PC latin1
ibm-851 cp851 851 csPC851 # PC DOS Greek (no euro)
ibm-858 cp858 # PC latin1 with Euro cp850 removed
ibm-9044 852 csPCp852 cp852 # PC latin2 (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-852 # PC latin2 (w/o euro update)
ibm-872 855 csIBM855 cp855 # PC cyrillic (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-855 # PC cyrillic (w/o euro update)
ibm-856 ibm856 cp856 # PC Hebrew (old)
ibm-856 cp856 # PC Hebrew (old)
ibm-9049 857 csIBM857 cp857 # PC Latin 5 (Turkish) (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-857 # PC Latin 5 (w/o euro update)
ibm-859 ibm859 cp859 # PC Latin 9 (w/ euro update)
ibm-860 ibm860 cp860 860 csIBM860 # PC Portugal
ibm-861 ibm861 cp861 861 cp-is csIBM861 # PC Iceland
ibm-867 ibm867 cp867 862 cp862 cspc862latinhebrew # PC Hebrew (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-862 IBM862 # PC Hebrew (w/o euro update)
ibm-863 ibm863 cp863 863 csIBM863 # PC Canadian French
ibm-859 cp859 # PC Latin 9 (w/ euro update)
ibm-860 cp860 860 csIBM860 # PC Portugal
ibm-861 cp861 861 cp-is csIBM861 # PC Iceland
ibm-867 cp867 862 cp862 cspc862latinhebrew # PC Hebrew (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-862 # PC Hebrew (w/o euro update)
ibm-863 cp863 863 csIBM863 # PC Canadian French
ibm-17248 cp864 csIBM864 # PC Arabic (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-864 # PC Arabic (w/o euro update)
ibm-865 ibm865 cp865 865 csIBM865 # PC Nordic
ibm-865 cp865 865 csIBM865 # PC Nordic
ibm-808 cp866 866 csIBM866 # PC Russian (w/ euro update) #where should the names go here or below - inconsistency!!! put IBM866 cp866 866 csIBM866 down
ibm-866 IBM866 # PC Russian (w/o euro update) added IBM866 cp866 866 csIBM866
ibm-868 ibm868 cp868 cp-ar csIBM868 # PC Urdu
ibm-866 # PC Russian (w/o euro update) added IBM866 cp866 866 csIBM866
ibm-868 cp868 cp-ar csIBM868 # PC Urdu
ibm-9061 869 cp-gr csIBM869 cp869 # PC Greek (w/ euro update)
ibm-869 # PC Greek (w/o euro update)
ibm-878 koi8-r ibm878 cp878 koi8 cskoi8r # Russian internet
ibm-878 koi8-r cp878 koi8 cskoi8r # Russian internet
ibm-901 cp921 # PC Baltic (w/ euro update) moved cp921 down
ibm-921 # PC Baltic (w/o euro update) from above
ibm-902 cp922 # PC Estonian (w/ euro update) moved cp922 down
ibm-922 # PC Estonian (w/o euro update) from above
ibm-942 shift_jis78 sjis78 ibm-932 ibm932 # Old s_jis ibm-932 added!
ibm-942 shift_jis78 sjis78 ibm-932 # Old s_jis ibm-932 added!
ibm-1038 Adobe-Symbol-Encoding csHPPSMath symbol
ibm-5346 windows-1250 cp1250 # Windows Latin2 (w/ euro update)
ibm-5347 windows-1251 cp1251 # Windows Cyrillic (w/ euro update)
@ -170,25 +170,25 @@ ibm-21427 cp947 # PC DBCS Big-5 (w/ euro update)
# EBCDIC codepages according to the CDRA
# without Euro
ibm-37 IBM037 ibm-037 cpibm37 ebcdic-cp-ca ebcdic-cp-wt ebcdic-cp-nl csIBM037 cp37 ebcdic-cp-us cp037 # EBCDIC US
ibm-273 IBM273 csIBM273 ebcdic-de cp273 cpibm273 # EBCDIC Germanay, Austria...
ibm-277 IBM277 EBCDIC-CP-DK EBCDIC-CP-NO csIBM277 ebcdic-dk cp277 cpibm277 # EBCDIC Denmark...
ibm-278 IBM278 ebcdic-cp-fi ebcdic-cp-se csIBM278 ebcdic-sv cp278 cpibm278 # EBCDIC Sweden
ibm-280 IBM280 ebcdic-cp-it csIBM280 cp280 cpibm280 # EBCDIC Italy
ibm-284 IBM284 ebcdic-cp-es csIBM284 cp284 cpibm284 # EBCDIC Spain
ibm-285 IBM285 ebcdic-cp-gb csIBM285 ebcdic-gb cp285 cpibm285 # EBCDIC UK Ireland
ibm-290 IBM290 EBCDIC-JP-kana csIBM290 cp290 # host SBCS (Katakana)
ibm-297 IBM297 ebcdic-cp-fr csIBM297 cp297 cpibm297 # EBCDIC France
ibm-420 IBM420 ebcdic-cp-ar1 csIBM420 ibm-420 cp420
ibm-424 IBM424 ebcdic-cp-he csIBM424 cp424 ibm-424
ibm-500 IBM500 cpibm500 csIBM500 cp500 ebcdic-cp-be ebcdic-cp-ch # EBCDIC International Latin1
ibm-37 ibm-037 cpibm37 ebcdic-cp-ca ebcdic-cp-wt ebcdic-cp-nl csIBM037 cp37 ebcdic-cp-us cp037 # EBCDIC US
ibm-273 csIBM273 ebcdic-de cp273 cpibm273 # EBCDIC Germanay, Austria...
ibm-277 EBCDIC-CP-DK EBCDIC-CP-NO csIBM277 ebcdic-dk cp277 cpibm277 # EBCDIC Denmark...
ibm-278 ebcdic-cp-fi ebcdic-cp-se csIBM278 ebcdic-sv cp278 cpibm278 # EBCDIC Sweden
ibm-280 ebcdic-cp-it csIBM280 cp280 cpibm280 # EBCDIC Italy
ibm-284 ebcdic-cp-es csIBM284 cp284 cpibm284 # EBCDIC Spain
ibm-285 ebcdic-cp-gb csIBM285 ebcdic-gb cp285 cpibm285 # EBCDIC UK Ireland
ibm-290 EBCDIC-JP-kana csIBM290 cp290 # host SBCS (Katakana)
ibm-297 ebcdic-cp-fr csIBM297 cp297 cpibm297 # EBCDIC France
ibm-420 ebcdic-cp-ar1 csIBM420 cp420
ibm-424 ebcdic-cp-he csIBM424 cp424
ibm-500 cpibm500 csIBM500 cp500 ebcdic-cp-be ebcdic-cp-ch # EBCDIC International Latin1
ibm-803 cp803 # Old EBCDIC Hebrew
ibm-834 cp834 # Korean DBCS Host
ibm-835 cp835 # DBCS T-Ch Host
ibm-871 IBM871 ebcdic-cp-is csIBM871 cpibm871 cp871 # EBCDIC Iceland
ibm-871 ebcdic-cp-is csIBM871 cpibm871 cp871 # EBCDIC Iceland
ibm-930 cp930 cpibm930 # Japan EBCDIC MIXED
ibm-933 ibm933 cp933 cpibm933 # Korea EBCDIC MIXED
ibm-935 ibm935 cp935 cpibm935 # China EBCDIC MIXED
ibm-933 cp933 cpibm933 # Korea EBCDIC MIXED
ibm-935 cp935 cpibm935 # China EBCDIC MIXED
ibm-937 cp937 cpibm937 # Taiwan EBCDIC MIXED
ibm-939 cp939 # Host MBCS (Latin-Kanji)
#ibm-1046 # PC Arabic without EURO
@ -197,17 +197,17 @@ ibm-1390 cpibm1390 # Japan EBCDIC MIXED
ibm-1371 cpibm1371 # Taiwan EBCDIC MIXED
ibm-1047 cpibm1047 # EBCDIC Open systems Latin1
ibm-1123 cpibm1123 # Cyrillic Ukraine EBCDIC
ibm-1140 cpibm1140 ibm1140 # EBCDIC US...
ibm-1141 cpibm1141 ibm1141 # EBCDIC Germanay, Austria...
ibm-1142 cpibm1142 ibm1142 # EBCDIC Denmark...
ibm-1143 cpibm1143 ibm1143 # EBCDIC Sweden
ibm-1144 cpibm1144 ibm1144 # EBCDIC Italy
ibm-1145 cpibm1145 ibm1145 # EBCDIC Spain
ibm-1146 cpibm1146 ibm1146 # EBCDIC UK Ireland
ibm-1147 cpibm1147 ibm1147 # EBCDIC France
ibm-1148 cpibm1148 ibm1148 # EBCDIC International Latin1
ibm-1149 cpibm1149 ibm1149 ebcdic-is # EBCDIC Iceland
ibm-1153 cpibm1153 ibm1153 # EBCDIC latin 2
ibm-1140 cpibm1140 # EBCDIC US...
ibm-1141 cpibm1141 # EBCDIC Germanay, Austria...
ibm-1142 cpibm1142 # EBCDIC Denmark...
ibm-1143 cpibm1143 # EBCDIC Sweden
ibm-1144 cpibm1144 # EBCDIC Italy
ibm-1145 cpibm1145 # EBCDIC Spain
ibm-1146 cpibm1146 # EBCDIC UK Ireland
ibm-1147 cpibm1147 # EBCDIC France
ibm-1148 cpibm1148 # EBCDIC International Latin1
ibm-1149 cpibm1149 ebcdic-is # EBCDIC Iceland
ibm-1153 cpibm1153 # EBCDIC latin 2
ibm-1154 cp1025 cpibm1154 # EBCDIC Cyrillic Multilingual
ibm-1155 IBM1026 csIBM1026 cp1026 cpibm1155 # EBCDIC Turkey
ibm-1156 cp1112 cpibm1156 # EBCDIC Baltic Multilingual
@ -225,9 +225,9 @@ ibm-4899 cpibm4899 # Old EBCDIC Hebrew
ibm-4971 cp875 cpibm4971 # EBCDIC Greek
ibm-9027 # DBCS T-Ch Host
ibm-5123 cp1027 # Host Roman Jis
ibm-12712 cpibm12712 ibm12712 ebcdic-he # EBCDIC Hebrew (new sheqel, control charaters update)
ibm-12712 cpibm12712 ebcdic-he # EBCDIC Hebrew (new sheqel, control charaters update)
ibm-16684 cp300 # Jis + Roman Jis Host
ibm-16804 cpibm16804 ibm16804 ebcdic-ar # EBCDIC Arabic
ibm-16804 cpibm16804 ebcdic-ar # EBCDIC Arabic
# unsupported IANA names
# ebcdic-us
@ -240,20 +240,20 @@ ibm-16804 cpibm16804 ibm16804 ebcdic-ar # EBCDIC Arabic
# EBCDIC codepages for S/390, with LF and NL codes swapped
# without Euro
ibm-37-s390 ibm037-s390 # EBCDIC US
ibm-1047-s390 ibm1047-s390 # EBCDIC for S/390 Open Edition
# with Euro
ibm-1140-s390 ibm1140-s390 # EBCDIC US
ibm-1142-s390 ibm1142-s390 # EBCDIC Denmark
ibm-1143-s390 ibm1143-s390 # EBCDIC Sweden
ibm-1144-s390 ibm1144-s390 # EBCDIC Italy
ibm-1145-s390 ibm1145-s390 # EBCDIC Spain
ibm-1146-s390 ibm1146-s390 # EBCDIC UK Ireland
ibm-1147-s390 ibm1147-s390 # EBCDIC France
ibm-1148-s390 ibm1148-s390 # EBCDIC International Latin1
ibm-1149-s390 ibm1149-s390 # EBCDIC Iceland
ibm-1153-s390 ibm1153-s390 # EBCDIC latin 2
ibm-12712-s390 ibm12712-s390 # EBCDIC Hebrew
ibm-16804-s390 ibm16804-s390 # EBCDIC Arabic
ibm-37-s390 ibm037-s390 # EBCDIC US
ibm-1047-s390 # EBCDIC for S/390 Open Edition
# with Euro
ibm-1140-s390 # EBCDIC US
ibm-1142-s390 # EBCDIC Denmark
ibm-1143-s390 # EBCDIC Sweden
ibm-1144-s390 # EBCDIC Italy
ibm-1145-s390 # EBCDIC Spain
ibm-1146-s390 # EBCDIC UK Ireland
ibm-1147-s390 # EBCDIC France
ibm-1148-s390 # EBCDIC International Latin1
ibm-1149-s390 # EBCDIC Iceland
ibm-1153-s390 # EBCDIC latin 2
ibm-12712-s390 # EBCDIC Hebrew
ibm-16804-s390 # EBCDIC Arabic

View File

@ -40,13 +40,13 @@
# be changed - or else code and/or file names must also be changed.
# Algorithmic
UTF8 utf-8 utf8 ibm-1208 utf_8 ibm1208 cp1208
UTF8 UTF-8 ibm-1208 cp1208
UTF16_BigEndian utf-16be
UTF16_LittleEndian utf-16le
UTF16_PlatformEndian iso-10646-ucs-2 csUnicode utf16 utf-16 ibm-1200 ibm1200 cp1200 ucs-2
UTF16_PlatformEndian iso-10646-ucs-2 csUnicode UTF-16 ibm-1200 cp1200 ucs-2
UTF16_OppositeEndian
LATIN_1 iso-8859-1 iso_8859-1 ibm-819 ibm819 cp819 latin1 latin-1 8859-1 csisolatin1 iso-ir-100 iso_8859-1:1978 cp367 iso-8859-1:1987 l1 iso_8859_1 ansi_x3.110-1983 iso8859-1 #!!!!! There's whole lot of names for this
ISO_2022 iso-2022 2022 cp2022 iso2022 iso_2022
LATIN_1 ISO-8859-1 ibm-819 cp819 latin1 8859-1 csisolatin1 iso-ir-100 cp367 ISO_8859-1:1987 l1 ansi_x3.110-1983 #!!!!! There's whole lot of names for this
ISO_2022 ISO-2022 2022 cp2022
LMBCS-1 lmbcs
LMBCS-2
LMBCS-3
@ -62,71 +62,71 @@ LMBCS-19
# Table-based
ibm-367 usascii ascii ascii-7 us-ascii usascii ansi_x3.4-1968 ansi_x3.4-1986 iso_646.irv:1991 iso646-us us csASCII 646
ibm-367 ascii ascii-7 US-ASCII ansi_x3.4-1968 ansi_x3.4-1986 iso_646.irv:1991 iso646-us us csASCII 646
# Special mapping for S/390 new line characters
ebcdic-xml-us
# Interchange codepages
ibm-912 iso-8859-2 iso_8859-2 iso8859-2 ibm912 cp912 latin2 8859-2 csisolatin2 iso-ir-101 iso_8859-2:1987 l2 # Central Europe
ibm-913 iso-8859-3 iso_8859-3 iso8859-3 latin3 cp913 ibm913 8859-3 csisolatin3 iso-ir-109 iso_8859-3:1988 l3 # Maltese Esperanto
ibm-914 iso-8859-4 iso_8859-4 iso8859-4 latin4 cp914 ibm914 8859-4 csisolatin4 iso-ir-110 iso_8859-4:1988 l4 # Baltic
ibm-915 iso-8859-5 iso_8859-5 iso8859-5 cyrillic cp915 ibm915 8859-5 csisolatincyrillic iso-ir-144 iso_8859-5:1988 # Cyrillic
ibm-1089 iso-8859-6 iso_8859-6 iso8859-6 arabic cp1089 ibm1089 8859-6 csisolatinarabic iso-ir-127 iso_8859-6:1987 ecma-114 asmo-708 # Arabic
ibm-4909 cp813 iso-8859-7 iso_8859-7 iso8859-7 cp813 greek greek8 elot_928 ecma-118 8859-7 csisolatingreek iso-ir-126 iso_8859-7:1987 # ISO Greek (w/ euro update)
ibm-912 ISO-8859-2 cp912 latin2 8859-2 csisolatin2 iso-ir-101 iso_8859-2:1987 l2 # Central Europe
ibm-913 ISO-8859-3 latin3 cp913 8859-3 csisolatin3 iso-ir-109 iso_8859-3:1988 l3 # Maltese Esperanto
ibm-914 ISO-8859-4 latin4 cp914 8859-4 csisolatin4 iso-ir-110 iso_8859-4:1988 l4 # Baltic
ibm-915 ISO-8859-5 cyrillic cp915 8859-5 csisolatincyrillic iso-ir-144 iso_8859-5:1988 # Cyrillic
ibm-1089 ISO-8859-6 arabic cp1089 8859-6 csisolatinarabic iso-ir-127 iso_8859-6:1987 ecma-114 asmo-708 # Arabic
ibm-4909 cp813 ISO-8859-7 greek greek8 elot_928 ecma-118 8859-7 csisolatingreek iso-ir-126 iso_8859-7:1987 # ISO Greek (w/ euro update)
ibm-813 # same as 4909 (w/o euro update)
ibm-916 iso-8859-8 iso_8859-8 iso8859-8 hebrew cp916 ibm916 8859-8 csisolatinhebrew iso-ir-138 iso_8859-8:1988 # hebrew iso-8859-8i - typo?
ibm-920 iso-8859-9 iso_8859-9 iso8859-9 ECMA-128 latin5 cp920 ibm920 8859-9 csisolatin5 iso-ir-148 l5 # Turkish
ibm-923 iso-8859-15 iso_8859-15 iso8859-15 latin9 cp923 ibm923 8859-15 latin0 csisolatin0 csisolatin9 # Latin 9
ibm-916 ISO-8859-8 hebrew cp916 8859-8 csisolatinhebrew iso-ir-138 iso_8859-8:1988 # hebrew iso-8859-8i - typo?
ibm-920 ISO-8859-9 ECMA-128 latin5 cp920 8859-9 csisolatin5 iso-ir-148 l5 # Turkish
ibm-923 ISO-8859-15 latin9 cp923 8859-15 latin0 csisolatin0 csisolatin9 # Latin 9
ibm-1252 windows-1252 cp1252 ibm-1004 cp1004 # Windows Latin 1 We don't have an ibm-5348, so this is a best possible match
ibm-943 shift_jis csWindows31J sjis shiftjis shift-jis ibm943 cp943 cp932 ms_kanji csshiftjis windows-31j x-sjis # japanese. Unicode name is \u30b7\u30d5\u30c8\u7b26\u53f7\u5316\u8868\u73fe Iana says that Windows-31J is an extension to csshiftjis ibm-932 removed
ibm-949 KS_C_5601-1987 iso-ir-149 KS_C_5601-1989 csKSC56011987 ibm949 ksc-5601 ksc_5601 johab ks_x_1001:1992 # KSC-5601-1992, korean
ibm-1370 Big5 csBig5 big-5 x-big5 cp950 # Taiwan Big-5 (w/ euro update)
ibm-943 Shift_JIS csWindows31J sjis cp943 cp932 ms_kanji csshiftjis windows-31j x-sjis # japanese. Unicode name is \u30b7\u30d5\u30c8\u7b26\u53f7\u5316\u8868\u73fe Iana says that Windows-31J is an extension to csshiftjis ibm-932 removed
ibm-949 KS_C_5601-1987 iso-ir-149 KS_C_5601-1989 csKSC56011987 KSC_5601 johab ks_x_1001:1992 # KSC-5601-1992, korean
ibm-1370 Big5 csBig5 x-big5 cp950 # Taiwan Big-5 (w/ euro update)
ibm-950 # Taiwan Big-5
ibm-1386 gb_2312-80 iso-ir-58 csISO58GB231280 gb2312-80 gbk chinese gb ibm1386 gb2312 gb2312-1980 cp936 zh_cn # Chinese GBK removed
ibm-954 euc-jp eucJP ibm-eucJP eucjis extended_unix_code_packed_format_for_japanese cseuckdfmtjapanese x-euc-jp x-eucjp # Japan EUC
ibm-970 euc-kr euckr ibm-eucKR csEUCKR # Korean EUC
#ibm-964 euc-tw euctw ibm-eucTW cns11643 # Taiwan EUC
ibm-1386 GB_2312-80 iso-ir-58 csISO58GB231280 gbk chinese gb gb2312 gb2312-1980 cp936 zh_cn # Chinese GBK removed
ibm-954 EUC-JP ibm-eucJP eucjis extended_unix_code_packed_format_for_japanese cseuckdfmtjapanese X-EUC-JP # Japan EUC
ibm-970 EUC-KR ibm-eucKR csEUCKR # Korean EUC
#ibm-964 EUC-TW ibm-eucTW cns11643 # Taiwan EUC
#ibm-1361 cp949 ksc korean # Korean KSC
ibm-1383 euc-cn euccn ibm-eucCN # China EUC
ibm-1383 EUC-CN ibm-eucCN # China EUC
#ibm-1162 tis-620 cp874 windows-874 ms874 # Thai (w/ euro support) #what is the connection between this and the one below!!!
ibm-874 ibm-1161 #same as 1162 (w/o euro update) ***This is commented out in Helena's
lmb-excp # special exceptions list for LMBCS algorithm
# Platform codepages
ibm-437 ibm437 cp437 csPC8CodePage437 437 # PC US
ibm-437 cp437 csPC8CodePage437 437 # PC US
# HSYS:
ibm-850 IBM850 cp850 850 csPC850Multilingual # PC latin1
ibm-851 IBM851 cp851 851 csPC851 # PC DOS Greek (no euro)
ibm-858 ibm858 cp858 # PC latin1 with Euro cp850 removed
ibm-850 cp850 850 csPC850Multilingual # PC latin1
ibm-851 cp851 851 csPC851 # PC DOS Greek (no euro)
ibm-858 cp858 # PC latin1 with Euro cp850 removed
ibm-9044 852 csPCp852 cp852 # PC latin2 (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-852 # PC latin2 (w/o euro update)
ibm-872 855 csIBM855 cp855 # PC cyrillic (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-855 # PC cyrillic (w/o euro update)
ibm-856 ibm856 cp856 # PC Hebrew (old)
ibm-856 cp856 # PC Hebrew (old)
ibm-9049 857 csIBM857 cp857 # PC Latin 5 (Turkish) (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-857 # PC Latin 5 (w/o euro update)
ibm-859 ibm859 cp859 # PC Latin 9 (w/ euro update)
ibm-860 ibm860 cp860 860 csIBM860 # PC Portugal
ibm-861 ibm861 cp861 861 cp-is csIBM861 # PC Iceland
ibm-867 ibm867 cp867 862 cp862 cspc862latinhebrew # PC Hebrew (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-862 IBM862 # PC Hebrew (w/o euro update)
ibm-863 ibm863 cp863 863 csIBM863 # PC Canadian French
ibm-859 cp859 # PC Latin 9 (w/ euro update)
ibm-860 cp860 860 csIBM860 # PC Portugal
ibm-861 cp861 861 cp-is csIBM861 # PC Iceland
ibm-867 cp867 862 cp862 cspc862latinhebrew # PC Hebrew (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-862 # PC Hebrew (w/o euro update)
ibm-863 cp863 863 csIBM863 # PC Canadian French
ibm-17248 cp864 csIBM864 # PC Arabic (w/ euro update) #where should the names go here or below - inconsistency!!!
ibm-864 # PC Arabic (w/o euro update)
ibm-865 ibm865 cp865 865 csIBM865 # PC Nordic
ibm-865 cp865 865 csIBM865 # PC Nordic
ibm-808 cp866 866 csIBM866 # PC Russian (w/ euro update) #where should the names go here or below - inconsistency!!! put IBM866 cp866 866 csIBM866 down
ibm-866 IBM866 # PC Russian (w/o euro update) added IBM866 cp866 866 csIBM866
ibm-868 ibm868 cp868 cp-ar csIBM868 # PC Urdu
ibm-866 # PC Russian (w/o euro update) added IBM866 cp866 866 csIBM866
ibm-868 cp868 cp-ar csIBM868 # PC Urdu
ibm-9061 869 cp-gr csIBM869 cp869 # PC Greek (w/ euro update)
ibm-869 # PC Greek (w/o euro update)
ibm-878 koi8-r ibm878 cp878 koi8 cskoi8r # Russian internet
ibm-878 koi8-r cp878 koi8 cskoi8r # Russian internet
ibm-901 cp921 # PC Baltic (w/ euro update) moved cp921 down
ibm-921 # PC Baltic (w/o euro update) from above
ibm-902 cp922 # PC Estonian (w/ euro update) moved cp922 down
ibm-922 # PC Estonian (w/o euro update) from above
ibm-942 shift_jis78 sjis78 ibm-932 ibm932 # Old s_jis ibm-932 added!
ibm-942 shift_jis78 sjis78 ibm-932 # Old s_jis ibm-932 added!
ibm-1038 Adobe-Symbol-Encoding csHPPSMath symbol
ibm-5346 windows-1250 cp1250 # Windows Latin2 (w/ euro update)
ibm-5347 windows-1251 cp1251 # Windows Cyrillic (w/ euro update)
@ -170,25 +170,25 @@ ibm-21427 cp947 # PC DBCS Big-5 (w/ euro update)
# EBCDIC codepages according to the CDRA
# without Euro
ibm-37 IBM037 ibm-037 cpibm37 ebcdic-cp-ca ebcdic-cp-wt ebcdic-cp-nl csIBM037 cp37 ebcdic-cp-us cp037 # EBCDIC US
ibm-273 IBM273 csIBM273 ebcdic-de cp273 cpibm273 # EBCDIC Germanay, Austria...
ibm-277 IBM277 EBCDIC-CP-DK EBCDIC-CP-NO csIBM277 ebcdic-dk cp277 cpibm277 # EBCDIC Denmark...
ibm-278 IBM278 ebcdic-cp-fi ebcdic-cp-se csIBM278 ebcdic-sv cp278 cpibm278 # EBCDIC Sweden
ibm-280 IBM280 ebcdic-cp-it csIBM280 cp280 cpibm280 # EBCDIC Italy
ibm-284 IBM284 ebcdic-cp-es csIBM284 cp284 cpibm284 # EBCDIC Spain
ibm-285 IBM285 ebcdic-cp-gb csIBM285 ebcdic-gb cp285 cpibm285 # EBCDIC UK Ireland
ibm-290 IBM290 EBCDIC-JP-kana csIBM290 cp290 # host SBCS (Katakana)
ibm-297 IBM297 ebcdic-cp-fr csIBM297 cp297 cpibm297 # EBCDIC France
ibm-420 IBM420 ebcdic-cp-ar1 csIBM420 ibm-420 cp420
ibm-424 IBM424 ebcdic-cp-he csIBM424 cp424 ibm-424
ibm-500 IBM500 cpibm500 csIBM500 cp500 ebcdic-cp-be ebcdic-cp-ch # EBCDIC International Latin1
ibm-37 ibm-037 cpibm37 ebcdic-cp-ca ebcdic-cp-wt ebcdic-cp-nl csIBM037 cp37 ebcdic-cp-us cp037 # EBCDIC US
ibm-273 csIBM273 ebcdic-de cp273 cpibm273 # EBCDIC Germanay, Austria...
ibm-277 EBCDIC-CP-DK EBCDIC-CP-NO csIBM277 ebcdic-dk cp277 cpibm277 # EBCDIC Denmark...
ibm-278 ebcdic-cp-fi ebcdic-cp-se csIBM278 ebcdic-sv cp278 cpibm278 # EBCDIC Sweden
ibm-280 ebcdic-cp-it csIBM280 cp280 cpibm280 # EBCDIC Italy
ibm-284 ebcdic-cp-es csIBM284 cp284 cpibm284 # EBCDIC Spain
ibm-285 ebcdic-cp-gb csIBM285 ebcdic-gb cp285 cpibm285 # EBCDIC UK Ireland
ibm-290 EBCDIC-JP-kana csIBM290 cp290 # host SBCS (Katakana)
ibm-297 ebcdic-cp-fr csIBM297 cp297 cpibm297 # EBCDIC France
ibm-420 ebcdic-cp-ar1 csIBM420 cp420
ibm-424 ebcdic-cp-he csIBM424 cp424
ibm-500 cpibm500 csIBM500 cp500 ebcdic-cp-be ebcdic-cp-ch # EBCDIC International Latin1
ibm-803 cp803 # Old EBCDIC Hebrew
ibm-834 cp834 # Korean DBCS Host
ibm-835 cp835 # DBCS T-Ch Host
ibm-871 IBM871 ebcdic-cp-is csIBM871 cpibm871 cp871 # EBCDIC Iceland
ibm-871 ebcdic-cp-is csIBM871 cpibm871 cp871 # EBCDIC Iceland
ibm-930 cp930 cpibm930 # Japan EBCDIC MIXED
ibm-933 ibm933 cp933 cpibm933 # Korea EBCDIC MIXED
ibm-935 ibm935 cp935 cpibm935 # China EBCDIC MIXED
ibm-933 cp933 cpibm933 # Korea EBCDIC MIXED
ibm-935 cp935 cpibm935 # China EBCDIC MIXED
ibm-937 cp937 cpibm937 # Taiwan EBCDIC MIXED
ibm-939 cp939 # Host MBCS (Latin-Kanji)
#ibm-1046 # PC Arabic without EURO
@ -197,17 +197,17 @@ ibm-1390 cpibm1390 # Japan EBCDIC MIXED
ibm-1371 cpibm1371 # Taiwan EBCDIC MIXED
ibm-1047 cpibm1047 # EBCDIC Open systems Latin1
ibm-1123 cpibm1123 # Cyrillic Ukraine EBCDIC
ibm-1140 cpibm1140 ibm1140 # EBCDIC US...
ibm-1141 cpibm1141 ibm1141 # EBCDIC Germanay, Austria...
ibm-1142 cpibm1142 ibm1142 # EBCDIC Denmark...
ibm-1143 cpibm1143 ibm1143 # EBCDIC Sweden
ibm-1144 cpibm1144 ibm1144 # EBCDIC Italy
ibm-1145 cpibm1145 ibm1145 # EBCDIC Spain
ibm-1146 cpibm1146 ibm1146 # EBCDIC UK Ireland
ibm-1147 cpibm1147 ibm1147 # EBCDIC France
ibm-1148 cpibm1148 ibm1148 # EBCDIC International Latin1
ibm-1149 cpibm1149 ibm1149 ebcdic-is # EBCDIC Iceland
ibm-1153 cpibm1153 ibm1153 # EBCDIC latin 2
ibm-1140 cpibm1140 # EBCDIC US...
ibm-1141 cpibm1141 # EBCDIC Germanay, Austria...
ibm-1142 cpibm1142 # EBCDIC Denmark...
ibm-1143 cpibm1143 # EBCDIC Sweden
ibm-1144 cpibm1144 # EBCDIC Italy
ibm-1145 cpibm1145 # EBCDIC Spain
ibm-1146 cpibm1146 # EBCDIC UK Ireland
ibm-1147 cpibm1147 # EBCDIC France
ibm-1148 cpibm1148 # EBCDIC International Latin1
ibm-1149 cpibm1149 ebcdic-is # EBCDIC Iceland
ibm-1153 cpibm1153 # EBCDIC latin 2
ibm-1154 cp1025 cpibm1154 # EBCDIC Cyrillic Multilingual
ibm-1155 IBM1026 csIBM1026 cp1026 cpibm1155 # EBCDIC Turkey
ibm-1156 cp1112 cpibm1156 # EBCDIC Baltic Multilingual
@ -225,9 +225,9 @@ ibm-4899 cpibm4899 # Old EBCDIC Hebrew
ibm-4971 cp875 cpibm4971 # EBCDIC Greek
ibm-9027 # DBCS T-Ch Host
ibm-5123 cp1027 # Host Roman Jis
ibm-12712 cpibm12712 ibm12712 ebcdic-he # EBCDIC Hebrew (new sheqel, control charaters update)
ibm-12712 cpibm12712 ebcdic-he # EBCDIC Hebrew (new sheqel, control charaters update)
ibm-16684 cp300 # Jis + Roman Jis Host
ibm-16804 cpibm16804 ibm16804 ebcdic-ar # EBCDIC Arabic
ibm-16804 cpibm16804 ebcdic-ar # EBCDIC Arabic
# unsupported IANA names
# ebcdic-us
@ -240,20 +240,20 @@ ibm-16804 cpibm16804 ibm16804 ebcdic-ar # EBCDIC Arabic
# EBCDIC codepages for S/390, with LF and NL codes swapped
# without Euro
ibm-37-s390 ibm037-s390 # EBCDIC US
ibm-1047-s390 ibm1047-s390 # EBCDIC for S/390 Open Edition
# with Euro
ibm-1140-s390 ibm1140-s390 # EBCDIC US
ibm-1142-s390 ibm1142-s390 # EBCDIC Denmark
ibm-1143-s390 ibm1143-s390 # EBCDIC Sweden
ibm-1144-s390 ibm1144-s390 # EBCDIC Italy
ibm-1145-s390 ibm1145-s390 # EBCDIC Spain
ibm-1146-s390 ibm1146-s390 # EBCDIC UK Ireland
ibm-1147-s390 ibm1147-s390 # EBCDIC France
ibm-1148-s390 ibm1148-s390 # EBCDIC International Latin1
ibm-1149-s390 ibm1149-s390 # EBCDIC Iceland
ibm-1153-s390 ibm1153-s390 # EBCDIC latin 2
ibm-12712-s390 ibm12712-s390 # EBCDIC Hebrew
ibm-16804-s390 ibm16804-s390 # EBCDIC Arabic
ibm-37-s390 ibm037-s390 # EBCDIC US
ibm-1047-s390 # EBCDIC for S/390 Open Edition
# with Euro
ibm-1140-s390 # EBCDIC US
ibm-1142-s390 # EBCDIC Denmark
ibm-1143-s390 # EBCDIC Sweden
ibm-1144-s390 # EBCDIC Italy
ibm-1145-s390 # EBCDIC Spain
ibm-1146-s390 # EBCDIC UK Ireland
ibm-1147-s390 # EBCDIC France
ibm-1148-s390 # EBCDIC International Latin1
ibm-1149-s390 # EBCDIC Iceland
ibm-1153-s390 # EBCDIC latin 2
ibm-12712-s390 # EBCDIC Hebrew
ibm-16804-s390 # EBCDIC Arabic