ICU-3346 add ibm-971
X-SVN-Rev: 13657
This commit is contained in:
parent
2e6b59aa7d
commit
21f41ac624
@ -538,7 +538,7 @@ ibm-949_P11A-1999 { UTR22* }
|
||||
# The following aliases tries to mirror the poor state of alias recognition
|
||||
# on these platforms.
|
||||
#
|
||||
# ibm-970 is a almost a subset of ibm-1363.
|
||||
# ibm-970 is almost a subset of ibm-1363.
|
||||
# Java, Solaris and AIX use euc-kr to also mean ksc5601.
|
||||
ibm-970_P110-1995 { UTR22* }
|
||||
ibm-970 { IBM* }
|
||||
@ -547,6 +547,10 @@ ibm-970_P110-1995 { UTR22* }
|
||||
ibm-eucKR { JAVA }
|
||||
csEUCKR { IANA WINDOWS } # x-euc-kr is also a MIME name
|
||||
ibm-970_VPUA
|
||||
|
||||
# ibm-971 is almost the set of DBCS mappings of ibm-970
|
||||
ibm-971_P100-1995 ibm-971 { IBM* } ibm-971_VPUA
|
||||
|
||||
# Java, Solaris and AIX use euc-kr to also mean ksc5601, and _sometimes_ for Windows too.
|
||||
# ibm-1363 is almost a superset of ibm-970.
|
||||
ibm-1363_P11B-1998 { UTR22* }
|
||||
|
@ -164,8 +164,6 @@ CHARMAP
|
||||
<U008B> \x8B |0
|
||||
<U008C> \x8C |0
|
||||
<U008D> \x8D |0
|
||||
<U008E> \x1A |2
|
||||
<U008F> \x1A |2
|
||||
<U0090> \x90 |0
|
||||
<U0091> \x91 |0
|
||||
<U0092> \x92 |0
|
||||
@ -182,102 +180,35 @@ CHARMAP
|
||||
<U009D> \x9D |0
|
||||
<U009E> \x9E |0
|
||||
<U009F> \x9F |0
|
||||
<U00A0> \x1A |2
|
||||
<U00A1> \xA2\xAE |0
|
||||
<U00A2> \x1A |2
|
||||
<U00A3> \x1A |2
|
||||
<U00A4> \xA2\xB4 |0
|
||||
<U00A5> \x1A |2
|
||||
<U00A6> \x1A |2
|
||||
<U00A7> \xA1\xD7 |0
|
||||
<U00A8> \xA1\xA7 |0
|
||||
<U00A9> \x1A |2
|
||||
<U00AA> \xA8\xA3 |0
|
||||
<U00AB> \x1A |2
|
||||
<U00AC> \x1A |2
|
||||
<U00AD> \xA1\xA9 |1
|
||||
<U00AE> \x1A |2
|
||||
<U00AF> \x1A |2
|
||||
<U00B0> \xA1\xC6 |0
|
||||
<U00B1> \xA1\xBE |0
|
||||
<U00B2> \xA9\xF7 |0
|
||||
<U00B3> \xA9\xF8 |0
|
||||
<U00B4> \xA2\xA5 |0
|
||||
<U00B5> \x1A |2
|
||||
<U00B6> \xA2\xD2 |0
|
||||
<U00B7> \xA1\xA4 |1
|
||||
<U00B8> \xA2\xAC |0
|
||||
<U00B9> \xA9\xF6 |0
|
||||
<U00BA> \xA8\xAC |0
|
||||
<U00BB> \x1A |2
|
||||
<U00BC> \xA8\xF9 |0
|
||||
<U00BD> \xA8\xF6 |0
|
||||
<U00BE> \xA8\xFA |0
|
||||
<U00BF> \xA2\xAF |0
|
||||
<U00C0> \x1A |2
|
||||
<U00C1> \x1A |2
|
||||
<U00C2> \x1A |2
|
||||
<U00C3> \x1A |2
|
||||
<U00C4> \x1A |2
|
||||
<U00C5> \x1A |2
|
||||
<U00C6> \xA8\xA1 |0
|
||||
<U00C7> \x1A |2
|
||||
<U00C8> \x1A |2
|
||||
<U00C9> \x1A |2
|
||||
<U00CA> \x1A |2
|
||||
<U00CB> \x1A |2
|
||||
<U00CC> \x1A |2
|
||||
<U00CD> \x1A |2
|
||||
<U00CE> \x1A |2
|
||||
<U00CF> \x1A |2
|
||||
<U00D0> \xA8\xA2 |0
|
||||
<U00D1> \x1A |2
|
||||
<U00D2> \x1A |2
|
||||
<U00D3> \x1A |2
|
||||
<U00D4> \x1A |2
|
||||
<U00D5> \x1A |2
|
||||
<U00D6> \x1A |2
|
||||
<U00D7> \xA1\xBF |0
|
||||
<U00D8> \xA8\xAA |0
|
||||
<U00D9> \x1A |2
|
||||
<U00DA> \x1A |2
|
||||
<U00DB> \x1A |2
|
||||
<U00DC> \x1A |2
|
||||
<U00DD> \x1A |2
|
||||
<U00DE> \xA8\xAD |0
|
||||
<U00DF> \xA9\xAC |0
|
||||
<U00E0> \x1A |2
|
||||
<U00E1> \x1A |2
|
||||
<U00E2> \x1A |2
|
||||
<U00E3> \x1A |2
|
||||
<U00E4> \x1A |2
|
||||
<U00E5> \x1A |2
|
||||
<U00E6> \xA9\xA1 |0
|
||||
<U00E7> \x1A |2
|
||||
<U00E8> \x1A |2
|
||||
<U00E9> \x1A |2
|
||||
<U00EA> \x1A |2
|
||||
<U00EB> \x1A |2
|
||||
<U00EC> \x1A |2
|
||||
<U00ED> \x1A |2
|
||||
<U00EE> \x1A |2
|
||||
<U00EF> \x1A |2
|
||||
<U00F0> \xA9\xA3 |0
|
||||
<U00F1> \x1A |2
|
||||
<U00F2> \x1A |2
|
||||
<U00F3> \x1A |2
|
||||
<U00F4> \x1A |2
|
||||
<U00F5> \x1A |2
|
||||
<U00F6> \x1A |2
|
||||
<U00F7> \xA1\xC0 |0
|
||||
<U00F8> \xA9\xAA |0
|
||||
<U00F9> \x1A |2
|
||||
<U00FA> \x1A |2
|
||||
<U00FB> \x1A |2
|
||||
<U00FC> \x1A |2
|
||||
<U00FD> \x1A |2
|
||||
<U00FE> \xA9\xAD |0
|
||||
<U00FF> \x1A |2
|
||||
<U0111> \xA9\xA2 |0
|
||||
<U0126> \xA8\xA4 |0
|
||||
<U0127> \xA9\xA4 |0
|
||||
@ -420,7 +351,6 @@ CHARMAP
|
||||
<U0451> \xAC\xD7 |0
|
||||
<U2010> \xA1\xA9 |0
|
||||
<U2014> \xA1\xAA |0
|
||||
<U2015> \xA1\xAA |1
|
||||
<U2018> \xA1\xAE |0
|
||||
<U2019> \xA1\xAF |0
|
||||
<U201C> \xA1\xB0 |0
|
||||
@ -433,7 +363,6 @@ CHARMAP
|
||||
<U2032> \xA1\xC7 |0
|
||||
<U2033> \xA1\xC8 |0
|
||||
<U203B> \xA1\xD8 |0
|
||||
<U203E> \x1A |2
|
||||
<U2074> \xA9\xF9 |0
|
||||
<U207F> \xA9\xFA |0
|
||||
<U2081> \xA9\xFB |0
|
||||
@ -509,7 +438,6 @@ CHARMAP
|
||||
<U222E> \xA2\xB1 |0
|
||||
<U2234> \xA1\xC5 |0
|
||||
<U2235> \xA1\xF1 |0
|
||||
<U223C> \xA1\xAD |1
|
||||
<U223D> \xA1\xEF |0
|
||||
<U2252> \xA1\xD6 |0
|
||||
<U2260> \xA1\xC1 |0
|
||||
@ -522,7 +450,6 @@ CHARMAP
|
||||
<U2283> \xA1\xF9 |0
|
||||
<U2286> \xA1\xF6 |0
|
||||
<U2287> \xA1\xF7 |0
|
||||
<U2299> \xA2\xC1 |1
|
||||
<U22A5> \xA1\xD1 |0
|
||||
<U2312> \xA1\xD2 |0
|
||||
<U2460> \xA8\xE7 |0
|
||||
@ -8660,6 +8587,88 @@ CHARMAP
|
||||
<UFF5B> \xA3\xFB |0
|
||||
<UFF5C> \xA3\xFC |0
|
||||
<UFF5D> \xA3\xFD |0
|
||||
<UFFE0> \xA1\xCB |0
|
||||
<UFFE1> \xA1\xCC |0
|
||||
<UFFE2> \xA1\xFE |0
|
||||
<UFFE3> \xA3\xFE |0
|
||||
<UFFE5> \xA1\xCD |0
|
||||
<UFFE6> \xA3\xDC |0
|
||||
END CHARMAP
|
||||
|
||||
CHARMAP
|
||||
<U008E> \x1A |2
|
||||
<U008F> \x1A |2
|
||||
<U00A0> \x1A |2
|
||||
<U00A2> \x1A |2
|
||||
<U00A3> \x1A |2
|
||||
<U00A5> \x1A |2
|
||||
<U00A6> \x1A |2
|
||||
<U00A9> \x1A |2
|
||||
<U00AB> \x1A |2
|
||||
<U00AC> \x1A |2
|
||||
<U00AD> \xA1\xA9 |1
|
||||
<U00AE> \x1A |2
|
||||
<U00AF> \x1A |2
|
||||
<U00B5> \x1A |2
|
||||
<U00B7> \xA1\xA4 |1
|
||||
<U00BB> \x1A |2
|
||||
<U00C0> \x1A |2
|
||||
<U00C1> \x1A |2
|
||||
<U00C2> \x1A |2
|
||||
<U00C3> \x1A |2
|
||||
<U00C4> \x1A |2
|
||||
<U00C5> \x1A |2
|
||||
<U00C7> \x1A |2
|
||||
<U00C8> \x1A |2
|
||||
<U00C9> \x1A |2
|
||||
<U00CA> \x1A |2
|
||||
<U00CB> \x1A |2
|
||||
<U00CC> \x1A |2
|
||||
<U00CD> \x1A |2
|
||||
<U00CE> \x1A |2
|
||||
<U00CF> \x1A |2
|
||||
<U00D1> \x1A |2
|
||||
<U00D2> \x1A |2
|
||||
<U00D3> \x1A |2
|
||||
<U00D4> \x1A |2
|
||||
<U00D5> \x1A |2
|
||||
<U00D6> \x1A |2
|
||||
<U00D9> \x1A |2
|
||||
<U00DA> \x1A |2
|
||||
<U00DB> \x1A |2
|
||||
<U00DC> \x1A |2
|
||||
<U00DD> \x1A |2
|
||||
<U00E0> \x1A |2
|
||||
<U00E1> \x1A |2
|
||||
<U00E2> \x1A |2
|
||||
<U00E3> \x1A |2
|
||||
<U00E4> \x1A |2
|
||||
<U00E5> \x1A |2
|
||||
<U00E7> \x1A |2
|
||||
<U00E8> \x1A |2
|
||||
<U00E9> \x1A |2
|
||||
<U00EA> \x1A |2
|
||||
<U00EB> \x1A |2
|
||||
<U00EC> \x1A |2
|
||||
<U00ED> \x1A |2
|
||||
<U00EE> \x1A |2
|
||||
<U00EF> \x1A |2
|
||||
<U00F1> \x1A |2
|
||||
<U00F2> \x1A |2
|
||||
<U00F3> \x1A |2
|
||||
<U00F4> \x1A |2
|
||||
<U00F5> \x1A |2
|
||||
<U00F6> \x1A |2
|
||||
<U00F9> \x1A |2
|
||||
<U00FA> \x1A |2
|
||||
<U00FB> \x1A |2
|
||||
<U00FC> \x1A |2
|
||||
<U00FD> \x1A |2
|
||||
<U00FF> \x1A |2
|
||||
<U2015> \xA1\xAA |1
|
||||
<U203E> \x1A |2
|
||||
<U223C> \xA1\xAD |1
|
||||
<U2299> \xA2\xC1 |1
|
||||
<UFF5E> \xA2\xA6 |1
|
||||
<UFFA0> \x1A |2
|
||||
<UFFA1> \x1A |2
|
||||
@ -8713,10 +8722,4 @@ CHARMAP
|
||||
<UFFDA> \x1A |2
|
||||
<UFFDB> \x1A |2
|
||||
<UFFDC> \x1A |2
|
||||
<UFFE0> \xA1\xCB |0
|
||||
<UFFE1> \xA1\xCC |0
|
||||
<UFFE2> \xA1\xFE |0
|
||||
<UFFE3> \xA3\xFE |0
|
||||
<UFFE5> \xA1\xCD |0
|
||||
<UFFE6> \xA3\xDC |0
|
||||
END CHARMAP
|
||||
|
8438
icu4c/source/data/mappings/ibm-971_P100-1995.ucm
Normal file
8438
icu4c/source/data/mappings/ibm-971_P100-1995.ucm
Normal file
File diff suppressed because it is too large
Load Diff
@ -83,6 +83,7 @@ ibm-943_P130-1999.ucm\
|
||||
ibm-949_P110-1999.ucm\
|
||||
ibm-950_P110-1999.ucm\
|
||||
ibm-964_P110-1999.ucm\
|
||||
ibm-971_P100-1995.ucm\
|
||||
ibm-1363_P110-1997.ucm\
|
||||
ibm-1381_P110-1999.ucm\
|
||||
ibm-33722_P120-1999.ucm\
|
||||
|
39
icu4c/source/test/testdata/conversion.txt
vendored
39
icu4c/source/test/testdata/conversion.txt
vendored
@ -44,6 +44,22 @@ conversion {
|
||||
Headers { "charset", "bytes", "unicode", "offsets", "flush", "fallbacks", "errorCode", "callback", "invalidChars" }
|
||||
Cases {
|
||||
// DBCS-only extensions
|
||||
{
|
||||
"ibm-970",
|
||||
:bin{ 617eece9b2eb },
|
||||
"\x61\x7e\u4e00\ub000",
|
||||
:intvector{ 0, 1, 2, 4 },
|
||||
:int{1}, :int{1}, "", "?", :bin{""}
|
||||
}
|
||||
|
||||
{
|
||||
"ibm-971",
|
||||
:bin{ 617eece9b2eb },
|
||||
"\ufffd\u4e00\ub000",
|
||||
:intvector{ 0, 2, 4 },
|
||||
:int{1}, :int{1}, "", "?", :bin{""}
|
||||
}
|
||||
|
||||
{
|
||||
"ibm-16684",
|
||||
:bin{ 430e4395ecc1404042e1 },
|
||||
@ -162,6 +178,22 @@ conversion {
|
||||
Headers { "charset", "unicode", "bytes", "offsets", "flush", "fallbacks", "errorCode", "callback", "invalidUChars" }
|
||||
Cases {
|
||||
// DBCS-only extensions
|
||||
{
|
||||
"ibm-970",
|
||||
"\x61\uffa1\u2015\ub000",
|
||||
:bin{ 611aa1aab2eb },
|
||||
:intvector{ 0, 1, 2, 2, 3, 3 },
|
||||
:int{1}, :int{1}, "", "?", ""
|
||||
}
|
||||
|
||||
{
|
||||
"ibm-971",
|
||||
"\x61\uffa1\u2015\ub000",
|
||||
:bin{ affeaffeaffeb2eb },
|
||||
:intvector{ 0, 0, 1, 1, 2, 2, 3, 3 },
|
||||
:int{1}, :int{1}, "", "?", ""
|
||||
}
|
||||
|
||||
{
|
||||
"ibm-1390,swaplfnl",
|
||||
"\uff63\u30C8\u30C8\u309A\u3000\x41\u20ac\x0a",
|
||||
@ -339,6 +371,13 @@ conversion {
|
||||
Headers { "charset", "map", "mapnot", "which" }
|
||||
Cases {
|
||||
// DBCS-only
|
||||
{
|
||||
"ibm-971",
|
||||
"[\xa1\xa4\uac01\ub000]",
|
||||
"[\x00-\x9f\u2015]",
|
||||
:int{0}
|
||||
}
|
||||
|
||||
{
|
||||
"ibm-16684",
|
||||
"[\xa0\xa1\xa4\xa6-\xab\xad-\u017f\u0254\u309b-\u30ff\u4e00-\u4e05\U00023d00\U000243bc\U0002a6b2"
|
||||
|
Loading…
Reference in New Issue
Block a user