mirror of
https://sourceware.org/git/glibc.git
synced 2024-11-21 20:40:05 +00:00
Bug 25819: Update to Unicode 13.0.0
Unicode 13.0.0 Support: Character encoding, character type info, and transliteration tables are all updated to Unicode 13.0.0, using the generator scripts contributed by Mike FABIAN (Red Hat). Total added characters in newly generated CHARMAP: 5930 Total added characters in newly generated WIDTH: 5536
This commit is contained in:
parent
0798b8ecc8
commit
8645f62469
6
NEWS
6
NEWS
@ -9,7 +9,11 @@ Version 2.32
|
||||
|
||||
Major new features:
|
||||
|
||||
* New locale added: ckb_IQ (Kurdish/Sorani spoken in Iraq)
|
||||
* Unicode 12.1.0 Support: Character encoding, character type info, and
|
||||
transliteration tables are all updated to Unicode 12.1.0, using
|
||||
generator scripts contributed by Mike FABIAN (Red Hat).
|
||||
|
||||
* New locale added: ckb_IQ (Kurdish/Sorani spoken in Iraq)
|
||||
|
||||
* The GNU C Library now loads audit modules listed in the DT_AUDIT and
|
||||
DT_DEPAUDIT dynamic section entries of the main executable.
|
||||
|
File diff suppressed because it is too large
Load Diff
File diff suppressed because it is too large
Load Diff
File diff suppressed because it is too large
Load Diff
@ -9,7 +9,7 @@ comment_char %
|
||||
% otherwise be governed by that license.
|
||||
|
||||
% Transliterations of encircled characters.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_circle.py on 2019-05-08 for Unicode 12.1.0.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_circle.py on 2020-04-14 for Unicode 13.0.0.
|
||||
|
||||
LC_CTYPE
|
||||
|
||||
|
@ -9,7 +9,7 @@ comment_char %
|
||||
% otherwise be governed by that license.
|
||||
|
||||
% Transliterations of CJK compatibility characters.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_cjk_compat.py on 2019-05-08 for Unicode 12.1.0.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_cjk_compat.py on 2020-04-14 for Unicode 13.0.0.
|
||||
|
||||
LC_CTYPE
|
||||
|
||||
|
@ -10,7 +10,7 @@ comment_char %
|
||||
|
||||
% Transliterations that remove all combining characters (accents,
|
||||
% pronounciation marks, etc.).
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_combining.py on 2019-05-08 for Unicode 12.1.0.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_combining.py on 2020-04-14 for Unicode 13.0.0.
|
||||
|
||||
LC_CTYPE
|
||||
|
||||
@ -564,6 +564,10 @@ translit_start
|
||||
<U1ABD> ""
|
||||
% COMBINING PARENTHESES OVERLAY
|
||||
<U1ABE> ""
|
||||
% COMBINING LATIN SMALL LETTER W BELOW
|
||||
<U1ABF> ""
|
||||
% COMBINING LATIN SMALL LETTER TURNED W BELOW
|
||||
<U1AC0> ""
|
||||
% COMBINING DOTTED GRAVE ACCENT
|
||||
<U1DC0> ""
|
||||
% COMBINING DOTTED ACUTE ACCENT
|
||||
@ -810,6 +814,10 @@ translit_start
|
||||
<U00010D26> ""
|
||||
% HANIFI ROHINGYA SIGN TASSI
|
||||
<U00010D27> ""
|
||||
% YEZIDI COMBINING HAMZA MARK
|
||||
<U00010EAB> ""
|
||||
% YEZIDI COMBINING MADDA MARK
|
||||
<U00010EAC> ""
|
||||
% SOGDIAN COMBINING DOT BELOW
|
||||
<U00010F46> ""
|
||||
% SOGDIAN COMBINING TWO DOTS BELOW
|
||||
@ -902,6 +910,36 @@ translit_start
|
||||
<U00011839> ""
|
||||
% DOGRA SIGN NUKTA
|
||||
<U0001183A> ""
|
||||
% DIVES AKURU VOWEL SIGN AA
|
||||
<U00011930> ""
|
||||
% DIVES AKURU VOWEL SIGN I
|
||||
<U00011931> ""
|
||||
% DIVES AKURU VOWEL SIGN II
|
||||
<U00011932> ""
|
||||
% DIVES AKURU VOWEL SIGN U
|
||||
<U00011933> ""
|
||||
% DIVES AKURU VOWEL SIGN UU
|
||||
<U00011934> ""
|
||||
% DIVES AKURU VOWEL SIGN E
|
||||
<U00011935> ""
|
||||
% DIVES AKURU VOWEL SIGN AI
|
||||
<U00011937> ""
|
||||
% DIVES AKURU VOWEL SIGN O
|
||||
<U00011938> ""
|
||||
% DIVES AKURU SIGN ANUSVARA
|
||||
<U0001193B> ""
|
||||
% DIVES AKURU SIGN CANDRABINDU
|
||||
<U0001193C> ""
|
||||
% DIVES AKURU SIGN HALANTA
|
||||
<U0001193D> ""
|
||||
% DIVES AKURU VIRAMA
|
||||
<U0001193E> ""
|
||||
% DIVES AKURU MEDIAL YA
|
||||
<U00011940> ""
|
||||
% DIVES AKURU MEDIAL RA
|
||||
<U00011942> ""
|
||||
% DIVES AKURU SIGN NUKTA
|
||||
<U00011943> ""
|
||||
% NANDINAGARI VOWEL SIGN AA
|
||||
<U000119D1> ""
|
||||
% NANDINAGARI VOWEL SIGN I
|
||||
@ -1200,6 +1238,12 @@ translit_start
|
||||
<U00011EF5> ""
|
||||
% MAKASAR VOWEL SIGN O
|
||||
<U00011EF6> ""
|
||||
% KHITAN SMALL SCRIPT FILLER
|
||||
<U00016FE4> ""
|
||||
% VIETNAMESE ALTERNATE READING MARK CA
|
||||
<U00016FF0> ""
|
||||
% VIETNAMESE ALTERNATE READING MARK NHAY
|
||||
<U00016FF1> ""
|
||||
% COMBINING GREEK MUSICAL TRISEME
|
||||
<U0001D242> ""
|
||||
% COMBINING GREEK MUSICAL TETRASEME
|
||||
|
@ -9,7 +9,7 @@ comment_char %
|
||||
% otherwise be governed by that license.
|
||||
|
||||
% Transliterations of compatibility characters and ligatures.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_compat.py on 2019-05-08 for Unicode 12.1.0.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_compat.py on 2020-04-14 for Unicode 13.0.0.
|
||||
|
||||
LC_CTYPE
|
||||
|
||||
@ -1691,6 +1691,8 @@ translit_start
|
||||
<UAB5E> "<U026B>"
|
||||
% MODIFIER LETTER SMALL U WITH LEFT HOOK
|
||||
<UAB5F> "<UAB52>"
|
||||
% MODIFIER LETTER SMALL TURNED W
|
||||
<UAB69> "<U028D>"
|
||||
% LATIN SMALL LIGATURE FF
|
||||
<UFB00> "<U0066><U0066>"
|
||||
% LATIN SMALL LIGATURE FI
|
||||
|
@ -9,7 +9,7 @@ comment_char %
|
||||
% otherwise be governed by that license.
|
||||
|
||||
% Transliterations of font equivalents.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_font.py on 2019-05-08 for Unicode 12.1.0.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_font.py on 2020-04-14 for Unicode 13.0.0.
|
||||
|
||||
LC_CTYPE
|
||||
|
||||
@ -1199,6 +1199,16 @@ translit_start
|
||||
<U0001EEB9> <U0636> % ARABIC MATHEMATICAL DOUBLE-STRUCK DAD
|
||||
<U0001EEBA> <U0638> % ARABIC MATHEMATICAL DOUBLE-STRUCK ZAH
|
||||
<U0001EEBB> <U063A> % ARABIC MATHEMATICAL DOUBLE-STRUCK GHAIN
|
||||
<U0001FBF0> <U0030> % SEGMENTED DIGIT ZERO
|
||||
<U0001FBF1> <U0031> % SEGMENTED DIGIT ONE
|
||||
<U0001FBF2> <U0032> % SEGMENTED DIGIT TWO
|
||||
<U0001FBF3> <U0033> % SEGMENTED DIGIT THREE
|
||||
<U0001FBF4> <U0034> % SEGMENTED DIGIT FOUR
|
||||
<U0001FBF5> <U0035> % SEGMENTED DIGIT FIVE
|
||||
<U0001FBF6> <U0036> % SEGMENTED DIGIT SIX
|
||||
<U0001FBF7> <U0037> % SEGMENTED DIGIT SEVEN
|
||||
<U0001FBF8> <U0038> % SEGMENTED DIGIT EIGHT
|
||||
<U0001FBF9> <U0039> % SEGMENTED DIGIT NINE
|
||||
|
||||
translit_end
|
||||
|
||||
|
@ -9,7 +9,7 @@ comment_char %
|
||||
% otherwise be governed by that license.
|
||||
|
||||
% Transliterations of fractions.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_fraction.py on 2019-05-08 for Unicode 12.1.0.
|
||||
% Generated automatically from UnicodeData.txt by gen_translit_fraction.py on 2020-04-14 for Unicode 13.0.0.
|
||||
% The replacements have been surrounded with spaces, because fractions are
|
||||
% often preceded by a decimal number and followed by a unit or a math symbol.
|
||||
|
||||
|
File diff suppressed because it is too large
Load Diff
@ -1,6 +1,6 @@
|
||||
# EastAsianWidth-12.1.0.txt
|
||||
# Date: 2019-03-31, 22:01:58 GMT [KW, LI]
|
||||
# © 2019 Unicode®, Inc.
|
||||
# EastAsianWidth-13.0.0.txt
|
||||
# Date: 2029-01-21, 18:14:00 GMT [KW, LI]
|
||||
# © 2020 Unicode®, Inc.
|
||||
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
|
||||
# For terms of use, see http://www.unicode.org/terms_of_use.html
|
||||
#
|
||||
@ -9,7 +9,7 @@
|
||||
#
|
||||
# East_Asian_Width Property
|
||||
#
|
||||
# This file is an informative contributory data file in the
|
||||
# This file is a normative contributory data file in the
|
||||
# Unicode Character Database.
|
||||
#
|
||||
# The format is two fields separated by a semicolon.
|
||||
@ -332,7 +332,7 @@
|
||||
085E;N # Po MANDAIC PUNCTUATION
|
||||
0860..086A;N # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA
|
||||
08A0..08B4;N # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW
|
||||
08B6..08BD;N # Lo [8] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER AFRICAN NOON
|
||||
08B6..08C7;N # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE
|
||||
08D3..08E1;N # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA
|
||||
08E2;N # Cf ARABIC DISPUTED END OF AYAH
|
||||
08E3..08FF;N # Mn [29] ARABIC TURNED DAMMA BELOW..ARABIC MARK SIDEWAYS NOON GHUNNA
|
||||
@ -450,7 +450,7 @@
|
||||
0B47..0B48;N # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI
|
||||
0B4B..0B4C;N # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU
|
||||
0B4D;N # Mn ORIYA SIGN VIRAMA
|
||||
0B56;N # Mn ORIYA AI LENGTH MARK
|
||||
0B55..0B56;N # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK
|
||||
0B57;N # Mc ORIYA AU LENGTH MARK
|
||||
0B5C..0B5D;N # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA
|
||||
0B5F..0B61;N # Lo [3] ORIYA LETTER YYA..ORIYA LETTER VOCALIC LL
|
||||
@ -529,7 +529,7 @@
|
||||
0CF1..0CF2;N # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA
|
||||
0D00..0D01;N # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU
|
||||
0D02..0D03;N # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA
|
||||
0D05..0D0C;N # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L
|
||||
0D04..0D0C;N # Lo [9] MALAYALAM LETTER VEDIC ANUSVARA..MALAYALAM LETTER VOCALIC L
|
||||
0D0E..0D10;N # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI
|
||||
0D12..0D3A;N # Lo [41] MALAYALAM LETTER O..MALAYALAM LETTER TTTA
|
||||
0D3B..0D3C;N # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA
|
||||
@ -550,6 +550,7 @@
|
||||
0D70..0D78;N # No [9] MALAYALAM NUMBER TEN..MALAYALAM FRACTION THREE SIXTEENTHS
|
||||
0D79;N # So MALAYALAM DATE MARK
|
||||
0D7A..0D7F;N # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K
|
||||
0D81;N # Mn SINHALA SIGN CANDRABINDU
|
||||
0D82..0D83;N # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA
|
||||
0D85..0D96;N # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA
|
||||
0D9A..0DB1;N # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA
|
||||
@ -795,6 +796,7 @@
|
||||
1AA8..1AAD;N # Po [6] TAI THAM SIGN KAAN..TAI THAM SIGN CAANG
|
||||
1AB0..1ABD;N # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW
|
||||
1ABE;N # Me COMBINING PARENTHESES OVERLAY
|
||||
1ABF..1AC0;N # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW
|
||||
1B00..1B03;N # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG
|
||||
1B04;N # Mc BALINESE SIGN BISAH
|
||||
1B05..1B33;N # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA
|
||||
@ -1335,7 +1337,7 @@
|
||||
2B56..2B59;A # So [4] HEAVY OVAL WITH OVAL INSIDE..HEAVY CIRCLED SALTIRE
|
||||
2B5A..2B73;N # So [26] SLANTED NORTH ARROW WITH HOOKED HEAD..DOWNWARDS TRIANGLE-HEADED ARROW TO BAR
|
||||
2B76..2B95;N # So [32] NORTH WEST TRIANGLE-HEADED ARROW TO BAR..RIGHTWARDS BLACK ARROW
|
||||
2B98..2BFF;N # So [104] THREE-D TOP-LIGHTED LEFTWARDS EQUILATERAL ARROWHEAD..HELLSCHREIBER PAUSE SYMBOL
|
||||
2B97..2BFF;N # So [105] SYMBOL FOR TYPE A ELECTRONICS..HELLSCHREIBER PAUSE SYMBOL
|
||||
2C00..2C2E;N # Lu [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE
|
||||
2C30..2C5E;N # Ll [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE
|
||||
2C60..2C7B;N # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E
|
||||
@ -1404,6 +1406,8 @@
|
||||
2E41;N # Po REVERSED COMMA
|
||||
2E42;N # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK
|
||||
2E43..2E4F;N # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER
|
||||
2E50..2E51;N # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR
|
||||
2E52;N # Po TIRONIAN SIGN CAPITAL ET
|
||||
2E80..2E99;W # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP
|
||||
2E9B..2EF3;W # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE
|
||||
2F00..2FD5;W # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE
|
||||
@ -1464,7 +1468,7 @@
|
||||
3190..3191;W # So [2] IDEOGRAPHIC ANNOTATION LINKING MARK..IDEOGRAPHIC ANNOTATION REVERSE MARK
|
||||
3192..3195;W # No [4] IDEOGRAPHIC ANNOTATION ONE MARK..IDEOGRAPHIC ANNOTATION FOUR MARK
|
||||
3196..319F;W # So [10] IDEOGRAPHIC ANNOTATION TOP MARK..IDEOGRAPHIC ANNOTATION MAN MARK
|
||||
31A0..31BA;W # Lo [27] BOPOMOFO LETTER BU..BOPOMOFO LETTER ZY
|
||||
31A0..31BF;W # Lo [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH
|
||||
31C0..31E3;W # So [36] CJK STROKE T..CJK STROKE Q
|
||||
31F0..31FF;W # Lo [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO
|
||||
3200..321E;W # So [31] PARENTHESIZED HANGUL KIYEOK..PARENTHESIZED KOREAN CHARACTER O HU
|
||||
@ -1479,11 +1483,10 @@
|
||||
32B1..32BF;W # No [15] CIRCLED NUMBER THIRTY SIX..CIRCLED NUMBER FIFTY
|
||||
32C0..32FF;W # So [64] IDEOGRAPHIC TELEGRAPH SYMBOL FOR JANUARY..SQUARE ERA NAME REIWA
|
||||
3300..33FF;W # So [256] SQUARE APAATO..SQUARE GAL
|
||||
3400..4DB5;W # Lo [6582] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DB5
|
||||
4DB6..4DBF;W # Cn [10] <reserved-4DB6>..<reserved-4DBF>
|
||||
3400..4DBF;W # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF
|
||||
4DC0..4DFF;N # So [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION
|
||||
4E00..9FEF;W # Lo [20976] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FEF
|
||||
9FF0..9FFF;W # Cn [16] <reserved-9FF0>..<reserved-9FFF>
|
||||
4E00..9FFC;W # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC
|
||||
9FFD..9FFF;W # Cn [3] <reserved-9FFD>..<reserved-9FFF>
|
||||
A000..A014;W # Lo [21] YI SYLLABLE IT..YI SYLLABLE E
|
||||
A015;W # Lm YI SYLLABLE WU
|
||||
A016..A48C;W # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR
|
||||
@ -1523,7 +1526,8 @@ A789..A78A;N # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUAL
|
||||
A78B..A78E;N # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT
|
||||
A78F;N # Lo LATIN LETTER SINOLOGICAL DOT
|
||||
A790..A7BF;N # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U
|
||||
A7C2..A7C6;N # L& [5] LATIN CAPITAL LETTER ANGLICANA W..LATIN CAPITAL LETTER Z WITH PALATAL HOOK
|
||||
A7C2..A7CA;N # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY
|
||||
A7F5..A7F6;N # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H
|
||||
A7F7;N # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I
|
||||
A7F8..A7F9;N # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE
|
||||
A7FA;N # Ll LATIN LETTER SMALL CAPITAL TURNED M
|
||||
@ -1539,6 +1543,7 @@ A823..A824;N # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN
|
||||
A825..A826;N # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E
|
||||
A827;N # Mc SYLOTI NAGRI VOWEL SIGN OO
|
||||
A828..A82B;N # So [4] SYLOTI NAGRI POETRY MARK-1..SYLOTI NAGRI POETRY MARK-4
|
||||
A82C;N # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA
|
||||
A830..A835;N # No [6] NORTH INDIC FRACTION ONE QUARTER..NORTH INDIC FRACTION THREE SIXTEENTHS
|
||||
A836..A837;N # So [2] NORTH INDIC QUARTER MARK..NORTH INDIC PLACEHOLDER MARK
|
||||
A838;N # Sc NORTH INDIC RUPEE MARK
|
||||
@ -1639,7 +1644,9 @@ AB28..AB2E;N # Lo [7] ETHIOPIC SYLLABLE BBA..ETHIOPIC SYLLABLE BBO
|
||||
AB30..AB5A;N # Ll [43] LATIN SMALL LETTER BARRED ALPHA..LATIN SMALL LETTER Y WITH SHORT RIGHT LEG
|
||||
AB5B;N # Sk MODIFIER BREVE WITH INVERTED BREVE
|
||||
AB5C..AB5F;N # Lm [4] MODIFIER LETTER SMALL HENG..MODIFIER LETTER SMALL U WITH LEFT HOOK
|
||||
AB60..AB67;N # Ll [8] LATIN SMALL LETTER SAKHA YAT..LATIN SMALL LETTER TS DIGRAPH WITH RETROFLEX HOOK
|
||||
AB60..AB68;N # Ll [9] LATIN SMALL LETTER SAKHA YAT..LATIN SMALL LETTER TURNED R WITH MIDDLE TILDE
|
||||
AB69;N # Lm MODIFIER LETTER SMALL TURNED W
|
||||
AB6A..AB6B;N # Sk [2] MODIFIER LETTER LEFT TACK..MODIFIER LETTER RIGHT TACK
|
||||
AB70..ABBF;N # Ll [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETTER YA
|
||||
ABC0..ABE2;N # Lo [35] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER I LONSUM
|
||||
ABE3..ABE4;N # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP
|
||||
@ -1800,7 +1807,7 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
10179..10189;N # So [17] GREEK YEAR SIGN..GREEK TRYBLION BASE SIGN
|
||||
1018A..1018B;N # No [2] GREEK ZERO SIGN..GREEK ONE QUARTER SIGN
|
||||
1018C..1018E;N # So [3] GREEK SINUSOID SIGN..NOMISMA SIGN
|
||||
10190..1019B;N # So [12] ROMAN SEXTANS SIGN..ROMAN CENTURIAL SIGN
|
||||
10190..1019C;N # So [13] ROMAN SEXTANS SIGN..ASCIA SYMBOL
|
||||
101A0;N # So GREEK SYMBOL TAU RHO
|
||||
101D0..101FC;N # So [45] PHAISTOS DISC SIGN PEDESTRIAN..PHAISTOS DISC SIGN WAVY BAND
|
||||
101FD;N # Mn PHAISTOS DISC SIGN COMBINING OBLIQUE STROKE
|
||||
@ -1902,6 +1909,10 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
10D24..10D27;N # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI
|
||||
10D30..10D39;N # Nd [10] HANIFI ROHINGYA DIGIT ZERO..HANIFI ROHINGYA DIGIT NINE
|
||||
10E60..10E7E;N # No [31] RUMI DIGIT ONE..RUMI FRACTION TWO THIRDS
|
||||
10E80..10EA9;N # Lo [42] YEZIDI LETTER ELIF..YEZIDI LETTER ET
|
||||
10EAB..10EAC;N # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK
|
||||
10EAD;N # Pd YEZIDI HYPHENATION MARK
|
||||
10EB0..10EB1;N # Lo [2] YEZIDI LETTER LAM WITH DOT ABOVE..YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE
|
||||
10F00..10F1C;N # Lo [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL
|
||||
10F1D..10F26;N # No [10] OLD SOGDIAN NUMBER ONE..OLD SOGDIAN FRACTION ONE HALF
|
||||
10F27;N # Lo OLD SOGDIAN LIGATURE AYIN-DALETH
|
||||
@ -1909,6 +1920,8 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
10F46..10F50;N # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW
|
||||
10F51..10F54;N # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED
|
||||
10F55..10F59;N # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT
|
||||
10FB0..10FC4;N # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW
|
||||
10FC5..10FCB;N # No [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED
|
||||
10FE0..10FF6;N # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH
|
||||
11000;N # Mc BRAHMI SIGN CANDRABINDU
|
||||
11001;N # Mn BRAHMI SIGN ANUSVARA
|
||||
@ -1941,6 +1954,7 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
11140..11143;N # Po [4] CHAKMA SECTION MARK..CHAKMA QUESTION MARK
|
||||
11144;N # Lo CHAKMA LETTER LHAA
|
||||
11145..11146;N # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI
|
||||
11147;N # Lo CHAKMA LETTER VAA
|
||||
11150..11172;N # Lo [35] MAHAJANI LETTER A..MAHAJANI LETTER RRA
|
||||
11173;N # Mn MAHAJANI SIGN NUKTA
|
||||
11174..11175;N # Po [2] MAHAJANI ABBREVIATION SIGN..MAHAJANI SECTION MARK
|
||||
@ -1955,6 +1969,8 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
111C5..111C8;N # Po [4] SHARADA DANDA..SHARADA SEPARATOR
|
||||
111C9..111CC;N # Mn [4] SHARADA SANDHI MARK..SHARADA EXTRA SHORT VOWEL MARK
|
||||
111CD;N # Po SHARADA SUTRA MARK
|
||||
111CE;N # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E
|
||||
111CF;N # Mn SHARADA SIGN INVERTED CANDRABINDU
|
||||
111D0..111D9;N # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE
|
||||
111DA;N # Lo SHARADA EKAM
|
||||
111DB;N # Po SHARADA SIGN SIDDHAM
|
||||
@ -2013,10 +2029,10 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
11447..1144A;N # Lo [4] NEWA SIGN AVAGRAHA..NEWA SIDDHI
|
||||
1144B..1144F;N # Po [5] NEWA DANDA..NEWA ABBREVIATION SIGN
|
||||
11450..11459;N # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE
|
||||
1145B;N # Po NEWA PLACEHOLDER MARK
|
||||
1145A..1145B;N # Po [2] NEWA DOUBLE COMMA..NEWA PLACEHOLDER MARK
|
||||
1145D;N # Po NEWA INSERTION SIGN
|
||||
1145E;N # Mn NEWA SANDHI MARK
|
||||
1145F;N # Lo NEWA LETTER VEDIC ANUSVARA
|
||||
1145F..11461;N # Lo [3] NEWA LETTER VEDIC ANUSVARA..NEWA SIGN UPADHMANIYA
|
||||
11480..114AF;N # Lo [48] TIRHUTA ANJI..TIRHUTA LETTER HA
|
||||
114B0..114B2;N # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II
|
||||
114B3..114B8;N # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL
|
||||
@ -2081,6 +2097,23 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
118E0..118E9;N # Nd [10] WARANG CITI DIGIT ZERO..WARANG CITI DIGIT NINE
|
||||
118EA..118F2;N # No [9] WARANG CITI NUMBER TEN..WARANG CITI NUMBER NINETY
|
||||
118FF;N # Lo WARANG CITI OM
|
||||
11900..11906;N # Lo [7] DIVES AKURU LETTER A..DIVES AKURU LETTER E
|
||||
11909;N # Lo DIVES AKURU LETTER O
|
||||
1190C..11913;N # Lo [8] DIVES AKURU LETTER KA..DIVES AKURU LETTER JA
|
||||
11915..11916;N # Lo [2] DIVES AKURU LETTER NYA..DIVES AKURU LETTER TTA
|
||||
11918..1192F;N # Lo [24] DIVES AKURU LETTER DDA..DIVES AKURU LETTER ZA
|
||||
11930..11935;N # Mc [6] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN E
|
||||
11937..11938;N # Mc [2] DIVES AKURU VOWEL SIGN AI..DIVES AKURU VOWEL SIGN O
|
||||
1193B..1193C;N # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU
|
||||
1193D;N # Mc DIVES AKURU SIGN HALANTA
|
||||
1193E;N # Mn DIVES AKURU VIRAMA
|
||||
1193F;N # Lo DIVES AKURU PREFIXED NASAL SIGN
|
||||
11940;N # Mc DIVES AKURU MEDIAL YA
|
||||
11941;N # Lo DIVES AKURU INITIAL RA
|
||||
11942;N # Mc DIVES AKURU MEDIAL RA
|
||||
11943;N # Mn DIVES AKURU SIGN NUKTA
|
||||
11944..11946;N # Po [3] DIVES AKURU DOUBLE DANDA..DIVES AKURU END OF TEXT MARK
|
||||
11950..11959;N # Nd [10] DIVES AKURU DIGIT ZERO..DIVES AKURU DIGIT NINE
|
||||
119A0..119A7;N # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR
|
||||
119AA..119D0;N # Lo [39] NANDINAGARI LETTER E..NANDINAGARI LETTER RRA
|
||||
119D1..119D3;N # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II
|
||||
@ -2158,6 +2191,7 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
11EF3..11EF4;N # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U
|
||||
11EF5..11EF6;N # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O
|
||||
11EF7..11EF8;N # Po [2] MAKASAR PASSIMBANG..MAKASAR END OF SECTION
|
||||
11FB0;N # Lo LISU LETTER YHA
|
||||
11FC0..11FD4;N # No [21] TAMIL FRACTION ONE THREE-HUNDRED-AND-TWENTIETH..TAMIL FRACTION DOWNSCALING FACTOR KIIZH
|
||||
11FD5..11FDC;N # So [8] TAMIL SIGN NEL..TAMIL SIGN MUKKURUNI
|
||||
11FDD..11FE0;N # Sc [4] TAMIL SIGN KAACU..TAMIL SIGN VARAAKAN
|
||||
@ -2200,8 +2234,12 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
16FE0..16FE1;W # Lm [2] TANGUT ITERATION MARK..NUSHU ITERATION MARK
|
||||
16FE2;W # Po OLD CHINESE HOOK MARK
|
||||
16FE3;W # Lm OLD CHINESE ITERATION MARK
|
||||
16FE4;W # Mn KHITAN SMALL SCRIPT FILLER
|
||||
16FF0..16FF1;W # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY
|
||||
17000..187F7;W # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7
|
||||
18800..18AF2;W # Lo [755] TANGUT COMPONENT-001..TANGUT COMPONENT-755
|
||||
18800..18AFF;W # Lo [768] TANGUT COMPONENT-001..TANGUT COMPONENT-768
|
||||
18B00..18CD5;W # Lo [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5
|
||||
18D00..18D08;W # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08
|
||||
1B000..1B0FF;W # Lo [256] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER RE-2
|
||||
1B100..1B11E;W # Lo [31] HENTAIGANA LETTER RE-3..HENTAIGANA LETTER N-MU-MO-2
|
||||
1B150..1B152;W # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO
|
||||
@ -2364,15 +2402,17 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
1F0D1..1F0F5;N # So [37] PLAYING CARD ACE OF CLUBS..PLAYING CARD TRUMP-21
|
||||
1F100..1F10A;A # No [11] DIGIT ZERO FULL STOP..DIGIT NINE COMMA
|
||||
1F10B..1F10C;N # No [2] DINGBAT CIRCLED SANS-SERIF DIGIT ZERO..DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT ZERO
|
||||
1F10D..1F10F;N # So [3] CIRCLED ZERO WITH SLASH..CIRCLED DOLLAR SIGN WITH OVERLAID BACKSLASH
|
||||
1F110..1F12D;A # So [30] PARENTHESIZED LATIN CAPITAL LETTER A..CIRCLED CD
|
||||
1F12E..1F12F;N # So [2] CIRCLED WZ..COPYLEFT SYMBOL
|
||||
1F130..1F169;A # So [58] SQUARED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z
|
||||
1F16A..1F16C;N # So [3] RAISED MC SIGN..RAISED MR SIGN
|
||||
1F16A..1F16F;N # So [6] RAISED MC SIGN..CIRCLED HUMAN FIGURE
|
||||
1F170..1F18D;A # So [30] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED SA
|
||||
1F18E;W # So NEGATIVE SQUARED AB
|
||||
1F18F..1F190;A # So [2] NEGATIVE SQUARED WC..SQUARE DJ
|
||||
1F191..1F19A;W # So [10] SQUARED CL..SQUARED VS
|
||||
1F19B..1F1AC;A # So [18] SQUARED THREE D..SQUARED VOD
|
||||
1F1AD;N # So MASK WORK SYMBOL
|
||||
1F1E6..1F1FF;N # So [26] REGIONAL INDICATOR SYMBOL LETTER A..REGIONAL INDICATOR SYMBOL LETTER Z
|
||||
1F200..1F202;W # So [3] SQUARE HIRAGANA HOKA..SQUARED KATAKANA SA
|
||||
1F210..1F23B;W # So [44] SQUARED CJK UNIFIED IDEOGRAPH-624B..SQUARED CJK UNIFIED IDEOGRAPH-914D
|
||||
@ -2424,11 +2464,11 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
1F6CD..1F6CF;N # So [3] SHOPPING BAGS..BED
|
||||
1F6D0..1F6D2;W # So [3] PLACE OF WORSHIP..SHOPPING TROLLEY
|
||||
1F6D3..1F6D4;N # So [2] STUPA..PAGODA
|
||||
1F6D5;W # So HINDU TEMPLE
|
||||
1F6D5..1F6D7;W # So [3] HINDU TEMPLE..ELEVATOR
|
||||
1F6E0..1F6EA;N # So [11] HAMMER AND WRENCH..NORTHEAST-POINTING AIRPLANE
|
||||
1F6EB..1F6EC;W # So [2] AIRPLANE DEPARTURE..AIRPLANE ARRIVING
|
||||
1F6F0..1F6F3;N # So [4] SATELLITE..PASSENGER SHIP
|
||||
1F6F4..1F6FA;W # So [7] SCOOTER..AUTO RICKSHAW
|
||||
1F6F4..1F6FC;W # So [9] SCOOTER..ROLLER SKATE
|
||||
1F700..1F773;N # So [116] ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE
|
||||
1F780..1F7D8;N # So [89] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..NEGATIVE CIRCLED SQUARE
|
||||
1F7E0..1F7EB;W # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE
|
||||
@ -2437,21 +2477,29 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
1F850..1F859;N # So [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW
|
||||
1F860..1F887;N # So [40] WIDE-HEADED LEFTWARDS LIGHT BARB ARROW..WIDE-HEADED SOUTH WEST VERY HEAVY BARB ARROW
|
||||
1F890..1F8AD;N # So [30] LEFTWARDS TRIANGLE ARROWHEAD..WHITE ARROW SHAFT WIDTH TWO THIRDS
|
||||
1F8B0..1F8B1;N # So [2] ARROW POINTING UPWARDS THEN NORTH WEST..ARROW POINTING RIGHTWARDS THEN CURVING SOUTH WEST
|
||||
1F900..1F90B;N # So [12] CIRCLED CROSS FORMEE WITH FOUR DOTS..DOWNWARD FACING NOTCHED HOOK WITH DOT
|
||||
1F90D..1F971;W # So [101] WHITE HEART..YAWNING FACE
|
||||
1F973..1F976;W # So [4] FACE WITH PARTY HORN AND PARTY HAT..FREEZING FACE
|
||||
1F97A..1F9A2;W # So [41] FACE WITH PLEADING EYES..SWAN
|
||||
1F9A5..1F9AA;W # So [6] SLOTH..OYSTER
|
||||
1F9AE..1F9CA;W # So [29] GUIDE DOG..ICE CUBE
|
||||
1F90C..1F93A;W # So [47] PINCHED FINGERS..FENCER
|
||||
1F93B;N # So MODERN PENTATHLON
|
||||
1F93C..1F945;W # So [10] WRESTLERS..GOAL NET
|
||||
1F946;N # So RIFLE
|
||||
1F947..1F978;W # So [50] FIRST PLACE MEDAL..DISGUISED FACE
|
||||
1F97A..1F9CB;W # So [82] FACE WITH PLEADING EYES..BUBBLE TEA
|
||||
1F9CD..1F9FF;W # So [51] STANDING PERSON..NAZAR AMULET
|
||||
1FA00..1FA53;N # So [84] NEUTRAL CHESS KING..BLACK CHESS KNIGHT-BISHOP
|
||||
1FA60..1FA6D;N # So [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER
|
||||
1FA70..1FA73;W # So [4] BALLET SHOES..SHORTS
|
||||
1FA70..1FA74;W # So [5] BALLET SHOES..THONG SANDAL
|
||||
1FA78..1FA7A;W # So [3] DROP OF BLOOD..STETHOSCOPE
|
||||
1FA80..1FA82;W # So [3] YO-YO..PARACHUTE
|
||||
1FA90..1FA95;W # So [6] RINGED PLANET..BANJO
|
||||
20000..2A6D6;W # Lo [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6
|
||||
2A6D7..2A6FF;W # Cn [41] <reserved-2A6D7>..<reserved-2A6FF>
|
||||
1FA80..1FA86;W # So [7] YO-YO..NESTING DOLLS
|
||||
1FA90..1FAA8;W # So [25] RINGED PLANET..ROCK
|
||||
1FAB0..1FAB6;W # So [7] FLY..FEATHER
|
||||
1FAC0..1FAC2;W # So [3] ANATOMICAL HEART..PEOPLE HUGGING
|
||||
1FAD0..1FAD6;W # So [7] BLUEBERRIES..TEAPOT
|
||||
1FB00..1FB92;N # So [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK
|
||||
1FB94..1FBCA;N # So [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON
|
||||
1FBF0..1FBF9;N # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE
|
||||
20000..2A6DD;W # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD
|
||||
2A6DE..2A6FF;W # Cn [34] <reserved-2A6DE>..<reserved-2A6FF>
|
||||
2A700..2B734;W # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734
|
||||
2B735..2B73F;W # Cn [11] <reserved-2B735>..<reserved-2B73F>
|
||||
2B740..2B81D;W # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D
|
||||
@ -2463,7 +2511,8 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
2F800..2FA1D;W # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
|
||||
2FA1E..2FA1F;W # Cn [2] <reserved-2FA1E>..<reserved-2FA1F>
|
||||
2FA20..2FFFD;W # Cn [1502] <reserved-2FA20>..<reserved-2FFFD>
|
||||
30000..3FFFD;W # Cn [65534] <reserved-30000>..<reserved-3FFFD>
|
||||
30000..3134A;W # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
|
||||
3134B..3FFFD;W # Cn [60595] <reserved-3134B>..<reserved-3FFFD>
|
||||
E0001;N # Cf LANGUAGE TAG
|
||||
E0020..E007F;N # Cf [96] TAG SPACE..CANCEL TAG
|
||||
E0100..E01EF;A # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256
|
||||
|
@ -35,7 +35,7 @@
|
||||
# files for making modifications.
|
||||
|
||||
|
||||
UNICODE_VERSION = 12.1.0
|
||||
UNICODE_VERSION = 13.0.0
|
||||
|
||||
PYTHON3 = python3
|
||||
WGET = wget
|
||||
|
@ -1,5 +1,5 @@
|
||||
# PropList-12.1.0.txt
|
||||
# Date: 2019-03-10, 10:53:16 GMT
|
||||
# PropList-13.0.0.txt
|
||||
# Date: 2019-11-27, 03:13:28 GMT
|
||||
# © 2019 Unicode®, Inc.
|
||||
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
|
||||
# For terms of use, see http://www.unicode.org/terms_of_use.html
|
||||
@ -61,8 +61,9 @@ FE31..FE32 ; Dash # Pd [2] PRESENTATION FORM FOR VERTICAL EM DASH..PRESENTA
|
||||
FE58 ; Dash # Pd SMALL EM DASH
|
||||
FE63 ; Dash # Pd SMALL HYPHEN-MINUS
|
||||
FF0D ; Dash # Pd FULLWIDTH HYPHEN-MINUS
|
||||
10EAD ; Dash # Pd YEZIDI HYPHENATION MARK
|
||||
|
||||
# Total code points: 28
|
||||
# Total code points: 29
|
||||
|
||||
# ================================================
|
||||
|
||||
@ -197,11 +198,13 @@ FF64 ; Terminal_Punctuation # Po HALFWIDTH IDEOGRAPHIC COMMA
|
||||
11238..1123C ; Terminal_Punctuation # Po [5] KHOJKI DANDA..KHOJKI DOUBLE SECTION MARK
|
||||
112A9 ; Terminal_Punctuation # Po MULTANI SECTION MARK
|
||||
1144B..1144D ; Terminal_Punctuation # Po [3] NEWA DANDA..NEWA COMMA
|
||||
1145B ; Terminal_Punctuation # Po NEWA PLACEHOLDER MARK
|
||||
1145A..1145B ; Terminal_Punctuation # Po [2] NEWA DOUBLE COMMA..NEWA PLACEHOLDER MARK
|
||||
115C2..115C5 ; Terminal_Punctuation # Po [4] SIDDHAM DANDA..SIDDHAM SEPARATOR BAR
|
||||
115C9..115D7 ; Terminal_Punctuation # Po [15] SIDDHAM END OF TEXT MARK..SIDDHAM SECTION MARK WITH CIRCLES AND FOUR ENCLOSURES
|
||||
11641..11642 ; Terminal_Punctuation # Po [2] MODI DANDA..MODI DOUBLE DANDA
|
||||
1173C..1173E ; Terminal_Punctuation # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI
|
||||
11944 ; Terminal_Punctuation # Po DIVES AKURU DOUBLE DANDA
|
||||
11946 ; Terminal_Punctuation # Po DIVES AKURU END OF TEXT MARK
|
||||
11A42..11A43 ; Terminal_Punctuation # Po [2] ZANABAZAR SQUARE MARK SHAD..ZANABAZAR SQUARE MARK DOUBLE SHAD
|
||||
11A9B..11A9C ; Terminal_Punctuation # Po [2] SOYOMBO MARK SHAD..SOYOMBO MARK DOUBLE SHAD
|
||||
11AA1..11AA2 ; Terminal_Punctuation # Po [2] SOYOMBO TERMINAL MARK-1..SOYOMBO TERMINAL MARK-2
|
||||
@ -217,7 +220,7 @@ FF64 ; Terminal_Punctuation # Po HALFWIDTH IDEOGRAPHIC COMMA
|
||||
1BC9F ; Terminal_Punctuation # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP
|
||||
1DA87..1DA8A ; Terminal_Punctuation # Po [4] SIGNWRITING COMMA..SIGNWRITING COLON
|
||||
|
||||
# Total code points: 264
|
||||
# Total code points: 267
|
||||
|
||||
# ================================================
|
||||
|
||||
@ -525,6 +528,7 @@ FF41..FF46 ; Hex_Digit # L& [6] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH L
|
||||
0D4A..0D4C ; Other_Alphabetic # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU
|
||||
0D57 ; Other_Alphabetic # Mc MALAYALAM AU LENGTH MARK
|
||||
0D62..0D63 ; Other_Alphabetic # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL
|
||||
0D81 ; Other_Alphabetic # Mn SINHALA SIGN CANDRABINDU
|
||||
0D82..0D83 ; Other_Alphabetic # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA
|
||||
0DCF..0DD1 ; Other_Alphabetic # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA
|
||||
0DD2..0DD4 ; Other_Alphabetic # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA
|
||||
@ -595,6 +599,7 @@ FF41..FF46 ; Hex_Digit # L& [6] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH L
|
||||
1A65..1A6C ; Other_Alphabetic # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW
|
||||
1A6D..1A72 ; Other_Alphabetic # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI
|
||||
1A73..1A74 ; Other_Alphabetic # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG
|
||||
1ABF..1AC0 ; Other_Alphabetic # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW
|
||||
1B00..1B03 ; Other_Alphabetic # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG
|
||||
1B04 ; Other_Alphabetic # Mc BALINESE SIGN BISAH
|
||||
1B35 ; Other_Alphabetic # Mc BALINESE VOWEL SIGN TEDUNG
|
||||
@ -676,6 +681,7 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA
|
||||
10A05..10A06 ; Other_Alphabetic # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O
|
||||
10A0C..10A0F ; Other_Alphabetic # Mn [4] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN VISARGA
|
||||
10D24..10D27 ; Other_Alphabetic # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI
|
||||
10EAB..10EAC ; Other_Alphabetic # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK
|
||||
11000 ; Other_Alphabetic # Mc BRAHMI SIGN CANDRABINDU
|
||||
11001 ; Other_Alphabetic # Mn BRAHMI SIGN ANUSVARA
|
||||
11002 ; Other_Alphabetic # Mc BRAHMI SIGN VISARGA
|
||||
@ -694,6 +700,8 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA
|
||||
111B3..111B5 ; Other_Alphabetic # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II
|
||||
111B6..111BE ; Other_Alphabetic # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O
|
||||
111BF ; Other_Alphabetic # Mc SHARADA VOWEL SIGN AU
|
||||
111CE ; Other_Alphabetic # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E
|
||||
111CF ; Other_Alphabetic # Mn SHARADA SIGN INVERTED CANDRABINDU
|
||||
1122C..1122E ; Other_Alphabetic # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II
|
||||
1122F..11231 ; Other_Alphabetic # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI
|
||||
11232..11233 ; Other_Alphabetic # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU
|
||||
@ -749,6 +757,11 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA
|
||||
1182C..1182E ; Other_Alphabetic # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II
|
||||
1182F..11837 ; Other_Alphabetic # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA
|
||||
11838 ; Other_Alphabetic # Mc DOGRA SIGN VISARGA
|
||||
11930..11935 ; Other_Alphabetic # Mc [6] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN E
|
||||
11937..11938 ; Other_Alphabetic # Mc [2] DIVES AKURU VOWEL SIGN AI..DIVES AKURU VOWEL SIGN O
|
||||
1193B..1193C ; Other_Alphabetic # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU
|
||||
11940 ; Other_Alphabetic # Mc DIVES AKURU MEDIAL YA
|
||||
11942 ; Other_Alphabetic # Mc DIVES AKURU MEDIAL RA
|
||||
119D1..119D3 ; Other_Alphabetic # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II
|
||||
119D4..119D7 ; Other_Alphabetic # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR
|
||||
119DA..119DB ; Other_Alphabetic # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI
|
||||
@ -790,6 +803,7 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA
|
||||
16F4F ; Other_Alphabetic # Mn MIAO SIGN CONSONANT MODIFIER BAR
|
||||
16F51..16F87 ; Other_Alphabetic # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI
|
||||
16F8F..16F92 ; Other_Alphabetic # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW
|
||||
16FF0..16FF1 ; Other_Alphabetic # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY
|
||||
1BC9E ; Other_Alphabetic # Mn DUPLOYAN DOUBLE MARK
|
||||
1E000..1E006 ; Other_Alphabetic # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE
|
||||
1E008..1E018 ; Other_Alphabetic # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU
|
||||
@ -801,7 +815,7 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA
|
||||
1F150..1F169 ; Other_Alphabetic # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z
|
||||
1F170..1F189 ; Other_Alphabetic # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z
|
||||
|
||||
# Total code points: 1377
|
||||
# Total code points: 1398
|
||||
|
||||
# ================================================
|
||||
|
||||
@ -809,21 +823,24 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA
|
||||
3007 ; Ideographic # Nl IDEOGRAPHIC NUMBER ZERO
|
||||
3021..3029 ; Ideographic # Nl [9] HANGZHOU NUMERAL ONE..HANGZHOU NUMERAL NINE
|
||||
3038..303A ; Ideographic # Nl [3] HANGZHOU NUMERAL TEN..HANGZHOU NUMERAL THIRTY
|
||||
3400..4DB5 ; Ideographic # Lo [6582] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DB5
|
||||
4E00..9FEF ; Ideographic # Lo [20976] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FEF
|
||||
3400..4DBF ; Ideographic # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF
|
||||
4E00..9FFC ; Ideographic # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC
|
||||
F900..FA6D ; Ideographic # Lo [366] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA6D
|
||||
FA70..FAD9 ; Ideographic # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9
|
||||
16FE4 ; Ideographic # Mn KHITAN SMALL SCRIPT FILLER
|
||||
17000..187F7 ; Ideographic # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7
|
||||
18800..18AF2 ; Ideographic # Lo [755] TANGUT COMPONENT-001..TANGUT COMPONENT-755
|
||||
18800..18CD5 ; Ideographic # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5
|
||||
18D00..18D08 ; Ideographic # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08
|
||||
1B170..1B2FB ; Ideographic # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB
|
||||
20000..2A6D6 ; Ideographic # Lo [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6
|
||||
20000..2A6DD ; Ideographic # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD
|
||||
2A700..2B734 ; Ideographic # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734
|
||||
2B740..2B81D ; Ideographic # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D
|
||||
2B820..2CEA1 ; Ideographic # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1
|
||||
2CEB0..2EBE0 ; Ideographic # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0
|
||||
2F800..2FA1D ; Ideographic # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
|
||||
30000..3134A ; Ideographic # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
|
||||
|
||||
# Total code points: 96190
|
||||
# Total code points: 101652
|
||||
|
||||
# ================================================
|
||||
|
||||
@ -882,6 +899,7 @@ FA70..FAD9 ; Ideographic # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COM
|
||||
0AFD..0AFF ; Diacritic # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE
|
||||
0B3C ; Diacritic # Mn ORIYA SIGN NUKTA
|
||||
0B4D ; Diacritic # Mn ORIYA SIGN VIRAMA
|
||||
0B55 ; Diacritic # Mn ORIYA SIGN OVERLINE
|
||||
0BCD ; Diacritic # Mn TAMIL SIGN VIRAMA
|
||||
0C4D ; Diacritic # Mn TELUGU SIGN VIRAMA
|
||||
0CBC ; Diacritic # Mn KANNADA SIGN NUKTA
|
||||
@ -978,6 +996,8 @@ AAC2 ; Diacritic # Lo TAI VIET TONE MAI SONG
|
||||
AAF6 ; Diacritic # Mn MEETEI MAYEK VIRAMA
|
||||
AB5B ; Diacritic # Sk MODIFIER BREVE WITH INVERTED BREVE
|
||||
AB5C..AB5F ; Diacritic # Lm [4] MODIFIER LETTER SMALL HENG..MODIFIER LETTER SMALL U WITH LEFT HOOK
|
||||
AB69 ; Diacritic # Lm MODIFIER LETTER SMALL TURNED W
|
||||
AB6A..AB6B ; Diacritic # Sk [2] MODIFIER LETTER LEFT TACK..MODIFIER LETTER RIGHT TACK
|
||||
ABEC ; Diacritic # Mc MEETEI MAYEK LUM IYEK
|
||||
ABED ; Diacritic # Mn MEETEI MAYEK APUN IYEK
|
||||
FB1E ; Diacritic # Mn HEBREW POINT JUDEO-SPANISH VARIKA
|
||||
@ -1013,6 +1033,9 @@ FFE3 ; Diacritic # Sk FULLWIDTH MACRON
|
||||
116B7 ; Diacritic # Mn TAKRI SIGN NUKTA
|
||||
1172B ; Diacritic # Mn AHOM SIGN KILLER
|
||||
11839..1183A ; Diacritic # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA
|
||||
1193D ; Diacritic # Mc DIVES AKURU SIGN HALANTA
|
||||
1193E ; Diacritic # Mn DIVES AKURU VIRAMA
|
||||
11943 ; Diacritic # Mn DIVES AKURU SIGN NUKTA
|
||||
119E0 ; Diacritic # Mn NANDINAGARI SIGN VIRAMA
|
||||
11A34 ; Diacritic # Mn ZANABAZAR SQUARE SIGN VIRAMA
|
||||
11A47 ; Diacritic # Mn ZANABAZAR SQUARE SUBJOINER
|
||||
@ -1025,6 +1048,7 @@ FFE3 ; Diacritic # Sk FULLWIDTH MACRON
|
||||
16B30..16B36 ; Diacritic # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM
|
||||
16F8F..16F92 ; Diacritic # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW
|
||||
16F93..16F9F ; Diacritic # Lm [13] MIAO LETTER TONE-2..MIAO LETTER REFORMED TONE-8
|
||||
16FF0..16FF1 ; Diacritic # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY
|
||||
1D167..1D169 ; Diacritic # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3
|
||||
1D16D..1D172 ; Diacritic # Mc [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5
|
||||
1D17B..1D182 ; Diacritic # Mn [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE
|
||||
@ -1036,7 +1060,7 @@ FFE3 ; Diacritic # Sk FULLWIDTH MACRON
|
||||
1E944..1E946 ; Diacritic # Mn [3] ADLAM ALIF LENGTHENER..ADLAM GEMINATION MARK
|
||||
1E948..1E94A ; Diacritic # Mn [3] ADLAM CONSONANT MODIFIER..ADLAM NUKTA
|
||||
|
||||
# Total code points: 873
|
||||
# Total code points: 882
|
||||
|
||||
# ================================================
|
||||
|
||||
@ -1044,6 +1068,7 @@ FFE3 ; Diacritic # Sk FULLWIDTH MACRON
|
||||
02D0..02D1 ; Extender # Lm [2] MODIFIER LETTER TRIANGULAR COLON..MODIFIER LETTER HALF TRIANGULAR COLON
|
||||
0640 ; Extender # Lm ARABIC TATWEEL
|
||||
07FA ; Extender # Lm NKO LAJANYALAN
|
||||
0B55 ; Extender # Mn ORIYA SIGN OVERLINE
|
||||
0E46 ; Extender # Lm THAI CHARACTER MAIYAMOK
|
||||
0EC6 ; Extender # Lm LAO KO LA
|
||||
180A ; Extender # Po MONGOLIAN NIRUGU
|
||||
@ -1072,7 +1097,7 @@ FF70 ; Extender # Lm HALFWIDTH KATAKANA-HIRAGANA PROLONGED SOUND
|
||||
1E13C..1E13D ; Extender # Lm [2] NYIAKENG PUACHUE HMONG SIGN XW XW..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER
|
||||
1E944..1E946 ; Extender # Mn [3] ADLAM ALIF LENGTHENER..ADLAM GEMINATION MARK
|
||||
|
||||
# Total code points: 47
|
||||
# Total code points: 48
|
||||
|
||||
# ================================================
|
||||
|
||||
@ -1155,11 +1180,12 @@ FF9E..FF9F ; Other_Grapheme_Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND
|
||||
114B0 ; Other_Grapheme_Extend # Mc TIRHUTA VOWEL SIGN AA
|
||||
114BD ; Other_Grapheme_Extend # Mc TIRHUTA VOWEL SIGN SHORT O
|
||||
115AF ; Other_Grapheme_Extend # Mc SIDDHAM VOWEL SIGN AA
|
||||
11930 ; Other_Grapheme_Extend # Mc DIVES AKURU VOWEL SIGN AA
|
||||
1D165 ; Other_Grapheme_Extend # Mc MUSICAL SYMBOL COMBINING STEM
|
||||
1D16E..1D172 ; Other_Grapheme_Extend # Mc [5] MUSICAL SYMBOL COMBINING FLAG-1..MUSICAL SYMBOL COMBINING FLAG-5
|
||||
E0020..E007F ; Other_Grapheme_Extend # Cf [96] TAG SPACE..CANCEL TAG
|
||||
|
||||
# Total code points: 126
|
||||
# Total code points: 127
|
||||
|
||||
# ================================================
|
||||
|
||||
@ -1184,8 +1210,8 @@ E0020..E007F ; Other_Grapheme_Extend # Cf [96] TAG SPACE..CANCEL TAG
|
||||
|
||||
# ================================================
|
||||
|
||||
3400..4DB5 ; Unified_Ideograph # Lo [6582] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DB5
|
||||
4E00..9FEF ; Unified_Ideograph # Lo [20976] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FEF
|
||||
3400..4DBF ; Unified_Ideograph # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF
|
||||
4E00..9FFC ; Unified_Ideograph # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC
|
||||
FA0E..FA0F ; Unified_Ideograph # Lo [2] CJK COMPATIBILITY IDEOGRAPH-FA0E..CJK COMPATIBILITY IDEOGRAPH-FA0F
|
||||
FA11 ; Unified_Ideograph # Lo CJK COMPATIBILITY IDEOGRAPH-FA11
|
||||
FA13..FA14 ; Unified_Ideograph # Lo [2] CJK COMPATIBILITY IDEOGRAPH-FA13..CJK COMPATIBILITY IDEOGRAPH-FA14
|
||||
@ -1193,13 +1219,14 @@ FA1F ; Unified_Ideograph # Lo CJK COMPATIBILITY IDEOGRAPH-FA1F
|
||||
FA21 ; Unified_Ideograph # Lo CJK COMPATIBILITY IDEOGRAPH-FA21
|
||||
FA23..FA24 ; Unified_Ideograph # Lo [2] CJK COMPATIBILITY IDEOGRAPH-FA23..CJK COMPATIBILITY IDEOGRAPH-FA24
|
||||
FA27..FA29 ; Unified_Ideograph # Lo [3] CJK COMPATIBILITY IDEOGRAPH-FA27..CJK COMPATIBILITY IDEOGRAPH-FA29
|
||||
20000..2A6D6 ; Unified_Ideograph # Lo [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6
|
||||
20000..2A6DD ; Unified_Ideograph # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD
|
||||
2A700..2B734 ; Unified_Ideograph # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734
|
||||
2B740..2B81D ; Unified_Ideograph # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D
|
||||
2B820..2CEA1 ; Unified_Ideograph # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1
|
||||
2CEB0..2EBE0 ; Unified_Ideograph # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0
|
||||
30000..3134A ; Unified_Ideograph # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
|
||||
|
||||
# Total code points: 87887
|
||||
# Total code points: 92856
|
||||
|
||||
# ================================================
|
||||
|
||||
@ -1362,6 +1389,8 @@ FF61 ; Sentence_Terminal # Po HALFWIDTH IDEOGRAPHIC FULL STOP
|
||||
115C9..115D7 ; Sentence_Terminal # Po [15] SIDDHAM END OF TEXT MARK..SIDDHAM SECTION MARK WITH CIRCLES AND FOUR ENCLOSURES
|
||||
11641..11642 ; Sentence_Terminal # Po [2] MODI DANDA..MODI DOUBLE DANDA
|
||||
1173C..1173E ; Sentence_Terminal # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI
|
||||
11944 ; Sentence_Terminal # Po DIVES AKURU DOUBLE DANDA
|
||||
11946 ; Sentence_Terminal # Po DIVES AKURU END OF TEXT MARK
|
||||
11A42..11A43 ; Sentence_Terminal # Po [2] ZANABAZAR SQUARE MARK SHAD..ZANABAZAR SQUARE MARK DOUBLE SHAD
|
||||
11A9B..11A9C ; Sentence_Terminal # Po [2] SOYOMBO MARK SHAD..SOYOMBO MARK DOUBLE SHAD
|
||||
11C41..11C42 ; Sentence_Terminal # Po [2] BHAIKSUKI DANDA..BHAIKSUKI DOUBLE DANDA
|
||||
@ -1374,7 +1403,7 @@ FF61 ; Sentence_Terminal # Po HALFWIDTH IDEOGRAPHIC FULL STOP
|
||||
1BC9F ; Sentence_Terminal # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP
|
||||
1DA88 ; Sentence_Terminal # Po SIGNWRITING FULL STOP
|
||||
|
||||
# Total code points: 141
|
||||
# Total code points: 143
|
||||
|
||||
# ================================================
|
||||
|
||||
@ -1574,8 +1603,8 @@ E0100..E01EF ; Variation_Selector # Mn [240] VARIATION SELECTOR-17..VARIATION S
|
||||
2B4D..2B73 ; Pattern_Syntax # So [39] DOWNWARDS TRIANGLE-HEADED ZIGZAG ARROW..DOWNWARDS TRIANGLE-HEADED ARROW TO BAR
|
||||
2B74..2B75 ; Pattern_Syntax # Cn [2] <reserved-2B74>..<reserved-2B75>
|
||||
2B76..2B95 ; Pattern_Syntax # So [32] NORTH WEST TRIANGLE-HEADED ARROW TO BAR..RIGHTWARDS BLACK ARROW
|
||||
2B96..2B97 ; Pattern_Syntax # Cn [2] <reserved-2B96>..<reserved-2B97>
|
||||
2B98..2BFF ; Pattern_Syntax # So [104] THREE-D TOP-LIGHTED LEFTWARDS EQUILATERAL ARROWHEAD..HELLSCHREIBER PAUSE SYMBOL
|
||||
2B96 ; Pattern_Syntax # Cn <reserved-2B96>
|
||||
2B97..2BFF ; Pattern_Syntax # So [105] SYMBOL FOR TYPE A ELECTRONICS..HELLSCHREIBER PAUSE SYMBOL
|
||||
2E00..2E01 ; Pattern_Syntax # Po [2] RIGHT ANGLE SUBSTITUTION MARKER..RIGHT ANGLE DOTTED SUBSTITUTION MARKER
|
||||
2E02 ; Pattern_Syntax # Pi LEFT SUBSTITUTION BRACKET
|
||||
2E03 ; Pattern_Syntax # Pf RIGHT SUBSTITUTION BRACKET
|
||||
@ -1614,7 +1643,9 @@ E0100..E01EF ; Variation_Selector # Mn [240] VARIATION SELECTOR-17..VARIATION S
|
||||
2E41 ; Pattern_Syntax # Po REVERSED COMMA
|
||||
2E42 ; Pattern_Syntax # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK
|
||||
2E43..2E4F ; Pattern_Syntax # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER
|
||||
2E50..2E7F ; Pattern_Syntax # Cn [48] <reserved-2E50>..<reserved-2E7F>
|
||||
2E50..2E51 ; Pattern_Syntax # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR
|
||||
2E52 ; Pattern_Syntax # Po TIRONIAN SIGN CAPITAL ET
|
||||
2E53..2E7F ; Pattern_Syntax # Cn [45] <reserved-2E53>..<reserved-2E7F>
|
||||
3001..3003 ; Pattern_Syntax # Po [3] IDEOGRAPHIC COMMA..DITTO MARK
|
||||
3008 ; Pattern_Syntax # Ps LEFT ANGLE BRACKET
|
||||
3009 ; Pattern_Syntax # Pe RIGHT ANGLE BRACKET
|
||||
|
File diff suppressed because it is too large
Load Diff
Loading…
Reference in New Issue
Block a user