summaryrefslogtreecommitdiffstats
path: root/util/unicode/data/LineBreak.txt
diff options
context:
space:
mode:
Diffstat (limited to 'util/unicode/data/LineBreak.txt')
-rw-r--r--util/unicode/data/LineBreak.txt285
1 files changed, 198 insertions, 87 deletions
diff --git a/util/unicode/data/LineBreak.txt b/util/unicode/data/LineBreak.txt
index d80210bde3..9728582ab1 100644
--- a/util/unicode/data/LineBreak.txt
+++ b/util/unicode/data/LineBreak.txt
@@ -1,6 +1,6 @@
-# LineBreak-10.0.0.txt
-# Date: 2017-03-08, 02:00:00 GMT [KW, LI]
-# © 2017 Unicode®, Inc.
+# LineBreak-12.1.0.txt
+# Date: 2019-03-31, 22:04:15 GMT [KW, LI]
+# © 2019 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
@@ -124,7 +124,7 @@
00D7;AI # Sm MULTIPLICATION SIGN
00D8..00F6;AL # L& [31] LATIN CAPITAL LETTER O WITH STROKE..LATIN SMALL LETTER O WITH DIAERESIS
00F7;AI # Sm DIVISION SIGN
-00F8..00FF;AL # L& [8] LATIN SMALL LETTER O WITH STROKE..LATIN SMALL LETTER Y WITH DIAERESIS
+00F8..00FF;AL # Ll [8] LATIN SMALL LETTER O WITH STROKE..LATIN SMALL LETTER Y WITH DIAERESIS
0100..017F;AL # L& [128] LATIN CAPITAL LETTER A WITH MACRON..LATIN SMALL LETTER LONG S
0180..01BA;AL # L& [59] LATIN SMALL LETTER B WITH STROKE..LATIN SMALL LETTER EZH WITH TAIL
01BB;AL # Lo LATIN LETTER TWO WITH STROKE
@@ -188,7 +188,7 @@
0531..0556;AL # Lu [38] ARMENIAN CAPITAL LETTER AYB..ARMENIAN CAPITAL LETTER FEH
0559;AL # Lm ARMENIAN MODIFIER LETTER LEFT HALF RING
055A..055F;AL # Po [6] ARMENIAN APOSTROPHE..ARMENIAN ABBREVIATION MARK
-0561..0587;AL # Ll [39] ARMENIAN SMALL LETTER AYB..ARMENIAN SMALL LIGATURE ECH YIWN
+0560..0588;AL # Ll [41] ARMENIAN SMALL LETTER TURNED AYB..ARMENIAN SMALL LETTER YI WITH STROKE
0589;IS # Po ARMENIAN FULL STOP
058A;BA # Pd ARMENIAN HYPHEN
058D..058E;AL # So [2] RIGHT-FACING ARMENIAN ETERNITY SIGN..LEFT-FACING ARMENIAN ETERNITY SIGN
@@ -203,7 +203,7 @@
05C6;EX # Po HEBREW PUNCTUATION NUN HAFUKHA
05C7;CM # Mn HEBREW POINT QAMATS QATAN
05D0..05EA;HL # Lo [27] HEBREW LETTER ALEF..HEBREW LETTER TAV
-05F0..05F2;HL # Lo [3] HEBREW LIGATURE YIDDISH DOUBLE VAV..HEBREW LIGATURE YIDDISH DOUBLE YOD
+05EF..05F2;HL # Lo [4] HEBREW YOD TRIANGLE..HEBREW LIGATURE YIDDISH DOUBLE YOD
05F3..05F4;AL # Po [2] HEBREW PUNCTUATION GERESH..HEBREW PUNCTUATION GERSHAYIM
0600..0605;AL # Cf [6] ARABIC NUMBER SIGN..ARABIC NUMBER MARK ABOVE
0606..0608;AL # Sm [3] ARABIC-INDIC CUBE ROOT..ARABIC RAY
@@ -261,6 +261,8 @@
07F8;IS # Po NKO COMMA
07F9;EX # Po NKO EXCLAMATION MARK
07FA;AL # Lm NKO LAJANYALAN
+07FD;CM # Mn NKO DANTAYALAN
+07FE..07FF;PR # Sc [2] NKO DOROME SIGN..NKO TAMAN SIGN
0800..0815;AL # Lo [22] SAMARITAN LETTER ALAF..SAMARITAN LETTER TAAF
0816..0819;CM # Mn [4] SAMARITAN MARK IN..SAMARITAN MARK DAGESH
081A;AL # Lm SAMARITAN MODIFIER LETTER EPENTHETIC YUT
@@ -276,7 +278,7 @@
0860..086A;AL # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA
08A0..08B4;AL # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW
08B6..08BD;AL # Lo [8] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER AFRICAN NOON
-08D4..08E1;CM # Mn [14] ARABIC SMALL HIGH WORD AR-RUB..ARABIC SMALL HIGH SIGN SAFHA
+08D3..08E1;CM # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA
08E2;AL # Cf ARABIC DISPUTED END OF AYAH
08E3..08FF;CM # Mn [29] ARABIC TURNED DAMMA BELOW..ARABIC MARK SIDEWAYS NOON GHUNNA
0900..0902;CM # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA
@@ -330,6 +332,7 @@
09FB;PR # Sc BENGALI GANDA MARK
09FC;AL # Lo BENGALI LETTER VEDIC ANUSVARA
09FD;AL # Po BENGALI ABBREVIATION SIGN
+09FE;CM # Mn BENGALI SANDHI MARK
0A01..0A02;CM # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI
0A03;CM # Mc GURMUKHI SIGN VISARGA
0A05..0A0A;AL # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU
@@ -351,6 +354,7 @@
0A70..0A71;CM # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK
0A72..0A74;AL # Lo [3] GURMUKHI IRI..GURMUKHI EK ONKAR
0A75;CM # Mn GURMUKHI SIGN YAKASH
+0A76;AL # Po GURMUKHI ABBREVIATION SIGN
0A81..0A82;CM # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA
0A83;CM # Mc GUJARATI SIGN VISARGA
0A85..0A8D;AL # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E
@@ -427,6 +431,7 @@
0BFA;AL # So TAMIL NUMBER SIGN
0C00;CM # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE
0C01..0C03;CM # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA
+0C04;CM # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE
0C05..0C0C;AL # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L
0C0E..0C10;AL # Lo [3] TELUGU LETTER E..TELUGU LETTER AI
0C12..0C28;AL # Lo [23] TELUGU LETTER O..TELUGU LETTER NA
@@ -441,11 +446,13 @@
0C60..0C61;AL # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL
0C62..0C63;CM # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL
0C66..0C6F;NU # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE
+0C77;BB # Po TELUGU SIGN SIDDHAM
0C78..0C7E;AL # No [7] TELUGU FRACTION DIGIT ZERO FOR ODD POWERS OF FOUR..TELUGU FRACTION DIGIT THREE FOR EVEN POWERS OF FOUR
0C7F;AL # So TELUGU SIGN TUUMU
0C80;AL # Lo KANNADA SIGN SPACING CANDRABINDU
0C81;CM # Mn KANNADA SIGN CANDRABINDU
0C82..0C83;CM # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA
+0C84;BB # Po KANNADA SIGN SIDDHAM
0C85..0C8C;AL # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L
0C8E..0C90;AL # Lo [3] KANNADA LETTER E..KANNADA LETTER AI
0C92..0CA8;AL # Lo [23] KANNADA LETTER O..KANNADA LETTER NA
@@ -516,20 +523,13 @@
0E5A..0E5B;BA # Po [2] THAI CHARACTER ANGKHANKHU..THAI CHARACTER KHOMUT
0E81..0E82;SA # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG
0E84;SA # Lo LAO LETTER KHO TAM
-0E87..0E88;SA # Lo [2] LAO LETTER NGO..LAO LETTER CO
-0E8A;SA # Lo LAO LETTER SO TAM
-0E8D;SA # Lo LAO LETTER NYO
-0E94..0E97;SA # Lo [4] LAO LETTER DO..LAO LETTER THO TAM
-0E99..0E9F;SA # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG
-0EA1..0EA3;SA # Lo [3] LAO LETTER MO..LAO LETTER LO LING
+0E86..0E8A;SA # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM
+0E8C..0EA3;SA # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING
0EA5;SA # Lo LAO LETTER LO LOOT
-0EA7;SA # Lo LAO LETTER WO
-0EAA..0EAB;SA # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG
-0EAD..0EB0;SA # Lo [4] LAO LETTER O..LAO VOWEL SIGN A
+0EA7..0EB0;SA # Lo [10] LAO LETTER WO..LAO VOWEL SIGN A
0EB1;SA # Mn LAO VOWEL SIGN MAI KAN
0EB2..0EB3;SA # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM
-0EB4..0EB9;SA # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU
-0EBB..0EBC;SA # Mn [2] LAO VOWEL SIGN MAI KON..LAO SEMIVOWEL SIGN LO
+0EB4..0EBC;SA # Mn [9] LAO VOWEL SIGN I..LAO SEMIVOWEL SIGN LO
0EBD;SA # Lo LAO SEMIVOWEL SIGN NYO
0EC0..0EC4;SA # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI
0EC6;SA # Lm LAO KO LA
@@ -625,10 +625,10 @@
10A0..10C5;AL # Lu [38] GEORGIAN CAPITAL LETTER AN..GEORGIAN CAPITAL LETTER HOE
10C7;AL # Lu GEORGIAN CAPITAL LETTER YN
10CD;AL # Lu GEORGIAN CAPITAL LETTER AEN
-10D0..10FA;AL # Lo [43] GEORGIAN LETTER AN..GEORGIAN LETTER AIN
+10D0..10FA;AL # Ll [43] GEORGIAN LETTER AN..GEORGIAN LETTER AIN
10FB;AL # Po GEORGIAN PARAGRAPH SEPARATOR
10FC;AL # Lm MODIFIER LETTER GEORGIAN NAR
-10FD..10FF;AL # Lo [3] GEORGIAN LETTER AEN..GEORGIAN LETTER LABIAL SIGN
+10FD..10FF;AL # Ll [3] GEORGIAN LETTER AEN..GEORGIAN LETTER LABIAL SIGN
1100..115F;JL # Lo [96] HANGUL CHOSEONG KIYEOK..HANGUL CHOSEONG FILLER
1160..11A7;JV # Lo [72] HANGUL JUNGSEONG FILLER..HANGUL JUNGSEONG O-YAE
11A8..11FF;JT # Lo [88] HANGUL JONGSEONG KIYEOK..HANGUL JONGSEONG SSANGNIEUN
@@ -659,7 +659,8 @@
13F8..13FD;AL # Ll [6] CHEROKEE SMALL LETTER YE..CHEROKEE SMALL LETTER MV
1400;BA # Pd CANADIAN SYLLABICS HYPHEN
1401..166C;AL # Lo [620] CANADIAN SYLLABICS E..CANADIAN SYLLABICS CARRIER TTSA
-166D..166E;AL # Po [2] CANADIAN SYLLABICS CHI SIGN..CANADIAN SYLLABICS FULL STOP
+166D;AL # So CANADIAN SYLLABICS CHI SIGN
+166E;AL # Po CANADIAN SYLLABICS FULL STOP
166F..167F;AL # Lo [17] CANADIAN SYLLABICS QAI..CANADIAN SYLLABICS BLACKFOOT W
1680;BA # Zs OGHAM SPACE MARK
1681..169A;AL # Lo [26] OGHAM LETTER BEITH..OGHAM LETTER PEITH
@@ -711,7 +712,7 @@
1810..1819;NU # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE
1820..1842;AL # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI
1843;AL # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN
-1844..1877;AL # Lo [52] MONGOLIAN LETTER TODO E..MONGOLIAN LETTER MANCHU ZHA
+1844..1878;AL # Lo [53] MONGOLIAN LETTER TODO E..MONGOLIAN LETTER CHA WITH TWO DOTS
1880..1884;AL # Lo [5] MONGOLIAN LETTER ALI GALI ANUSVARA ONE..MONGOLIAN LETTER ALI GALI INVERTED UBADAMA
1885..1886;CM # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA
1887..18A8;AL # Lo [34] MONGOLIAN LETTER ALI GALI A..MONGOLIAN LETTER MANCHU ALI GALI BHA
@@ -817,6 +818,8 @@
1C78..1C7D;AL # Lm [6] OL CHIKI MU TTUDDAG..OL CHIKI AHAD
1C7E..1C7F;BA # Po [2] OL CHIKI PUNCTUATION MUCAAD..OL CHIKI PUNCTUATION DOUBLE MUCAAD
1C80..1C88;AL # Ll [9] CYRILLIC SMALL LETTER ROUNDED VE..CYRILLIC SMALL LETTER UNBLENDED UK
+1C90..1CBA;AL # Lu [43] GEORGIAN MTAVRULI CAPITAL LETTER AN..GEORGIAN MTAVRULI CAPITAL LETTER AIN
+1CBD..1CBF;AL # Lu [3] GEORGIAN MTAVRULI CAPITAL LETTER AEN..GEORGIAN MTAVRULI CAPITAL LETTER LABIAL SIGN
1CC0..1CC7;AL # Po [8] SUNDANESE PUNCTUATION BINDU SURYA..SUNDANESE PUNCTUATION BINDU BA SATANGA
1CD0..1CD2;CM # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA
1CD3;AL # Po VEDIC SIGN NIHSHVASA
@@ -825,12 +828,12 @@
1CE2..1CE8;CM # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL
1CE9..1CEC;AL # Lo [4] VEDIC SIGN ANUSVARA ANTARGOMUKHA..VEDIC SIGN ANUSVARA VAMAGOMUKHA WITH TAIL
1CED;CM # Mn VEDIC SIGN TIRYAK
-1CEE..1CF1;AL # Lo [4] VEDIC SIGN HEXIFORM LONG ANUSVARA..VEDIC SIGN ANUSVARA UBHAYATO MUKHA
-1CF2..1CF3;CM # Mc [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA
+1CEE..1CF3;AL # Lo [6] VEDIC SIGN HEXIFORM LONG ANUSVARA..VEDIC SIGN ROTATED ARDHAVISARGA
1CF4;CM # Mn VEDIC TONE CANDRA ABOVE
1CF5..1CF6;AL # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA
1CF7;CM # Mc VEDIC SIGN ATIKRAMA
1CF8..1CF9;CM # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE
+1CFA;AL # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA
1D00..1D2B;AL # Ll [44] LATIN LETTER SMALL CAPITAL A..CYRILLIC LETTER SMALL CAPITAL EL
1D2C..1D6A;AL # Lm [63] MODIFIER LETTER CAPITAL A..GREEK SUBSCRIPT SMALL LETTER CHI
1D6B..1D77;AL # Ll [13] LATIN SMALL LETTER UE..LATIN SMALL LETTER TURNED G
@@ -1300,10 +1303,7 @@
2B55..2B59;AI # So [5] HEAVY LARGE CIRCLE..HEAVY CIRCLED SALTIRE
2B5A..2B73;AL # So [26] SLANTED NORTH ARROW WITH HOOKED HEAD..DOWNWARDS TRIANGLE-HEADED ARROW TO BAR
2B76..2B95;AL # So [32] NORTH WEST TRIANGLE-HEADED ARROW TO BAR..RIGHTWARDS BLACK ARROW
-2B98..2BB9;AL # So [34] THREE-D TOP-LIGHTED LEFTWARDS EQUILATERAL ARROWHEAD..UP ARROWHEAD IN A RECTANGLE BOX
-2BBD..2BC8;AL # So [12] BALLOT BOX WITH LIGHT X..BLACK MEDIUM RIGHT-POINTING TRIANGLE CENTRED
-2BCA..2BD2;AL # So [9] TOP HALF BLACK CIRCLE..GROUP MARK
-2BEC..2BEF;AL # So [4] LEFTWARDS TWO-HEADED ARROW WITH TRIANGLE ARROWHEADS..DOWNWARDS TWO-HEADED ARROW WITH TRIANGLE ARROWHEADS
+2B98..2BFF;AL # So [104] THREE-D TOP-LIGHTED LEFTWARDS EQUILATERAL ARROWHEAD..HELLSCHREIBER PAUSE SYMBOL
2C00..2C2E;AL # Lu [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE
2C30..2C5E;AL # Ll [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE
2C60..2C7B;AL # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E
@@ -1380,7 +1380,11 @@
2E40;BA # Pd DOUBLE HYPHEN
2E41;BA # Po REVERSED COMMA
2E42;OP # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK
-2E43..2E49;BA # Po [7] DASH WITH LEFT UPTURN..DOUBLE STACKED COMMA
+2E43..2E4A;BA # Po [8] DASH WITH LEFT UPTURN..DOTTED SOLIDUS
+2E4B;AL # Po TRIPLE DAGGER
+2E4C;BA # Po MEDIEVAL COMMA
+2E4D;AL # Po PARAGRAPHUS MARK
+2E4E..2E4F;BA # Po [2] PUNCTUS ELEVATUS MARK..CORNISH VERSE DIVIDER
2E80..2E99;ID # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP
2E9B..2EF3;ID # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE
2F00..2FD5;ID # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE
@@ -1479,7 +1483,7 @@
30FC;CJ # Lm KATAKANA-HIRAGANA PROLONGED SOUND MARK
30FD..30FE;NS # Lm [2] KATAKANA ITERATION MARK..KATAKANA VOICED ITERATION MARK
30FF;ID # Lo KATAKANA DIGRAPH KOTO
-3105..312E;ID # Lo [42] BOPOMOFO LETTER B..BOPOMOFO LETTER O WITH DOT ABOVE
+3105..312F;ID # Lo [43] BOPOMOFO LETTER B..BOPOMOFO LETTER NN
3131..318E;ID # Lo [94] HANGUL LETTER KIYEOK..HANGUL LETTER ARAEAE
3190..3191;ID # So [2] IDEOGRAPHIC ANNOTATION LINKING MARK..IDEOGRAPHIC ANNOTATION REVERSE MARK
3192..3195;ID # No [4] IDEOGRAPHIC ANNOTATION ONE MARK..IDEOGRAPHIC ANNOTATION FOUR MARK
@@ -1497,13 +1501,13 @@
3280..3289;ID # No [10] CIRCLED IDEOGRAPH ONE..CIRCLED IDEOGRAPH TEN
328A..32B0;ID # So [39] CIRCLED IDEOGRAPH MOON..CIRCLED IDEOGRAPH NIGHT
32B1..32BF;ID # No [15] CIRCLED NUMBER THIRTY SIX..CIRCLED NUMBER FIFTY
-32C0..32FE;ID # So [63] IDEOGRAPHIC TELEGRAPH SYMBOL FOR JANUARY..CIRCLED KATAKANA WO
+32C0..32FF;ID # So [64] IDEOGRAPHIC TELEGRAPH SYMBOL FOR JANUARY..SQUARE ERA NAME REIWA
3300..33FF;ID # So [256] SQUARE APAATO..SQUARE GAL
3400..4DB5;ID # Lo [6582] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DB5
4DB6..4DBF;ID # Cn [10] <reserved-4DB6>..<reserved-4DBF>
4DC0..4DFF;AL # So [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION
-4E00..9FEA;ID # Lo [20971] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FEA
-9FEB..9FFF;ID # Cn [21] <reserved-9FEB>..<reserved-9FFF>
+4E00..9FEF;ID # Lo [20976] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FEF
+9FF0..9FFF;ID # Cn [16] <reserved-9FF0>..<reserved-9FFF>
A000..A014;ID # Lo [21] YI SYLLABLE IT..YI SYLLABLE E
A015;NS # Lm YI SYLLABLE WU
A016..A48C;ID # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR
@@ -1545,8 +1549,8 @@ A788;AL # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT
A789..A78A;AL # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN
A78B..A78E;AL # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT
A78F;AL # Lo LATIN LETTER SINOLOGICAL DOT
-A790..A7AE;AL # L& [31] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER SMALL CAPITAL I
-A7B0..A7B7;AL # L& [8] LATIN CAPITAL LETTER TURNED K..LATIN SMALL LETTER OMEGA
+A790..A7BF;AL # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U
+A7C2..A7C6;AL # L& [5] LATIN CAPITAL LETTER ANGLICANA W..LATIN CAPITAL LETTER Z WITH PALATAL HOOK
A7F7;AL # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I
A7F8..A7F9;AL # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE
A7FA;AL # Ll LATIN LETTER SMALL CAPITAL TURNED M
@@ -1580,7 +1584,8 @@ A8F2..A8F7;AL # Lo [6] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI S
A8F8..A8FA;AL # Po [3] DEVANAGARI SIGN PUSHPIKA..DEVANAGARI CARET
A8FB;AL # Lo DEVANAGARI HEADSTROKE
A8FC;BB # Po DEVANAGARI SIGN SIDDHAM
-A8FD;AL # Lo DEVANAGARI JAIN OM
+A8FD..A8FE;AL # Lo [2] DEVANAGARI JAIN OM..DEVANAGARI LETTER AY
+A8FF;CM # Mn DEVANAGARI VOWEL SIGN AY
A900..A909;NU # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE
A90A..A925;AL # Lo [28] KAYAH LI LETTER KA..KAYAH LI LETTER OO
A926..A92D;CM # Mn [8] KAYAH LI VOWEL UE..KAYAH LI TONE CALYA PLOPHU
@@ -1597,8 +1602,8 @@ A9B3;CM # Mn JAVANESE SIGN CECAK TELU
A9B4..A9B5;CM # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG
A9B6..A9B9;CM # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT
A9BA..A9BB;CM # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE
-A9BC;CM # Mn JAVANESE VOWEL SIGN PEPET
-A9BD..A9C0;CM # Mc [4] JAVANESE CONSONANT SIGN KERET..JAVANESE PANGKON
+A9BC..A9BD;CM # Mn [2] JAVANESE VOWEL SIGN PEPET..JAVANESE CONSONANT SIGN KERET
+A9BE..A9C0;CM # Mc [3] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE PANGKON
A9C1..A9C6;AL # Po [6] JAVANESE LEFT RERENGGAN..JAVANESE PADA WINDU
A9C7..A9C9;BA # Po [3] JAVANESE PADA PANGKAT..JAVANESE PADA LUNGSI
A9CA..A9CD;AL # Po [4] JAVANESE PADA ADEG..JAVANESE TURNED PADA PISELEH
@@ -1665,7 +1670,7 @@ AB28..AB2E;AL # Lo [7] ETHIOPIC SYLLABLE BBA..ETHIOPIC SYLLABLE BBO
AB30..AB5A;AL # Ll [43] LATIN SMALL LETTER BARRED ALPHA..LATIN SMALL LETTER Y WITH SHORT RIGHT LEG
AB5B;AL # Sk MODIFIER BREVE WITH INVERTED BREVE
AB5C..AB5F;AL # Lm [4] MODIFIER LETTER SMALL HENG..MODIFIER LETTER SMALL U WITH LEFT HOOK
-AB60..AB65;AL # Ll [6] LATIN SMALL LETTER SAKHA YAT..GREEK LETTER SMALL CAPITAL OMEGA
+AB60..AB67;AL # Ll [8] LATIN SMALL LETTER SAKHA YAT..LATIN SMALL LETTER TS DIGRAPH WITH RETROFLEX HOOK
AB70..ABBF;AL # Ll [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETTER YA
ABC0..ABE2;AL # Lo [35] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER I LONSUM
ABE3..ABE4;CM # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP
@@ -2706,10 +2711,10 @@ FFFD;AI # So REPLACEMENT CHARACTER
10A0C..10A0F;CM # Mn [4] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN VISARGA
10A10..10A13;AL # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA
10A15..10A17;AL # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA
-10A19..10A33;AL # Lo [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA
+10A19..10A35;AL # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA
10A38..10A3A;CM # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW
10A3F;CM # Mn KHAROSHTHI VIRAMA
-10A40..10A47;AL # No [8] KHAROSHTHI DIGIT ONE..KHAROSHTHI NUMBER ONE THOUSAND
+10A40..10A48;AL # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF
10A50..10A57;BA # Po [8] KHAROSHTHI PUNCTUATION DOT..KHAROSHTHI PUNCTUATION DOUBLE DANDA
10A58;AL # Po KHAROSHTHI PUNCTUATION LINES
10A60..10A7C;AL # Lo [29] OLD SOUTH ARABIAN LETTER HE..OLD SOUTH ARABIAN LETTER THETH
@@ -2737,7 +2742,18 @@ FFFD;AI # So REPLACEMENT CHARACTER
10C80..10CB2;AL # Lu [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US
10CC0..10CF2;AL # Ll [51] OLD HUNGARIAN SMALL LETTER A..OLD HUNGARIAN SMALL LETTER US
10CFA..10CFF;AL # No [6] OLD HUNGARIAN NUMBER ONE..OLD HUNGARIAN NUMBER ONE THOUSAND
+10D00..10D23;AL # Lo [36] HANIFI ROHINGYA LETTER A..HANIFI ROHINGYA MARK NA KHONNA
+10D24..10D27;CM # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI
+10D30..10D39;NU # Nd [10] HANIFI ROHINGYA DIGIT ZERO..HANIFI ROHINGYA DIGIT NINE
10E60..10E7E;AL # No [31] RUMI DIGIT ONE..RUMI FRACTION TWO THIRDS
+10F00..10F1C;AL # Lo [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL
+10F1D..10F26;AL # No [10] OLD SOGDIAN NUMBER ONE..OLD SOGDIAN FRACTION ONE HALF
+10F27;AL # Lo OLD SOGDIAN LIGATURE AYIN-DALETH
+10F30..10F45;AL # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN
+10F46..10F50;CM # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW
+10F51..10F54;AL # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED
+10F55..10F59;AL # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT
+10FE0..10FF6;AL # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH
11000;CM # Mc BRAHMI SIGN CANDRABINDU
11001;CM # Mn BRAHMI SIGN ANUSVARA
11002;CM # Mc BRAHMI SIGN VISARGA
@@ -2758,6 +2774,7 @@ FFFD;AI # So REPLACEMENT CHARACTER
110BB..110BC;AL # Po [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN
110BD;AL # Cf KAITHI NUMBER SIGN
110BE..110C1;BA # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA
+110CD;AL # Cf KAITHI NUMBER SIGN ABOVE
110D0..110E8;AL # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE
110F0..110F9;NU # Nd [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE
11100..11102;CM # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA
@@ -2767,6 +2784,8 @@ FFFD;AI # So REPLACEMENT CHARACTER
1112D..11134;CM # Mn [8] CHAKMA VOWEL SIGN AI..CHAKMA MAAYYAA
11136..1113F;NU # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE
11140..11143;BA # Po [4] CHAKMA SECTION MARK..CHAKMA QUESTION MARK
+11144;AL # Lo CHAKMA LETTER LHAA
+11145..11146;CM # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI
11150..11172;AL # Lo [35] MAHAJANI LETTER A..MAHAJANI LETTER RRA
11173;CM # Mn MAHAJANI SIGN NUKTA
11174;AL # Po MAHAJANI ABBREVIATION SIGN
@@ -2782,8 +2801,7 @@ FFFD;AI # So REPLACEMENT CHARACTER
111C5..111C6;BA # Po [2] SHARADA DANDA..SHARADA DOUBLE DANDA
111C7;AL # Po SHARADA ABBREVIATION SIGN
111C8;BA # Po SHARADA SEPARATOR
-111C9;AL # Po SHARADA SANDHI MARK
-111CA..111CC;CM # Mn [3] SHARADA SIGN NUKTA..SHARADA EXTRA SHORT VOWEL MARK
+111C9..111CC;CM # Mn [4] SHARADA SANDHI MARK..SHARADA EXTRA SHORT VOWEL MARK
111CD;AL # Po SHARADA SUTRA MARK
111D0..111D9;NU # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE
111DA;AL # Lo SHARADA EKAM
@@ -2823,7 +2841,7 @@ FFFD;AI # So REPLACEMENT CHARACTER
1132A..11330;AL # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA
11332..11333;AL # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA
11335..11339;AL # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA
-1133C;CM # Mn GRANTHA SIGN NUKTA
+1133B..1133C;CM # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA
1133D;AL # Lo GRANTHA SIGN AVAGRAHA
1133E..1133F;CM # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I
11340;CM # Mn GRANTHA VOWEL SIGN II
@@ -2849,6 +2867,8 @@ FFFD;AI # So REPLACEMENT CHARACTER
11450..11459;NU # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE
1145B;BA # Po NEWA PLACEHOLDER MARK
1145D;AL # Po NEWA INSERTION SIGN
+1145E;CM # Mn NEWA SANDHI MARK
+1145F;AL # Lo NEWA LETTER VEDIC ANUSVARA
11480..114AF;AL # Lo [48] TIRHUTA ANJI..TIRHUTA LETTER HA
114B0..114B2;CM # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II
114B3..114B8;CM # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL
@@ -2896,8 +2916,9 @@ FFFD;AI # So REPLACEMENT CHARACTER
116B0..116B5;CM # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU
116B6;CM # Mc TAKRI SIGN VIRAMA
116B7;CM # Mn TAKRI SIGN NUKTA
+116B8;AL # Lo TAKRI LETTER ARCHAIC KHA
116C0..116C9;NU # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE
-11700..11719;SA # Lo [26] AHOM LETTER KA..AHOM LETTER JHA
+11700..1171A;SA # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA
1171D..1171F;SA # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA
11720..11721;SA # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA
11722..11725;SA # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU
@@ -2907,14 +2928,29 @@ FFFD;AI # So REPLACEMENT CHARACTER
1173A..1173B;SA # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY
1173C..1173E;BA # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI
1173F;SA # So AHOM SYMBOL VI
+11800..1182B;AL # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA
+1182C..1182E;CM # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II
+1182F..11837;CM # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA
+11838;CM # Mc DOGRA SIGN VISARGA
+11839..1183A;CM # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA
+1183B;AL # Po DOGRA ABBREVIATION SIGN
118A0..118DF;AL # L& [64] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI SMALL LETTER VIYO
118E0..118E9;NU # Nd [10] WARANG CITI DIGIT ZERO..WARANG CITI DIGIT NINE
118EA..118F2;AL # No [9] WARANG CITI NUMBER TEN..WARANG CITI NUMBER NINETY
118FF;AL # Lo WARANG CITI OM
+119A0..119A7;AL # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR
+119AA..119D0;AL # Lo [39] NANDINAGARI LETTER E..NANDINAGARI LETTER RRA
+119D1..119D3;CM # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II
+119D4..119D7;CM # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR
+119DA..119DB;CM # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI
+119DC..119DF;CM # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA
+119E0;CM # Mn NANDINAGARI SIGN VIRAMA
+119E1;AL # Lo NANDINAGARI SIGN AVAGRAHA
+119E2;BB # Po NANDINAGARI SIGN SIDDHAM
+119E3;AL # Lo NANDINAGARI HEADSTROKE
+119E4;CM # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E
11A00;AL # Lo ZANABAZAR SQUARE LETTER A
-11A01..11A06;CM # Mn [6] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL SIGN O
-11A07..11A08;CM # Mc [2] ZANABAZAR SQUARE VOWEL SIGN AI..ZANABAZAR SQUARE VOWEL SIGN AU
-11A09..11A0A;CM # Mn [2] ZANABAZAR SQUARE VOWEL SIGN REVERSED I..ZANABAZAR SQUARE VOWEL LENGTH MARK
+11A01..11A0A;CM # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK
11A0B..11A32;AL # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA
11A33..11A38;CM # Mn [6] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN ANUSVARA
11A39;CM # Mc ZANABAZAR SQUARE SIGN VISARGA
@@ -2930,12 +2966,12 @@ FFFD;AI # So REPLACEMENT CHARACTER
11A51..11A56;CM # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE
11A57..11A58;CM # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU
11A59..11A5B;CM # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK
-11A5C..11A83;AL # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA
-11A86..11A89;AL # Lo [4] SOYOMBO CLUSTER-INITIAL LETTER RA..SOYOMBO CLUSTER-INITIAL LETTER SA
+11A5C..11A89;AL # Lo [46] SOYOMBO LETTER KA..SOYOMBO CLUSTER-INITIAL LETTER SA
11A8A..11A96;CM # Mn [13] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO SIGN ANUSVARA
11A97;CM # Mc SOYOMBO SIGN VISARGA
11A98..11A99;CM # Mn [2] SOYOMBO GEMINATION MARK..SOYOMBO SUBJOINER
11A9A..11A9C;BA # Po [3] SOYOMBO MARK TSHEG..SOYOMBO MARK DOUBLE SHAD
+11A9D;AL # Lo SOYOMBO MARK PLUTA
11A9E..11AA0;BB # Po [3] SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME..SOYOMBO HEAD MARK WITH MOON AND SUN
11AA1..11AA2;BA # Po [2] SOYOMBO TERMINAL MARK-1..SOYOMBO TERMINAL MARK-2
11AC0..11AF8;AL # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL
@@ -2970,6 +3006,26 @@ FFFD;AI # So REPLACEMENT CHARACTER
11D46;AL # Lo MASARAM GONDI REPHA
11D47;CM # Mn MASARAM GONDI RA-KARA
11D50..11D59;NU # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE
+11D60..11D65;AL # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU
+11D67..11D68;AL # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI
+11D6A..11D89;AL # Lo [32] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER SA
+11D8A..11D8E;CM # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU
+11D90..11D91;CM # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI
+11D93..11D94;CM # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU
+11D95;CM # Mn GUNJALA GONDI SIGN ANUSVARA
+11D96;CM # Mc GUNJALA GONDI SIGN VISARGA
+11D97;CM # Mn GUNJALA GONDI VIRAMA
+11D98;AL # Lo GUNJALA GONDI OM
+11DA0..11DA9;NU # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE
+11EE0..11EF2;AL # Lo [19] MAKASAR LETTER KA..MAKASAR ANGKA
+11EF3..11EF4;CM # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U
+11EF5..11EF6;CM # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O
+11EF7..11EF8;AL # Po [2] MAKASAR PASSIMBANG..MAKASAR END OF SECTION
+11FC0..11FD4;AL # No [21] TAMIL FRACTION ONE THREE-HUNDRED-AND-TWENTIETH..TAMIL FRACTION DOWNSCALING FACTOR KIIZH
+11FD5..11FDC;AL # So [8] TAMIL SIGN NEL..TAMIL SIGN MUKKURUNI
+11FDD..11FE0;PO # Sc [4] TAMIL SIGN KAACU..TAMIL SIGN VARAAKAN
+11FE1..11FF1;AL # So [17] TAMIL SIGN PAARAM..TAMIL SIGN VAKAIYARAA
+11FFF;BA # Po TAMIL PUNCTUATION END OF TEXT
12000..12399;AL # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U
12400..1246E;AL # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM
12470..12474;BA # Po [5] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON
@@ -2988,6 +3044,9 @@ FFFD;AI # So REPLACEMENT CHARACTER
13379;OP # Lo EGYPTIAN HIEROGLYPH V011A
1337A..1337B;CL # Lo [2] EGYPTIAN HIEROGLYPH V011B..EGYPTIAN HIEROGLYPH V011C
1337C..1342E;AL # Lo [179] EGYPTIAN HIEROGLYPH V012..EGYPTIAN HIEROGLYPH AA032
+13430..13436;GL # Cf [7] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH OVERLAY MIDDLE
+13437;OP # Cf EGYPTIAN HIEROGLYPH BEGIN SEGMENT
+13438;CL # Cf EGYPTIAN HIEROGLYPH END SEGMENT
14400..145CD;AL # Lo [462] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A409
145CE;OP # Lo ANATOLIAN HIEROGLYPH A410 BEGIN LOGOGRAM MARK
145CF;CL # Lo ANATOLIAN HIEROGLYPH A410A END LOGOGRAM MARK
@@ -3011,16 +3070,25 @@ FFFD;AI # So REPLACEMENT CHARACTER
16B5B..16B61;AL # No [7] PAHAWH HMONG NUMBER TENS..PAHAWH HMONG NUMBER TRILLIONS
16B63..16B77;AL # Lo [21] PAHAWH HMONG SIGN VOS LUB..PAHAWH HMONG SIGN CIM NRES TOS
16B7D..16B8F;AL # Lo [19] PAHAWH HMONG CLAN SIGN TSHEEJ..PAHAWH HMONG CLAN SIGN VWJ
-16F00..16F44;AL # Lo [69] MIAO LETTER PA..MIAO LETTER HHA
+16E40..16E7F;AL # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y
+16E80..16E96;AL # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM
+16E97..16E98;BA # Po [2] MEDEFAIDRIN COMMA..MEDEFAIDRIN FULL STOP
+16E99..16E9A;AL # Po [2] MEDEFAIDRIN SYMBOL AIVA..MEDEFAIDRIN EXCLAMATION OH
+16F00..16F4A;AL # Lo [75] MIAO LETTER PA..MIAO LETTER RTE
+16F4F;CM # Mn MIAO SIGN CONSONANT MODIFIER BAR
16F50;AL # Lo MIAO LETTER NASALIZATION
-16F51..16F7E;CM # Mc [46] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN NG
+16F51..16F87;CM # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI
16F8F..16F92;CM # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW
16F93..16F9F;AL # Lm [13] MIAO LETTER TONE-2..MIAO LETTER REFORMED TONE-8
16FE0..16FE1;NS # Lm [2] TANGUT ITERATION MARK..NUSHU ITERATION MARK
-17000..187EC;ID # Lo [6125] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187EC
+16FE2;NS # Po OLD CHINESE HOOK MARK
+16FE3;NS # Lm OLD CHINESE ITERATION MARK
+17000..187F7;ID # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7
18800..18AF2;ID # Lo [755] TANGUT COMPONENT-001..TANGUT COMPONENT-755
1B000..1B0FF;ID # Lo [256] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER RE-2
1B100..1B11E;ID # Lo [31] HENTAIGANA LETTER RE-3..HENTAIGANA LETTER N-MU-MO-2
+1B150..1B152;CJ # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO
+1B164..1B167;CJ # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N
1B170..1B2FB;ID # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB
1BC00..1BC6A;AL # Lo [107] DUPLOYAN LETTER H..DUPLOYAN LETTER VOCALIC M
1BC70..1BC7C;AL # Lo [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK
@@ -3047,8 +3115,9 @@ FFFD;AI # So REPLACEMENT CHARACTER
1D200..1D241;AL # So [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54
1D242..1D244;CM # Mn [3] COMBINING GREEK MUSICAL TRISEME..COMBINING GREEK MUSICAL PENTASEME
1D245;AL # So GREEK MUSICAL LEIMMA
+1D2E0..1D2F3;AL # No [20] MAYAN NUMERAL ZERO..MAYAN NUMERAL NINETEEN
1D300..1D356;AL # So [87] MONOGRAM FOR EARTH..TETRAGRAM FOR FOSTERING
-1D360..1D371;AL # No [18] COUNTING ROD UNIT DIGIT ONE..COUNTING ROD TENS DIGIT NINE
+1D360..1D378;AL # No [25] COUNTING ROD UNIT DIGIT ONE..TALLY MARK FIVE
1D400..1D454;AL # L& [85] MATHEMATICAL BOLD CAPITAL A..MATHEMATICAL ITALIC SMALL G
1D456..1D49C;AL # L& [71] MATHEMATICAL ITALIC SMALL I..MATHEMATICAL SCRIPT CAPITAL A
1D49E..1D49F;AL # Lu [2] MATHEMATICAL SCRIPT CAPITAL C..MATHEMATICAL SCRIPT CAPITAL D
@@ -3108,13 +3177,32 @@ FFFD;AI # So REPLACEMENT CHARACTER
1E01B..1E021;CM # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI
1E023..1E024;CM # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS
1E026..1E02A;CM # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA
+1E100..1E12C;AL # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W
+1E130..1E136;CM # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D
+1E137..1E13D;AL # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER
+1E140..1E149;NU # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE
+1E14E;AL # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ
+1E14F;AL # So NYIAKENG PUACHUE HMONG CIRCLED CA
+1E2C0..1E2EB;AL # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH
+1E2EC..1E2EF;CM # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI
+1E2F0..1E2F9;NU # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE
+1E2FF;PR # Sc WANCHO NGUN SIGN
1E800..1E8C4;AL # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON
1E8C7..1E8CF;AL # No [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE
1E8D0..1E8D6;CM # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS
1E900..1E943;AL # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA
1E944..1E94A;CM # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA
+1E94B;AL # Lm ADLAM NASALIZATION MARK
1E950..1E959;NU # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE
1E95E..1E95F;OP # Po [2] ADLAM INITIAL EXCLAMATION MARK..ADLAM INITIAL QUESTION MARK
+1EC71..1ECAB;AL # No [59] INDIC SIYAQ NUMBER ONE..INDIC SIYAQ NUMBER PREFIXED NINE
+1ECAC;PO # So INDIC SIYAQ PLACEHOLDER
+1ECAD..1ECAF;AL # No [3] INDIC SIYAQ FRACTION ONE QUARTER..INDIC SIYAQ FRACTION THREE QUARTERS
+1ECB0;PO # Sc INDIC SIYAQ RUPEE MARK
+1ECB1..1ECB4;AL # No [4] INDIC SIYAQ NUMBER ALTERNATE ONE..INDIC SIYAQ ALTERNATE LAKH MARK
+1ED01..1ED2D;AL # No [45] OTTOMAN SIYAQ NUMBER ONE..OTTOMAN SIYAQ NUMBER NINETY THOUSAND
+1ED2E;AL # So OTTOMAN SIYAQ MARRATAN
+1ED2F..1ED3D;AL # No [15] OTTOMAN SIYAQ ALTERNATE NUMBER TWO..OTTOMAN SIYAQ FRACTION ONE SIXTH
1EE00..1EE03;AL # Lo [4] ARABIC MATHEMATICAL ALEF..ARABIC MATHEMATICAL DAL
1EE05..1EE1F;AL # Lo [27] ARABIC MATHEMATICAL WAW..ARABIC MATHEMATICAL DOTLESS QAF
1EE21..1EE22;AL # Lo [2] ARABIC MATHEMATICAL INITIAL BEH..ARABIC MATHEMATICAL INITIAL JEEM
@@ -3164,11 +3252,10 @@ FFFD;AI # So REPLACEMENT CHARACTER
1F100..1F10C;AI # No [13] DIGIT ZERO FULL STOP..DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT ZERO
1F10D..1F10F;ID # Cn [3] <reserved-1F10D>..<reserved-1F10F>
1F110..1F12D;AI # So [30] PARENTHESIZED LATIN CAPITAL LETTER A..CIRCLED CD
-1F12E;AL # So CIRCLED WZ
-1F12F;ID # Cn <reserved-1F12F>
+1F12E..1F12F;AL # So [2] CIRCLED WZ..COPYLEFT SYMBOL
1F130..1F169;AI # So [58] SQUARED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z
-1F16A..1F16B;AL # So [2] RAISED MC SIGN..RAISED MD SIGN
-1F16C..1F16F;ID # Cn [4] <reserved-1F16C>..<reserved-1F16F>
+1F16A..1F16C;AL # So [3] RAISED MC SIGN..RAISED MR SIGN
+1F16D..1F16F;ID # Cn [3] <reserved-1F16D>..<reserved-1F16F>
1F170..1F1AC;AI # So [61] NEGATIVE SQUARED LATIN CAPITAL LETTER A..SQUARED VOD
1F1AD..1F1E5;ID # Cn [57] <reserved-1F1AD>..<reserved-1F1E5>
1F1E6..1F1FF;RI # So [26] REGIONAL INDICATOR SYMBOL LETTER A..REGIONAL INDICATOR SYMBOL LETTER Z
@@ -3203,18 +3290,18 @@ FFFD;AI # So REPLACEMENT CHARACTER
1F444..1F445;ID # So [2] MOUTH..TONGUE
1F446..1F450;EB # So [11] WHITE UP POINTING BACKHAND INDEX..OPEN HANDS SIGN
1F451..1F465;ID # So [21] CROWN..BUSTS IN SILHOUETTE
-1F466..1F469;EB # So [4] BOY..WOMAN
-1F46A..1F46D;ID # So [4] FAMILY..TWO WOMEN HOLDING HANDS
-1F46E;EB # So POLICE OFFICER
-1F46F;ID # So WOMAN WITH BUNNY EARS
-1F470..1F478;EB # So [9] BRIDE WITH VEIL..PRINCESS
+1F466..1F478;EB # So [19] BOY..PRINCESS
1F479..1F47B;ID # So [3] JAPANESE OGRE..GHOST
1F47C;EB # So BABY ANGEL
1F47D..1F480;ID # So [4] EXTRATERRESTRIAL ALIEN..SKULL
1F481..1F483;EB # So [3] INFORMATION DESK PERSON..DANCER
1F484;ID # So LIPSTICK
1F485..1F487;EB # So [3] NAIL POLISH..HAIRCUT
-1F488..1F49F;ID # So [24] BARBER POLE..HEART DECORATION
+1F488..1F48E;ID # So [7] BARBER POLE..GEM STONE
+1F48F;EB # So KISS
+1F490;ID # So BOUQUET
+1F491;EB # So COUPLE WITH HEART
+1F492..1F49F;ID # So [14] WEDDING..HEART DECORATION
1F4A0;AL # So DIAMOND SHAPE WITH A DOT INSIDE
1F4A1;ID # So ELECTRIC LIGHT BULB
1F4A2;AL # So ANGER SYMBOL
@@ -3261,16 +3348,19 @@ FFFD;AI # So REPLACEMENT CHARACTER
1F6C0;EB # So BATH
1F6C1..1F6CB;ID # So [11] BATHTUB..COUCH AND LAMP
1F6CC;EB # So SLEEPING ACCOMMODATION
-1F6CD..1F6D4;ID # So [8] SHOPPING BAGS..PAGODA
-1F6D5..1F6DF;ID # Cn [11] <reserved-1F6D5>..<reserved-1F6DF>
+1F6CD..1F6D5;ID # So [9] SHOPPING BAGS..HINDU TEMPLE
+1F6D6..1F6DF;ID # Cn [10] <reserved-1F6D6>..<reserved-1F6DF>
1F6E0..1F6EC;ID # So [13] HAMMER AND WRENCH..AIRPLANE ARRIVING
1F6ED..1F6EF;ID # Cn [3] <reserved-1F6ED>..<reserved-1F6EF>
-1F6F0..1F6F8;ID # So [9] SATELLITE..FLYING SAUCER
-1F6F9..1F6FF;ID # Cn [7] <reserved-1F6F9>..<reserved-1F6FF>
+1F6F0..1F6FA;ID # So [11] SATELLITE..AUTO RICKSHAW
+1F6FB..1F6FF;ID # Cn [5] <reserved-1F6FB>..<reserved-1F6FF>
1F700..1F773;AL # So [116] ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE
1F774..1F77F;ID # Cn [12] <reserved-1F774>..<reserved-1F77F>
1F780..1F7D4;AL # So [85] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..HEAVY TWELVE POINTED PINWHEEL STAR
-1F7D5..1F7FF;ID # Cn [43] <reserved-1F7D5>..<reserved-1F7FF>
+1F7D5..1F7D8;ID # So [4] CIRCLED TRIANGLE..NEGATIVE CIRCLED SQUARE
+1F7D9..1F7DF;ID # Cn [7] <reserved-1F7D9>..<reserved-1F7DF>
+1F7E0..1F7EB;ID # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE
+1F7EC..1F7FF;ID # Cn [20] <reserved-1F7EC>..<reserved-1F7FF>
1F800..1F80B;AL # So [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD
1F80C..1F80F;ID # Cn [4] <reserved-1F80C>..<reserved-1F80F>
1F810..1F847;AL # So [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW
@@ -3282,30 +3372,50 @@ FFFD;AI # So REPLACEMENT CHARACTER
1F890..1F8AD;AL # So [30] LEFTWARDS TRIANGLE ARROWHEAD..WHITE ARROW SHAFT WIDTH TWO THIRDS
1F8AE..1F8FF;ID # Cn [82] <reserved-1F8AE>..<reserved-1F8FF>
1F900..1F90B;AL # So [12] CIRCLED CROSS FORMEE WITH FOUR DOTS..DOWNWARD FACING NOTCHED HOOK WITH DOT
-1F90C..1F90F;ID # Cn [4] <reserved-1F90C>..<reserved-1F90F>
+1F90C;ID # Cn <reserved-1F90C>
+1F90D..1F90E;ID # So [2] WHITE HEART..BROWN HEART
+1F90F;EB # So PINCHING HAND
1F910..1F917;ID # So [8] ZIPPER-MOUTH FACE..HUGGING FACE
-1F918..1F91C;EB # So [5] SIGN OF THE HORNS..RIGHT-FACING FIST
-1F91D;ID # So HANDSHAKE
-1F91E..1F91F;EB # So [2] HAND WITH INDEX AND MIDDLE FINGERS CROSSED..I LOVE YOU HAND SIGN
+1F918..1F91F;EB # So [8] SIGN OF THE HORNS..I LOVE YOU HAND SIGN
1F920..1F925;ID # So [6] FACE WITH COWBOY HAT..LYING FACE
1F926;EB # So FACE PALM
1F927..1F92F;ID # So [9] SNEEZING FACE..SHOCKED FACE WITH EXPLODING HEAD
1F930..1F939;EB # So [10] PREGNANT WOMAN..JUGGLING
-1F93A..1F93C;ID # So [3] FENCER..WRESTLERS
-1F93D..1F93E;EB # So [2] WATER POLO..HANDBALL
-1F93F;ID # Cn <reserved-1F93F>
-1F940..1F94C;ID # So [13] WILTED FLOWER..CURLING STONE
-1F94D..1F94F;ID # Cn [3] <reserved-1F94D>..<reserved-1F94F>
-1F950..1F96B;ID # So [28] CROISSANT..CANNED FOOD
-1F96C..1F97F;ID # Cn [20] <reserved-1F96C>..<reserved-1F97F>
-1F980..1F997;ID # So [24] CRAB..CRICKET
-1F998..1F9BF;ID # Cn [40] <reserved-1F998>..<reserved-1F9BF>
-1F9C0;ID # So CHEESE WEDGE
-1F9C1..1F9CF;ID # Cn [15] <reserved-1F9C1>..<reserved-1F9CF>
+1F93A..1F93B;ID # So [2] FENCER..MODERN PENTATHLON
+1F93C..1F93E;EB # So [3] WRESTLERS..HANDBALL
+1F93F..1F971;ID # So [51] DIVING MASK..YAWNING FACE
+1F972;ID # Cn <reserved-1F972>
+1F973..1F976;ID # So [4] FACE WITH PARTY HORN AND PARTY HAT..FREEZING FACE
+1F977..1F979;ID # Cn [3] <reserved-1F977>..<reserved-1F979>
+1F97A..1F9A2;ID # So [41] FACE WITH PLEADING EYES..SWAN
+1F9A3..1F9A4;ID # Cn [2] <reserved-1F9A3>..<reserved-1F9A4>
+1F9A5..1F9AA;ID # So [6] SLOTH..OYSTER
+1F9AB..1F9AD;ID # Cn [3] <reserved-1F9AB>..<reserved-1F9AD>
+1F9AE..1F9B4;ID # So [7] GUIDE DOG..BONE
+1F9B5..1F9B6;EB # So [2] LEG..FOOT
+1F9B7;ID # So TOOTH
+1F9B8..1F9B9;EB # So [2] SUPERHERO..SUPERVILLAIN
+1F9BA;ID # So SAFETY VEST
+1F9BB;EB # So EAR WITH HEARING AID
+1F9BC..1F9CA;ID # So [15] MOTORIZED WHEELCHAIR..ICE CUBE
+1F9CB..1F9CC;ID # Cn [2] <reserved-1F9CB>..<reserved-1F9CC>
+1F9CD..1F9CF;EB # So [3] STANDING PERSON..DEAF PERSON
1F9D0;ID # So FACE WITH MONOCLE
1F9D1..1F9DD;EB # So [13] ADULT..ELF
-1F9DE..1F9E6;ID # So [9] GENIE..SOCKS
-1F9E7..1FFFD;ID # Cn [1559] <reserved-1F9E7>..<reserved-1FFFD>
+1F9DE..1F9FF;ID # So [34] GENIE..NAZAR AMULET
+1FA00..1FA53;AL # So [84] NEUTRAL CHESS KING..BLACK CHESS KNIGHT-BISHOP
+1FA54..1FA5F;ID # Cn [12] <reserved-1FA54>..<reserved-1FA5F>
+1FA60..1FA6D;ID # So [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER
+1FA6E..1FA6F;ID # Cn [2] <reserved-1FA6E>..<reserved-1FA6F>
+1FA70..1FA73;ID # So [4] BALLET SHOES..SHORTS
+1FA74..1FA77;ID # Cn [4] <reserved-1FA74>..<reserved-1FA77>
+1FA78..1FA7A;ID # So [3] DROP OF BLOOD..STETHOSCOPE
+1FA7B..1FA7F;ID # Cn [5] <reserved-1FA7B>..<reserved-1FA7F>
+1FA80..1FA82;ID # So [3] YO-YO..PARACHUTE
+1FA83..1FA8F;ID # Cn [13] <reserved-1FA83>..<reserved-1FA8F>
+1FA90..1FA95;ID # So [6] RINGED PLANET..BANJO
+1FA96..1FAFF;ID # Cn [106] <reserved-1FA96>..<reserved-1FAFF>
+1FB00..1FFFD;ID # Cn [1278] <reserved-1FB00>..<reserved-1FFFD>
20000..2A6D6;ID # Lo [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6
2A6D7..2A6FF;ID # Cn [41] <reserved-2A6D7>..<reserved-2A6FF>
2A700..2B734;ID # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734
@@ -3317,7 +3427,8 @@ FFFD;AI # So REPLACEMENT CHARACTER
2CEB0..2EBE0;ID # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0
2EBE1..2F7FF;ID # Cn [3103] <reserved-2EBE1>..<reserved-2F7FF>
2F800..2FA1D;ID # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
-2FA1E..2FFFD;ID # Cn [1504] <reserved-2FA1E>..<reserved-2FFFD>
+2FA1E..2FA1F;ID # Cn [2] <reserved-2FA1E>..<reserved-2FA1F>
+2FA20..2FFFD;ID # Cn [1502] <reserved-2FA20>..<reserved-2FFFD>
30000..3FFFD;ID # Cn [65534] <reserved-30000>..<reserved-3FFFD>
E0001;CM # Cf LANGUAGE TAG
E0020..E007F;CM # Cf [96] TAG SPACE..CANCEL TAG