diff options
Diffstat (limited to 'util/unicode/data/DerivedNormalizationProps.txt')
-rw-r--r-- | util/unicode/data/DerivedNormalizationProps.txt | 110 |
1 files changed, 97 insertions, 13 deletions
diff --git a/util/unicode/data/DerivedNormalizationProps.txt b/util/unicode/data/DerivedNormalizationProps.txt index 6492493da3..941c310b96 100644 --- a/util/unicode/data/DerivedNormalizationProps.txt +++ b/util/unicode/data/DerivedNormalizationProps.txt @@ -1,10 +1,11 @@ -# DerivedNormalizationProps-8.0.0.txt -# Date: 2015-02-13, 13:30:23 GMT [MD] +# DerivedNormalizationProps-10.0.0.txt +# Date: 2017-02-14, 04:26:07 GMT +# © 2017 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Character Database -# Copyright (c) 1991-2015 Unicode, Inc. -# For terms of use, see http://www.unicode.org/terms_of_use.html -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see http://www.unicode.org/reports/tr44/ # ================================================ @@ -1679,12 +1680,12 @@ FFED..FFEE ; NFKD_QC; N # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CI 1F16A..1F16B ; NFKD_QC; N # So [2] RAISED MC SIGN..RAISED MD SIGN 1F190 ; NFKD_QC; N # So SQUARE DJ 1F200..1F202 ; NFKD_QC; N # So [3] SQUARE HIRAGANA HOKA..SQUARED KATAKANA SA -1F210..1F23A ; NFKD_QC; N # So [43] SQUARED CJK UNIFIED IDEOGRAPH-624B..SQUARED CJK UNIFIED IDEOGRAPH-55B6 +1F210..1F23B ; NFKD_QC; N # So [44] SQUARED CJK UNIFIED IDEOGRAPH-624B..SQUARED CJK UNIFIED IDEOGRAPH-914D 1F240..1F248 ; NFKD_QC; N # So [9] TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-672C..TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-6557 1F250..1F251 ; NFKD_QC; N # So [2] CIRCLED IDEOGRAPH ADVANTAGE..CIRCLED IDEOGRAPH ACCEPT 2F800..2FA1D ; NFKD_QC; N # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D -# Total code points: 16893 +# Total code points: 16894 # ================================================ @@ -2082,12 +2083,12 @@ FFED..FFEE ; NFKC_QC; N # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CI 1F16A..1F16B ; NFKC_QC; N # So [2] RAISED MC SIGN..RAISED MD SIGN 1F190 ; NFKC_QC; N # So SQUARE DJ 1F200..1F202 ; NFKC_QC; N # So [3] SQUARE HIRAGANA HOKA..SQUARED KATAKANA SA -1F210..1F23A ; NFKC_QC; N # So [43] SQUARED CJK UNIFIED IDEOGRAPH-624B..SQUARED CJK UNIFIED IDEOGRAPH-55B6 +1F210..1F23B ; NFKC_QC; N # So [44] SQUARED CJK UNIFIED IDEOGRAPH-624B..SQUARED CJK UNIFIED IDEOGRAPH-914D 1F240..1F248 ; NFKC_QC; N # So [9] TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-672C..TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-6557 1F250..1F251 ; NFKC_QC; N # So [2] CIRCLED IDEOGRAPH ADVANTAGE..CIRCLED IDEOGRAPH ACCEPT 2F800..2FA1D ; NFKC_QC; N # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D -# Total code points: 4793 +# Total code points: 4794 # ================================================ @@ -3513,6 +3514,14 @@ FFE3 ; Expands_On_NFKC # Sk FULLWIDTH MACRON 17B4..17B5 ; NFKC_CF; # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA 180B..180D ; NFKC_CF; # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; NFKC_CF; # Cf MONGOLIAN VOWEL SEPARATOR +1C80 ; NFKC_CF; 0432 # L& CYRILLIC SMALL LETTER ROUNDED VE +1C81 ; NFKC_CF; 0434 # L& CYRILLIC SMALL LETTER LONG-LEGGED DE +1C82 ; NFKC_CF; 043E # L& CYRILLIC SMALL LETTER NARROW O +1C83 ; NFKC_CF; 0441 # L& CYRILLIC SMALL LETTER WIDE ES +1C84..1C85 ; NFKC_CF; 0442 # L& [2] CYRILLIC SMALL LETTER TALL TE..CYRILLIC SMALL LETTER THREE-LEGGED TE +1C86 ; NFKC_CF; 044A # L& CYRILLIC SMALL LETTER TALL HARD SIGN +1C87 ; NFKC_CF; 0463 # L& CYRILLIC SMALL LETTER TALL YAT +1C88 ; NFKC_CF; A64B # L& CYRILLIC SMALL LETTER UNBLENDED UK 1D2C ; NFKC_CF; 0061 # Lm MODIFIER LETTER CAPITAL A 1D2D ; NFKC_CF; 00E6 # Lm MODIFIER LETTER CAPITAL AE 1D2E ; NFKC_CF; 0062 # Lm MODIFIER LETTER CAPITAL B @@ -5263,6 +5272,7 @@ A7AA ; NFKC_CF; 0266 # L& LATIN CAPITAL LETTER H WITH H A7AB ; NFKC_CF; 025C # L& LATIN CAPITAL LETTER REVERSED OPEN E A7AC ; NFKC_CF; 0261 # L& LATIN CAPITAL LETTER SCRIPT G A7AD ; NFKC_CF; 026C # L& LATIN CAPITAL LETTER L WITH BELT +A7AE ; NFKC_CF; 026A # L& LATIN CAPITAL LETTER SMALL CAPITAL I A7B0 ; NFKC_CF; 029E # L& LATIN CAPITAL LETTER TURNED K A7B1 ; NFKC_CF; 0287 # L& LATIN CAPITAL LETTER TURNED T A7B2 ; NFKC_CF; 029D # L& LATIN CAPITAL LETTER J WITH CROSSED-TAIL @@ -6731,6 +6741,42 @@ FFF0..FFF8 ; NFKC_CF; # Cn [9] <reserved-FFF0>..<reserved-FF 10425 ; NFKC_CF; 1044D # L& DESERET CAPITAL LETTER ENG 10426 ; NFKC_CF; 1044E # L& DESERET CAPITAL LETTER OI 10427 ; NFKC_CF; 1044F # L& DESERET CAPITAL LETTER EW +104B0 ; NFKC_CF; 104D8 # L& OSAGE CAPITAL LETTER A +104B1 ; NFKC_CF; 104D9 # L& OSAGE CAPITAL LETTER AI +104B2 ; NFKC_CF; 104DA # L& OSAGE CAPITAL LETTER AIN +104B3 ; NFKC_CF; 104DB # L& OSAGE CAPITAL LETTER AH +104B4 ; NFKC_CF; 104DC # L& OSAGE CAPITAL LETTER BRA +104B5 ; NFKC_CF; 104DD # L& OSAGE CAPITAL LETTER CHA +104B6 ; NFKC_CF; 104DE # L& OSAGE CAPITAL LETTER EHCHA +104B7 ; NFKC_CF; 104DF # L& OSAGE CAPITAL LETTER E +104B8 ; NFKC_CF; 104E0 # L& OSAGE CAPITAL LETTER EIN +104B9 ; NFKC_CF; 104E1 # L& OSAGE CAPITAL LETTER HA +104BA ; NFKC_CF; 104E2 # L& OSAGE CAPITAL LETTER HYA +104BB ; NFKC_CF; 104E3 # L& OSAGE CAPITAL LETTER I +104BC ; NFKC_CF; 104E4 # L& OSAGE CAPITAL LETTER KA +104BD ; NFKC_CF; 104E5 # L& OSAGE CAPITAL LETTER EHKA +104BE ; NFKC_CF; 104E6 # L& OSAGE CAPITAL LETTER KYA +104BF ; NFKC_CF; 104E7 # L& OSAGE CAPITAL LETTER LA +104C0 ; NFKC_CF; 104E8 # L& OSAGE CAPITAL LETTER MA +104C1 ; NFKC_CF; 104E9 # L& OSAGE CAPITAL LETTER NA +104C2 ; NFKC_CF; 104EA # L& OSAGE CAPITAL LETTER O +104C3 ; NFKC_CF; 104EB # L& OSAGE CAPITAL LETTER OIN +104C4 ; NFKC_CF; 104EC # L& OSAGE CAPITAL LETTER PA +104C5 ; NFKC_CF; 104ED # L& OSAGE CAPITAL LETTER EHPA +104C6 ; NFKC_CF; 104EE # L& OSAGE CAPITAL LETTER SA +104C7 ; NFKC_CF; 104EF # L& OSAGE CAPITAL LETTER SHA +104C8 ; NFKC_CF; 104F0 # L& OSAGE CAPITAL LETTER TA +104C9 ; NFKC_CF; 104F1 # L& OSAGE CAPITAL LETTER EHTA +104CA ; NFKC_CF; 104F2 # L& OSAGE CAPITAL LETTER TSA +104CB ; NFKC_CF; 104F3 # L& OSAGE CAPITAL LETTER EHTSA +104CC ; NFKC_CF; 104F4 # L& OSAGE CAPITAL LETTER TSHA +104CD ; NFKC_CF; 104F5 # L& OSAGE CAPITAL LETTER DHA +104CE ; NFKC_CF; 104F6 # L& OSAGE CAPITAL LETTER U +104CF ; NFKC_CF; 104F7 # L& OSAGE CAPITAL LETTER WA +104D0 ; NFKC_CF; 104F8 # L& OSAGE CAPITAL LETTER KHA +104D1 ; NFKC_CF; 104F9 # L& OSAGE CAPITAL LETTER GHA +104D2 ; NFKC_CF; 104FA # L& OSAGE CAPITAL LETTER ZA +104D3 ; NFKC_CF; 104FB # L& OSAGE CAPITAL LETTER ZHA 10C80 ; NFKC_CF; 10CC0 # L& OLD HUNGARIAN CAPITAL LETTER A 10C81 ; NFKC_CF; 10CC1 # L& OLD HUNGARIAN CAPITAL LETTER AA 10C82 ; NFKC_CF; 10CC2 # L& OLD HUNGARIAN CAPITAL LETTER EB @@ -7819,6 +7865,40 @@ FFF0..FFF8 ; NFKC_CF; # Cn [9] <reserved-FFF0>..<reserved-FF 1D7FD ; NFKC_CF; 0037 # Nd MATHEMATICAL MONOSPACE DIGIT SEVEN 1D7FE ; NFKC_CF; 0038 # Nd MATHEMATICAL MONOSPACE DIGIT EIGHT 1D7FF ; NFKC_CF; 0039 # Nd MATHEMATICAL MONOSPACE DIGIT NINE +1E900 ; NFKC_CF; 1E922 # L& ADLAM CAPITAL LETTER ALIF +1E901 ; NFKC_CF; 1E923 # L& ADLAM CAPITAL LETTER DAALI +1E902 ; NFKC_CF; 1E924 # L& ADLAM CAPITAL LETTER LAAM +1E903 ; NFKC_CF; 1E925 # L& ADLAM CAPITAL LETTER MIIM +1E904 ; NFKC_CF; 1E926 # L& ADLAM CAPITAL LETTER BA +1E905 ; NFKC_CF; 1E927 # L& ADLAM CAPITAL LETTER SINNYIIYHE +1E906 ; NFKC_CF; 1E928 # L& ADLAM CAPITAL LETTER PE +1E907 ; NFKC_CF; 1E929 # L& ADLAM CAPITAL LETTER BHE +1E908 ; NFKC_CF; 1E92A # L& ADLAM CAPITAL LETTER RA +1E909 ; NFKC_CF; 1E92B # L& ADLAM CAPITAL LETTER E +1E90A ; NFKC_CF; 1E92C # L& ADLAM CAPITAL LETTER FA +1E90B ; NFKC_CF; 1E92D # L& ADLAM CAPITAL LETTER I +1E90C ; NFKC_CF; 1E92E # L& ADLAM CAPITAL LETTER O +1E90D ; NFKC_CF; 1E92F # L& ADLAM CAPITAL LETTER DHA +1E90E ; NFKC_CF; 1E930 # L& ADLAM CAPITAL LETTER YHE +1E90F ; NFKC_CF; 1E931 # L& ADLAM CAPITAL LETTER WAW +1E910 ; NFKC_CF; 1E932 # L& ADLAM CAPITAL LETTER NUN +1E911 ; NFKC_CF; 1E933 # L& ADLAM CAPITAL LETTER KAF +1E912 ; NFKC_CF; 1E934 # L& ADLAM CAPITAL LETTER YA +1E913 ; NFKC_CF; 1E935 # L& ADLAM CAPITAL LETTER U +1E914 ; NFKC_CF; 1E936 # L& ADLAM CAPITAL LETTER JIIM +1E915 ; NFKC_CF; 1E937 # L& ADLAM CAPITAL LETTER CHI +1E916 ; NFKC_CF; 1E938 # L& ADLAM CAPITAL LETTER HA +1E917 ; NFKC_CF; 1E939 # L& ADLAM CAPITAL LETTER QAAF +1E918 ; NFKC_CF; 1E93A # L& ADLAM CAPITAL LETTER GA +1E919 ; NFKC_CF; 1E93B # L& ADLAM CAPITAL LETTER NYA +1E91A ; NFKC_CF; 1E93C # L& ADLAM CAPITAL LETTER TU +1E91B ; NFKC_CF; 1E93D # L& ADLAM CAPITAL LETTER NHA +1E91C ; NFKC_CF; 1E93E # L& ADLAM CAPITAL LETTER VA +1E91D ; NFKC_CF; 1E93F # L& ADLAM CAPITAL LETTER KHA +1E91E ; NFKC_CF; 1E940 # L& ADLAM CAPITAL LETTER GBE +1E91F ; NFKC_CF; 1E941 # L& ADLAM CAPITAL LETTER ZAL +1E920 ; NFKC_CF; 1E942 # L& ADLAM CAPITAL LETTER KPO +1E921 ; NFKC_CF; 1E943 # L& ADLAM CAPITAL LETTER SHA 1EE00 ; NFKC_CF; 0627 # Lo ARABIC MATHEMATICAL ALEF 1EE01 ; NFKC_CF; 0628 # Lo ARABIC MATHEMATICAL BEH 1EE02 ; NFKC_CF; 062C # Lo ARABIC MATHEMATICAL JEEM @@ -8083,6 +8163,7 @@ FFF0..FFF8 ; NFKC_CF; # Cn [9] <reserved-FFF0>..<reserved-FF 1F238 ; NFKC_CF; 7533 # So SQUARED CJK UNIFIED IDEOGRAPH-7533 1F239 ; NFKC_CF; 5272 # So SQUARED CJK UNIFIED IDEOGRAPH-5272 1F23A ; NFKC_CF; 55B6 # So SQUARED CJK UNIFIED IDEOGRAPH-55B6 +1F23B ; NFKC_CF; 914D # So SQUARED CJK UNIFIED IDEOGRAPH-914D 1F240 ; NFKC_CF; 3014 672C 3015 # So TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-672C 1F241 ; NFKC_CF; 3014 4E09 3015 # So TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-4E09 1F242 ; NFKC_CF; 3014 4E8C 3015 # So TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-4E8C @@ -8634,7 +8715,7 @@ E0080..E00FF ; NFKC_CF; # Cn [128] <reserved-E0080>..<reserved-E E0100..E01EF ; NFKC_CF; # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 E01F0..E0FFF ; NFKC_CF; # Cn [3600] <reserved-E01F0>..<reserved-E0FFF> -# Total code points: 10146 +# Total code points: 10227 # ================================================ @@ -8972,6 +9053,7 @@ E01F0..E0FFF ; NFKC_CF; # Cn [3600] <reserved-E01F0>..<reserved- 17B4..17B5 ; Changes_When_NFKC_Casefolded # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA 180B..180D ; Changes_When_NFKC_Casefolded # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; Changes_When_NFKC_Casefolded # Cf MONGOLIAN VOWEL SEPARATOR +1C80..1C88 ; Changes_When_NFKC_Casefolded # L& [9] CYRILLIC SMALL LETTER ROUNDED VE..CYRILLIC SMALL LETTER UNBLENDED UK 1D2C..1D2E ; Changes_When_NFKC_Casefolded # Lm [3] MODIFIER LETTER CAPITAL A..MODIFIER LETTER CAPITAL B 1D30..1D3A ; Changes_When_NFKC_Casefolded # Lm [11] MODIFIER LETTER CAPITAL D..MODIFIER LETTER CAPITAL N 1D3C..1D4D ; Changes_When_NFKC_Casefolded # Lm [18] MODIFIER LETTER CAPITAL O..MODIFIER LETTER SMALL G @@ -9389,7 +9471,7 @@ A7A2 ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER K W A7A4 ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER N WITH OBLIQUE STROKE A7A6 ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER R WITH OBLIQUE STROKE A7A8 ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER S WITH OBLIQUE STROKE -A7AA..A7AD ; Changes_When_NFKC_Casefolded # L& [4] LATIN CAPITAL LETTER H WITH HOOK..LATIN CAPITAL LETTER L WITH BELT +A7AA..A7AE ; Changes_When_NFKC_Casefolded # L& [5] LATIN CAPITAL LETTER H WITH HOOK..LATIN CAPITAL LETTER SMALL CAPITAL I A7B0..A7B4 ; Changes_When_NFKC_Casefolded # L& [5] LATIN CAPITAL LETTER TURNED K..LATIN CAPITAL LETTER BETA A7B6 ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER OMEGA A7F8..A7F9 ; Changes_When_NFKC_Casefolded # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -9519,6 +9601,7 @@ FFE9..FFEC ; Changes_When_NFKC_Casefolded # Sm [4] HALFWIDTH LEFTWARDS ARRO FFED..FFEE ; Changes_When_NFKC_Casefolded # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE FFF0..FFF8 ; Changes_When_NFKC_Casefolded # Cn [9] <reserved-FFF0>..<reserved-FFF8> 10400..10427 ; Changes_When_NFKC_Casefolded # L& [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW +104B0..104D3 ; Changes_When_NFKC_Casefolded # L& [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA 10C80..10CB2 ; Changes_When_NFKC_Casefolded # L& [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US 118A0..118BF ; Changes_When_NFKC_Casefolded # L& [32] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI CAPITAL LETTER VIYO 1BCA0..1BCA3 ; Changes_When_NFKC_Casefolded # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP @@ -9566,6 +9649,7 @@ FFF0..FFF8 ; Changes_When_NFKC_Casefolded # Cn [9] <reserved-FFF0>..<reserv 1D7C3 ; Changes_When_NFKC_Casefolded # Sm MATHEMATICAL SANS-SERIF BOLD ITALIC PARTIAL DIFFERENTIAL 1D7C4..1D7CB ; Changes_When_NFKC_Casefolded # L& [8] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL BOLD SMALL DIGAMMA 1D7CE..1D7FF ; Changes_When_NFKC_Casefolded # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE +1E900..1E921 ; Changes_When_NFKC_Casefolded # L& [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA 1EE00..1EE03 ; Changes_When_NFKC_Casefolded # Lo [4] ARABIC MATHEMATICAL ALEF..ARABIC MATHEMATICAL DAL 1EE05..1EE1F ; Changes_When_NFKC_Casefolded # Lo [27] ARABIC MATHEMATICAL WAW..ARABIC MATHEMATICAL DOTLESS QAF 1EE21..1EE22 ; Changes_When_NFKC_Casefolded # Lo [2] ARABIC MATHEMATICAL INITIAL BEH..ARABIC MATHEMATICAL INITIAL JEEM @@ -9605,7 +9689,7 @@ FFF0..FFF8 ; Changes_When_NFKC_Casefolded # Cn [9] <reserved-FFF0>..<reserv 1F16A..1F16B ; Changes_When_NFKC_Casefolded # So [2] RAISED MC SIGN..RAISED MD SIGN 1F190 ; Changes_When_NFKC_Casefolded # So SQUARE DJ 1F200..1F202 ; Changes_When_NFKC_Casefolded # So [3] SQUARE HIRAGANA HOKA..SQUARED KATAKANA SA -1F210..1F23A ; Changes_When_NFKC_Casefolded # So [43] SQUARED CJK UNIFIED IDEOGRAPH-624B..SQUARED CJK UNIFIED IDEOGRAPH-55B6 +1F210..1F23B ; Changes_When_NFKC_Casefolded # So [44] SQUARED CJK UNIFIED IDEOGRAPH-624B..SQUARED CJK UNIFIED IDEOGRAPH-914D 1F240..1F248 ; Changes_When_NFKC_Casefolded # So [9] TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-672C..TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-6557 1F250..1F251 ; Changes_When_NFKC_Casefolded # So [2] CIRCLED IDEOGRAPH ADVANTAGE..CIRCLED IDEOGRAPH ACCEPT 2F800..2FA1D ; Changes_When_NFKC_Casefolded # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D @@ -9617,6 +9701,6 @@ E0080..E00FF ; Changes_When_NFKC_Casefolded # Cn [128] <reserved-E0080>..<reser E0100..E01EF ; Changes_When_NFKC_Casefolded # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 E01F0..E0FFF ; Changes_When_NFKC_Casefolded # Cn [3600] <reserved-E01F0>..<reserved-E0FFF> -# Total code points: 10146 +# Total code points: 10227 # EOF |