diff --git a/unicodetools/data/ucd/dev/BidiBrackets.txt b/unicodetools/data/ucd/dev/BidiBrackets.txt index fefad0a65..8f382aea8 100644 --- a/unicodetools/data/ucd/dev/BidiBrackets.txt +++ b/unicodetools/data/ucd/dev/BidiBrackets.txt @@ -155,6 +155,8 @@ 2E5A; 2E59; c # TOP HALF RIGHT PARENTHESIS 2E5B; 2E5C; o # BOTTOM HALF LEFT PARENTHESIS 2E5C; 2E5B; c # BOTTOM HALF RIGHT PARENTHESIS +2E62; 2E63; o # LEFT PARENTHESIS WITH MIDDLE RING +2E63; 2E62; c # RIGHT PARENTHESIS WITH MIDDLE RING 3008; 3009; o # LEFT ANGLE BRACKET 3009; 3008; c # RIGHT ANGLE BRACKET 300A; 300B; o # LEFT DOUBLE ANGLE BRACKET diff --git a/unicodetools/data/ucd/dev/BidiMirroring.txt b/unicodetools/data/ucd/dev/BidiMirroring.txt index 8752077e0..a4eaaf50a 100644 --- a/unicodetools/data/ucd/dev/BidiMirroring.txt +++ b/unicodetools/data/ucd/dev/BidiMirroring.txt @@ -463,6 +463,8 @@ 2E5A; 2E59 # TOP HALF RIGHT PARENTHESIS 2E5B; 2E5C # BOTTOM HALF LEFT PARENTHESIS 2E5C; 2E5B # BOTTOM HALF RIGHT PARENTHESIS +2E62; 2E63 # LEFT PARENTHESIS WITH MIDDLE RING +2E63; 2E62 # RIGHT PARENTHESIS WITH MIDDLE RING 3008; 3009 # LEFT ANGLE BRACKET 3009; 3008 # RIGHT ANGLE BRACKET 300A; 300B # LEFT DOUBLE ANGLE BRACKET diff --git a/unicodetools/data/ucd/dev/CaseFolding.txt b/unicodetools/data/ucd/dev/CaseFolding.txt index ec92b75e1..9c5b71711 100644 --- a/unicodetools/data/ucd/dev/CaseFolding.txt +++ b/unicodetools/data/ucd/dev/CaseFolding.txt @@ -1,5 +1,5 @@ # CaseFolding-17.0.0.txt -# Date: 2025-01-27, 18:09:07 GMT +# Date: 2025-02-11, 13:47:46 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1251,6 +1251,7 @@ A7D6; C; A7D7; # LATIN CAPITAL LETTER MIDDLE SCOTS S A7D8; C; A7D9; # LATIN CAPITAL LETTER SIGMOID S A7DA; C; A7DB; # LATIN CAPITAL LETTER LAMBDA A7DC; C; 019B; # LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DD; C; 0277; # LATIN CAPITAL LETTER CLOSED OMEGA A7F5; C; A7F6; # LATIN CAPITAL LETTER REVERSED HALF H AB70; C; 13A0; # CHEROKEE SMALL LETTER A AB71; C; 13A1; # CHEROKEE SMALL LETTER E @@ -1644,6 +1645,17 @@ FF3A; C; FF5A; # FULLWIDTH LATIN CAPITAL LETTER Z 16EB6; C; 16ED1; # BERIA ERFE CAPITAL LETTER UI 16EB7; C; 16ED2; # BERIA ERFE CAPITAL LETTER WASSE 16EB8; C; 16ED3; # BERIA ERFE CAPITAL LETTER AY +1DF68; C; 1DF69; # LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH +1DF6A; C; 1DF6B; # LATIN CAPITAL LETTER PHONOTYPIC ROUNDTOP A +1DF6C; C; 1DF6D; # LATIN CAPITAL LETTER REVERSED SCRUPLE +1DF6E; C; 1DF6F; # LATIN CAPITAL LETTER PHONOTYPIC DIPHTHONG AI +1DF72; C; 1DF73; # LATIN CAPITAL LETTER O WITH CURL +1DF74; C; 1DF75; # LATIN CAPITAL LETTER CLOSED OMEGA WITH LONG STEM +1DF76; C; 1DF77; # LATIN CAPITAL LETTER TURNED CLOSED OMEGA +1DF78; C; 1DF79; # LATIN CAPITAL LETTER PHONOTYPIC TH +1DF7A; C; 1DF7B; # LATIN CAPITAL LETTER U WITH HOOK TAIL +1DF7C; C; 1DF7D; # LATIN CAPITAL LETTER U WITH NOTCH AT BOTTOM +1DF7E; C; 1DF7F; # LATIN CAPITAL LETTER REVERSED ENLARGED SMALL U 1E900; C; 1E922; # ADLAM CAPITAL LETTER ALIF 1E901; C; 1E923; # ADLAM CAPITAL LETTER DAALI 1E902; C; 1E924; # ADLAM CAPITAL LETTER LAAM diff --git a/unicodetools/data/ucd/dev/DerivedAge.txt b/unicodetools/data/ucd/dev/DerivedAge.txt index 18d53a3f0..ff9908e03 100644 --- a/unicodetools/data/ucd/dev/DerivedAge.txt +++ b/unicodetools/data/ucd/dev/DerivedAge.txt @@ -1,5 +1,5 @@ # DerivedAge-17.0.0.txt -# Date: 2025-01-27, 18:09:08 GMT +# Date: 2025-02-11, 13:47:47 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -2073,9 +2073,11 @@ A7DA..A7DC ; 16.0 # [3] LATIN CAPITAL LETTER LAMBDA..LATIN CAPITAL LETTER L 1ACF..1ADD ; 17.0 # [15] COMBINING DOUBLE CARON..COMBINING DOT-AND-RING BELOW 1AE0..1AEB ; 17.0 # [12] COMBINING LEFT TACK ABOVE..COMBINING DOUBLE RIGHTWARDS ARROW ABOVE 2B96 ; 17.0 # EQUALS SIGN WITH INFINITY ABOVE +2E60..2E63 ; 17.0 # [4] WIGGLY EXCLAMATION MARK..RIGHT PARENTHESIS WITH MIDDLE RING A7CE..A7CF ; 17.0 # [2] LATIN CAPITAL LETTER PHARYNGEAL VOICED FRICATIVE..LATIN SMALL LETTER PHARYNGEAL VOICED FRICATIVE A7D2 ; 17.0 # LATIN CAPITAL LETTER DOUBLE THORN A7D4 ; 17.0 # LATIN CAPITAL LETTER DOUBLE WYNN +A7DD ; 17.0 # LATIN CAPITAL LETTER CLOSED OMEGA A7F1 ; 17.0 # MODIFIER LETTER CAPITAL S FBC3..FBD2 ; 17.0 # [16] ARABIC LIGATURE JALLA WA-ALAA..ARABIC LIGATURE ALAYHI AR-RAHMAH FD90..FD91 ; 17.0 # [2] ARABIC LIGATURE RAHMATU ALLAAHI ALAYH..ARABIC LIGATURE RAHMATU ALLAAHI ALAYHAA @@ -2098,6 +2100,7 @@ FDC8..FDCE ; 17.0 # [7] ARABIC LIGATURE RAHIMAHU ALLAAH TAAALAA..ARABIC LIG 1CCFA..1CCFC ; 17.0 # [3] SNAKE SYMBOL..NOSE SYMBOL 1CEBA..1CED0 ; 17.0 # [23] FRAGILE SYMBOL..LEUKOTHEA 1CEE0..1CEF0 ; 17.0 # [17] GEOMANTIC FIGURE POPULUS..MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR +1DF68..1DF81 ; 17.0 # [26] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E6C0..1E6DE ; 17.0 # [31] TAI YO LETTER LOW KO..TAI YO LETTER HIGH KVO 1E6E0..1E6F5 ; 17.0 # [22] TAI YO LETTER AA..TAI YO SIGN OM 1E6FE..1E6FF ; 17.0 # [2] TAI YO SYMBOL MUEANG..TAI YO XAM LAI @@ -2116,6 +2119,6 @@ FDC8..FDCE ; 17.0 # [7] ARABIC LIGATURE RAHIMAHU ALLAAH TAAALAA..ARABIC LIG 2B73A..2B73E ; 17.0 # [5] CJK UNIFIED IDEOGRAPH-2B73A..CJK UNIFIED IDEOGRAPH-2B73E 323B0..33479 ; 17.0 # [4298] CJK UNIFIED IDEOGRAPH-323B0..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 4836 +# Total code points: 4867 # EOF diff --git a/unicodetools/data/ucd/dev/DerivedCoreProperties.txt b/unicodetools/data/ucd/dev/DerivedCoreProperties.txt index 44b253f44..cb39cda32 100644 --- a/unicodetools/data/ucd/dev/DerivedCoreProperties.txt +++ b/unicodetools/data/ucd/dev/DerivedCoreProperties.txt @@ -1,5 +1,5 @@ # DerivedCoreProperties-17.0.0.txt -# Date: 2025-01-27, 18:09:11 GMT +# Date: 2025-02-14, 01:57:20 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -836,7 +836,7 @@ A771..A787 ; Alphabetic # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER A788 ; Alphabetic # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; Alphabetic # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; Alphabetic # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; Alphabetic # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; Alphabetic # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; Alphabetic # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; Alphabetic # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; Alphabetic # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -1390,6 +1390,8 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 1DF0A ; Alphabetic # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; Alphabetic # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; Alphabetic # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; Alphabetic # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; Alphabetic # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E000..1E006 ; Alphabetic # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; Alphabetic # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; Alphabetic # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -1471,7 +1473,7 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 30000..3134A ; Alphabetic # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; Alphabetic # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 147441 +# Total code points: 147468 # ================================================ @@ -2168,10 +2170,21 @@ FF41..FF5A ; Lowercase # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH L 1DF00..1DF09 ; Lowercase # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK 1DF0B..1DF1E ; Lowercase # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; Lowercase # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF69 ; Lowercase # L& LATIN SMALL LETTER PHONOTYPIC A WITH SWASH +1DF6B ; Lowercase # L& LATIN SMALL LETTER PHONOTYPIC ROUNDTOP A +1DF6D ; Lowercase # L& LATIN SMALL LETTER REVERSED SCRUPLE +1DF6F..1DF71 ; Lowercase # L& [3] LATIN SMALL LETTER PHONOTYPIC DIPHTHONG AI..LATIN SMALL LETTER STRETCHED I +1DF73 ; Lowercase # L& LATIN SMALL LETTER O WITH CURL +1DF75 ; Lowercase # L& LATIN SMALL LETTER CLOSED OMEGA WITH LONG STEM +1DF77 ; Lowercase # L& LATIN SMALL LETTER TURNED CLOSED OMEGA +1DF79 ; Lowercase # L& LATIN SMALL LETTER PHONOTYPIC TH +1DF7B ; Lowercase # L& LATIN SMALL LETTER U WITH HOOK TAIL +1DF7D ; Lowercase # L& LATIN SMALL LETTER U WITH NOTCH AT BOTTOM +1DF7F ; Lowercase # L& LATIN SMALL LETTER REVERSED U 1E030..1E06D ; Lowercase # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E922..1E943 ; Lowercase # L& [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 2595 +# Total code points: 2608 # ================================================ @@ -2789,7 +2802,7 @@ A7D4 ; Uppercase # L& LATIN CAPITAL LETTER DOUBLE WYNN A7D6 ; Uppercase # L& LATIN CAPITAL LETTER MIDDLE SCOTS S A7D8 ; Uppercase # L& LATIN CAPITAL LETTER SIGMOID S A7DA ; Uppercase # L& LATIN CAPITAL LETTER LAMBDA -A7DC ; Uppercase # L& LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DC..A7DD ; Uppercase # L& [2] LATIN CAPITAL LETTER LAMBDA WITH STROKE..LATIN CAPITAL LETTER CLOSED OMEGA A7F5 ; Uppercase # L& LATIN CAPITAL LETTER REVERSED HALF H FF21..FF3A ; Uppercase # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z 10400..10427 ; Uppercase # L& [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW @@ -2834,12 +2847,23 @@ FF21..FF3A ; Uppercase # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH 1D756..1D76E ; Uppercase # L& [25] MATHEMATICAL SANS-SERIF BOLD CAPITAL ALPHA..MATHEMATICAL SANS-SERIF BOLD CAPITAL OMEGA 1D790..1D7A8 ; Uppercase # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL OMEGA 1D7CA ; Uppercase # L& MATHEMATICAL BOLD CAPITAL DIGAMMA +1DF68 ; Uppercase # L& LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH +1DF6A ; Uppercase # L& LATIN CAPITAL LETTER PHONOTYPIC ROUNDTOP A +1DF6C ; Uppercase # L& LATIN CAPITAL LETTER REVERSED SCRUPLE +1DF6E ; Uppercase # L& LATIN CAPITAL LETTER PHONOTYPIC DIPHTHONG AI +1DF72 ; Uppercase # L& LATIN CAPITAL LETTER O WITH CURL +1DF74 ; Uppercase # L& LATIN CAPITAL LETTER CLOSED OMEGA WITH LONG STEM +1DF76 ; Uppercase # L& LATIN CAPITAL LETTER TURNED CLOSED OMEGA +1DF78 ; Uppercase # L& LATIN CAPITAL LETTER PHONOTYPIC TH +1DF7A ; Uppercase # L& LATIN CAPITAL LETTER U WITH HOOK TAIL +1DF7C ; Uppercase # L& LATIN CAPITAL LETTER U WITH NOTCH AT BOTTOM +1DF7E ; Uppercase # L& LATIN CAPITAL LETTER REVERSED ENLARGED SMALL U 1E900..1E921 ; Uppercase # L& [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA 1F130..1F149 ; Uppercase # So [26] SQUARED LATIN CAPITAL LETTER A..SQUARED LATIN CAPITAL LETTER Z 1F150..1F169 ; Uppercase # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; Uppercase # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 2006 +# Total code points: 2018 # ================================================ @@ -2947,7 +2971,7 @@ A722..A76F ; Cased # L& [78] LATIN CAPITAL LETTER EGYPTOLOGICAL ALEF..LATIN A770 ; Cased # Lm MODIFIER LETTER US A771..A787 ; Cased # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER INSULAR T A78B..A78E ; Cased # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT -A790..A7DC ; Cased # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; Cased # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; Cased # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; Cased # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F8..A7F9 ; Cased # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -3017,13 +3041,14 @@ FF41..FF5A ; Cased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 1DF00..1DF09 ; Cased # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK 1DF0B..1DF1E ; Cased # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; Cased # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; Cased # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U 1E030..1E06D ; Cased # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E900..1E943 ; Cased # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA 1F130..1F149 ; Cased # So [26] SQUARED LATIN CAPITAL LETTER A..SQUARED LATIN CAPITAL LETTER Z 1F150..1F169 ; Cased # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; Cased # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 4632 +# Total code points: 4657 # ================================================ @@ -4166,7 +4191,7 @@ A7D4 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER DOUBLE W A7D6 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER MIDDLE SCOTS S A7D8 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER SIGMOID S A7DA ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER LAMBDA -A7DC ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DC..A7DD ; Changes_When_Lowercased # L& [2] LATIN CAPITAL LETTER LAMBDA WITH STROKE..LATIN CAPITAL LETTER CLOSED OMEGA A7F5 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER REVERSED HALF H FF21..FF3A ; Changes_When_Lowercased # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z 10400..10427 ; Changes_When_Lowercased # L& [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW @@ -4180,9 +4205,20 @@ FF21..FF3A ; Changes_When_Lowercased # L& [26] FULLWIDTH LATIN CAPITAL LETTE 118A0..118BF ; Changes_When_Lowercased # L& [32] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI CAPITAL LETTER VIYO 16E40..16E5F ; Changes_When_Lowercased # L& [32] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN CAPITAL LETTER Y 16EA0..16EB8 ; Changes_When_Lowercased # L& [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY +1DF68 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH +1DF6A ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER PHONOTYPIC ROUNDTOP A +1DF6C ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER REVERSED SCRUPLE +1DF6E ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER PHONOTYPIC DIPHTHONG AI +1DF72 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER O WITH CURL +1DF74 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER CLOSED OMEGA WITH LONG STEM +1DF76 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER TURNED CLOSED OMEGA +1DF78 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER PHONOTYPIC TH +1DF7A ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER U WITH HOOK TAIL +1DF7C ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER U WITH NOTCH AT BOTTOM +1DF7E ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER REVERSED ENLARGED SMALL U 1E900..1E921 ; Changes_When_Lowercased # L& [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA -# Total code points: 1488 +# Total code points: 1500 # ================================================ @@ -4344,6 +4380,7 @@ FF21..FF3A ; Changes_When_Lowercased # L& [26] FULLWIDTH LATIN CAPITAL LETTE 026F ; Changes_When_Uppercased # L& LATIN SMALL LETTER TURNED M 0271..0272 ; Changes_When_Uppercased # L& [2] LATIN SMALL LETTER M WITH HOOK..LATIN SMALL LETTER N WITH LEFT HOOK 0275 ; Changes_When_Uppercased # L& LATIN SMALL LETTER BARRED O +0277 ; Changes_When_Uppercased # L& LATIN SMALL LETTER CLOSED OMEGA 027D ; Changes_When_Uppercased # L& LATIN SMALL LETTER R WITH TAIL 0280 ; Changes_When_Uppercased # L& LATIN LETTER SMALL CAPITAL R 0282..0283 ; Changes_When_Uppercased # L& [2] LATIN SMALL LETTER S WITH HOOK..LATIN SMALL LETTER ESH @@ -4824,9 +4861,20 @@ FF41..FF5A ; Changes_When_Uppercased # L& [26] FULLWIDTH LATIN SMALL LETTER 118C0..118DF ; Changes_When_Uppercased # L& [32] WARANG CITI SMALL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 16E60..16E7F ; Changes_When_Uppercased # L& [32] MEDEFAIDRIN SMALL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16EBB..16ED3 ; Changes_When_Uppercased # L& [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY +1DF69 ; Changes_When_Uppercased # L& LATIN SMALL LETTER PHONOTYPIC A WITH SWASH +1DF6B ; Changes_When_Uppercased # L& LATIN SMALL LETTER PHONOTYPIC ROUNDTOP A +1DF6D ; Changes_When_Uppercased # L& LATIN SMALL LETTER REVERSED SCRUPLE +1DF6F ; Changes_When_Uppercased # L& LATIN SMALL LETTER PHONOTYPIC DIPHTHONG AI +1DF73 ; Changes_When_Uppercased # L& LATIN SMALL LETTER O WITH CURL +1DF75 ; Changes_When_Uppercased # L& LATIN SMALL LETTER CLOSED OMEGA WITH LONG STEM +1DF77 ; Changes_When_Uppercased # L& LATIN SMALL LETTER TURNED CLOSED OMEGA +1DF79 ; Changes_When_Uppercased # L& LATIN SMALL LETTER PHONOTYPIC TH +1DF7B ; Changes_When_Uppercased # L& LATIN SMALL LETTER U WITH HOOK TAIL +1DF7D ; Changes_When_Uppercased # L& LATIN SMALL LETTER U WITH NOTCH AT BOTTOM +1DF7F ; Changes_When_Uppercased # L& LATIN SMALL LETTER REVERSED U 1E922..1E943 ; Changes_When_Uppercased # L& [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 1580 +# Total code points: 1592 # ================================================ @@ -4989,6 +5037,7 @@ FF41..FF5A ; Changes_When_Uppercased # L& [26] FULLWIDTH LATIN SMALL LETTER 026F ; Changes_When_Titlecased # L& LATIN SMALL LETTER TURNED M 0271..0272 ; Changes_When_Titlecased # L& [2] LATIN SMALL LETTER M WITH HOOK..LATIN SMALL LETTER N WITH LEFT HOOK 0275 ; Changes_When_Titlecased # L& LATIN SMALL LETTER BARRED O +0277 ; Changes_When_Titlecased # L& LATIN SMALL LETTER CLOSED OMEGA 027D ; Changes_When_Titlecased # L& LATIN SMALL LETTER R WITH TAIL 0280 ; Changes_When_Titlecased # L& LATIN LETTER SMALL CAPITAL R 0282..0283 ; Changes_When_Titlecased # L& [2] LATIN SMALL LETTER S WITH HOOK..LATIN SMALL LETTER ESH @@ -5467,9 +5516,20 @@ FF41..FF5A ; Changes_When_Titlecased # L& [26] FULLWIDTH LATIN SMALL LETTER 118C0..118DF ; Changes_When_Titlecased # L& [32] WARANG CITI SMALL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 16E60..16E7F ; Changes_When_Titlecased # L& [32] MEDEFAIDRIN SMALL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16EBB..16ED3 ; Changes_When_Titlecased # L& [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY +1DF69 ; Changes_When_Titlecased # L& LATIN SMALL LETTER PHONOTYPIC A WITH SWASH +1DF6B ; Changes_When_Titlecased # L& LATIN SMALL LETTER PHONOTYPIC ROUNDTOP A +1DF6D ; Changes_When_Titlecased # L& LATIN SMALL LETTER REVERSED SCRUPLE +1DF6F ; Changes_When_Titlecased # L& LATIN SMALL LETTER PHONOTYPIC DIPHTHONG AI +1DF73 ; Changes_When_Titlecased # L& LATIN SMALL LETTER O WITH CURL +1DF75 ; Changes_When_Titlecased # L& LATIN SMALL LETTER CLOSED OMEGA WITH LONG STEM +1DF77 ; Changes_When_Titlecased # L& LATIN SMALL LETTER TURNED CLOSED OMEGA +1DF79 ; Changes_When_Titlecased # L& LATIN SMALL LETTER PHONOTYPIC TH +1DF7B ; Changes_When_Titlecased # L& LATIN SMALL LETTER U WITH HOOK TAIL +1DF7D ; Changes_When_Titlecased # L& LATIN SMALL LETTER U WITH NOTCH AT BOTTOM +1DF7F ; Changes_When_Titlecased # L& LATIN SMALL LETTER REVERSED U 1E922..1E943 ; Changes_When_Titlecased # L& [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 1507 +# Total code points: 1519 # ================================================ @@ -6090,7 +6150,7 @@ A7D4 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER DOUBLE W A7D6 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER MIDDLE SCOTS S A7D8 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER SIGMOID S A7DA ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER LAMBDA -A7DC ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DC..A7DD ; Changes_When_Casefolded # L& [2] LATIN CAPITAL LETTER LAMBDA WITH STROKE..LATIN CAPITAL LETTER CLOSED OMEGA A7F5 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER REVERSED HALF H AB70..ABBF ; Changes_When_Casefolded # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETTER YA FB00..FB06 ; Changes_When_Casefolded # L& [7] LATIN SMALL LIGATURE FF..LATIN SMALL LIGATURE ST @@ -6107,9 +6167,20 @@ FF21..FF3A ; Changes_When_Casefolded # L& [26] FULLWIDTH LATIN CAPITAL LETTE 118A0..118BF ; Changes_When_Casefolded # L& [32] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI CAPITAL LETTER VIYO 16E40..16E5F ; Changes_When_Casefolded # L& [32] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN CAPITAL LETTER Y 16EA0..16EB8 ; Changes_When_Casefolded # L& [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY +1DF68 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH +1DF6A ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER PHONOTYPIC ROUNDTOP A +1DF6C ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER REVERSED SCRUPLE +1DF6E ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER PHONOTYPIC DIPHTHONG AI +1DF72 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER O WITH CURL +1DF74 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER CLOSED OMEGA WITH LONG STEM +1DF76 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER TURNED CLOSED OMEGA +1DF78 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER PHONOTYPIC TH +1DF7A ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER U WITH HOOK TAIL +1DF7C ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER U WITH NOTCH AT BOTTOM +1DF7E ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER REVERSED ENLARGED SMALL U 1E900..1E921 ; Changes_When_Casefolded # L& [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA -# Total code points: 1561 +# Total code points: 1573 # ================================================ @@ -6141,6 +6212,7 @@ FF21..FF3A ; Changes_When_Casefolded # L& [26] FULLWIDTH LATIN CAPITAL LETTE 026F ; Changes_When_Casemapped # L& LATIN SMALL LETTER TURNED M 0271..0272 ; Changes_When_Casemapped # L& [2] LATIN SMALL LETTER M WITH HOOK..LATIN SMALL LETTER N WITH LEFT HOOK 0275 ; Changes_When_Casemapped # L& LATIN SMALL LETTER BARRED O +0277 ; Changes_When_Casemapped # L& LATIN SMALL LETTER CLOSED OMEGA 027D ; Changes_When_Casemapped # L& LATIN SMALL LETTER R WITH TAIL 0280 ; Changes_When_Casemapped # L& LATIN LETTER SMALL CAPITAL R 0282..0283 ; Changes_When_Casemapped # L& [2] LATIN SMALL LETTER S WITH HOOK..LATIN SMALL LETTER ESH @@ -6221,7 +6293,7 @@ A779..A787 ; Changes_When_Casemapped # L& [15] LATIN CAPITAL LETTER INSULAR A78B..A78D ; Changes_When_Casemapped # L& [3] LATIN CAPITAL LETTER SALTILLO..LATIN CAPITAL LETTER TURNED H A790..A794 ; Changes_When_Casemapped # L& [5] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER C WITH PALATAL HOOK A796..A7AE ; Changes_When_Casemapped # L& [25] LATIN CAPITAL LETTER B WITH FLOURISH..LATIN CAPITAL LETTER SMALL CAPITAL I -A7B0..A7DC ; Changes_When_Casemapped # L& [45] LATIN CAPITAL LETTER TURNED K..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7B0..A7DD ; Changes_When_Casemapped # L& [46] LATIN CAPITAL LETTER TURNED K..LATIN CAPITAL LETTER CLOSED OMEGA A7F5..A7F6 ; Changes_When_Casemapped # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H AB53 ; Changes_When_Casemapped # L& LATIN SMALL LETTER CHI AB70..ABBF ; Changes_When_Casemapped # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETTER YA @@ -6248,9 +6320,11 @@ FF41..FF5A ; Changes_When_Casemapped # L& [26] FULLWIDTH LATIN SMALL LETTER 16E40..16E7F ; Changes_When_Casemapped # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16EA0..16EB8 ; Changes_When_Casemapped # L& [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY 16EBB..16ED3 ; Changes_When_Casemapped # L& [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY +1DF68..1DF6F ; Changes_When_Casemapped # L& [8] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER PHONOTYPIC DIPHTHONG AI +1DF72..1DF7F ; Changes_When_Casemapped # L& [14] LATIN CAPITAL LETTER O WITH CURL..LATIN SMALL LETTER REVERSED U 1E900..1E943 ; Changes_When_Casemapped # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 3037 +# Total code points: 3061 # ================================================ @@ -6627,7 +6701,7 @@ A771..A787 ; ID_Start # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER I A788 ; ID_Start # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; ID_Start # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; ID_Start # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; ID_Start # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; ID_Start # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; ID_Start # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; ID_Start # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; ID_Start # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -6977,6 +7051,8 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1DF0A ; ID_Start # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; ID_Start # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; ID_Start # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; ID_Start # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; ID_Start # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E030..1E06D ; ID_Start # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E100..1E12C ; ID_Start # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; ID_Start # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER @@ -7044,7 +7120,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 30000..3134A ; ID_Start # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; ID_Start # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 145935 +# Total code points: 145962 # ================================================ @@ -7730,7 +7806,7 @@ A771..A787 ; ID_Continue # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTE A788 ; ID_Continue # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; ID_Continue # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; ID_Continue # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; ID_Continue # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; ID_Continue # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; ID_Continue # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; ID_Continue # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; ID_Continue # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -8393,6 +8469,8 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 1DF0A ; ID_Continue # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; ID_Continue # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; ID_Continue # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; ID_Continue # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; ID_Continue # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E000..1E006 ; ID_Continue # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; ID_Continue # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; ID_Continue # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -8484,7 +8562,7 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 31350..33479 ; ID_Continue # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 149273 +# Total code points: 149300 # ================================================ @@ -8857,7 +8935,7 @@ A771..A787 ; XID_Start # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER A788 ; XID_Start # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; XID_Start # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; XID_Start # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; XID_Start # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; XID_Start # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; XID_Start # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; XID_Start # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; XID_Start # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -9212,6 +9290,8 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 1DF0A ; XID_Start # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; XID_Start # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; XID_Start # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; XID_Start # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; XID_Start # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E030..1E06D ; XID_Start # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E100..1E12C ; XID_Start # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; XID_Start # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER @@ -9279,7 +9359,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 30000..3134A ; XID_Start # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; XID_Start # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 145912 +# Total code points: 145939 # ================================================ @@ -9960,7 +10040,7 @@ A771..A787 ; XID_Continue # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETT A788 ; XID_Continue # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; XID_Continue # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; XID_Continue # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; XID_Continue # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; XID_Continue # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; XID_Continue # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; XID_Continue # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; XID_Continue # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -10629,6 +10709,8 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 1DF0A ; XID_Continue # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; XID_Continue # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; XID_Continue # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; XID_Continue # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; XID_Continue # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E000..1E006 ; XID_Continue # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; XID_Continue # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; XID_Continue # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -10720,7 +10802,7 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 31350..33479 ; XID_Continue # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 E0100..E01EF ; XID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 149254 +# Total code points: 149281 # ================================================ @@ -12044,6 +12126,9 @@ E0100..E01EF ; Grapheme_Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELE 2E5B ; Grapheme_Base # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; Grapheme_Base # Pe BOTTOM HALF RIGHT PARENTHESIS 2E5D ; Grapheme_Base # Pd OBLIQUE HYPHEN +2E60..2E61 ; Grapheme_Base # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK +2E62 ; Grapheme_Base # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; Grapheme_Base # Pe RIGHT PARENTHESIS WITH MIDDLE RING 2E80..2E99 ; Grapheme_Base # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2EF3 ; Grapheme_Base # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE 2F00..2FD5 ; Grapheme_Base # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE @@ -12150,7 +12235,7 @@ A788 ; Grapheme_Base # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; Grapheme_Base # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; Grapheme_Base # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; Grapheme_Base # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; Grapheme_Base # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; Grapheme_Base # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; Grapheme_Base # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; Grapheme_Base # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; Grapheme_Base # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -12888,6 +12973,8 @@ FFFC..FFFD ; Grapheme_Base # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEME 1DF0A ; Grapheme_Base # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; Grapheme_Base # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; Grapheme_Base # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; Grapheme_Base # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; Grapheme_Base # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E030..1E06D ; Grapheme_Base # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E100..1E12C ; Grapheme_Base # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; Grapheme_Base # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER @@ -13016,7 +13103,7 @@ FFFC..FFFD ; Grapheme_Base # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEME 30000..3134A ; Grapheme_Base # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; Grapheme_Base # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 157523 +# Total code points: 157554 # ================================================ diff --git a/unicodetools/data/ucd/dev/DerivedNormalizationProps.txt b/unicodetools/data/ucd/dev/DerivedNormalizationProps.txt index 448ba69d6..04edf881a 100644 --- a/unicodetools/data/ucd/dev/DerivedNormalizationProps.txt +++ b/unicodetools/data/ucd/dev/DerivedNormalizationProps.txt @@ -1,5 +1,5 @@ # DerivedNormalizationProps-17.0.0.txt -# Date: 2025-01-27, 18:09:14 GMT +# Date: 2025-02-11, 13:48:10 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -5457,6 +5457,7 @@ A7D6 ; NFKC_CF; A7D7 # L& LATIN CAPITAL LETTER MIDDLE S A7D8 ; NFKC_CF; A7D9 # L& LATIN CAPITAL LETTER SIGMOID S A7DA ; NFKC_CF; A7DB # L& LATIN CAPITAL LETTER LAMBDA A7DC ; NFKC_CF; 019B # L& LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DD ; NFKC_CF; 0277 # L& LATIN CAPITAL LETTER CLOSED OMEGA A7F1 ; NFKC_CF; 0073 # Lm MODIFIER LETTER CAPITAL S A7F2 ; NFKC_CF; 0063 # Lm MODIFIER LETTER CAPITAL C A7F3 ; NFKC_CF; 0066 # Lm MODIFIER LETTER CAPITAL F @@ -8255,6 +8256,17 @@ FFF0..FFF8 ; NFKC_CF; # Cn [9] ...... -# Total code points: 10583 +# Total code points: 10595 # ================================================ @@ -11620,6 +11632,7 @@ A7D6 ; NFKC_SCF; A7D7 # L& LATIN CAPITAL LETTER MIDDLE A7D8 ; NFKC_SCF; A7D9 # L& LATIN CAPITAL LETTER SIGMOID S A7DA ; NFKC_SCF; A7DB # L& LATIN CAPITAL LETTER LAMBDA A7DC ; NFKC_SCF; 019B # L& LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DD ; NFKC_SCF; 0277 # L& LATIN CAPITAL LETTER CLOSED OMEGA A7F1 ; NFKC_SCF; 0073 # Lm MODIFIER LETTER CAPITAL S A7F2 ; NFKC_SCF; 0063 # Lm MODIFIER LETTER CAPITAL C A7F3 ; NFKC_SCF; 0066 # Lm MODIFIER LETTER CAPITAL F @@ -14418,6 +14431,17 @@ FFF0..FFF8 ; NFKC_SCF; # Cn [9] ...... -# Total code points: 10545 +# Total code points: 10557 # ================================================ @@ -16118,7 +16142,7 @@ A7D4 ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER DOU A7D6 ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER MIDDLE SCOTS S A7D8 ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER SIGMOID S A7DA ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER LAMBDA -A7DC ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DC..A7DD ; Changes_When_NFKC_Casefolded # L& [2] LATIN CAPITAL LETTER LAMBDA WITH STROKE..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; Changes_When_NFKC_Casefolded # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5 ; Changes_When_NFKC_Casefolded # L& LATIN CAPITAL LETTER REVERSED HALF H A7F8..A7F9 ; Changes_When_NFKC_Casefolded # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -16309,6 +16333,17 @@ FFF0..FFF8 ; Changes_When_NFKC_Casefolded # Cn [9] ...... -# Total code points: 10583 +# Total code points: 10595 # EOF diff --git a/unicodetools/data/ucd/dev/EastAsianWidth.txt b/unicodetools/data/ucd/dev/EastAsianWidth.txt index a5c270b19..51528cc29 100644 --- a/unicodetools/data/ucd/dev/EastAsianWidth.txt +++ b/unicodetools/data/ucd/dev/EastAsianWidth.txt @@ -1,5 +1,5 @@ # EastAsianWidth-17.0.0.txt -# Date: 2025-01-27, 18:09:15 GMT +# Date: 2025-02-14, 01:57:25 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1432,6 +1432,9 @@ 2E5B ; N # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; N # Pe BOTTOM HALF RIGHT PARENTHESIS 2E5D ; N # Pd OBLIQUE HYPHEN +2E60..2E61 ; N # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK +2E62 ; N # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; N # Pe RIGHT PARENTHESIS WITH MIDDLE RING 2E80..2E99 ; W # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2EF3 ; W # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE 2F00..2FD5 ; W # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE @@ -1549,7 +1552,7 @@ A788 ; N # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; N # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; N # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; N # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; N # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; N # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; N # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; N # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; N # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -2498,6 +2501,8 @@ FFFD ; A # So REPLACEMENT CHARACTER 1DF0A ; N # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; N # Ll [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; N # Ll [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; N # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; N # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E000..1E006 ; N # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; N # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; N # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI diff --git a/unicodetools/data/ucd/dev/LineBreak.txt b/unicodetools/data/ucd/dev/LineBreak.txt index e122f19e6..05f5c0c3c 100644 --- a/unicodetools/data/ucd/dev/LineBreak.txt +++ b/unicodetools/data/ucd/dev/LineBreak.txt @@ -1,5 +1,5 @@ # LineBreak-17.0.0.txt -# Date: 2025-01-27, 18:09:16 GMT +# Date: 2025-02-14, 01:57:28 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1413,6 +1413,9 @@ 2E5B ; OP # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; CP # Pe BOTTOM HALF RIGHT PARENTHESIS 2E5D ; BA # Pd OBLIQUE HYPHEN +2E60..2E61 ; EX # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK +2E62 ; OP # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; CL # Pe RIGHT PARENTHESIS WITH MIDDLE RING 2E80..2E99 ; ID # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2EF3 ; ID # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE 2F00..2FD5 ; ID # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE @@ -1576,7 +1579,7 @@ A788 ; AL # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; AL # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; AL # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; AL # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; AL # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; AL # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; AL # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; AL # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; AL # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -3409,6 +3412,8 @@ FFFD ; AI # So REPLACEMENT CHARACTER 1DF0A ; AL # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; AL # Ll [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; AL # Ll [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; AL # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; AL # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E000..1E006 ; CM # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; CM # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; CM # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI diff --git a/unicodetools/data/ucd/dev/PropList.txt b/unicodetools/data/ucd/dev/PropList.txt index 37e888db9..5fc45a3c0 100644 --- a/unicodetools/data/ucd/dev/PropList.txt +++ b/unicodetools/data/ucd/dev/PropList.txt @@ -1,5 +1,5 @@ # PropList-17.0.0.txt -# Date: 2025-01-27, 18:09:27 GMT +# Date: 2025-02-11, 16:14:30 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -167,6 +167,7 @@ FF63 ; Quotation_Mark # Pe HALFWIDTH RIGHT CORNER BRACKET 2E4C ; Terminal_Punctuation # Po MEDIEVAL COMMA 2E4E..2E4F ; Terminal_Punctuation # Po [2] PUNCTUS ELEVATUS MARK..CORNISH VERSE DIVIDER 2E53..2E54 ; Terminal_Punctuation # Po [2] MEDIEVAL EXCLAMATION MARK..MEDIEVAL QUESTION MARK +2E60..2E61 ; Terminal_Punctuation # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK 3001..3002 ; Terminal_Punctuation # Po [2] IDEOGRAPHIC COMMA..IDEOGRAPHIC FULL STOP A4FE..A4FF ; Terminal_Punctuation # Po [2] LISU PUNCTUATION COMMA..LISU PUNCTUATION FULL STOP A60D..A60F ; Terminal_Punctuation # Po [3] VAI COMMA..VAI QUESTION MARK @@ -234,7 +235,7 @@ FF64 ; Terminal_Punctuation # Po HALFWIDTH IDEOGRAPHIC COMMA 1BC9F ; Terminal_Punctuation # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1DA87..1DA8A ; Terminal_Punctuation # Po [4] SIGNWRITING COMMA..SIGNWRITING COLON -# Total code points: 291 +# Total code points: 293 # ================================================ @@ -1576,6 +1577,7 @@ FF65 ; Other_ID_Continue # Po HALFWIDTH KATAKANA MIDDLE DOT 2E2E ; Sentence_Terminal # Po REVERSED QUESTION MARK 2E3C ; Sentence_Terminal # Po STENOGRAPHIC FULL STOP 2E53..2E54 ; Sentence_Terminal # Po [2] MEDIEVAL EXCLAMATION MARK..MEDIEVAL QUESTION MARK +2E60..2E61 ; Sentence_Terminal # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK 3002 ; Sentence_Terminal # Po IDEOGRAPHIC FULL STOP A4FF ; Sentence_Terminal # Po LISU PUNCTUATION FULL STOP A60E..A60F ; Sentence_Terminal # Po [2] VAI FULL STOP..VAI QUESTION MARK @@ -1630,7 +1632,7 @@ FF61 ; Sentence_Terminal # Po HALFWIDTH IDEOGRAPHIC FULL STOP 1BC9F ; Sentence_Terminal # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1DA88 ; Sentence_Terminal # Po SIGNWRITING FULL STOP -# Total code points: 170 +# Total code points: 172 # ================================================ @@ -1880,7 +1882,11 @@ E0100..E01EF ; Variation_Selector # Mn [240] VARIATION SELECTOR-17..VARIATION S 2E5B ; Pattern_Syntax # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; Pattern_Syntax # Pe BOTTOM HALF RIGHT PARENTHESIS 2E5D ; Pattern_Syntax # Pd OBLIQUE HYPHEN -2E5E..2E7F ; Pattern_Syntax # Cn [34] .. +2E5E..2E5F ; Pattern_Syntax # Cn [2] .. +2E60..2E61 ; Pattern_Syntax # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK +2E62 ; Pattern_Syntax # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; Pattern_Syntax # Pe RIGHT PARENTHESIS WITH MIDDLE RING +2E64..2E7F ; Pattern_Syntax # Cn [28] .. 3001..3003 ; Pattern_Syntax # Po [3] IDEOGRAPHIC COMMA..DITTO MARK 3008 ; Pattern_Syntax # Ps LEFT ANGLE BRACKET 3009 ; Pattern_Syntax # Pe RIGHT ANGLE BRACKET diff --git a/unicodetools/data/ucd/dev/Scripts.txt b/unicodetools/data/ucd/dev/Scripts.txt index 139c00537..fb970da29 100644 --- a/unicodetools/data/ucd/dev/Scripts.txt +++ b/unicodetools/data/ucd/dev/Scripts.txt @@ -1,5 +1,5 @@ # Scripts-17.0.0.txt -# Date: 2025-01-27, 18:09:39 GMT +# Date: 2025-02-14, 01:57:56 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -356,6 +356,9 @@ 2E5B ; Common # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; Common # Pe BOTTOM HALF RIGHT PARENTHESIS 2E5D ; Common # Pd OBLIQUE HYPHEN +2E60..2E61 ; Common # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK +2E62 ; Common # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; Common # Pe RIGHT PARENTHESIS WITH MIDDLE RING 2FF0..2FFF ; Common # So [16] IDEOGRAPHIC DESCRIPTION CHARACTER LEFT TO RIGHT..IDEOGRAPHIC DESCRIPTION CHARACTER ROTATION 3000 ; Common # Zs IDEOGRAPHIC SPACE 3001..3003 ; Common # Po [3] IDEOGRAPHIC COMMA..DITTO MARK @@ -638,7 +641,7 @@ FFFC..FFFD ; Common # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHAR E0001 ; Common # Cf LANGUAGE TAG E0020..E007F ; Common # Cf [96] TAG SPACE..CANCEL TAG -# Total code points: 9123 +# Total code points: 9127 # ================================================ @@ -681,7 +684,7 @@ A770 ; Latin # Lm MODIFIER LETTER US A771..A787 ; Latin # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER INSULAR T A78B..A78E ; Latin # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; Latin # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; Latin # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; Latin # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; Latin # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; Latin # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; Latin # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -703,8 +706,10 @@ FF41..FF5A ; Latin # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 1DF0A ; Latin # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; Latin # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; Latin # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; Latin # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; Latin # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR -# Total code points: 1492 +# Total code points: 1519 # ================================================ diff --git a/unicodetools/data/ucd/dev/UnicodeData.txt b/unicodetools/data/ucd/dev/UnicodeData.txt index 908382199..68ab252f8 100644 --- a/unicodetools/data/ucd/dev/UnicodeData.txt +++ b/unicodetools/data/ucd/dev/UnicodeData.txt @@ -629,7 +629,7 @@ 0274;LATIN LETTER SMALL CAPITAL N;Ll;0;L;;;;;N;;;;; 0275;LATIN SMALL LETTER BARRED O;Ll;0;L;;;;;N;;;019F;;019F 0276;LATIN LETTER SMALL CAPITAL OE;Ll;0;L;;;;;N;LATIN LETTER SMALL CAPITAL O E;;;; -0277;LATIN SMALL LETTER CLOSED OMEGA;Ll;0;L;;;;;N;;;;; +0277;LATIN SMALL LETTER CLOSED OMEGA;Ll;0;L;;;;;N;;;A7DD;;A7DD 0278;LATIN SMALL LETTER PHI;Ll;0;L;;;;;N;;;;; 0279;LATIN SMALL LETTER TURNED R;Ll;0;L;;;;;N;;;;; 027A;LATIN SMALL LETTER TURNED R WITH LONG LEG;Ll;0;L;;;;;N;;;;; @@ -10933,6 +10933,10 @@ 2E5B;BOTTOM HALF LEFT PARENTHESIS;Ps;0;ON;;;;;Y;;;;; 2E5C;BOTTOM HALF RIGHT PARENTHESIS;Pe;0;ON;;;;;Y;;;;; 2E5D;OBLIQUE HYPHEN;Pd;0;ON;;;;;N;;;;; +2E60;WIGGLY EXCLAMATION MARK;Po;0;ON;;;;;N;;;;; +2E61;INVERTED WIGGLY EXCLAMATION MARK;Po;0;ON;;;;;N;;;;; +2E62;LEFT PARENTHESIS WITH MIDDLE RING;Ps;0;ON;;;;;Y;;;;; +2E63;RIGHT PARENTHESIS WITH MIDDLE RING;Pe;0;ON;;;;;Y;;;;; 2E80;CJK RADICAL REPEAT;So;0;ON;;;;;N;;;;; 2E81;CJK RADICAL CLIFF;So;0;ON;;;;;N;;;;; 2E82;CJK RADICAL SECOND ONE;So;0;ON;;;;;N;;;;; @@ -14323,6 +14327,7 @@ A7D9;LATIN SMALL LETTER SIGMOID S;Ll;0;L;;;;;N;;;A7D8;;A7D8 A7DA;LATIN CAPITAL LETTER LAMBDA;Lu;0;L;;;;;N;;;;A7DB; A7DB;LATIN SMALL LETTER LAMBDA;Ll;0;L;;;;;N;;;A7DA;;A7DA A7DC;LATIN CAPITAL LETTER LAMBDA WITH STROKE;Lu;0;L;;;;;N;;;;019B; +A7DD;LATIN CAPITAL LETTER CLOSED OMEGA;Lu;0;L;;;;;N;;;;0277; A7F1;MODIFIER LETTER CAPITAL S;Lm;0;L; 0053;;;;N;;;;; A7F2;MODIFIER LETTER CAPITAL C;Lm;0;L; 0043;;;;N;;;;; A7F3;MODIFIER LETTER CAPITAL F;Lm;0;L; 0046;;;;N;;;;; @@ -36078,6 +36083,32 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1DF28;LATIN SMALL LETTER R WITH MID-HEIGHT LEFT HOOK;Ll;0;L;;;;;N;;;;; 1DF29;LATIN SMALL LETTER S WITH MID-HEIGHT LEFT HOOK;Ll;0;L;;;;;N;;;;; 1DF2A;LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK;Ll;0;L;;;;;N;;;;; +1DF68;LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH;Lu;0;L;;;;;N;;;;1DF69; +1DF69;LATIN SMALL LETTER PHONOTYPIC A WITH SWASH;Ll;0;L;;;;;N;;;1DF68;;1DF68 +1DF6A;LATIN CAPITAL LETTER PHONOTYPIC ROUNDTOP A;Lu;0;L;;;;;N;;;;1DF6B; +1DF6B;LATIN SMALL LETTER PHONOTYPIC ROUNDTOP A;Ll;0;L;;;;;N;;;1DF6A;;1DF6A +1DF6C;LATIN CAPITAL LETTER REVERSED SCRUPLE;Lu;0;L;;;;;N;;;;1DF6D; +1DF6D;LATIN SMALL LETTER REVERSED SCRUPLE;Ll;0;L;;;;;N;;;1DF6C;;1DF6C +1DF6E;LATIN CAPITAL LETTER PHONOTYPIC DIPHTHONG AI;Lu;0;L;;;;;N;;;;1DF6F; +1DF6F;LATIN SMALL LETTER PHONOTYPIC DIPHTHONG AI;Ll;0;L;;;;;N;;;1DF6E;;1DF6E +1DF70;LATIN SMALL LETTER I WITH PIGTAIL AT BOTTOM;Ll;0;L;;;;;N;;;;; +1DF71;LATIN SMALL LETTER STRETCHED I;Ll;0;L;;;;;N;;;;; +1DF72;LATIN CAPITAL LETTER O WITH CURL;Lu;0;L;;;;;N;;;;1DF73; +1DF73;LATIN SMALL LETTER O WITH CURL;Ll;0;L;;;;;N;;;1DF72;;1DF72 +1DF74;LATIN CAPITAL LETTER CLOSED OMEGA WITH LONG STEM;Lu;0;L;;;;;N;;;;1DF75; +1DF75;LATIN SMALL LETTER CLOSED OMEGA WITH LONG STEM;Ll;0;L;;;;;N;;;1DF74;;1DF74 +1DF76;LATIN CAPITAL LETTER TURNED CLOSED OMEGA;Lu;0;L;;;;;N;;;;1DF77; +1DF77;LATIN SMALL LETTER TURNED CLOSED OMEGA;Ll;0;L;;;;;N;;;1DF76;;1DF76 +1DF78;LATIN CAPITAL LETTER PHONOTYPIC TH;Lu;0;L;;;;;N;;;;1DF79; +1DF79;LATIN SMALL LETTER PHONOTYPIC TH;Ll;0;L;;;;;N;;;1DF78;;1DF78 +1DF7A;LATIN CAPITAL LETTER U WITH HOOK TAIL;Lu;0;L;;;;;N;;;;1DF7B; +1DF7B;LATIN SMALL LETTER U WITH HOOK TAIL;Ll;0;L;;;;;N;;;1DF7A;;1DF7A +1DF7C;LATIN CAPITAL LETTER U WITH NOTCH AT BOTTOM;Lu;0;L;;;;;N;;;;1DF7D; +1DF7D;LATIN SMALL LETTER U WITH NOTCH AT BOTTOM;Ll;0;L;;;;;N;;;1DF7C;;1DF7C +1DF7E;LATIN CAPITAL LETTER REVERSED ENLARGED SMALL U;Lu;0;L;;;;;N;;;;1DF7F; +1DF7F;LATIN SMALL LETTER REVERSED U;Ll;0;L;;;;;N;;;1DF7E;;1DF7E +1DF80;LATIN CAPITAL LETTER A WITH TOPBAR;Lo;0;L;;;;;N;;;;; +1DF81;LATIN CAPITAL LETTER E WITH BENT TOPBAR;Lo;0;L;;;;;N;;;;; 1E000;COMBINING GLAGOLITIC LETTER AZU;Mn;230;NSM;;;;;N;;;;; 1E001;COMBINING GLAGOLITIC LETTER BUKY;Mn;230;NSM;;;;;N;;;;; 1E002;COMBINING GLAGOLITIC LETTER VEDE;Mn;230;NSM;;;;;N;;;;; diff --git a/unicodetools/data/ucd/dev/VerticalOrientation.txt b/unicodetools/data/ucd/dev/VerticalOrientation.txt index 71770a13d..62ac93d95 100644 --- a/unicodetools/data/ucd/dev/VerticalOrientation.txt +++ b/unicodetools/data/ucd/dev/VerticalOrientation.txt @@ -1,5 +1,5 @@ # VerticalOrientation-17.0.0.txt -# Date: 2025-01-29 +# Date: 2025-02-14, 01:57:58 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1183,6 +1183,9 @@ 2E5B ; R # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; R # Pe BOTTOM HALF RIGHT PARENTHESIS 2E5D ; R # Pd OBLIQUE HYPHEN +2E60..2E61 ; R # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK +2E62 ; R # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; R # Pe RIGHT PARENTHESIS WITH MIDDLE RING 2E80..2E99 ; U # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9A ; U # Cn 2E9B..2EF3 ; U # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE @@ -1365,7 +1368,7 @@ A788 ; R # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; R # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; R # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; R # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; R # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; R # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; R # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; R # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; R # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -2360,6 +2363,8 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 1DF0A ; R # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; R # Ll [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; R # Ll [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; R # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; R # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E000..1E006 ; R # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; R # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; R # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI diff --git a/unicodetools/data/ucd/dev/auxiliary/SentenceBreakProperty.txt b/unicodetools/data/ucd/dev/auxiliary/SentenceBreakProperty.txt index 0e5dc2e11..ae3af118d 100644 --- a/unicodetools/data/ucd/dev/auxiliary/SentenceBreakProperty.txt +++ b/unicodetools/data/ucd/dev/auxiliary/SentenceBreakProperty.txt @@ -1,5 +1,5 @@ # SentenceBreakProperty-17.0.0.txt -# Date: 2025-01-27, 18:09:39 GMT +# Date: 2025-02-14, 01:57:56 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1332,10 +1332,21 @@ FF41..FF5A ; Lower # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 1DF00..1DF09 ; Lower # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK 1DF0B..1DF1E ; Lower # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; Lower # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF69 ; Lower # L& LATIN SMALL LETTER PHONOTYPIC A WITH SWASH +1DF6B ; Lower # L& LATIN SMALL LETTER PHONOTYPIC ROUNDTOP A +1DF6D ; Lower # L& LATIN SMALL LETTER REVERSED SCRUPLE +1DF6F..1DF71 ; Lower # L& [3] LATIN SMALL LETTER PHONOTYPIC DIPHTHONG AI..LATIN SMALL LETTER STRETCHED I +1DF73 ; Lower # L& LATIN SMALL LETTER O WITH CURL +1DF75 ; Lower # L& LATIN SMALL LETTER CLOSED OMEGA WITH LONG STEM +1DF77 ; Lower # L& LATIN SMALL LETTER TURNED CLOSED OMEGA +1DF79 ; Lower # L& LATIN SMALL LETTER PHONOTYPIC TH +1DF7B ; Lower # L& LATIN SMALL LETTER U WITH HOOK TAIL +1DF7D ; Lower # L& LATIN SMALL LETTER U WITH NOTCH AT BOTTOM +1DF7F ; Lower # L& LATIN SMALL LETTER REVERSED U 1E030..1E06D ; Lower # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E922..1E943 ; Lower # L& [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 2548 +# Total code points: 2561 # ================================================ @@ -1951,7 +1962,7 @@ A7D4 ; Upper # L& LATIN CAPITAL LETTER DOUBLE WYNN A7D6 ; Upper # L& LATIN CAPITAL LETTER MIDDLE SCOTS S A7D8 ; Upper # L& LATIN CAPITAL LETTER SIGMOID S A7DA ; Upper # L& LATIN CAPITAL LETTER LAMBDA -A7DC ; Upper # L& LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DC..A7DD ; Upper # L& [2] LATIN CAPITAL LETTER LAMBDA WITH STROKE..LATIN CAPITAL LETTER CLOSED OMEGA A7F5 ; Upper # L& LATIN CAPITAL LETTER REVERSED HALF H FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z 10400..10427 ; Upper # L& [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW @@ -1996,12 +2007,23 @@ FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LAT 1D756..1D76E ; Upper # L& [25] MATHEMATICAL SANS-SERIF BOLD CAPITAL ALPHA..MATHEMATICAL SANS-SERIF BOLD CAPITAL OMEGA 1D790..1D7A8 ; Upper # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL OMEGA 1D7CA ; Upper # L& MATHEMATICAL BOLD CAPITAL DIGAMMA +1DF68 ; Upper # L& LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH +1DF6A ; Upper # L& LATIN CAPITAL LETTER PHONOTYPIC ROUNDTOP A +1DF6C ; Upper # L& LATIN CAPITAL LETTER REVERSED SCRUPLE +1DF6E ; Upper # L& LATIN CAPITAL LETTER PHONOTYPIC DIPHTHONG AI +1DF72 ; Upper # L& LATIN CAPITAL LETTER O WITH CURL +1DF74 ; Upper # L& LATIN CAPITAL LETTER CLOSED OMEGA WITH LONG STEM +1DF76 ; Upper # L& LATIN CAPITAL LETTER TURNED CLOSED OMEGA +1DF78 ; Upper # L& LATIN CAPITAL LETTER PHONOTYPIC TH +1DF7A ; Upper # L& LATIN CAPITAL LETTER U WITH HOOK TAIL +1DF7C ; Upper # L& LATIN CAPITAL LETTER U WITH NOTCH AT BOTTOM +1DF7E ; Upper # L& LATIN CAPITAL LETTER REVERSED ENLARGED SMALL U 1E900..1E921 ; Upper # L& [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA 1F130..1F149 ; Upper # So [26] SQUARED LATIN CAPITAL LETTER A..SQUARED LATIN CAPITAL LETTER Z 1F150..1F169 ; Upper # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; Upper # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 1991 +# Total code points: 2003 # ================================================ @@ -2557,6 +2579,7 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1BC80..1BC88 ; OLetter # Lo [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL 1BC90..1BC99 ; OLetter # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW 1DF0A ; OLetter # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF80..1DF81 ; OLetter # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E100..1E12C ; OLetter # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; OLetter # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E14E ; OLetter # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ @@ -2622,7 +2645,7 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 30000..3134A ; OLetter # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; OLetter # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 141520 +# Total code points: 141522 # ================================================ @@ -2754,6 +2777,7 @@ FF0E ; ATerm # Po FULLWIDTH FULL STOP 2E2E ; STerm # Po REVERSED QUESTION MARK 2E3C ; STerm # Po STENOGRAPHIC FULL STOP 2E53..2E54 ; STerm # Po [2] MEDIEVAL EXCLAMATION MARK..MEDIEVAL QUESTION MARK +2E60..2E61 ; STerm # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK 3002 ; STerm # Po IDEOGRAPHIC FULL STOP A4FF ; STerm # Po LISU PUNCTUATION FULL STOP A60E..A60F ; STerm # Po [2] VAI FULL STOP..VAI QUESTION MARK @@ -2806,7 +2830,7 @@ FF61 ; STerm # Po HALFWIDTH IDEOGRAPHIC FULL STOP 1BC9F ; STerm # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1DA88 ; STerm # Po SIGNWRITING FULL STOP -# Total code points: 166 +# Total code points: 168 # ================================================ @@ -2934,6 +2958,8 @@ FF61 ; STerm # Po HALFWIDTH IDEOGRAPHIC FULL STOP 2E5A ; Close # Pe TOP HALF RIGHT PARENTHESIS 2E5B ; Close # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; Close # Pe BOTTOM HALF RIGHT PARENTHESIS +2E62 ; Close # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; Close # Pe RIGHT PARENTHESIS WITH MIDDLE RING 3008 ; Close # Ps LEFT ANGLE BRACKET 3009 ; Close # Pe RIGHT ANGLE BRACKET 300A ; Close # Ps LEFT DOUBLE ANGLE BRACKET @@ -2994,7 +3020,7 @@ FF62 ; Close # Ps HALFWIDTH LEFT CORNER BRACKET FF63 ; Close # Pe HALFWIDTH RIGHT CORNER BRACKET 1F676..1F678 ; Close # So [3] SANS-SERIF HEAVY DOUBLE TURNED COMMA QUOTATION MARK ORNAMENT..SANS-SERIF HEAVY LOW DOUBLE COMMA QUOTATION MARK ORNAMENT -# Total code points: 195 +# Total code points: 197 # ================================================ diff --git a/unicodetools/data/ucd/dev/auxiliary/WordBreakProperty.txt b/unicodetools/data/ucd/dev/auxiliary/WordBreakProperty.txt index e5a5b9937..ad3584eab 100644 --- a/unicodetools/data/ucd/dev/auxiliary/WordBreakProperty.txt +++ b/unicodetools/data/ucd/dev/auxiliary/WordBreakProperty.txt @@ -1,5 +1,5 @@ # WordBreakProperty-17.0.0.txt -# Date: 2025-01-27, 18:09:43 GMT +# Date: 2025-02-14, 01:57:58 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1016,7 +1016,7 @@ A788 ; ALetter # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; ALetter # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; ALetter # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; ALetter # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; ALetter # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; ALetter # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; ALetter # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; ALetter # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; ALetter # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -1322,6 +1322,8 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1DF0A ; ALetter # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; ALetter # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; ALetter # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; ALetter # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; ALetter # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E030..1E06D ; ALetter # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E100..1E12C ; ALetter # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; ALetter # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER @@ -1383,7 +1385,7 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1F150..1F169 ; ALetter # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; ALetter # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 34004 +# Total code points: 34031 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt b/unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt index a4dc4250a..a24abfbec 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt @@ -1,5 +1,5 @@ # DerivedBidiClass-17.0.0.txt -# Date: 2025-01-27, 18:09:10 GMT +# Date: 2025-02-14, 01:57:18 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -664,7 +664,7 @@ A771..A787 ; L # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER INSULAR A789..A78A ; L # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; L # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; L # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; L # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; L # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; L # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; L # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; L # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -1188,6 +1188,8 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 1DF0A ; L # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; L # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; L # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; L # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; L # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E030..1E06D ; L # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E100..1E12C ; L # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; L # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER @@ -1234,8 +1236,8 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER F0000..FFFFD ; L # Co [65534] .. 100000..10FFFD; L # Co [65534] .. -# The above property value applies to 810584 code points not listed here. -# Total code points: 1095402 +# The above property value applies to 810553 code points not listed here. +# Total code points: 1095398 # ================================================ @@ -1806,6 +1808,9 @@ FF1A ; CS # Po FULLWIDTH COLON 2E5B ; ON # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; ON # Pe BOTTOM HALF RIGHT PARENTHESIS 2E5D ; ON # Pd OBLIQUE HYPHEN +2E60..2E61 ; ON # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK +2E62 ; ON # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; ON # Pe RIGHT PARENTHESIS WITH MIDDLE RING 2E80..2E99 ; ON # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2EF3 ; ON # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE 2F00..2FD5 ; ON # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE @@ -2027,7 +2032,7 @@ FFFC..FFFD ; ON # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTE 1FB94..1FBEF ; ON # So [92] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..TOP LEFT JUSTIFIED LOWER RIGHT QUARTER BLACK CIRCLE 1FBFA ; ON # So ALARM BELL SYMBOL -# Total code points: 6855 +# Total code points: 6859 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedBinaryProperties.txt b/unicodetools/data/ucd/dev/extracted/DerivedBinaryProperties.txt index fa328ca5f..af9281035 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedBinaryProperties.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedBinaryProperties.txt @@ -1,5 +1,5 @@ # DerivedBinaryProperties-17.0.0.txt -# Date: 2025-01-27, 18:09:10 GMT +# Date: 2025-02-11, 13:48:06 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -193,6 +193,8 @@ 2E5A ; Bidi_Mirrored # Pe TOP HALF RIGHT PARENTHESIS 2E5B ; Bidi_Mirrored # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; Bidi_Mirrored # Pe BOTTOM HALF RIGHT PARENTHESIS +2E62 ; Bidi_Mirrored # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; Bidi_Mirrored # Pe RIGHT PARENTHESIS WITH MIDDLE RING 3008 ; Bidi_Mirrored # Ps LEFT ANGLE BRACKET 3009 ; Bidi_Mirrored # Pe RIGHT ANGLE BRACKET 300A ; Bidi_Mirrored # Ps LEFT DOUBLE ANGLE BRACKET @@ -236,6 +238,6 @@ FF63 ; Bidi_Mirrored # Pe HALFWIDTH RIGHT CORNER BRACKET 1D789 ; Bidi_Mirrored # Sm MATHEMATICAL SANS-SERIF BOLD PARTIAL DIFFERENTIAL 1D7C3 ; Bidi_Mirrored # Sm MATHEMATICAL SANS-SERIF BOLD ITALIC PARTIAL DIFFERENTIAL -# Total code points: 554 +# Total code points: 556 # EOF diff --git a/unicodetools/data/ucd/dev/extracted/DerivedCombiningClass.txt b/unicodetools/data/ucd/dev/extracted/DerivedCombiningClass.txt index 3a10fc1e4..394a92100 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedCombiningClass.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedCombiningClass.txt @@ -1,5 +1,5 @@ # DerivedCombiningClass-17.0.0.txt -# Date: 2025-01-27, 18:09:10 GMT +# Date: 2025-02-14, 01:57:19 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -986,6 +986,9 @@ 2E5B ; 0 # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; 0 # Pe BOTTOM HALF RIGHT PARENTHESIS 2E5D ; 0 # Pd OBLIQUE HYPHEN +2E60..2E61 ; 0 # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK +2E62 ; 0 # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; 0 # Pe RIGHT PARENTHESIS WITH MIDDLE RING 2E80..2E99 ; 0 # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2EF3 ; 0 # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE 2F00..2FD5 ; 0 # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE @@ -1093,7 +1096,7 @@ A788 ; 0 # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; 0 # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; 0 # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; 0 # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; 0 # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; 0 # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; 0 # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; 0 # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; 0 # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -1962,6 +1965,8 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 1DF0A ; 0 # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; 0 # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; 0 # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; 0 # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; 0 # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E030..1E06D ; 0 # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E100..1E12C ; 0 # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; 0 # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER @@ -2095,7 +2100,7 @@ E0100..E01EF ; 0 # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 F0000..FFFFD ; 0 # Co [65534] .. 100000..10FFFD; 0 # Co [65534] .. -# The above property value applies to 816745 code points not listed here. +# The above property value applies to 816714 code points not listed here. # Total code points: 1113143 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedEastAsianWidth.txt b/unicodetools/data/ucd/dev/extracted/DerivedEastAsianWidth.txt index c3d0bb02a..29385bbc3 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedEastAsianWidth.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedEastAsianWidth.txt @@ -1,5 +1,5 @@ # DerivedEastAsianWidth-17.0.0.txt -# Date: 2025-01-27, 18:09:12 GMT +# Date: 2025-02-14, 01:57:22 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1149,6 +1149,9 @@ 2E5B ; N # Ps BOTTOM HALF LEFT PARENTHESIS 2E5C ; N # Pe BOTTOM HALF RIGHT PARENTHESIS 2E5D ; N # Pd OBLIQUE HYPHEN +2E60..2E61 ; N # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK +2E62 ; N # Ps LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; N # Pe RIGHT PARENTHESIS WITH MIDDLE RING 303F ; N # So IDEOGRAPHIC HALF FILL SPACE A4D0..A4F7 ; N # Lo [40] LISU LETTER BA..LISU LETTER OE A4F8..A4FD ; N # Lm [6] LISU LETTER TONE MYA TI..LISU LETTER TONE MYA JEU @@ -1184,7 +1187,7 @@ A788 ; N # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; N # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; N # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; N # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; N # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; N # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; N # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; N # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; N # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -1994,6 +1997,8 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 1DF0A ; N # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; N # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; N # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; N # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; N # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E000..1E006 ; N # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; N # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; N # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -2144,7 +2149,7 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER E0001 ; N # Cf LANGUAGE TAG E0020..E007F ; N # Cf [96] TAG SPACE..CANCEL TAG -# The above property value applies to 760566 code points not listed here. +# The above property value applies to 760535 code points not listed here. # Total code points: 792267 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedGeneralCategory.txt b/unicodetools/data/ucd/dev/extracted/DerivedGeneralCategory.txt index 22b9a85f6..43c72a3a7 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedGeneralCategory.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedGeneralCategory.txt @@ -1,5 +1,5 @@ # DerivedGeneralCategory-17.0.0.txt -# Date: 2025-01-27, 18:09:13 GMT +# Date: 2025-02-14, 01:57:22 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -278,7 +278,8 @@ 2DCF ; Cn # 2DD7 ; Cn # 2DDF ; Cn # -2E5E..2E7F ; Cn # [34] .. +2E5E..2E5F ; Cn # [2] .. +2E64..2E7F ; Cn # [28] .. 2E9A ; Cn # 2EF4..2EFF ; Cn # [12] .. 2FD6..2FEF ; Cn # [26] .. @@ -293,7 +294,7 @@ A48D..A48F ; Cn # [3] .. A4C7..A4CF ; Cn # [9] .. A62C..A63F ; Cn # [20] .. A6F8..A6FF ; Cn # [8] .. -A7DD..A7F0 ; Cn # [20] .. +A7DE..A7F0 ; Cn # [19] .. A82D..A82F ; Cn # [3] .. A83A..A83F ; Cn # [6] .. A878..A87F ; Cn # [8] .. @@ -636,7 +637,8 @@ FFFE..FFFF ; Cn # [2] .. 1DAA0 ; Cn # 1DAB0..1DEFF ; Cn # [1104] .. 1DF1F..1DF24 ; Cn # [6] .. -1DF2B..1DFFF ; Cn # [213] .. +1DF2B..1DF67 ; Cn # [61] .. +1DF82..1DFFF ; Cn # [126] .. 1E007 ; Cn # 1E019..1E01A ; Cn # [2] .. 1E022 ; Cn # @@ -754,7 +756,7 @@ E01F0..EFFFF ; Cn # [65040] .. FFFFE..FFFFF ; Cn # [2] .. 10FFFE..10FFFF; Cn # [2] .. -# Total code points: 814697 +# Total code points: 814666 # ================================================ @@ -1369,7 +1371,7 @@ A7D4 ; Lu # LATIN CAPITAL LETTER DOUBLE WYNN A7D6 ; Lu # LATIN CAPITAL LETTER MIDDLE SCOTS S A7D8 ; Lu # LATIN CAPITAL LETTER SIGMOID S A7DA ; Lu # LATIN CAPITAL LETTER LAMBDA -A7DC ; Lu # LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DC..A7DD ; Lu # [2] LATIN CAPITAL LETTER LAMBDA WITH STROKE..LATIN CAPITAL LETTER CLOSED OMEGA A7F5 ; Lu # LATIN CAPITAL LETTER REVERSED HALF H FF21..FF3A ; Lu # [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z 10400..10427 ; Lu # [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW @@ -1414,9 +1416,20 @@ FF21..FF3A ; Lu # [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAP 1D756..1D76E ; Lu # [25] MATHEMATICAL SANS-SERIF BOLD CAPITAL ALPHA..MATHEMATICAL SANS-SERIF BOLD CAPITAL OMEGA 1D790..1D7A8 ; Lu # [25] MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL OMEGA 1D7CA ; Lu # MATHEMATICAL BOLD CAPITAL DIGAMMA +1DF68 ; Lu # LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH +1DF6A ; Lu # LATIN CAPITAL LETTER PHONOTYPIC ROUNDTOP A +1DF6C ; Lu # LATIN CAPITAL LETTER REVERSED SCRUPLE +1DF6E ; Lu # LATIN CAPITAL LETTER PHONOTYPIC DIPHTHONG AI +1DF72 ; Lu # LATIN CAPITAL LETTER O WITH CURL +1DF74 ; Lu # LATIN CAPITAL LETTER CLOSED OMEGA WITH LONG STEM +1DF76 ; Lu # LATIN CAPITAL LETTER TURNED CLOSED OMEGA +1DF78 ; Lu # LATIN CAPITAL LETTER PHONOTYPIC TH +1DF7A ; Lu # LATIN CAPITAL LETTER U WITH HOOK TAIL +1DF7C ; Lu # LATIN CAPITAL LETTER U WITH NOTCH AT BOTTOM +1DF7E ; Lu # LATIN CAPITAL LETTER REVERSED ENLARGED SMALL U 1E900..1E921 ; Lu # [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA -# Total code points: 1886 +# Total code points: 1898 # ================================================ @@ -2085,9 +2098,20 @@ FF41..FF5A ; Ll # [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL 1DF00..1DF09 ; Ll # [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK 1DF0B..1DF1E ; Ll # [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; Ll # [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF69 ; Ll # LATIN SMALL LETTER PHONOTYPIC A WITH SWASH +1DF6B ; Ll # LATIN SMALL LETTER PHONOTYPIC ROUNDTOP A +1DF6D ; Ll # LATIN SMALL LETTER REVERSED SCRUPLE +1DF6F..1DF71 ; Ll # [3] LATIN SMALL LETTER PHONOTYPIC DIPHTHONG AI..LATIN SMALL LETTER STRETCHED I +1DF73 ; Ll # LATIN SMALL LETTER O WITH CURL +1DF75 ; Ll # LATIN SMALL LETTER CLOSED OMEGA WITH LONG STEM +1DF77 ; Ll # LATIN SMALL LETTER TURNED CLOSED OMEGA +1DF79 ; Ll # LATIN SMALL LETTER PHONOTYPIC TH +1DF7B ; Ll # LATIN SMALL LETTER U WITH HOOK TAIL +1DF7D ; Ll # LATIN SMALL LETTER U WITH NOTCH AT BOTTOM +1DF7F ; Ll # LATIN SMALL LETTER REVERSED U 1E922..1E943 ; Ll # [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 2283 +# Total code points: 2296 # ================================================ @@ -2677,6 +2701,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 1BC80..1BC88 ; Lo # [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL 1BC90..1BC99 ; Lo # [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW 1DF0A ; Lo # LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF80..1DF81 ; Lo # [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E100..1E12C ; Lo # [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E14E ; Lo # NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 1E290..1E2AD ; Lo # [30] TOTO LETTER PA..TOTO LETTER A @@ -2738,7 +2763,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 30000..3134A ; Lo # [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; Lo # [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 141081 +# Total code points: 141083 # ================================================ @@ -3671,6 +3696,7 @@ FF0D ; Pd # FULLWIDTH HYPHEN-MINUS 2E57 ; Ps # LEFT SQUARE BRACKET WITH DOUBLE STROKE 2E59 ; Ps # TOP HALF LEFT PARENTHESIS 2E5B ; Ps # BOTTOM HALF LEFT PARENTHESIS +2E62 ; Ps # LEFT PARENTHESIS WITH MIDDLE RING 3008 ; Ps # LEFT ANGLE BRACKET 300A ; Ps # LEFT DOUBLE ANGLE BRACKET 300C ; Ps # LEFT CORNER BRACKET @@ -3701,7 +3727,7 @@ FF5B ; Ps # FULLWIDTH LEFT CURLY BRACKET FF5F ; Ps # FULLWIDTH LEFT WHITE PARENTHESIS FF62 ; Ps # HALFWIDTH LEFT CORNER BRACKET -# Total code points: 79 +# Total code points: 80 # ================================================ @@ -3754,6 +3780,7 @@ FF62 ; Ps # HALFWIDTH LEFT CORNER BRACKET 2E58 ; Pe # RIGHT SQUARE BRACKET WITH DOUBLE STROKE 2E5A ; Pe # TOP HALF RIGHT PARENTHESIS 2E5C ; Pe # BOTTOM HALF RIGHT PARENTHESIS +2E63 ; Pe # RIGHT PARENTHESIS WITH MIDDLE RING 3009 ; Pe # RIGHT ANGLE BRACKET 300B ; Pe # RIGHT DOUBLE ANGLE BRACKET 300D ; Pe # RIGHT CORNER BRACKET @@ -3784,7 +3811,7 @@ FF5D ; Pe # FULLWIDTH RIGHT CURLY BRACKET FF60 ; Pe # FULLWIDTH RIGHT WHITE PARENTHESIS FF63 ; Pe # HALFWIDTH RIGHT CORNER BRACKET -# Total code points: 77 +# Total code points: 78 # ================================================ @@ -3894,6 +3921,7 @@ FF3F ; Pc # FULLWIDTH LOW LINE 2E41 ; Po # REVERSED COMMA 2E43..2E4F ; Po # [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER 2E52..2E54 ; Po # [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK +2E60..2E61 ; Po # [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK 3001..3003 ; Po # [3] IDEOGRAPHIC COMMA..DITTO MARK 303D ; Po # PART ALTERNATION MARK 30FB ; Po # KATAKANA MIDDLE DOT @@ -3998,7 +4026,7 @@ FF64..FF65 ; Po # [2] HALFWIDTH IDEOGRAPHIC COMMA..HALFWIDTH KATAKANA MIDDL 1E5FF ; Po # OL ONAL ABBREVIATION SIGN 1E95E..1E95F ; Po # [2] ADLAM INITIAL EXCLAMATION MARK..ADLAM INITIAL QUESTION MARK -# Total code points: 641 +# Total code points: 643 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedLineBreak.txt b/unicodetools/data/ucd/dev/extracted/DerivedLineBreak.txt index 03b4c0a9b..48e416c5f 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedLineBreak.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedLineBreak.txt @@ -1,5 +1,5 @@ # DerivedLineBreak-17.0.0.txt -# Date: 2025-01-27, 18:09:13 GMT +# Date: 2025-02-14, 01:57:23 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -70,8 +70,8 @@ E000..F8FF ; XX # Co [6400] .. F0000..FFFFD ; XX # Co [65534] .. 100000..10FFFD; XX # Co [65534] .. -# The above property value applies to 757136 code points not listed here. -# Total code points: 894604 +# The above property value applies to 757105 code points not listed here. +# Total code points: 894573 # ================================================ @@ -130,6 +130,7 @@ F0000..FFFFD ; XX # Co [65534] .. 2E57 ; OP # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE 2E59 ; OP # Ps TOP HALF LEFT PARENTHESIS 2E5B ; OP # Ps BOTTOM HALF LEFT PARENTHESIS +2E62 ; OP # Ps LEFT PARENTHESIS WITH MIDDLE RING 3008 ; OP # Ps LEFT ANGLE BRACKET 300A ; OP # Ps LEFT DOUBLE ANGLE BRACKET 300C ; OP # Ps LEFT CORNER BRACKET @@ -170,7 +171,7 @@ FF62 ; OP # Ps HALFWIDTH LEFT CORNER BRACKET 145CE ; OP # Lo ANATOLIAN HIEROGLYPH A410 BEGIN LOGOGRAM MARK 1E95E..1E95F ; OP # Po [2] ADLAM INITIAL EXCLAMATION MARK..ADLAM INITIAL QUESTION MARK -# Total code points: 95 +# Total code points: 96 # ================================================ @@ -217,6 +218,7 @@ FF62 ; OP # Ps HALFWIDTH LEFT CORNER BRACKET 2E25 ; CL # Pe BOTTOM RIGHT HALF BRACKET 2E27 ; CL # Pe RIGHT SIDEWAYS U BRACKET 2E29 ; CL # Pe RIGHT DOUBLE PARENTHESIS +2E63 ; CL # Pe RIGHT PARENTHESIS WITH MIDDLE RING 3001..3002 ; CL # Po [2] IDEOGRAPHIC COMMA..IDEOGRAPHIC FULL STOP 3009 ; CL # Pe RIGHT ANGLE BRACKET 300B ; CL # Pe RIGHT DOUBLE ANGLE BRACKET @@ -264,7 +266,7 @@ FF64 ; CL # Po HALFWIDTH IDEOGRAPHIC COMMA 1343F ; CL # Cf EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE 145CF ; CL # Lo ANATOLIAN HIEROGLYPH A410A END LOGOGRAM MARK -# Total code points: 94 +# Total code points: 95 # ================================================ @@ -384,6 +386,7 @@ FF9E..FF9F ; NS # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KA 2CFE ; EX # Po COPTIC FULL STOP 2E2E ; EX # Po REVERSED QUESTION MARK 2E53..2E54 ; EX # Po [2] MEDIEVAL EXCLAMATION MARK..MEDIEVAL QUESTION MARK +2E60..2E61 ; EX # Po [2] WIGGLY EXCLAMATION MARK..INVERTED WIGGLY EXCLAMATION MARK A60E ; EX # Po VAI FULL STOP A876..A877 ; EX # Po [2] PHAGS-PA MARK SHAD..PHAGS-PA MARK DOUBLE SHAD FE15..FE16 ; EX # Po [2] PRESENTATION FORM FOR VERTICAL EXCLAMATION MARK..PRESENTATION FORM FOR VERTICAL QUESTION MARK @@ -393,7 +396,7 @@ FF1F ; EX # Po FULLWIDTH QUESTION MARK 115C4..115C5 ; EX # Po [2] SIDDHAM SEPARATOR DOT..SIDDHAM SEPARATOR BAR 11C71 ; EX # Po MARCHEN MARK SHAD -# Total code points: 40 +# Total code points: 42 # ================================================ @@ -1145,7 +1148,7 @@ A788 ; AL # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; AL # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; AL # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; AL # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7DC ; AL # L& [77] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER LAMBDA WITH STROKE +A790..A7DD ; AL # L& [78] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN CAPITAL LETTER CLOSED OMEGA A7F1..A7F4 ; AL # Lm [4] MODIFIER LETTER CAPITAL S..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; AL # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; AL # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I @@ -1539,6 +1542,8 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 1DF0A ; AL # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1DF0B..1DF1E ; AL # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1DF25..1DF2A ; AL # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68..1DF7F ; AL # L& [24] LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH..LATIN SMALL LETTER REVERSED U +1DF80..1DF81 ; AL # Lo [2] LATIN CAPITAL LETTER A WITH TOPBAR..LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E030..1E06D ; AL # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1E100..1E12C ; AL # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; AL # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER @@ -1642,7 +1647,7 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 1FB94..1FBEF ; AL # So [92] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..TOP LEFT JUSTIFIED LOWER RIGHT QUARTER BLACK CIRCLE 1FBFA ; AL # So ALARM BELL SYMBOL -# Total code points: 26987 +# Total code points: 27014 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedName.txt b/unicodetools/data/ucd/dev/extracted/DerivedName.txt index 5876213a1..bbd0fa053 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedName.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedName.txt @@ -1,5 +1,5 @@ # DerivedName-17.0.0.txt -# Date: 2025-01-27, 18:09:14 GMT +# Date: 2025-02-11, 13:48:10 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -10908,6 +10908,10 @@ 2E5B ; BOTTOM HALF LEFT PARENTHESIS 2E5C ; BOTTOM HALF RIGHT PARENTHESIS 2E5D ; OBLIQUE HYPHEN +2E60 ; WIGGLY EXCLAMATION MARK +2E61 ; INVERTED WIGGLY EXCLAMATION MARK +2E62 ; LEFT PARENTHESIS WITH MIDDLE RING +2E63 ; RIGHT PARENTHESIS WITH MIDDLE RING 2E80 ; CJK RADICAL REPEAT 2E81 ; CJK RADICAL CLIFF 2E82 ; CJK RADICAL SECOND ONE @@ -14296,6 +14300,7 @@ A7D9 ; LATIN SMALL LETTER SIGMOID S A7DA ; LATIN CAPITAL LETTER LAMBDA A7DB ; LATIN SMALL LETTER LAMBDA A7DC ; LATIN CAPITAL LETTER LAMBDA WITH STROKE +A7DD ; LATIN CAPITAL LETTER CLOSED OMEGA A7F1 ; MODIFIER LETTER CAPITAL S A7F2 ; MODIFIER LETTER CAPITAL C A7F3 ; MODIFIER LETTER CAPITAL F @@ -41883,6 +41888,32 @@ FFFD ; REPLACEMENT CHARACTER 1DF28 ; LATIN SMALL LETTER R WITH MID-HEIGHT LEFT HOOK 1DF29 ; LATIN SMALL LETTER S WITH MID-HEIGHT LEFT HOOK 1DF2A ; LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF68 ; LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH +1DF69 ; LATIN SMALL LETTER PHONOTYPIC A WITH SWASH +1DF6A ; LATIN CAPITAL LETTER PHONOTYPIC ROUNDTOP A +1DF6B ; LATIN SMALL LETTER PHONOTYPIC ROUNDTOP A +1DF6C ; LATIN CAPITAL LETTER REVERSED SCRUPLE +1DF6D ; LATIN SMALL LETTER REVERSED SCRUPLE +1DF6E ; LATIN CAPITAL LETTER PHONOTYPIC DIPHTHONG AI +1DF6F ; LATIN SMALL LETTER PHONOTYPIC DIPHTHONG AI +1DF70 ; LATIN SMALL LETTER I WITH PIGTAIL AT BOTTOM +1DF71 ; LATIN SMALL LETTER STRETCHED I +1DF72 ; LATIN CAPITAL LETTER O WITH CURL +1DF73 ; LATIN SMALL LETTER O WITH CURL +1DF74 ; LATIN CAPITAL LETTER CLOSED OMEGA WITH LONG STEM +1DF75 ; LATIN SMALL LETTER CLOSED OMEGA WITH LONG STEM +1DF76 ; LATIN CAPITAL LETTER TURNED CLOSED OMEGA +1DF77 ; LATIN SMALL LETTER TURNED CLOSED OMEGA +1DF78 ; LATIN CAPITAL LETTER PHONOTYPIC TH +1DF79 ; LATIN SMALL LETTER PHONOTYPIC TH +1DF7A ; LATIN CAPITAL LETTER U WITH HOOK TAIL +1DF7B ; LATIN SMALL LETTER U WITH HOOK TAIL +1DF7C ; LATIN CAPITAL LETTER U WITH NOTCH AT BOTTOM +1DF7D ; LATIN SMALL LETTER U WITH NOTCH AT BOTTOM +1DF7E ; LATIN CAPITAL LETTER REVERSED ENLARGED SMALL U +1DF7F ; LATIN SMALL LETTER REVERSED U +1DF80 ; LATIN CAPITAL LETTER A WITH TOPBAR +1DF81 ; LATIN CAPITAL LETTER E WITH BENT TOPBAR 1E000 ; COMBINING GLAGOLITIC LETTER AZU 1E001 ; COMBINING GLAGOLITIC LETTER BUKY 1E002 ; COMBINING GLAGOLITIC LETTER VEDE @@ -45870,6 +45901,6 @@ E01ED ; VARIATION SELECTOR-254 E01EE ; VARIATION SELECTOR-255 E01EF ; VARIATION SELECTOR-256 -# Total code points: 159834 +# Total code points: 159865 # EOF diff --git a/unicodetools/src/main/resources/org/unicode/text/UCD/AdditionComparisons/179.txt b/unicodetools/src/main/resources/org/unicode/text/UCD/AdditionComparisons/179.txt new file mode 100644 index 000000000..333b8749a --- /dev/null +++ b/unicodetools/src/main/resources/org/unicode/text/UCD/AdditionComparisons/179.txt @@ -0,0 +1,77 @@ +# Latin (and Punctuation): English Phonotypic Alphabet +# https://github.com/unicode-org/utc-release-management/issues/179 + +# Names always differ. +# Age always differs since these tests are comparing additions to pre-existing characters. +Ignoring Name Age: + +# Ignore the security and IDNA properties, as these are not yet included for provisionally assigned characters. +Ignoring Confusable_MA Identifier_Status Identifier_Type Idn_Status Idn_Mapping Idn_2008: + +Propertywise [ + \x{2E60} \N{WIGGLY EXCLAMATION MARK} + \x{2E61} \N{INVERTED WIGGLY EXCLAMATION MARK} + \x{2E2E} ⸮ \N{REVERSED QUESTION MARK} +] AreAlike + +Propertywise [\x{2E60} \N{WIGGLY EXCLAMATION MARK} + \x{2E61} \N{INVERTED WIGGLY EXCLAMATION MARK}] +CorrespondTo [\x{0021} ! \N{EXCLAMATION MARK}] + UpTo: East_Asian_Width (Neutral vs Narrow), + Block (Supplemental_Punctuation vs Basic_Latin) + +Propertywise [\x{2E62} \N{LEFT PARENTHESIS WITH MIDDLE RING}] + : [\x{2E63} \N{RIGHT PARENTHESIS WITH MIDDLE RING}] +CorrespondTo [\x{2E28} ⸨ \N{LEFT DOUBLE PARENTHESIS}] + : [\x{2E29} ⸩ \N{RIGHT DOUBLE PARENTHESIS}] + +Ignoring Unicode_1_Name: +Propertywise [\x{A7DD} \N{LATIN CAPITAL LETTER CLOSED OMEGA}] + : [\x{0277} ɷ \N{LATIN SMALL LETTER CLOSED OMEGA}] +CorrespondTo [\x{A7AD} Ɬ \N{LATIN CAPITAL LETTER L WITH BELT}] + : [\x{026C} ɬ \N{LATIN SMALL LETTER L WITH BELT}] +end Ignoring; + +Propertywise [\x{1DF68} \N{LATIN CAPITAL LETTER PHONOTYPIC A WITH SWASH} + \x{1DF6A} \N{LATIN CAPITAL LETTER PHONOTYPIC ROUNDTOP A} + \x{1DF6C} \N{LATIN CAPITAL LETTER REVERSED SCRUPLE} + \x{1DF6E} \N{LATIN CAPITAL LETTER PHONOTYPIC DIPHTHONG AI} + \x{1DF72} \N{LATIN CAPITAL LETTER O WITH CURL} + \x{1DF74} \N{LATIN CAPITAL LETTER CLOSED OMEGA WITH LONG STEM} + \x{1DF76} \N{LATIN CAPITAL LETTER TURNED CLOSED OMEGA} + \x{1DF78} \N{LATIN CAPITAL LETTER PHONOTYPIC TH} + \x{1DF7A} \N{LATIN CAPITAL LETTER U WITH HOOK TAIL} + \x{1DF7C} \N{LATIN CAPITAL LETTER U WITH NOTCH AT BOTTOM} + \x{1DF7E} \N{LATIN CAPITAL LETTER REVERSED ENLARGED SMALL U}] + : [\x{1DF69} \N{LATIN SMALL LETTER PHONOTYPIC A WITH SWASH} + \x{1DF6B} \N{LATIN SMALL LETTER PHONOTYPIC ROUNDTOP A} + \x{1DF6D} \N{LATIN SMALL LETTER REVERSED SCRUPLE} + \x{1DF6F} \N{LATIN SMALL LETTER PHONOTYPIC DIPHTHONG AI} + \x{1DF73} \N{LATIN SMALL LETTER O WITH CURL} + \x{1DF75} \N{LATIN SMALL LETTER CLOSED OMEGA WITH LONG STEM} + \x{1DF77} \N{LATIN SMALL LETTER TURNED CLOSED OMEGA} + \x{1DF79} \N{LATIN SMALL LETTER PHONOTYPIC TH} + \x{1DF7B} \N{LATIN SMALL LETTER U WITH HOOK TAIL} + \x{1DF7D} \N{LATIN SMALL LETTER U WITH NOTCH AT BOTTOM} + \x{1DF7F} \N{LATIN SMALL LETTER REVERSED U}] +CorrespondTo [\x{A79A} Ꞛ \N{LATIN CAPITAL LETTER VOLAPUK AE}] + : [\x{A79B} ꞛ \N{LATIN SMALL LETTER VOLAPUK AE}] + UpTo: Block (Latin_Extended_G vs Latin_Extended_D) + +Propertywise [ + \x{1DF70} \N{LATIN SMALL LETTER I WITH PIGTAIL AT BOTTOM} + \x{1DF71} \N{LATIN SMALL LETTER STRETCHED I} + \x{1DF03} 𝼃 \N{LATIN SMALL LETTER REVERSED K} +] AreAlike + +Ignoring Block: +Propertywise [ + \x{1DF80} \N{LATIN CAPITAL LETTER A WITH TOPBAR} + \x{1DF81} \N{LATIN CAPITAL LETTER E WITH BENT TOPBAR} + \x{A7FB} ꟻ \N{LATIN EPIGRAPHIC LETTER REVERSED F} +] AreAlike +end Ignoring; + +end Ignoring; + +end Ignoring; \ No newline at end of file