Skip to content

Commit 647947f

Browse files
LaurenzValerque
authored andcommitted
[USE] Update the data files
1 parent bd68568 commit 647947f

7 files changed

+485
-547
lines changed

scripts/ms-use/IndicPositionalCategory-Additional.txt

+5-4
Original file line numberDiff line numberDiff line change
@@ -49,7 +49,7 @@ A9BE ; Right # Mc JAVANESE CONSONANT SIGN PENGKAL # Reduced from
4949
AA35   ; Top # Mn       CHAM CONSONANT SIGN
5050
1112A..1112B ; Top # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU # see USE issue #25
5151
11131..11132 ; Top # Mn [2] CHAKMA O MARK..CHAKMA AU MARK # see USE issue #25
52-
1E4EC..1E4EF ; Top # Mn [4] NAG MUNDARI SIGN MUHOR..NAG MUNDARI SIGN SUTUH # 1E4EE is below, but made to for ccc
52+
1E4EC..1E4EF ; Top # Mn [4] NAG MUNDARI SIGN MUHOR..NAG MUNDARI SIGN SUTUH # 1E4EE is below, but made to for ccc
5353

5454
# ================================================
5555

@@ -77,11 +77,12 @@ AA35   ; Top # Mn       CHAM CONSONANT SIGN
7777
10F83 ; Bottom # Mn OLD UYGHUR COMBINING DOT BELOW
7878
10F84 ; Bottom # Mn OLD UYGHUR COMBINING TWO DOTS ABOVE # Overriden, ccc controls order
7979
10F85 ; Bottom # Mn OLD UYGHUR COMBINING TWO DOTS BELOW
80+
113CF ; Bottom # Mc TULU-TIGALARI SIGN LOOPED VIRAMA # Issue #17
8081
16F4F ; Bottom # Mn MIAO SIGN CONSONANT MODIFIER BAR
8182
16F51..16F87 ; Bottom # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI
8283
16F8F..16F92 ; Bottom # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW
83-
1E5EE ; Bottom # Mn OL ONAL SIGN MU # Not really below, but need to override to fit into Universal model
84-
1E5EF ; Bottom # Mn OL ONAL SIGN IKIR
84+
1E5EE ; Bottom # Mn OL ONAL SIGN MU # Not really below, but need to override to fit into Universal model
85+
1E5EF ; Bottom # Mn OL ONAL SIGN IKIR
8586

8687
# ================================================
8788

@@ -94,7 +95,7 @@ AA35   ; Top # Mn       CHAM CONSONANT SIGN
9495
07EB..07F3 ; Top # Mn [9] NKO COMBINING SHORT HIGH TONE..NKO COMBINING DOUBLE DOT ABOVE
9596
07FD ; Top # Mn NKO DANTAYALAN # Not really top, but assigned here to allow ccc to control mark order
9697
1885..1886 ; Top # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA
97-
1B6C ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP
98+
1B6C ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP
9899
1CF8..1CF9 ; Top # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE
99100
10D24..10D27 ; Top # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI
100101
10EAB..10EAC ; Top # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK

scripts/ms-use/IndicSyllabicCategory-Additional.txt

+4-5
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
# OVERRIDES TO ASSIGNED VALUES
1414
# ================================================
1515

16-
# Indic_Syllabic_Category=Bindu
16+
# Indic_Syllabic_Category=Bindu
1717
193A ; Bindu # Mn LIMBU SIGN KEMPHRENG
1818
AA29 ; Bindu # Mn CHAM VOWEL SIGN AA
1919
10A0D ; Bindu # Mn KHAROSHTHI SIGN DOUBLE RING BELOW
@@ -47,14 +47,13 @@ AA29 ; Bindu # Mn CHAM VOWEL SIGN AA
4747

4848
# ================================================
4949

50-
# Indic_Syllabic_Category=Gemination_Mark
50+
# Indic_Syllabic_Category=Gemination_Mark
5151
11134 ; Gemination_Mark # Mc CHAKMA MAAYYAA
5252

5353
# ================================================
5454

55-
# Indic_Syllabic_Category=Nukta
55+
# Indic_Syllabic_Category=Nukta
5656
0F71 ; Nukta # Mn TIBETAN VOWEL SIGN AA # Reassigned to get this before an above vowel, but see #22
57-
1BF2..1BF3 ; Nukta # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN # see USE issue #20
5857
113CF ; Nukta # Mc TULU-TIGALARI SIGN LOOPED VIRAMA
5958

6059
# ================================================
@@ -115,7 +114,7 @@ AABD ; Vowel_Independent # Lo TAI VIET VOWEL AN
115114
18B00..18CD5 ; Consonant # Lo [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5
116115
18CFF ; Consonant # Lo KHITAN SMALL SCRIPT CHARACTER-18CFF
117116
1BC00..1BC6A ; Consonant # Lo [107] DUPLOYAN LETTER H..DUPLOYAN LETTER VOCALIC M
118-
1BC70..1BC7C ; Consonant # Lo [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK
117+
1BC70..1BC7C ; Consonant # Lo [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK
119118
1BC80..1BC88 ; Consonant # Lo [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL
120119
1BC90..1BC99 ; Consonant # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW
121120
1E100..1E12C ; Consonant # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W

src/hb/ot_shaper_use.rs

+1
Original file line numberDiff line numberDiff line change
@@ -101,6 +101,7 @@ pub mod category {
101101
pub const HVM: u8 = 53; // HIEROGLYPH_SEGMENT_END
102102
pub const HM: u8 = 54; // HIEROGLYPH_MOD
103103
pub const HR: u8 = 55; // HIEROGLYPH_MIRROR
104+
pub const RK: u8 = 56; // REORDERING_KILLER
104105
}
105106

106107
// These features are applied all at once, before reordering,

src/hb/ot_shaper_use_machine.rl

+2-1
Original file line numberDiff line numberDiff line change
@@ -55,6 +55,7 @@ SE = 52; # HIEROGLYPH_SEGMENT_END
5555
HVM = 53; # HALANT_OR_VOWEL_MODIFIER
5656
HM = 54; # HIEROGLYPH_MOD
5757
HR = 55; # HIEROGLYPH_MIRROR
58+
RK = 56; # REORDERING_KILLER
5859

5960
FAbv = 24; # CONS_FINAL_ABOVE
6061
FBlw = 25; # CONS_FINAL_BELOW
@@ -107,7 +108,7 @@ symbol_cluster_tail = SMAbv+ SMBlw* | SMBlw+;
107108

108109
virama_terminated_cluster_tail =
109110
consonant_modifiers
110-
IS
111+
(IS | RK)
111112
;
112113
virama_terminated_cluster =
113114
complex_syllable_start

0 commit comments

Comments
 (0)