|
17 | 17 | "ancient_greek": "αβγδεζηθικλμνξοπρστυφχψωΑΒΓΔΕΖΗΘΙΚΛΜΝΞΟΠΡΣΤΥΦΧΨΩ", |
18 | 18 | "arabic_letters": "ءآأؤإئابةتثجحخدذرزسشصضطظعغـفقكلمنهوىي", |
19 | 19 | "persian_letters": "پچڢڤگ", |
20 | | - "hindi_digits": "٠١٢٣٤٥٦٧٨٩", |
| 20 | + "arabic_digits": "٠١٢٣٤٥٦٧٨٩", |
21 | 21 | "arabic_diacritics": "ًٌٍَُِّْ", |
22 | 22 | "arabic_punctuation": "؟؛«»—", |
| 23 | + "hindi_letters": "अआइईउऊऋॠऌॡएऐओऔअंअःकखगघङचछजझञटठडढणतथदधनपफबभमयरलवशषसह", |
| 24 | + "hindi_digits": "०१२३४५६७८९", |
| 25 | + "hindi_punctuation": "।,?!:्ॐ॰॥॰", |
| 26 | + "bangla_letters": "অআইঈউঊঋএঐওঔকখগঘঙচছজঝঞটঠডঢণতথদধনপফবভমযরলশষসহ়ঽািীুূৃেৈোৌ্ৎংঃঁ", |
| 27 | + "bangla_digits": "০১২৩৪৫৬৭৮৯", |
23 | 28 | } |
24 | 29 |
|
25 | 30 | VOCABS["latin"] = VOCABS["digits"] + VOCABS["ascii_letters"] + VOCABS["punctuation"] |
|
32 | 37 | VOCABS["german"] = VOCABS["english"] + "äöüßÄÖÜẞ" |
33 | 38 | VOCABS["arabic"] = ( |
34 | 39 | VOCABS["digits"] |
35 | | - + VOCABS["hindi_digits"] |
| 40 | + + VOCABS["arabic_digits"] |
36 | 41 | + VOCABS["arabic_letters"] |
37 | 42 | + VOCABS["persian_letters"] |
38 | 43 | + VOCABS["arabic_diacritics"] |
|
52 | 57 | + "ÁÀẢẠÃĂẮẰẲẴẶÂẤẦẨẪẬÉÈẺẼẸÊẾỀỂỄỆÓÒỎÕỌÔỐỒỔỘỖƠỚỜỞỢỠÚÙỦŨỤƯỨỪỬỮỰIÍÌỈĨỊÝỲỶỸỴ" |
53 | 58 | ) |
54 | 59 | VOCABS["hebrew"] = VOCABS["english"] + "אבגדהוזחטיכלמנסעפצקרשת" + "₪" |
| 60 | +VOCABS["hindi"] = VOCABS["hindi_letters"] + VOCABS["hindi_digits"] + VOCABS["hindi_punctuation"] |
| 61 | +VOCABS["bangla"] = VOCABS["bangla_letters"] + VOCABS["bangla_digits"] |
55 | 62 | VOCABS["multilingual"] = "".join( |
56 | 63 | dict.fromkeys( |
57 | 64 | VOCABS["french"] |
|
0 commit comments