From 9c032a040629f1780c37ebf49a79afb4176b91fd Mon Sep 17 00:00:00 2001 From: Robin Leroy Date: Tue, 3 Oct 2023 01:16:07 +0200 Subject: [PATCH] Regenerate UCD --- .../data/ucd/dev/IndicPositionalCategory.txt | 40 ++++++------- .../data/ucd/dev/IndicSyllabicCategory.txt | 57 ++++++++----------- 2 files changed, 41 insertions(+), 56 deletions(-) diff --git a/unicodetools/data/ucd/dev/IndicPositionalCategory.txt b/unicodetools/data/ucd/dev/IndicPositionalCategory.txt index 1bdddd705..a4d04a2a1 100644 --- a/unicodetools/data/ucd/dev/IndicPositionalCategory.txt +++ b/unicodetools/data/ucd/dev/IndicPositionalCategory.txt @@ -1,30 +1,11 @@ -# Indic_Positional_Category=Right -113B8 ; Right # Mc [3] TULU-TIGALARI VOWEL SIGN AA -113C9..113CA ; Right # Mc [2] TULU-TIGALARI AU LENGTH MARK..TULU-TIGALARI SIGN CANDRA ANUNASIKA -113CC..113CD ; Right # Mc [2] TULU-TIGALARI SIGN ANUSVARA..TULU-TIGALARI SIGN VISARGA -113CF ; Right # Mc TULU-TIGALARI SIGN LOOPED VIRAMA -# Indic_Positional_Category=Left -113C2 ; Left # Mc TULU-TIGALARI VOWEL SIGN EE -113C5 ; Left # Mc TULU-TIGALARI VOWEL SIGN AI -# Indic_Positional_Category=Left_And_Right -113C7..113C8 ; Left_And_Right # Mc [2] TULU-TIGALARI VOWEL SIGN OO..TULU-TIGALARI VOWEL SIGN AU -# Indic_Positional_Category=Top -113CE ; Top # Mn TULU-TIGALARI SIGN VIRAMA -113D1 ; Top # Lo TULU-TIGALARI REPHA -113E1 ; Top # Mn TULU-TIGALARI VEDIC TONE SVARITA -# Indic_Positional_Category=Bottom -113BB..113C0 ; Bottom # Mn [6] TULU-TIGALARI VOWEL SIGN U..TULU-TIGALARI VOWEL SIGN VOCALIC LL -113E2 ; Bottom # Mn TULU-TIGALARI VEDIC TONE ANUDATTA -# Indic_Positional_Category=Top_And_Right -113B9..113BA ; Top_And_Right # Mc [2] TULU-TIGALARI VOWEL SIGN I..TULU-TIGALARI VOWEL SIGN II -# IndicPositionalCategory-15.1.0.txt -# Date: 2023-01-05 +# IndicPositionalCategory-16.0.0.txt +# Date: 2023-10-02, 23:15:32 GMT # © 2023 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see https://www.unicode.org/terms_of_use.html # -# For documentation, see UAX #44: Unicode Character Database, -# at https://www.unicode.org/reports/tr44/ +# Unicode Character Database +# For documentation, see https://www.unicode.org/reports/tr44/ # # This file defines the following property: # @@ -277,6 +258,10 @@ ABEC ; Right # Mc MEETEI MAYEK LUM IYEK 1134D ; Right # Mc GRANTHA SIGN VIRAMA 11357 ; Right # Mc GRANTHA AU LENGTH MARK 11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +113B8 ; Right # Mc TULU-TIGALARI VOWEL SIGN AA +113C9..113CA ; Right # Mc [2] TULU-TIGALARI AU LENGTH MARK..TULU-TIGALARI SIGN CANDRA ANUNASIKA +113CC..113CD ; Right # Mc [2] TULU-TIGALARI SIGN ANUSVARA..TULU-TIGALARI SIGN VISARGA +113CF ; Right # Mc TULU-TIGALARI SIGN LOOPED VIRAMA 11435 ; Right # Mc NEWA VOWEL SIGN AA 11437 ; Right # Mc NEWA VOWEL SIGN II 11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU @@ -355,6 +340,8 @@ AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU 111CE ; Left # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E 112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I 11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +113C2 ; Left # Mc TULU-TIGALARI VOWEL SIGN EE +113C5 ; Left # Mc TULU-TIGALARI VOWEL SIGN AI 11436 ; Left # Mc NEWA VOWEL SIGN I 114B1 ; Left # Mc TIRHUTA VOWEL SIGN I 114B9 ; Left # Mc TIRHUTA VOWEL SIGN E @@ -401,6 +388,7 @@ AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL 17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU 1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +113C7..113C8 ; Left_And_Right # Mc [2] TULU-TIGALARI VOWEL SIGN OO..TULU-TIGALARI VOWEL SIGN AU 114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O 114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU 115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O @@ -563,6 +551,9 @@ ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP 11340 ; Top # Mn GRANTHA VOWEL SIGN II 11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX 11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +113CE ; Top # Mn TULU-TIGALARI SIGN VIRAMA +113D1 ; Top # Lo TULU-TIGALARI REPHA +113E1 ; Top # Mn TULU-TIGALARI VEDIC TONE SVARITA 1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI 11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA 1145E ; Top # Mn NEWA SANDHI MARK @@ -721,6 +712,8 @@ ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK 112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU 112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA 1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +113BB..113C0 ; Bottom # Mn [6] TULU-TIGALARI VOWEL SIGN U..TULU-TIGALARI VOWEL SIGN VOCALIC LL +113E2 ; Bottom # Mn TULU-TIGALARI VEDIC TONE ANUDATTA 11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL 11442 ; Bottom # Mn NEWA SIGN VIRAMA 11446 ; Bottom # Mn NEWA SIGN NUKTA @@ -780,6 +773,7 @@ ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK 1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG 111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU 11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +113B9..113BA ; Top_And_Right # Mc [2] TULU-TIGALARI VOWEL SIGN I..TULU-TIGALARI VOWEL SIGN II # Indic_Positional_Category=Top_And_Left diff --git a/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt b/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt index 68e85e206..f6eefdde8 100644 --- a/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt +++ b/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt @@ -1,39 +1,11 @@ -# Indic_Syllabic_Category=Bindu -113CA ; Bindu # Mc TULU-TIGALARI SIGN CANDRA ANUNASIKA -113CC ; Bindu # Mc TULU-TIGALARI SIGN ANUSVARA -# Indic_Syllabic_Category=Visarga -113CD ; Visarga # Mc TULU-TIGALARI SIGN VISARGA -# Indic_Syllabic_Category=Avagraha -113B7 ; Avagraha # Lo TULU-TIGALARI SIGN AVAGRAHA -# Indic_Syllabic_Category=Pure_Killer -113CE..113CF ; Pure_Killer # Mn [2] TULU-TIGALARI SIGN VIRAMA..TULU-TIGALARI SIGN LOOPED VIRAMA -# Indic_Syllabic_Category=Invisible_Stacker -113D0 ; Invisible_Stacker # Mn TULU-TIGALARI CONJOINER -# Indic_Syllabic_Category=Vowel_Independent -11380..11389 ; Vowel_Independent # Lo [10] TULU-TIGALARI LETTER A..TULU-TIGALARI LETTER VOCALIC LL -1138B ; Vowel_Independent # Lo TULU-TIGALARI LETTER EE -1138E ; Vowel_Independent # Lo TULU-TIGALARI LETTER AI -11390..11391 ; Vowel_Independent # Lo [2] TULU-TIGALARI LETTER OO..TULU-TIGALARI LETTER VOCALIC AU -# Indic_Syllabic_Category=Vowel_Dependent -113B8..113BA ; Vowel_Dependent # Mc [3] TULU-TIGALARI VOWEL SIGN AA..TIGALARI VOWEL SIGN VOCALIC II -113BB..113C0 ; Vowel_Dependent # Mn [6] TULU-TIGALARI VOWEL SIGN U..TIGALARI VOWEL SIGN VOCALIC LL -113C2 ; Vowel_Dependent # Mn TIGALARI VOWEL SIGN EE -113C5 ; Vowel_Dependent # Mn TIGALARI VOWEL SIGN AI -113C7..113C9 ; Vowel_Dependent # Mc [3] TIGALARI VOWEL SIGN OO..TIGALARI VOWEL AU LENGTH MARK -# Indic_Syllabic_Category=Consonant -11392..113B5 ; Consonant # Lo [36] TULU-TIGALARI LETTER KA..TULU-TIGALARI LETTER LLLA -# Indic_Syllabic_Category=Cantillation_Mark -113E1..113E2 ; Cantillation_Mark # Mn [2] TULU-TIGALARI VEDIC TONE SVARITA..TULU-TIGALARI VEDIC TONE ANUDATTA -# Indic_Syllabic_Category=Consonant_Preceding_Repha -113D1 ; Consonant_Preceding_Repha # Lo TULU-TIGALARI REPHA -# IndicSyllabicCategory-15.1.0.txt -# Date: 2023-01-05 +# IndicSyllabicCategory-16.0.0.txt +# Date: 2023-10-02, 23:15:32 GMT # © 2023 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see https://www.unicode.org/terms_of_use.html # -# For documentation, see UAX #44: Unicode Character Database, -# at https://www.unicode.org/reports/tr44/ +# Unicode Character Database +# For documentation, see https://www.unicode.org/reports/tr44/ # # This file defines the following property: # @@ -147,6 +119,8 @@ A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK 11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU 11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA 1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +113CA ; Bindu # Mc TULU-TIGALARI SIGN CANDRA ANUNASIKA +113CC ; Bindu # Mc TULU-TIGALARI SIGN ANUSVARA 11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA 1145F ; Bindu # Lo NEWA LETTER VEDIC ANUSVARA 114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA @@ -197,6 +171,7 @@ AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA 11102 ; Visarga # Mn CHAKMA SIGN VISARGA 11182 ; Visarga # Mc SHARADA SIGN VISARGA 11303 ; Visarga # Mc GRANTHA SIGN VISARGA +113CD ; Visarga # Mc TULU-TIGALARI SIGN VISARGA 11445 ; Visarga # Mc NEWA SIGN VISARGA 114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA 115BE ; Visarga # Mc SIDDHAM SIGN VISARGA @@ -231,6 +206,7 @@ AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA 1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA 111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA 1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +113B7 ; Avagraha # Lo TULU-TIGALARI SIGN AVAGRAHA 11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA 114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA 119E1 ; Avagraha # Lo NANDINAGARI SIGN AVAGRAHA @@ -347,6 +323,8 @@ ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK 11070 ; Pure_Killer # Mn BRAHMI SIGN OLD TAMIL VIRAMA 11134 ; Pure_Killer # Mn CHAKMA MAAYYAA 112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +113CE ; Pure_Killer # Mn TULU-TIGALARI SIGN VIRAMA +113CF ; Pure_Killer # Mc TULU-TIGALARI SIGN LOOPED VIRAMA 1172B ; Pure_Killer # Mn AHOM SIGN KILLER 1193D ; Pure_Killer # Mc DIVES AKURU SIGN HALANTA 11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA @@ -373,6 +351,7 @@ ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA 10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA 11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +113D0 ; Invisible_Stacker # Mn TULU-TIGALARI CONJOINER 1193E ; Invisible_Stacker # Mn DIVES AKURU VIRAMA 11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER 11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER @@ -456,6 +435,10 @@ ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA 1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI 11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU 11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11380..11389 ; Vowel_Independent # Lo [10] TULU-TIGALARI LETTER A..TULU-TIGALARI LETTER VOCALIC LL +1138B ; Vowel_Independent # Lo TULU-TIGALARI LETTER EE +1138E ; Vowel_Independent # Lo TULU-TIGALARI LETTER AI +11390..11391 ; Vowel_Independent # Lo [2] TULU-TIGALARI LETTER OO..TULU-TIGALARI LETTER AU 11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU 11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU 11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU @@ -683,6 +666,11 @@ ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEET 1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU 11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK 11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +113B8..113BA ; Vowel_Dependent # Mc [3] TULU-TIGALARI VOWEL SIGN AA..TULU-TIGALARI VOWEL SIGN II +113BB..113C0 ; Vowel_Dependent # Mn [6] TULU-TIGALARI VOWEL SIGN U..TULU-TIGALARI VOWEL SIGN VOCALIC LL +113C2 ; Vowel_Dependent # Mc TULU-TIGALARI VOWEL SIGN EE +113C5 ; Vowel_Dependent # Mc TULU-TIGALARI VOWEL SIGN AI +113C7..113C9 ; Vowel_Dependent # Mc [3] TULU-TIGALARI VOWEL SIGN OO..TULU-TIGALARI AU LENGTH MARK 11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II 11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI 11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU @@ -929,6 +917,7 @@ ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTE 1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA 11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA 11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +11392..113B5 ; Consonant # Lo [36] TULU-TIGALARI LETTER KA..TULU-TIGALARI LETTER LLLA 1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA 1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA 1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA @@ -1003,6 +992,7 @@ ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTE # [Not derivable] 0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +113D1 ; Consonant_Preceding_Repha # Lo TULU-TIGALARI REPHA 11941 ; Consonant_Preceding_Repha # Lo DIVES AKURU INITIAL RA 11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA 11F02 ; Consonant_Preceding_Repha # Lo KAWI SIGN REPHA @@ -1209,6 +1199,7 @@ A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..CO 1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN 11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX 11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +113E1..113E2 ; Cantillation_Mark # Mn [2] TULU-TIGALARI VEDIC TONE SVARITA..TULU-TIGALARI VEDIC TONE ANUDATTA # ================================================ @@ -1363,7 +1354,7 @@ ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NI # script, e.g. in Brahmi) # # Note: These are different from Numbers, in the way that there is no known -# evidence of Brahmi Joining Numbers taking vowels or subjoined consonants. +# evidence of Brahmi Joining Numbers taking vowels or subjoined consonants. # Until such evidence is found, implementations may assume that Brahmi # Joining Numbers only participate in shaping with other Brahmi Joining # Numbers.