Skip to content

Commit

Permalink
Merge remote-tracking branch 'la-vache/main' into cjk-extension-j
Browse files Browse the repository at this point in the history
  • Loading branch information
eggrobin committed Nov 14, 2024
2 parents 7f18dec + 5a39610 commit e8ac7ad
Show file tree
Hide file tree
Showing 20 changed files with 124 additions and 36 deletions.
1 change: 1 addition & 0 deletions unicodetools/data/ucd/dev/Blocks.txt
Original file line number Diff line number Diff line change
Expand Up @@ -228,6 +228,7 @@ FFF0..FFFF; Specials
108E0..108FF; Hatran
10900..1091F; Phoenician
10920..1093F; Lydian
10940..1095C; Sidetic
10980..1099F; Meroitic Hieroglyphs
109A0..109FF; Meroitic Cursive
10A00..10A5F; Kharoshthi
Expand Down
5 changes: 3 additions & 2 deletions unicodetools/data/ucd/dev/DerivedAge.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# DerivedAge-17.0.0.txt
# Date: 2024-11-14, 15:01:57 GMT
# Date: 2024-11-14, 15:03:59 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -2080,9 +2080,10 @@ A7F1 ; 17.0 # MODIFIER LETTER CAPITAL S
FBC3..FBD2 ; 17.0 # [16] ARABIC LIGATURE JALLA WA-ALAA..ARABIC LIGATURE ALAYHI AR-RAHMAH
FD90..FD91 ; 17.0 # [2] ARABIC LIGATURE RAHMATU ALLAAHI ALAYH..ARABIC LIGATURE RAHMATU ALLAAHI ALAYHAA
FDC8..FDCE ; 17.0 # [7] ARABIC LIGATURE RAHIMAHU ALLAAH TAAALAA..ARABIC LIGATURE KARRAMA ALLAAHU WAJHAH
10940..1095C ; 17.0 # [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10ED1..10ED8 ; 17.0 # [8] ARABIC LIGATURE ALAYHAA AS-SALAATU WAS-SALAAM..ARABIC LIGATURE NAWWARA ALLAAHU MARQADAH
323B0..33479 ; 17.0 # [4298] CJK UNIFIED IDEOGRAPH-323B0..CJK UNIFIED IDEOGRAPH-33479

# Total code points: 4370
# Total code points: 4399

# EOF
20 changes: 13 additions & 7 deletions unicodetools/data/ucd/dev/DerivedCoreProperties.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# DerivedCoreProperties-17.0.0.txt
# Date: 2024-11-14, 15:02:17 GMT
# Date: 2024-11-14, 15:04:19 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -1018,6 +1018,7 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG
108F4..108F5 ; Alphabetic # Lo [2] HATRAN LETTER SHIN..HATRAN LETTER TAW
10900..10915 ; Alphabetic # Lo [22] PHOENICIAN LETTER ALF..PHOENICIAN LETTER TAU
10920..10939 ; Alphabetic # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
10940..1095C ; Alphabetic # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..109B7 ; Alphabetic # Lo [56] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC CURSIVE LETTER DA
109BE..109BF ; Alphabetic # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
10A00 ; Alphabetic # Lo KHAROSHTHI LETTER A
Expand Down Expand Up @@ -1439,7 +1440,7 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG
30000..3134A ; Alphabetic # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
31350..33479 ; Alphabetic # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479

# Total code points: 147066
# Total code points: 147095

# ================================================

Expand Down Expand Up @@ -6710,6 +6711,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL
108F4..108F5 ; ID_Start # Lo [2] HATRAN LETTER SHIN..HATRAN LETTER TAW
10900..10915 ; ID_Start # Lo [22] PHOENICIAN LETTER ALF..PHOENICIAN LETTER TAU
10920..10939 ; ID_Start # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
10940..1095C ; ID_Start # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..109B7 ; ID_Start # Lo [56] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC CURSIVE LETTER DA
109BE..109BF ; ID_Start # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
10A00 ; ID_Start # Lo KHAROSHTHI LETTER A
Expand Down Expand Up @@ -6970,7 +6972,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL
30000..3134A ; ID_Start # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
31350..33479 ; ID_Start # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479

# Total code points: 145576
# Total code points: 145605

# ================================================

Expand Down Expand Up @@ -7864,6 +7866,7 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN
108F4..108F5 ; ID_Continue # Lo [2] HATRAN LETTER SHIN..HATRAN LETTER TAW
10900..10915 ; ID_Continue # Lo [22] PHOENICIAN LETTER ALF..PHOENICIAN LETTER TAU
10920..10939 ; ID_Continue # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
10940..1095C ; ID_Continue # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..109B7 ; ID_Continue # Lo [56] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC CURSIVE LETTER DA
109BE..109BF ; ID_Continue # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
10A00 ; ID_Continue # Lo KHAROSHTHI LETTER A
Expand Down Expand Up @@ -8377,7 +8380,7 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN
31350..33479 ; ID_Continue # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479
E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256

# Total code points: 148877
# Total code points: 148906

# ================================================

Expand Down Expand Up @@ -8893,6 +8896,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU
108F4..108F5 ; XID_Start # Lo [2] HATRAN LETTER SHIN..HATRAN LETTER TAW
10900..10915 ; XID_Start # Lo [22] PHOENICIAN LETTER ALF..PHOENICIAN LETTER TAU
10920..10939 ; XID_Start # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
10940..1095C ; XID_Start # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..109B7 ; XID_Start # Lo [56] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC CURSIVE LETTER DA
109BE..109BF ; XID_Start # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
10A00 ; XID_Start # Lo KHAROSHTHI LETTER A
Expand Down Expand Up @@ -9153,7 +9157,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU
30000..3134A ; XID_Start # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
31350..33479 ; XID_Start # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479

# Total code points: 145553
# Total code points: 145582

# ================================================

Expand Down Expand Up @@ -10048,6 +10052,7 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA
108F4..108F5 ; XID_Continue # Lo [2] HATRAN LETTER SHIN..HATRAN LETTER TAW
10900..10915 ; XID_Continue # Lo [22] PHOENICIAN LETTER ALF..PHOENICIAN LETTER TAU
10920..10939 ; XID_Continue # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
10940..1095C ; XID_Continue # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..109B7 ; XID_Continue # Lo [56] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC CURSIVE LETTER DA
109BE..109BF ; XID_Continue # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
10A00 ; XID_Continue # Lo KHAROSHTHI LETTER A
Expand Down Expand Up @@ -10561,7 +10566,7 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA
31350..33479 ; XID_Continue # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479
E0100..E01EF ; XID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256

# Total code points: 148858
# Total code points: 148887

# ================================================

Expand Down Expand Up @@ -12284,6 +12289,7 @@ FFFC..FFFD ; Grapheme_Base # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEME
1091F ; Grapheme_Base # Po PHOENICIAN WORD SEPARATOR
10920..10939 ; Grapheme_Base # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
1093F ; Grapheme_Base # Po LYDIAN TRIANGULAR MARK
10940..1095C ; Grapheme_Base # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..109B7 ; Grapheme_Base # Lo [56] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC CURSIVE LETTER DA
109BC..109BD ; Grapheme_Base # No [2] MEROITIC CURSIVE FRACTION ELEVEN TWELFTHS..MEROITIC CURSIVE FRACTION ONE HALF
109BE..109BF ; Grapheme_Base # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
Expand Down Expand Up @@ -12817,7 +12823,7 @@ FFFC..FFFD ; Grapheme_Base # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEME
30000..3134A ; Grapheme_Base # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
31350..33479 ; Grapheme_Base # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479

# Total code points: 157071
# Total code points: 157100

# ================================================

Expand Down
3 changes: 2 additions & 1 deletion unicodetools/data/ucd/dev/EastAsianWidth.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# EastAsianWidth-17.0.0.txt
# Date: 2024-11-14, 15:02:21 GMT
# Date: 2024-11-14, 15:04:25 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -1904,6 +1904,7 @@ FFFD ; A # So REPLACEMENT CHARACTER
1091F ; N # Po PHOENICIAN WORD SEPARATOR
10920..10939 ; N # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
1093F ; N # Po LYDIAN TRIANGULAR MARK
10940..1095C ; N # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..1099F ; N # Lo [32] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC HIEROGLYPHIC SYMBOL VIDJ-2
109A0..109B7 ; N # Lo [24] MEROITIC CURSIVE LETTER A..MEROITIC CURSIVE LETTER DA
109BC..109BD ; N # No [2] MEROITIC CURSIVE FRACTION ELEVEN TWELFTHS..MEROITIC CURSIVE FRACTION ONE HALF
Expand Down
3 changes: 2 additions & 1 deletion unicodetools/data/ucd/dev/LineBreak.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# LineBreak-17.0.0.txt
# Date: 2024-11-14, 15:02:22 GMT
# Date: 2024-11-14, 15:04:26 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -2759,6 +2759,7 @@ FFFD ; AI # So REPLACEMENT CHARACTER
1091F ; BA # Po PHOENICIAN WORD SEPARATOR
10920..10939 ; AL # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
1093F ; AL # Po LYDIAN TRIANGULAR MARK
10940..1095C ; AL # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..1099F ; AL # Lo [32] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC HIEROGLYPHIC SYMBOL VIDJ-2
109A0..109B7 ; AL # Lo [24] MEROITIC CURSIVE LETTER A..MEROITIC CURSIVE LETTER DA
109BC..109BD ; AL # No [2] MEROITIC CURSIVE FRACTION ELEVEN TWELFTHS..MEROITIC CURSIVE FRACTION ONE HALF
Expand Down
4 changes: 3 additions & 1 deletion unicodetools/data/ucd/dev/PropertyValueAliases.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# PropertyValueAliases-17.0.0.txt
# Date: 2024-10-16, 13:48:47 GMT
# Date: 2024-11-14, 15:04:37 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -424,6 +424,7 @@ blk; Sharada ; Sharada
blk; Shavian ; Shavian
blk; Shorthand_Format_Controls ; Shorthand_Format_Controls
blk; Siddham ; Siddham
blk; Sidetic ; Sidetic
blk; Sinhala ; Sinhala
blk; Sinhala_Archaic_Numbers ; Sinhala_Archaic_Numbers
blk; Small_Forms ; Small_Form_Variants
Expand Down Expand Up @@ -1440,6 +1441,7 @@ sc ; Sgnw ; SignWriting
sc ; Shaw ; Shavian
sc ; Shrd ; Sharada
sc ; Sidd ; Siddham
sc ; Sidt ; Sidetic
sc ; Sind ; Khudawadi
sc ; Sinh ; Sinhala
sc ; Sogd ; Sogdian
Expand Down
4 changes: 2 additions & 2 deletions unicodetools/data/ucd/dev/ScriptExtensions.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# ScriptExtensions-16.0.0.txt
# Date: 2024-07-30, 19:38:00 GMT
# ScriptExtensions-17.0.0.txt
# Date: 2024-10-16, 17:28:17 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down
8 changes: 7 additions & 1 deletion unicodetools/data/ucd/dev/Scripts.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# Scripts-17.0.0.txt
# Date: 2024-11-14, 15:02:45 GMT
# Date: 2024-11-14, 15:04:49 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -3127,4 +3127,10 @@ ABF0..ABF9 ; Meetei_Mayek # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DI

# Total code points: 80

# ================================================

10940..1095C ; Sidetic # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29

# Total code points: 29

# EOF
29 changes: 29 additions & 0 deletions unicodetools/data/ucd/dev/UnicodeData.txt
Original file line number Diff line number Diff line change
Expand Up @@ -18772,6 +18772,35 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;;
10938;LYDIAN LETTER NN;Lo;0;R;;;;;N;;;;;
10939;LYDIAN LETTER C;Lo;0;R;;;;;N;;;;;
1093F;LYDIAN TRIANGULAR MARK;Po;0;R;;;;;N;;;;;
10940;SIDETIC LETTER N01;Lo;0;R;;;;;N;;;;;
10941;SIDETIC LETTER N02;Lo;0;R;;;;;N;;;;;
10942;SIDETIC LETTER N03;Lo;0;R;;;;;N;;;;;
10943;SIDETIC LETTER N04;Lo;0;R;;;;;N;;;;;
10944;SIDETIC LETTER N05;Lo;0;R;;;;;N;;;;;
10945;SIDETIC LETTER N06;Lo;0;R;;;;;N;;;;;
10946;SIDETIC LETTER N07;Lo;0;R;;;;;N;;;;;
10947;SIDETIC LETTER N08;Lo;0;R;;;;;N;;;;;
10948;SIDETIC LETTER N09;Lo;0;R;;;;;N;;;;;
10949;SIDETIC LETTER N10;Lo;0;R;;;;;N;;;;;
1094A;SIDETIC LETTER N11;Lo;0;R;;;;;N;;;;;
1094B;SIDETIC LETTER N12;Lo;0;R;;;;;N;;;;;
1094C;SIDETIC LETTER N13;Lo;0;R;;;;;N;;;;;
1094D;SIDETIC LETTER N14;Lo;0;R;;;;;N;;;;;
1094E;SIDETIC LETTER N15;Lo;0;R;;;;;N;;;;;
1094F;SIDETIC LETTER N16;Lo;0;R;;;;;N;;;;;
10950;SIDETIC LETTER N17;Lo;0;R;;;;;N;;;;;
10951;SIDETIC LETTER N18;Lo;0;R;;;;;N;;;;;
10952;SIDETIC LETTER N19;Lo;0;R;;;;;N;;;;;
10953;SIDETIC LETTER N20;Lo;0;R;;;;;N;;;;;
10954;SIDETIC LETTER N21;Lo;0;R;;;;;N;;;;;
10955;SIDETIC LETTER N22;Lo;0;R;;;;;N;;;;;
10956;SIDETIC LETTER N23;Lo;0;R;;;;;N;;;;;
10957;SIDETIC LETTER N24;Lo;0;R;;;;;N;;;;;
10958;SIDETIC LETTER N25;Lo;0;R;;;;;N;;;;;
10959;SIDETIC LETTER N26;Lo;0;R;;;;;N;;;;;
1095A;SIDETIC LETTER N27;Lo;0;R;;;;;N;;;;;
1095B;SIDETIC LETTER N28;Lo;0;R;;;;;N;;;;;
1095C;SIDETIC LETTER N29;Lo;0;R;;;;;N;;;;;
10980;MEROITIC HIEROGLYPHIC LETTER A;Lo;0;R;;;;;N;;;;;
10981;MEROITIC HIEROGLYPHIC LETTER E;Lo;0;R;;;;;N;;;;;
10982;MEROITIC HIEROGLYPHIC LETTER I;Lo;0;R;;;;;N;;;;;
Expand Down
3 changes: 2 additions & 1 deletion unicodetools/data/ucd/dev/VerticalOrientation.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# VerticalOrientation-17.0.0.txt
# Date: 2024-11-14, 15:02:47 GMT
# Date: 2024-11-14, 15:04:52 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -1725,6 +1725,7 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA
1091F ; R # Po PHOENICIAN WORD SEPARATOR
10920..10939 ; R # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
1093F ; R # Po LYDIAN TRIANGULAR MARK
10940..1095C ; R # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..1099F ; U # Lo [32] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC HIEROGLYPHIC SYMBOL VIDJ-2
109A0..109B7 ; R # Lo [24] MEROITIC CURSIVE LETTER A..MEROITIC CURSIVE LETTER DA
109BC..109BD ; R # No [2] MEROITIC CURSIVE FRACTION ELEVEN TWELFTHS..MEROITIC CURSIVE FRACTION ONE HALF
Expand Down
5 changes: 3 additions & 2 deletions unicodetools/data/ucd/dev/auxiliary/SentenceBreakProperty.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# SentenceBreakProperty-17.0.0.txt
# Date: 2024-11-14, 15:02:45 GMT
# Date: 2024-11-14, 15:04:50 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -2372,6 +2372,7 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL
108F4..108F5 ; OLetter # Lo [2] HATRAN LETTER SHIN..HATRAN LETTER TAW
10900..10915 ; OLetter # Lo [22] PHOENICIAN LETTER ALF..PHOENICIAN LETTER TAU
10920..10939 ; OLetter # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
10940..1095C ; OLetter # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..109B7 ; OLetter # Lo [56] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC CURSIVE LETTER DA
109BE..109BF ; OLetter # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
10A00 ; OLetter # Lo KHAROSHTHI LETTER A
Expand Down Expand Up @@ -2591,7 +2592,7 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL
30000..3134A ; OLetter # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
31350..33479 ; OLetter # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479

# Total code points: 141211
# Total code points: 141240

# ================================================

Expand Down
5 changes: 3 additions & 2 deletions unicodetools/data/ucd/dev/auxiliary/WordBreakProperty.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# WordBreakProperty-17.0.0.txt
# Date: 2024-11-13, 22:19:12 GMT
# Date: 2024-11-14, 14:37:47 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -1114,6 +1114,7 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL
108F4..108F5 ; ALetter # Lo [2] HATRAN LETTER SHIN..HATRAN LETTER TAW
10900..10915 ; ALetter # Lo [22] PHOENICIAN LETTER ALF..PHOENICIAN LETTER TAU
10920..10939 ; ALetter # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
10940..1095C ; ALetter # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..109B7 ; ALetter # Lo [56] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC CURSIVE LETTER DA
109BE..109BF ; ALetter # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
10A00 ; ALetter # Lo KHAROSHTHI LETTER A
Expand Down Expand Up @@ -1354,7 +1355,7 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL
1F150..1F169 ; ALetter # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z
1F170..1F189 ; ALetter # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z

# Total code points: 33800
# Total code points: 33829

# ================================================

Expand Down
6 changes: 4 additions & 2 deletions unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# DerivedBidiClass-17.0.0.txt
# Date: 2024-11-14, 15:02:15 GMT
# Date: 2024-11-14, 15:04:17 GMT
# © 2024 Unicode®, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
Expand Down Expand Up @@ -67,6 +67,7 @@
# 108E0..108FF Hatran
# 10900..1091F Phoenician
# 10920..1093F Lydian
# 10940..1095C Sidetic
# 10980..1099F Meroitic_Hieroglyphs
# 109A0..109FF Meroitic_Cursive
# 10A00..10A5F Kharoshthi
Expand Down Expand Up @@ -1267,6 +1268,7 @@ FB46..FB4F ; R # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATURE AL
10916..1091B ; R # No [6] PHOENICIAN NUMBER ONE..PHOENICIAN NUMBER THREE
10920..10939 ; R # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
1093F ; R # Po LYDIAN TRIANGULAR MARK
10940..1095C ; R # Lo [29] SIDETIC LETTER N01..SIDETIC LETTER N29
10980..109B7 ; R # Lo [56] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC CURSIVE LETTER DA
109BC..109BD ; R # No [2] MEROITIC CURSIVE FRACTION ELEVEN TWELFTHS..MEROITIC CURSIVE FRACTION ONE HALF
109BE..109BF ; R # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
Expand Down Expand Up @@ -1325,7 +1327,7 @@ FB46..FB4F ; R # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATURE AL
1E950..1E959 ; R # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE
1E95E..1E95F ; R # Po [2] ADLAM INITIAL EXCLAMATION MARK..ADLAM INITIAL QUESTION MARK

# The above property value applies to 2087 code points not listed here.
# The above property value applies to 2058 code points not listed here.
# Total code points: 3631

# ================================================
Expand Down
Loading

0 comments on commit e8ac7ad

Please sign in to comment.