From 064c55c7dc2ad1a34e615d1579efe0e229c4226b Mon Sep 17 00:00:00 2001 From: Markus Scherer Date: Sat, 4 May 2024 14:39:31 -0700 Subject: [PATCH] short: ID_Status & ID_Type --- .../data/security/dev/IdentifierStatus.txt | 4 +- .../data/security/dev/IdentifierType.txt | 4 +- .../dev/data/confusablesSummaryIdentifier.txt | 7 +- .../security/dev/data/draft-restrictions.txt | 21 ++- .../data/security/dev/data/review.txt | 122 +++++++++--------- .../java/org/unicode/props/UcdProperty.java | 4 +- .../org/unicode/text/UCD/IdentifierInfo.java | 4 +- .../unicode/props/ExtraPropertyAliases.txt | 6 +- .../props/ExtraPropertyValueAliases.txt | 32 ++--- 9 files changed, 99 insertions(+), 105 deletions(-) diff --git a/unicodetools/data/security/dev/IdentifierStatus.txt b/unicodetools/data/security/dev/IdentifierStatus.txt index 59d3843ff..358bc09f7 100644 --- a/unicodetools/data/security/dev/IdentifierStatus.txt +++ b/unicodetools/data/security/dev/IdentifierStatus.txt @@ -1,5 +1,5 @@ # IdentifierStatus.txt -# Date: 2024-05-03, 03:51:21 GMT +# Date: 2024-05-04, 21:31:06 GMT # © 2024 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -16,7 +16,7 @@ # # For the purpose of regular expressions, the property Identifier_Status is defined as # an enumerated property of code points. -# The short name of Identifier_Status is the same as the long name. +# The short name of Identifier_Status is ID_Status. # The possible values are: # Allowed, Restricted # The short name of each value is the same as its long name. diff --git a/unicodetools/data/security/dev/IdentifierType.txt b/unicodetools/data/security/dev/IdentifierType.txt index eaea24b69..2640a29fc 100644 --- a/unicodetools/data/security/dev/IdentifierType.txt +++ b/unicodetools/data/security/dev/IdentifierType.txt @@ -1,5 +1,5 @@ # IdentifierType.txt -# Date: 2024-05-03, 03:51:21 GMT +# Date: 2024-05-04, 21:31:06 GMT # © 2024 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -16,7 +16,7 @@ # # For the purpose of regular expressions, the property Identifier_Type is defined as # mapping each code point to a set of enumerated values. -# The short name of Identifier_Type is the same as the long name. +# The short name of Identifier_Type is ID_Type. # The possible values are: # Not_Character, Deprecated, Default_Ignorable, Not_NFKC, Not_XID, # Exclusion, Obsolete, Technical, Uncommon_Use, Limited_Use, Inclusion, Recommended diff --git a/unicodetools/data/security/dev/data/confusablesSummaryIdentifier.txt b/unicodetools/data/security/dev/data/confusablesSummaryIdentifier.txt index ecef0e7a1..5435b8bff 100644 --- a/unicodetools/data/security/dev/data/confusablesSummaryIdentifier.txt +++ b/unicodetools/data/security/dev/data/confusablesSummaryIdentifier.txt @@ -1,5 +1,5 @@ # confusablesSummaryIdentifier.txt -# Date: 2024-05-03, 03:26:41 GMT +# Date: 2024-05-04, 21:31:06 GMT # © 2024 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -60,7 +60,7 @@ ← (‎ Θ ‎) 0398 GREEK CAPITAL LETTER THETA # →Ѳ→→О̵→ ← (‎ Ө ‎) 04E8 CYRILLIC CAPITAL LETTER BARRED O # →Ѳ→→О̵→ -# l I 1 | ו ן ا ١ ۱ Ι І +# l I 1 | ו ן ا ١ ۱ Ι І Ӏ (‎ 1 ‎) 0031 DIGIT ONE ← (‎ l ‎) 006C LATIN SMALL LETTER L ← (‎ I ‎) 0049 LATIN CAPITAL LETTER I @@ -72,6 +72,7 @@ ← (‎ ۱ ‎) 06F1 EXTENDED ARABIC-INDIC DIGIT ONE ← (‎ Ι ‎) 0399 GREEK CAPITAL LETTER IOTA # →I→ ← (‎ І ‎) 0406 CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I # →I→ +← (‎ Ӏ ‎) 04C0 CYRILLIC LETTER PALOCHKA # →I→ # l' 1' וי ױ (‎ 1' ‎) 0031 0027 DIGIT ONE, APOSTROPHE @@ -1838,5 +1839,5 @@ (‎ 鹂 ‎) 9E42 CJK UNIFIED IDEOGRAPH-9E42 ← (‎ 鹃 ‎) 9E43 CJK UNIFIED IDEOGRAPH-9E43 -# total : 634 +# total : 635 diff --git a/unicodetools/data/security/dev/data/draft-restrictions.txt b/unicodetools/data/security/dev/data/draft-restrictions.txt index 635c6ffbc..acb5babdc 100644 --- a/unicodetools/data/security/dev/data/draft-restrictions.txt +++ b/unicodetools/data/security/dev/data/draft-restrictions.txt @@ -22438,14 +22438,14 @@ ABF9 ; ; Limited_Use # (꯹) MEETEI MAYEK DIGIT NINE 0DED ; ; Obsolete # (෭) SINHALA LITH DIGIT SEVEN 0DEE ; ; Obsolete # (෮) SINHALA LITH DIGIT EIGHT 0DEF ; ; Obsolete # (෯) SINHALA LITH DIGIT NINE +10A0..10C5 ; ; Obsolete # [38] (Ⴀ..Ⴥ) GEORGIAN CAPITAL LETTER AN..GEORGIAN CAPITAL LETTER HOE 10F1 ; ; Obsolete # (ჱ) GEORGIAN LETTER HE 10F2 ; ; Obsolete # (ჲ) GEORGIAN LETTER HIE 10F3 ; ; Obsolete # (ჳ) GEORGIAN LETTER WE 10F4 ; ; Obsolete # (ჴ) GEORGIAN LETTER HAR 10F5 ; ; Obsolete # (ჵ) GEORGIAN LETTER HOE 10F6 ; ; Obsolete # (ჶ) GEORGIAN LETTER FI -1100..115E ; ; Obsolete # [95] (ᄀ..ᅞ) HANGUL CHOSEONG KIYEOK..HANGUL CHOSEONG TIKEUT-RIEUL -1161..11FF ; ; Obsolete # [159] (ᅡ..ᇿ) HANGUL JUNGSEONG A..HANGUL JONGSEONG SSANGNIEUN +1100..11FF ; ; Obsolete # [256] (ᄀ..ᇿ) HANGUL CHOSEONG KIYEOK..HANGUL JONGSEONG SSANGNIEUN 1369..1371 ; ; Obsolete # [9] (፩..፱) ETHIOPIC DIGIT ONE..ETHIOPIC DIGIT NINE 1681..169A ; ; Obsolete # [26] (ᚁ..ᚚ) OGHAM LETTER BEITH..OGHAM LETTER PEITH 16A0..16EA ; ; Obsolete # [75] (ᚠ..ᛪ) RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X @@ -22537,10 +22537,12 @@ ABF9 ; ; Limited_Use # (꯹) MEETEI MAYEK DIGIT NINE 1DE4 ; ; Obsolete # (ᷤ) COMBINING LATIN SMALL LETTER S 1DE5 ; ; Obsolete # (ᷥ) COMBINING LATIN SMALL LETTER LONG S 1DE6 ; ; Obsolete # (ᷦ) COMBINING LATIN SMALL LETTER Z +2132 ; ; Obsolete # (Ⅎ) TURNED CAPITAL F 214E ; ; Obsolete # (ⅎ) TURNED SMALL F 2180 ; ; Obsolete # (ↀ) ROMAN NUMERAL ONE THOUSAND C D 2181 ; ; Obsolete # (ↁ) ROMAN NUMERAL FIVE THOUSAND 2182 ; ; Obsolete # (ↂ) ROMAN NUMERAL TEN THOUSAND +2183 ; ; Obsolete # (Ↄ) ROMAN NUMERAL REVERSED ONE HUNDRED 2184 ; ; Obsolete # (ↄ) LATIN SMALL LETTER REVERSED C 2185 ; ; Obsolete # (ↅ) ROMAN NUMERAL SIX LATE FORM 2186 ; ; Obsolete # (ↆ) ROMAN NUMERAL FIFTY EARLY FORM @@ -23348,7 +23350,7 @@ D7FB ; ; Obsolete # (ퟻ) HANGUL JONGSEONG PHIEUPH-THIEUTH 1D243 ; ; Obsolete # (𝉃) COMBINING GREEK MUSICAL TETRASEME 1D244 ; ; Obsolete # (𝉄) COMBINING GREEK MUSICAL PENTASEME -# Total code points: 1667 +# Total code points: 1709 0180 ; ; Technical # (ƀ) LATIN SMALL LETTER B WITH STROKE 01C0 ; ; Technical # (ǀ) LATIN LETTER DENTAL CLICK @@ -24652,7 +24654,7 @@ AB63 ; ; Uncommon_Use # (ꭣ) LATIN SMALL LETTER UO 04BD ; Allowed ; Recommended # (ҽ) CYRILLIC SMALL LETTER ABKHASIAN CHE 04BE ; Allowed ; Recommended # (Ҿ) CYRILLIC CAPITAL LETTER ABKHASIAN CHE WITH DESCENDER 04BF ; Allowed ; Recommended # (ҿ) CYRILLIC SMALL LETTER ABKHASIAN CHE WITH DESCENDER -04C1 ; Allowed ; Recommended # (Ӂ) CYRILLIC CAPITAL LETTER ZHE WITH BREVE +04C0..04C1 ; Allowed ; Recommended # [2] (Ӏ..Ӂ) CYRILLIC LETTER PALOCHKA..CYRILLIC CAPITAL LETTER ZHE WITH BREVE 04C2 ; Allowed ; Recommended # (ӂ) CYRILLIC SMALL LETTER ZHE WITH BREVE 04C3 ; Allowed ; Recommended # (Ӄ) CYRILLIC CAPITAL LETTER KA WITH HOOK 04C4 ; Allowed ; Recommended # (ӄ) CYRILLIC SMALL LETTER KA WITH HOOK @@ -26517,6 +26519,7 @@ AB63 ; ; Uncommon_Use # (ꭣ) LATIN SMALL LETTER UO 17B1 ; Allowed ; Recommended # (ឱ) KHMER INDEPENDENT VOWEL QOO TYPE ONE 17B2 ; Allowed ; Recommended # (ឲ) KHMER INDEPENDENT VOWEL QOO TYPE TWO 17B3 ; Allowed ; Recommended # (ឳ) KHMER INDEPENDENT VOWEL QAU +17B4..17B5 ; Allowed ; Recommended # [2] (U+17B4..U+17B5) KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA 17B6 ; Allowed ; Recommended # (ា) KHMER VOWEL SIGN AA 17B7 ; Allowed ; Recommended # (ិ) KHMER VOWEL SIGN I 17B8 ; Allowed ; Recommended # (ី) KHMER VOWEL SIGN II @@ -54814,17 +54817,11 @@ FA29 ; Allowed ; Recommended # (﨩) CJK COMPATIBILITY IDEOGRAPH- 323AF ; Allowed ; Recommended # (𲎯) CJK UNIFIED IDEOGRAPH-323AF E0100..E01EF ; Allowed ; Recommended # [240] (U+E0100..U+E01EF) VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 112998 +# Total code points: 113001 005F ; ~IDNA # (_) LOW LINE -04C0 ; ~IDNA # (Ӏ) CYRILLIC LETTER PALOCHKA -10A0..10C5 ; ~IDNA # [38] (Ⴀ..Ⴥ) GEORGIAN CAPITAL LETTER AN..GEORGIAN CAPITAL LETTER HOE -115F..1160 ; ~IDNA # [2] (U+115F..U+1160) HANGUL CHOSEONG FILLER..HANGUL JUNGSEONG FILLER -17B4..17B5 ; ~IDNA # [2] (U+17B4..U+17B5) KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA -2132 ; ~IDNA # (Ⅎ) TURNED CAPITAL F -2183 ; ~IDNA # (Ↄ) ROMAN NUMERAL REVERSED ONE HUNDRED -# Total code points: 46 +# Total code points: 1 0000..002F ; ~Unicode Identifier # [48] (U+0000../) ..SOLIDUS 003A..0040 ; ~Unicode Identifier # [7] (:..@) COLON..COMMERCIAL AT diff --git a/unicodetools/data/security/dev/data/review.txt b/unicodetools/data/security/dev/data/review.txt index 1ef760219..a9722908f 100644 --- a/unicodetools/data/security/dev/data/review.txt +++ b/unicodetools/data/security/dev/data/review.txt @@ -1,5 +1,5 @@ # review.txt -# Date: 2024-05-03, 03:51:22 GMT +# Date: 2024-05-04, 21:31:07 GMT # © 2024 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1095,6 +1095,7 @@ 04BD ; output # (ҽ) CYRILLIC SMALL LETTER ABKHASIAN CHE 04BE ; input # (Ҿ) CYRILLIC CAPITAL LETTER ABKHASIAN CHE WITH DESCENDER 04BF ; output # (ҿ) CYRILLIC SMALL LETTER ABKHASIAN CHE WITH DESCENDER +04C0 ; input # (Ӏ) CYRILLIC LETTER PALOCHKA 04C1 ; input # (Ӂ) CYRILLIC CAPITAL LETTER ZHE WITH BREVE 04C2 ; output # (ӂ) CYRILLIC SMALL LETTER ZHE WITH BREVE 04C3 ; input # (Ӄ) CYRILLIC CAPITAL LETTER KA WITH HOOK @@ -3522,6 +3523,44 @@ 109D ; output-nonstarting # (ႝ) MYANMAR VOWEL SIGN AITON AI 109E ; Restricted ; Not_XID # (႞) MYANMAR SYMBOL SHAN ONE 109F ; Restricted ; Not_XID # (႟) MYANMAR SYMBOL SHAN EXCLAMATION +10A0 ; Restricted ; Obsolete # (Ⴀ) GEORGIAN CAPITAL LETTER AN +10A1 ; Restricted ; Obsolete # (Ⴁ) GEORGIAN CAPITAL LETTER BAN +10A2 ; Restricted ; Obsolete # (Ⴂ) GEORGIAN CAPITAL LETTER GAN +10A3 ; Restricted ; Obsolete # (Ⴃ) GEORGIAN CAPITAL LETTER DON +10A4 ; Restricted ; Obsolete # (Ⴄ) GEORGIAN CAPITAL LETTER EN +10A5 ; Restricted ; Obsolete # (Ⴅ) GEORGIAN CAPITAL LETTER VIN +10A6 ; Restricted ; Obsolete # (Ⴆ) GEORGIAN CAPITAL LETTER ZEN +10A7 ; Restricted ; Obsolete # (Ⴇ) GEORGIAN CAPITAL LETTER TAN +10A8 ; Restricted ; Obsolete # (Ⴈ) GEORGIAN CAPITAL LETTER IN +10A9 ; Restricted ; Obsolete # (Ⴉ) GEORGIAN CAPITAL LETTER KAN +10AA ; Restricted ; Obsolete # (Ⴊ) GEORGIAN CAPITAL LETTER LAS +10AB ; Restricted ; Obsolete # (Ⴋ) GEORGIAN CAPITAL LETTER MAN +10AC ; Restricted ; Obsolete # (Ⴌ) GEORGIAN CAPITAL LETTER NAR +10AD ; Restricted ; Obsolete # (Ⴍ) GEORGIAN CAPITAL LETTER ON +10AE ; Restricted ; Obsolete # (Ⴎ) GEORGIAN CAPITAL LETTER PAR +10AF ; Restricted ; Obsolete # (Ⴏ) GEORGIAN CAPITAL LETTER ZHAR +10B0 ; Restricted ; Obsolete # (Ⴐ) GEORGIAN CAPITAL LETTER RAE +10B1 ; Restricted ; Obsolete # (Ⴑ) GEORGIAN CAPITAL LETTER SAN +10B2 ; Restricted ; Obsolete # (Ⴒ) GEORGIAN CAPITAL LETTER TAR +10B3 ; Restricted ; Obsolete # (Ⴓ) GEORGIAN CAPITAL LETTER UN +10B4 ; Restricted ; Obsolete # (Ⴔ) GEORGIAN CAPITAL LETTER PHAR +10B5 ; Restricted ; Obsolete # (Ⴕ) GEORGIAN CAPITAL LETTER KHAR +10B6 ; Restricted ; Obsolete # (Ⴖ) GEORGIAN CAPITAL LETTER GHAN +10B7 ; Restricted ; Obsolete # (Ⴗ) GEORGIAN CAPITAL LETTER QAR +10B8 ; Restricted ; Obsolete # (Ⴘ) GEORGIAN CAPITAL LETTER SHIN +10B9 ; Restricted ; Obsolete # (Ⴙ) GEORGIAN CAPITAL LETTER CHIN +10BA ; Restricted ; Obsolete # (Ⴚ) GEORGIAN CAPITAL LETTER CAN +10BB ; Restricted ; Obsolete # (Ⴛ) GEORGIAN CAPITAL LETTER JIL +10BC ; Restricted ; Obsolete # (Ⴜ) GEORGIAN CAPITAL LETTER CIL +10BD ; Restricted ; Obsolete # (Ⴝ) GEORGIAN CAPITAL LETTER CHAR +10BE ; Restricted ; Obsolete # (Ⴞ) GEORGIAN CAPITAL LETTER XAN +10BF ; Restricted ; Obsolete # (Ⴟ) GEORGIAN CAPITAL LETTER JHAN +10C0 ; Restricted ; Obsolete # (Ⴠ) GEORGIAN CAPITAL LETTER HAE +10C1 ; Restricted ; Obsolete # (Ⴡ) GEORGIAN CAPITAL LETTER HE +10C2 ; Restricted ; Obsolete # (Ⴢ) GEORGIAN CAPITAL LETTER HIE +10C3 ; Restricted ; Obsolete # (Ⴣ) GEORGIAN CAPITAL LETTER WE +10C4 ; Restricted ; Obsolete # (Ⴤ) GEORGIAN CAPITAL LETTER HAR +10C5 ; Restricted ; Obsolete # (Ⴥ) GEORGIAN CAPITAL LETTER HOE 10C7 ; input # (Ⴧ) GEORGIAN CAPITAL LETTER YN 10CD ; input # (Ⴭ) GEORGIAN CAPITAL LETTER AEN 10D0 ; output # (ა) GEORGIAN LETTER AN @@ -3572,8 +3611,7 @@ 10FD ; output # (ჽ) GEORGIAN LETTER AEN 10FE ; output # (ჾ) GEORGIAN LETTER HARD SIGN 10FF ; output # (ჿ) GEORGIAN LETTER LABIAL SIGN -1100..115E ; Restricted ; Obsolete # [95] (ᄀ..ᅞ) HANGUL CHOSEONG KIYEOK..HANGUL CHOSEONG TIKEUT-RIEUL -1161..11FF ; Restricted ; Obsolete # [159] (ᅡ..ᇿ) HANGUL JUNGSEONG A..HANGUL JONGSEONG SSANGNIEUN +1100..11FF ; Restricted ; Obsolete # [256] (ᄀ..ᇿ) HANGUL CHOSEONG KIYEOK..HANGUL JONGSEONG SSANGNIEUN 1200..1248 ; output # [73] (ሀ..ቈ) ETHIOPIC SYLLABLE HA..ETHIOPIC SYLLABLE QWA 124A..124D ; output # [4] (ቊ..ቍ) ETHIOPIC SYLLABLE QWI..ETHIOPIC SYLLABLE QWE 1250..1256 ; output # [7] (ቐ..ቖ) ETHIOPIC SYLLABLE QHA..ETHIOPIC SYLLABLE QHO @@ -3759,6 +3797,7 @@ 17B1 ; output # (ឱ) KHMER INDEPENDENT VOWEL QOO TYPE ONE 17B2 ; output # (ឲ) KHMER INDEPENDENT VOWEL QOO TYPE TWO 17B3 ; output # (ឳ) KHMER INDEPENDENT VOWEL QAU +17B4..17B5 ; Restricted ; output-disallowed # [2] (U+17B4..U+17B5) KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA 17B6 ; output-nonstarting # (ា) KHMER VOWEL SIGN AA 17B7 ; output-nonstarting # (ិ) KHMER VOWEL SIGN I 17B8 ; output-nonstarting # (ី) KHMER VOWEL SIGN II @@ -3825,11 +3864,13 @@ 1803 ; Restricted ; Not_XID # (᠃) MONGOLIAN FULL STOP 1804 ; Restricted ; Not_XID # (᠄) MONGOLIAN COLON 1805 ; Restricted ; Not_XID # (᠅) MONGOLIAN FOUR DOTS +1806 ; Restricted ; Not_XID # (᠆) MONGOLIAN TODO SOFT HYPHEN 1807 ; Restricted ; Not_XID # (᠇) MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER 1808 ; Restricted ; Not_XID # (᠈) MONGOLIAN MANCHU COMMA 1809 ; Restricted ; Not_XID # (᠉) MONGOLIAN MANCHU FULL STOP 180A ; Restricted ; Not_XID # (᠊) MONGOLIAN NIRUGU 180B..180D ; Restricted ; Exclusion # [3] (U+180B..U+180D) MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180E ; Restricted ; Not_XID # (U+180E) MONGOLIAN VOWEL SEPARATOR 180F ; Restricted ; Exclusion # (U+180F) MONGOLIAN FREE VARIATION SELECTOR FOUR 1810 ; Restricted ; Exclusion # (᠐) MONGOLIAN DIGIT ZERO 1811 ; Restricted ; Exclusion # (᠑) MONGOLIAN DIGIT ONE @@ -5651,8 +5692,8 @@ 205C ; Restricted ; Not_XID # (⁜) DOTTED CROSS 205D ; Restricted ; Not_XID # (⁝) TRICOLON 205E ; Restricted ; Not_XID # (⁞) VERTICAL FOUR DOTS -2060 ; Restricted ; Not_XID # (U+2060) WORD JOINER -2064 ; Restricted ; Not_XID # (U+2064) INVISIBLE PLUS +2060..2064 ; Restricted ; Not_XID # [5] (U+2060..U+2064) WORD JOINER..INVISIBLE PLUS +206A..206F ; Restricted ; Deprecated # [6] (U+206A..U+206F) INHIBIT SYMMETRIC SWAPPING..NOMINAL DIGIT SHAPES 2070 ; Restricted ; Not_XID # (⁰) SUPERSCRIPT ZERO 2071 ; input-lenient # (ⁱ) SUPERSCRIPT LATIN SMALL LETTER I 2074 ; Restricted ; Not_XID # (⁴) SUPERSCRIPT FOUR @@ -5799,6 +5840,7 @@ 212F ; input-lenient # (ℯ) SCRIPT SMALL E 2130 ; input-lenient # (ℰ) SCRIPT CAPITAL E 2131 ; input-lenient # (ℱ) SCRIPT CAPITAL F +2132 ; Restricted ; Obsolete # (Ⅎ) TURNED CAPITAL F 2133 ; input-lenient # (ℳ) SCRIPT CAPITAL M 2134 ; input-lenient # (ℴ) SCRIPT SMALL O 2135 ; input-lenient # (ℵ) ALEF SYMBOL @@ -5879,6 +5921,7 @@ 2180 ; Restricted ; Obsolete # (ↀ) ROMAN NUMERAL ONE THOUSAND C D 2181 ; Restricted ; Obsolete # (ↁ) ROMAN NUMERAL FIVE THOUSAND 2182 ; Restricted ; Obsolete # (ↂ) ROMAN NUMERAL TEN THOUSAND +2183 ; Restricted ; Obsolete # (Ↄ) ROMAN NUMERAL REVERSED ONE HUNDRED 2184 ; Restricted ; Obsolete # (ↄ) LATIN SMALL LETTER REVERSED C 2185 ; Restricted ; Obsolete # (ↅ) ROMAN NUMERAL SIX LATE FORM 2186 ; Restricted ; Obsolete # (ↆ) ROMAN NUMERAL FIFTY EARLY FORM @@ -9298,7 +9341,7 @@ 3161 ; Restricted ; Obsolete # (ㅡ) HANGUL LETTER EU 3162 ; Restricted ; Obsolete # (ㅢ) HANGUL LETTER YI 3163 ; Restricted ; Obsolete # (ㅣ) HANGUL LETTER I -3165..318E ; Restricted ; Obsolete # [42] (ㅥ..ㆎ) HANGUL LETTER SSANGNIEUN..HANGUL LETTER ARAEAE +3164..318E ; Restricted ; Obsolete # [43] (U+3164..ㆎ) HANGUL FILLER..HANGUL LETTER ARAEAE 3190 ; Restricted ; Not_XID # (㆐) IDEOGRAPHIC ANNOTATION LINKING MARK 3191 ; Restricted ; Not_XID # (㆑) IDEOGRAPHIC ANNOTATION REVERSE MARK 3192 ; Restricted ; Not_XID # (㆒) IDEOGRAPHIC ANNOTATION ONE MARK @@ -11868,6 +11911,7 @@ FF9C ; input-lenient # (ワ) HALFWIDTH KATAKANA FF9D ; input-lenient # (ン) HALFWIDTH KATAKANA LETTER N FF9E ; input-lenient # (゙) HALFWIDTH KATAKANA VOICED SOUND MARK FF9F ; input-lenient # (゚) HALFWIDTH KATAKANA SEMI-VOICED SOUND MARK +FFA0 ; Restricted ; Obsolete # (U+FFA0) HALFWIDTH HANGUL FILLER FFA1 ; Restricted ; Obsolete # (ᄀ) HALFWIDTH HANGUL LETTER KIYEOK FFA2 ; Restricted ; Obsolete # (ᄁ) HALFWIDTH HANGUL LETTER SSANGKIYEOK FFA3 ; Restricted ; Obsolete # (ᆪ) HALFWIDTH HANGUL LETTER KIYEOK-SIOS @@ -33718,6 +33762,7 @@ FFEE ; Restricted ; Not_XID # (○) HALFWIDTH WHITE CIR 1D165..1D169 ; Restricted ; Technical # [5] (𝅥..𝅩) MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING TREMOLO-3 1D16A..1D16C ; Restricted ; Not_XID # [3] (𝅪..𝅬) MUSICAL SYMBOL FINGERED TREMOLO-1..MUSICAL SYMBOL FINGERED TREMOLO-3 1D16D..1D172 ; Restricted ; Technical # [6] (𝅭..𝅲) MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5 +1D173..1D17A ; Restricted ; Not_XID # [8] (U+1D173..U+1D17A) MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE 1D17B..1D182 ; Restricted ; Technical # [8] (𝅻..𝆂) MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE 1D183..1D184 ; Restricted ; Not_XID # [2] (𝆃..𝆄) MUSICAL SYMBOL ARPEGGIATO UP..MUSICAL SYMBOL ARPEGGIATO DOWN 1D185..1D18B ; Restricted ; Technical # [7] (𝆅..𝆋) MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE @@ -56435,6 +56480,7 @@ FFEE ; Restricted ; Not_XID # (○) HALFWIDTH WHITE CIR 2F865 ; input-lenient # (姘) CJK COMPATIBILITY IDEOGRAPH-2F865 2F866 ; input-lenient # (婦) CJK COMPATIBILITY IDEOGRAPH-2F866 2F867 ; input-lenient # (㛮) CJK COMPATIBILITY IDEOGRAPH-2F867 +2F868 ; input-lenient # (㛼) CJK COMPATIBILITY IDEOGRAPH-2F868 2F869 ; input-lenient # (嬈) CJK COMPATIBILITY IDEOGRAPH-2F869 2F86A ; input-lenient # (嬾) CJK COMPATIBILITY IDEOGRAPH-2F86A 2F86B ; input-lenient # (嬾) CJK COMPATIBILITY IDEOGRAPH-2F86B @@ -56446,6 +56492,7 @@ FFEE ; Restricted ; Not_XID # (○) HALFWIDTH WHITE CIR 2F871 ; input-lenient # (𡬘) CJK COMPATIBILITY IDEOGRAPH-2F871 2F872 ; input-lenient # (寿) CJK COMPATIBILITY IDEOGRAPH-2F872 2F873 ; input-lenient # (将) CJK COMPATIBILITY IDEOGRAPH-2F873 +2F874 ; input-lenient # (当) CJK COMPATIBILITY IDEOGRAPH-2F874 2F875 ; input-lenient # (尢) CJK COMPATIBILITY IDEOGRAPH-2F875 2F876 ; input-lenient # (㞁) CJK COMPATIBILITY IDEOGRAPH-2F876 2F877 ; input-lenient # (屠) CJK COMPATIBILITY IDEOGRAPH-2F877 @@ -56616,6 +56663,7 @@ FFEE ; Restricted ; Not_XID # (○) HALFWIDTH WHITE CIR 2F91C ; input-lenient # (煅) CJK COMPATIBILITY IDEOGRAPH-2F91C 2F91D ; input-lenient # (𤉣) CJK COMPATIBILITY IDEOGRAPH-2F91D 2F91E ; input-lenient # (熜) CJK COMPATIBILITY IDEOGRAPH-2F91E +2F91F ; input-lenient # (𤎫) CJK COMPATIBILITY IDEOGRAPH-2F91F 2F920 ; input-lenient # (爨) CJK COMPATIBILITY IDEOGRAPH-2F920 2F921 ; input-lenient # (爵) CJK COMPATIBILITY IDEOGRAPH-2F921 2F922 ; input-lenient # (牐) CJK COMPATIBILITY IDEOGRAPH-2F922 @@ -56679,6 +56727,7 @@ FFEE ; Restricted ; Not_XID # (○) HALFWIDTH WHITE CIR 2F95C ; input-lenient # (𥥼) CJK COMPATIBILITY IDEOGRAPH-2F95C 2F95D ; input-lenient # (𥪧) CJK COMPATIBILITY IDEOGRAPH-2F95D 2F95E ; input-lenient # (𥪧) CJK COMPATIBILITY IDEOGRAPH-2F95E +2F95F ; input-lenient # (竮) CJK COMPATIBILITY IDEOGRAPH-2F95F 2F960 ; input-lenient # (䈂) CJK COMPATIBILITY IDEOGRAPH-2F960 2F961 ; input-lenient # (𥮫) CJK COMPATIBILITY IDEOGRAPH-2F961 2F962 ; input-lenient # (篆) CJK COMPATIBILITY IDEOGRAPH-2F962 @@ -56774,6 +56823,7 @@ FFEE ; Restricted ; Not_XID # (○) HALFWIDTH WHITE CIR 2F9BC ; input-lenient # (蜨) CJK COMPATIBILITY IDEOGRAPH-2F9BC 2F9BD ; input-lenient # (蝫) CJK COMPATIBILITY IDEOGRAPH-2F9BD 2F9BE ; input-lenient # (螆) CJK COMPATIBILITY IDEOGRAPH-2F9BE +2F9BF ; input-lenient # (䗗) CJK COMPATIBILITY IDEOGRAPH-2F9BF 2F9C0 ; input-lenient # (蟡) CJK COMPATIBILITY IDEOGRAPH-2F9C0 2F9C1 ; input-lenient # (蠁) CJK COMPATIBILITY IDEOGRAPH-2F9C1 2F9C2 ; input-lenient # (䗹) CJK COMPATIBILITY IDEOGRAPH-2F9C2 @@ -66001,7 +66051,7 @@ FFEE ; Restricted ; Not_XID # (○) HALFWIDTH WHITE CIR 323AF ; output # (𲎯) CJK UNIFIED IDEOGRAPH-323AF E0100..E01EF ; Restricted ; output-disallowed # [240] (U+E0100..U+E01EF) VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 154398 +# Total code points: 154469 # Characters disallowed in IDNA # The IDNA spec doesn't allow any of these characters, @@ -66119,7 +66169,6 @@ E0100..E01EF ; Restricted ; output-disallowed # [240] (U+E0100..U+E01EF) VARIA 037E ; Restricted ; not in XID+ # (;) GREEK QUESTION MARK 0384 ; Restricted ; not in XID+ # (΄) GREEK TONOS 0385 ; Restricted ; not in XID+ # (΅) GREEK DIALYTIKA TONOS -04C0 ; future? # (Ӏ) CYRILLIC LETTER PALOCHKA 0600 ; Restricted ; not in XID+ # (U+0600) ARABIC NUMBER SIGN 0601 ; Restricted ; not in XID+ # (U+0601) ARABIC SIGN SANAH 0602 ; Restricted ; not in XID+ # (U+0602) ARABIC FOOTNOTE MARKER @@ -66132,49 +66181,7 @@ E0100..E01EF ; Restricted ; output-disallowed # [240] (U+E0100..U+E01EF) VARIA 0890 ; Restricted ; not in XID+ # (U+0890) ARABIC POUND MARK ABOVE 0891 ; Restricted ; not in XID+ # (U+0891) ARABIC PIASTRE MARK ABOVE 08E2 ; Restricted ; not in XID+ # (U+08E2) ARABIC DISPUTED END OF AYAH -10A0 ; future? # (Ⴀ) GEORGIAN CAPITAL LETTER AN -10A1 ; future? # (Ⴁ) GEORGIAN CAPITAL LETTER BAN -10A2 ; future? # (Ⴂ) GEORGIAN CAPITAL LETTER GAN -10A3 ; future? # (Ⴃ) GEORGIAN CAPITAL LETTER DON -10A4 ; future? # (Ⴄ) GEORGIAN CAPITAL LETTER EN -10A5 ; future? # (Ⴅ) GEORGIAN CAPITAL LETTER VIN -10A6 ; future? # (Ⴆ) GEORGIAN CAPITAL LETTER ZEN -10A7 ; future? # (Ⴇ) GEORGIAN CAPITAL LETTER TAN -10A8 ; future? # (Ⴈ) GEORGIAN CAPITAL LETTER IN -10A9 ; future? # (Ⴉ) GEORGIAN CAPITAL LETTER KAN -10AA ; future? # (Ⴊ) GEORGIAN CAPITAL LETTER LAS -10AB ; future? # (Ⴋ) GEORGIAN CAPITAL LETTER MAN -10AC ; future? # (Ⴌ) GEORGIAN CAPITAL LETTER NAR -10AD ; future? # (Ⴍ) GEORGIAN CAPITAL LETTER ON -10AE ; future? # (Ⴎ) GEORGIAN CAPITAL LETTER PAR -10AF ; future? # (Ⴏ) GEORGIAN CAPITAL LETTER ZHAR -10B0 ; future? # (Ⴐ) GEORGIAN CAPITAL LETTER RAE -10B1 ; future? # (Ⴑ) GEORGIAN CAPITAL LETTER SAN -10B2 ; future? # (Ⴒ) GEORGIAN CAPITAL LETTER TAR -10B3 ; future? # (Ⴓ) GEORGIAN CAPITAL LETTER UN -10B4 ; future? # (Ⴔ) GEORGIAN CAPITAL LETTER PHAR -10B5 ; future? # (Ⴕ) GEORGIAN CAPITAL LETTER KHAR -10B6 ; future? # (Ⴖ) GEORGIAN CAPITAL LETTER GHAN -10B7 ; future? # (Ⴗ) GEORGIAN CAPITAL LETTER QAR -10B8 ; future? # (Ⴘ) GEORGIAN CAPITAL LETTER SHIN -10B9 ; future? # (Ⴙ) GEORGIAN CAPITAL LETTER CHIN -10BA ; future? # (Ⴚ) GEORGIAN CAPITAL LETTER CAN -10BB ; future? # (Ⴛ) GEORGIAN CAPITAL LETTER JIL -10BC ; future? # (Ⴜ) GEORGIAN CAPITAL LETTER CIL -10BD ; future? # (Ⴝ) GEORGIAN CAPITAL LETTER CHAR -10BE ; future? # (Ⴞ) GEORGIAN CAPITAL LETTER XAN -10BF ; future? # (Ⴟ) GEORGIAN CAPITAL LETTER JHAN -10C0 ; future? # (Ⴠ) GEORGIAN CAPITAL LETTER HAE -10C1 ; future? # (Ⴡ) GEORGIAN CAPITAL LETTER HE -10C2 ; future? # (Ⴢ) GEORGIAN CAPITAL LETTER HIE -10C3 ; future? # (Ⴣ) GEORGIAN CAPITAL LETTER WE -10C4 ; future? # (Ⴤ) GEORGIAN CAPITAL LETTER HAR -10C5 ; future? # (Ⴥ) GEORGIAN CAPITAL LETTER HOE -115F..1160 ; future? # [2] (U+115F..U+1160) HANGUL CHOSEONG FILLER..HANGUL JUNGSEONG FILLER 1680 ; Restricted ; not in XID+ # (U+1680) OGHAM SPACE MARK -17B4..17B5 ; future? # [2] (U+17B4..U+17B5) KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA -1806 ; Restricted ; not in XID+ # (᠆) MONGOLIAN TODO SOFT HYPHEN -180E ; Restricted ; not in XID+ # (U+180E) MONGOLIAN VOWEL SEPARATOR 1FBD ; Restricted ; not in XID+ # (᾽) GREEK KORONIS 1FBF ; Restricted ; not in XID+ # (᾿) GREEK PSILI 1FC0 ; Restricted ; not in XID+ # (῀) GREEK PERISPOMENI @@ -66216,8 +66223,7 @@ E0100..E01EF ; Restricted ; output-disallowed # [240] (U+E0100..U+E01EF) VARIA 2048 ; Restricted ; not in XID+ # (⁈) QUESTION EXCLAMATION MARK 2049 ; Restricted ; not in XID+ # (⁉) EXCLAMATION QUESTION MARK 205F ; Restricted ; not in XID+ # (U+205F) MEDIUM MATHEMATICAL SPACE -2061..2063 ; Restricted ; not in XID+ # [3] (U+2061..U+2063) FUNCTION APPLICATION..INVISIBLE SEPARATOR -2066..206F ; Restricted ; not in XID+ # [10] (U+2066..U+206F) LEFT-TO-RIGHT ISOLATE..NOMINAL DIGIT SHAPES +2066..2069 ; Restricted ; not in XID+ # [4] (U+2066..U+2069) LEFT-TO-RIGHT ISOLATE..POP DIRECTIONAL ISOLATE 207A ; Restricted ; not in XID+ # (⁺) SUPERSCRIPT PLUS SIGN 207C ; Restricted ; not in XID+ # (⁼) SUPERSCRIPT EQUALS SIGN 207D ; Restricted ; not in XID+ # (⁽) SUPERSCRIPT LEFT PARENTHESIS @@ -66230,8 +66236,6 @@ E0100..E01EF ; Restricted ; output-disallowed # [240] (U+E0100..U+E01EF) VARIA 2101 ; Restricted ; not in XID+ # (℁) ADDRESSED TO THE SUBJECT 2105 ; Restricted ; not in XID+ # (℅) CARE OF 2106 ; Restricted ; not in XID+ # (℆) CADA UNA -2132 ; future? # (Ⅎ) TURNED CAPITAL F -2183 ; future? # (Ↄ) ROMAN NUMERAL REVERSED ONE HUNDRED 2474..24B5 ; Restricted ; not in XID+ # [66] (⑴..⒵) PARENTHESIZED DIGIT ONE..PARENTHESIZED LATIN SMALL LETTER Z 2A74 ; Restricted ; not in XID+ # (⩴) DOUBLE COLON EQUAL 2A75 ; Restricted ; not in XID+ # (⩵) TWO CONSECUTIVE EQUALS SIGNS @@ -66255,7 +66259,6 @@ E0100..E01EF ; Restricted ; output-disallowed # [240] (U+E0100..U+E01EF) VARIA 3000 ; Restricted ; not in XID+ # (U+3000) IDEOGRAPHIC SPACE 309B ; Restricted ; not in XID+ # (゛) KATAKANA-HIRAGANA VOICED SOUND MARK 309C ; Restricted ; not in XID+ # (゜) KATAKANA-HIRAGANA SEMI-VOICED SOUND MARK -3164 ; future? # (U+3164) HANGUL FILLER 31EF ; Restricted ; not in XID+ # (㇯) IDEOGRAPHIC DESCRIPTION CHARACTER SUBTRACTION 3200 ; Restricted ; not in XID+ # (㈀) PARENTHESIZED HANGUL KIYEOK 3201 ; Restricted ; not in XID+ # (㈁) PARENTHESIZED HANGUL NIEUN @@ -66383,7 +66386,6 @@ FF5B ; Restricted ; not in XID+ # ({) FULLWIDTH LEFT CURLY BRAC FF5C ; Restricted ; not in XID+ # (|) FULLWIDTH VERTICAL LINE FF5D ; Restricted ; not in XID+ # (}) FULLWIDTH RIGHT CURLY BRACKET FF5E ; Restricted ; not in XID+ # (~) FULLWIDTH TILDE -FFA0 ; future? # (U+FFA0) HALFWIDTH HANGUL FILLER FFE3 ; Restricted ; not in XID+ # ( ̄) FULLWIDTH MACRON FFF9 ; Restricted ; not in XID+ # (U+FFF9) INTERLINEAR ANNOTATION ANCHOR FFFA ; Restricted ; not in XID+ # (U+FFFA) INTERLINEAR ANNOTATION SEPARATOR @@ -66408,7 +66410,6 @@ FFFD ; Restricted ; not in XID+ # (�) REPLACEMENT CHARACTER 1343D ; Restricted ; not in XID+ # (U+1343D) EGYPTIAN HIEROGLYPH END ENCLOSURE 1343E ; Restricted ; not in XID+ # (U+1343E) EGYPTIAN HIEROGLYPH BEGIN WALLED ENCLOSURE 1343F ; Restricted ; not in XID+ # (U+1343F) EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE -1D173..1D17A ; Restricted ; not in XID+ # [8] (U+1D173..U+1D17A) MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE 1F100 ; Restricted ; not in XID+ # (🄀) DIGIT ZERO FULL STOP 1F101 ; Restricted ; not in XID+ # (🄁) DIGIT ZERO COMMA 1F102 ; Restricted ; not in XID+ # (🄂) DIGIT ONE COMMA @@ -66446,12 +66447,7 @@ FFFD ; Restricted ; not in XID+ # (�) REPLACEMENT CHARACTER 1F127 ; Restricted ; not in XID+ # (🄧) PARENTHESIZED LATIN CAPITAL LETTER X 1F128 ; Restricted ; not in XID+ # (🄨) PARENTHESIZED LATIN CAPITAL LETTER Y 1F129 ; Restricted ; not in XID+ # (🄩) PARENTHESIZED LATIN CAPITAL LETTER Z -2F868 ; future? # (㛼) CJK COMPATIBILITY IDEOGRAPH-2F868 -2F874 ; future? # (当) CJK COMPATIBILITY IDEOGRAPH-2F874 -2F91F ; future? # (𤎫) CJK COMPATIBILITY IDEOGRAPH-2F91F -2F95F ; future? # (竮) CJK COMPATIBILITY IDEOGRAPH-2F95F -2F9BF ; future? # (䗗) CJK COMPATIBILITY IDEOGRAPH-2F9BF E0001 ; Restricted ; not in XID+ # (U+E0001) LANGUAGE TAG E0020..E007F ; Restricted ; not in XID+ # [96] (U+E0020..U+E007F) TAG SPACE..CANCEL TAG -# Total code points: 665 +# Total code points: 594 diff --git a/unicodetools/src/main/java/org/unicode/props/UcdProperty.java b/unicodetools/src/main/java/org/unicode/props/UcdProperty.java index 0fa8aa761..0e18f8867 100644 --- a/unicodetools/src/main/java/org/unicode/props/UcdProperty.java +++ b/unicodetools/src/main/java/org/unicode/props/UcdProperty.java @@ -234,12 +234,12 @@ public enum UcdProperty { Grapheme_Cluster_Break( PropertyType.Enumerated, Grapheme_Cluster_Break_Values.class, null, "GCB"), Hangul_Syllable_Type(PropertyType.Enumerated, Hangul_Syllable_Type_Values.class, null, "hst"), - Identifier_Status(PropertyType.Enumerated, Identifier_Status_Values.class, null, "idstatus"), + Identifier_Status(PropertyType.Enumerated, Identifier_Status_Values.class, null, "ID_Status"), Identifier_Type( PropertyType.Enumerated, Identifier_Type_Values.class, ValueCardinality.Unordered, - "idtype"), + "ID_Type"), Idn_2008(PropertyType.Enumerated, Idn_2008_Values.class, null, "idn8"), Idn_Status(PropertyType.Enumerated, Idn_Status_Values.class, null, "idns"), Indic_Conjunct_Break(PropertyType.Enumerated, Indic_Conjunct_Break_Values.class, null, "InCB"), diff --git a/unicodetools/src/main/java/org/unicode/text/UCD/IdentifierInfo.java b/unicodetools/src/main/java/org/unicode/text/UCD/IdentifierInfo.java index 0962a80b9..ce7739a83 100644 --- a/unicodetools/src/main/java/org/unicode/text/UCD/IdentifierInfo.java +++ b/unicodetools/src/main/java/org/unicode/text/UCD/IdentifierInfo.java @@ -1082,7 +1082,7 @@ public int compare(String o1, String o2) { + "# mapping each code point to a set of enumerated values.\n" + "# The short name of " + propName - + " is the same as the long name.\n" + + " is ID_Type.\n" + "# The possible values are:\n" + "# Not_Character, Deprecated, Default_Ignorable, Not_NFKC, Not_XID,\n" + "# Exclusion, Obsolete, Technical, Uncommon_Use, Limited_Use, Inclusion, Recommended\n" @@ -1153,7 +1153,7 @@ private void printIdentifierStatus() throws IOException { + "# an enumerated property of code points.\n" + "# The short name of " + propName - + " is the same as the long name.\n" + + " is ID_Status.\n" + "# The possible values are:\n" + "# Allowed, Restricted\n" + "# The short name of each value is the same as its long name.\n\n" diff --git a/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyAliases.txt b/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyAliases.txt index e7608094e..db657d34b 100644 --- a/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyAliases.txt +++ b/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyAliases.txt @@ -21,8 +21,8 @@ REZS ; RGI_Emoji_Zwj_Sequence ; Emoji_Zwj_Sequence # Enumerated Properties # ================================================ -idstatus ; Identifier_Status -idtype ; Identifier_Type +ID_Status ; Identifier_Status +ID_Type ; Identifier_Type idns ; Idn_Status idn8 ; Idn_2008 @@ -161,4 +161,4 @@ cjkSMSZD2003Readings ; kSMSZD2003Readings cjkVietnameseNumeric ; kVietnameseNumeric cjkZhuangNumeric ; kZhuangNumeric # 16.0 -cjkFanqie ; kFanqie \ No newline at end of file +cjkFanqie ; kFanqie diff --git a/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyValueAliases.txt b/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyValueAliases.txt index d4a0cdde1..465c613c6 100644 --- a/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyValueAliases.txt +++ b/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyValueAliases.txt @@ -126,26 +126,26 @@ idn8 ; na ; na # @missing: 0000..10FFFF; Identifier_Status ; r -idstatus ; r ; Restricted -idstatus ; a ; Allowed +ID_Status ; r ; Restricted +ID_Status ; a ; Allowed # @missing: 0000..10FFFF; Identifier_Type ; nc # @missing: 0000..10FFFF; Identifier_Type ; rec ; v9.0 -idtype ; nc ; Not_Character ; not_chars -idtype ; d ; Deprecated -idtype ; di ; Default_Ignorable -idtype ; nn ; Not_NFKC -idtype ; nx ; Not_XID -idtype ; o ; Obsolete -idtype ; ex ; Exclusion -idtype ; t ; Technical -idtype ; uu ; Uncommon_Use -# idtype ; h ; Historic -idtype ; lu ; Limited_Use -idtype ; a ; Aspirational -idtype ; inc ; Inclusion -idtype ; rec ; Recommended +ID_Type ; nc ; Not_Character ; not_chars +ID_Type ; d ; Deprecated +ID_Type ; di ; Default_Ignorable +ID_Type ; nn ; Not_NFKC +ID_Type ; nx ; Not_XID +ID_Type ; o ; Obsolete +ID_Type ; ex ; Exclusion +ID_Type ; t ; Technical +ID_Type ; uu ; Uncommon_Use +# ID_Type ; h ; Historic +ID_Type ; lu ; Limited_Use +ID_Type ; a ; Aspirational +ID_Type ; inc ; Inclusion +ID_Type ; rec ; Recommended # @missing: 0000..10FFFF; Confusable_SL ; # @missing: 0000..10FFFF; Confusable_SA ;