From 14e095674e44a5cb95347c7ab5e54b9c4d72fbed Mon Sep 17 00:00:00 2001 From: Robin Leroy Date: Wed, 23 Jul 2025 03:37:57 +0200 Subject: [PATCH 1/3] Revert "Revert "Chisoi (#759)"" This reverts commit f1ea28169d94b7b1bbbc520aed5e848524888a53. --- unicodetools/data/ucd/dev/Blocks.txt | 1 + unicodetools/data/ucd/dev/DerivedAge.txt | 6 ++- .../data/ucd/dev/DerivedCoreProperties.txt | 49 ++++++++++++++----- unicodetools/data/ucd/dev/EastAsianWidth.txt | 7 ++- .../data/ucd/dev/IndicPositionalCategory.txt | 4 +- .../data/ucd/dev/IndicSyllabicCategory.txt | 18 ++++++- unicodetools/data/ucd/dev/LineBreak.txt | 7 ++- .../data/ucd/dev/NormalizationTest.txt | 4 +- unicodetools/data/ucd/dev/PropList.txt | 8 +-- .../data/ucd/dev/PropertyValueAliases.txt | 4 +- .../data/ucd/dev/ScriptExtensions.txt | 6 +-- unicodetools/data/ucd/dev/Scripts.txt | 12 ++++- unicodetools/data/ucd/dev/UnicodeData.txt | 40 +++++++++++++++ .../data/ucd/dev/VerticalOrientation.txt | 7 ++- .../dev/auxiliary/GraphemeBreakProperty.txt | 6 ++- .../dev/auxiliary/SentenceBreakProperty.txt | 13 +++-- .../ucd/dev/auxiliary/WordBreakProperty.txt | 13 +++-- .../ucd/dev/extracted/DerivedBidiClass.txt | 13 +++-- .../dev/extracted/DerivedCombiningClass.txt | 13 +++-- .../dev/extracted/DerivedEastAsianWidth.txt | 9 +++- .../dev/extracted/DerivedGeneralCategory.txt | 19 ++++--- .../ucd/dev/extracted/DerivedJoiningType.txt | 6 ++- .../ucd/dev/extracted/DerivedLineBreak.txt | 17 ++++--- .../data/ucd/dev/extracted/DerivedName.txt | 44 ++++++++++++++++- .../ucd/dev/extracted/DerivedNumericType.txt | 5 +- .../dev/extracted/DerivedNumericValues.txt | 32 +++++++----- .../org/unicode/props/UcdPropertyValues.java | 2 + .../org/unicode/text/UCD/ShortBlockNames.txt | 1 + 28 files changed, 290 insertions(+), 76 deletions(-) diff --git a/unicodetools/data/ucd/dev/Blocks.txt b/unicodetools/data/ucd/dev/Blocks.txt index c80741649..a6e3dac65 100644 --- a/unicodetools/data/ucd/dev/Blocks.txt +++ b/unicodetools/data/ucd/dev/Blocks.txt @@ -306,6 +306,7 @@ FFF0..FFFF; Specials 16AD0..16AFF; Bassa Vah 16B00..16B8F; Pahawh Hmong 16D40..16D7F; Kirat Rai +16D80..16DAF; Chisoi 16E40..16E9F; Medefaidrin 16EA0..16EDF; Beria Erfe 16F00..16F9F; Miao diff --git a/unicodetools/data/ucd/dev/DerivedAge.txt b/unicodetools/data/ucd/dev/DerivedAge.txt index 0b3b9dd1c..902f028ff 100644 --- a/unicodetools/data/ucd/dev/DerivedAge.txt +++ b/unicodetools/data/ucd/dev/DerivedAge.txt @@ -1,5 +1,5 @@ # DerivedAge-17.0.0.txt -# Date: 2025-06-30, 06:20:00 GMT +# Date: 2025-07-23, 01:36:45 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -2086,6 +2086,8 @@ FDC8..FDCE ; 17.0 # [7] ARABIC LIGATURE RAHIMAHU ALLAAH TAAALAA..ARABIC LIG 11B60..11B67 ; 17.0 # [8] SHARADA VOWEL SIGN OE..SHARADA VOWEL SIGN CANDRA O 11DB0..11DDB ; 17.0 # [44] TOLONG SIKI LETTER I..TOLONG SIKI UNGGA 11DE0..11DE9 ; 17.0 # [10] TOLONG SIKI DIGIT ZERO..TOLONG SIKI DIGIT NINE +16D80..16D9D ; 17.0 # [30] CHISOI LETTER A..CHISOI SIGN SISO +16DA0..16DA9 ; 17.0 # [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16EA0..16EB8 ; 17.0 # [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY 16EBB..16ED3 ; 17.0 # [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY 16FF2..16FF6 ; 17.0 # [5] CHINESE SMALL SIMPLIFIED ER..YANGQIN SIGN SLOW TWO BEATS @@ -2114,6 +2116,6 @@ FDC8..FDCE ; 17.0 # [7] ARABIC LIGATURE RAHIMAHU ALLAAH TAAALAA..ARABIC LIG 2CEA2..2CEAD ; 17.0 # [12] CJK UNIFIED IDEOGRAPH-2CEA2..CJK UNIFIED IDEOGRAPH-2CEAD 323B0..33479 ; 17.0 # [4298] CJK UNIFIED IDEOGRAPH-323B0..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 4804 +# Total code points: 4844 # EOF diff --git a/unicodetools/data/ucd/dev/DerivedCoreProperties.txt b/unicodetools/data/ucd/dev/DerivedCoreProperties.txt index 208ae0049..e5f64c876 100644 --- a/unicodetools/data/ucd/dev/DerivedCoreProperties.txt +++ b/unicodetools/data/ucd/dev/DerivedCoreProperties.txt @@ -1,5 +1,5 @@ # DerivedCoreProperties-17.0.0.txt -# Date: 2025-06-30, 06:20:18 GMT +# Date: 2025-07-23, 01:37:03 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1321,6 +1321,9 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 16D40..16D42 ; Alphabetic # Lm [3] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN VISARGA 16D43..16D6A ; Alphabetic # Lo [40] KIRAT RAI LETTER A..KIRAT RAI VOWEL SIGN AU 16D6B..16D6C ; Alphabetic # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT +16D80..16D97 ; Alphabetic # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D98 ; Alphabetic # Mn CHISOI SIGN ANUSVARA +16D99..16D9C ; Alphabetic # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA 16E40..16E7F ; Alphabetic # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16EA0..16EB8 ; Alphabetic # L& [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY 16EBB..16ED3 ; Alphabetic # L& [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY @@ -1466,7 +1469,7 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 30000..3134A ; Alphabetic # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; Alphabetic # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 147421 +# Total code points: 147450 # ================================================ @@ -3494,6 +3497,8 @@ FFF9..FFFB ; Case_Ignorable # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLI 16B40..16B43 ; Case_Ignorable # Lm [4] PAHAWH HMONG SIGN VOS SEEV..PAHAWH HMONG SIGN IB YAM 16D40..16D42 ; Case_Ignorable # Lm [3] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN VISARGA 16D6B..16D6C ; Case_Ignorable # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT +16D98 ; Case_Ignorable # Mn CHISOI SIGN ANUSVARA +16D9D ; Case_Ignorable # Mn CHISOI SIGN SISO 16F4F ; Case_Ignorable # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F8F..16F92 ; Case_Ignorable # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16F93..16F9F ; Case_Ignorable # Lm [13] MIAO LETTER TONE-2..MIAO LETTER REFORMED TONE-8 @@ -3547,7 +3552,7 @@ E0001 ; Case_Ignorable # Cf LANGUAGE TAG E0020..E007F ; Case_Ignorable # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Case_Ignorable # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2794 +# Total code points: 2796 # ================================================ @@ -6907,6 +6912,8 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 16D40..16D42 ; ID_Start # Lm [3] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN VISARGA 16D43..16D6A ; ID_Start # Lo [40] KIRAT RAI LETTER A..KIRAT RAI VOWEL SIGN AU 16D6B..16D6C ; ID_Start # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT +16D80..16D97 ; ID_Start # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D99..16D9C ; ID_Start # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA 16E40..16E7F ; ID_Start # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16EA0..16EB8 ; ID_Start # L& [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY 16EBB..16ED3 ; ID_Start # L& [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY @@ -7033,7 +7040,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 30000..3134A ; ID_Start # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; ID_Start # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 145916 +# Total code points: 145944 # ================================================ @@ -8293,6 +8300,11 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 16D43..16D6A ; ID_Continue # Lo [40] KIRAT RAI LETTER A..KIRAT RAI VOWEL SIGN AU 16D6B..16D6C ; ID_Continue # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT 16D70..16D79 ; ID_Continue # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16D80..16D97 ; ID_Continue # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D98 ; ID_Continue # Mn CHISOI SIGN ANUSVARA +16D99..16D9C ; ID_Continue # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16D9D ; ID_Continue # Mn CHISOI SIGN SISO +16DA0..16DA9 ; ID_Continue # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16E40..16E7F ; ID_Continue # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16EA0..16EB8 ; ID_Continue # L& [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY 16EBB..16ED3 ; ID_Continue # L& [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY @@ -8466,7 +8478,7 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 31350..33479 ; ID_Continue # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 149240 +# Total code points: 149280 # ================================================ @@ -9131,6 +9143,8 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 16D40..16D42 ; XID_Start # Lm [3] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN VISARGA 16D43..16D6A ; XID_Start # Lo [40] KIRAT RAI LETTER A..KIRAT RAI VOWEL SIGN AU 16D6B..16D6C ; XID_Start # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT +16D80..16D97 ; XID_Start # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D99..16D9C ; XID_Start # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA 16E40..16E7F ; XID_Start # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16EA0..16EB8 ; XID_Start # L& [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY 16EBB..16ED3 ; XID_Start # L& [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY @@ -9257,7 +9271,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 30000..3134A ; XID_Start # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; XID_Start # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 145893 +# Total code points: 145921 # ================================================ @@ -10518,6 +10532,11 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 16D43..16D6A ; XID_Continue # Lo [40] KIRAT RAI LETTER A..KIRAT RAI VOWEL SIGN AU 16D6B..16D6C ; XID_Continue # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT 16D70..16D79 ; XID_Continue # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16D80..16D97 ; XID_Continue # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D98 ; XID_Continue # Mn CHISOI SIGN ANUSVARA +16D99..16D9C ; XID_Continue # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16D9D ; XID_Continue # Mn CHISOI SIGN SISO +16DA0..16DA9 ; XID_Continue # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16E40..16E7F ; XID_Continue # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16EA0..16EB8 ; XID_Continue # L& [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY 16EBB..16ED3 ; XID_Continue # L& [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY @@ -10691,7 +10710,7 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 31350..33479 ; XID_Continue # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 E0100..E01EF ; XID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 149221 +# Total code points: 149261 # ================================================ @@ -11131,6 +11150,8 @@ FF9E..FF9F ; Grapheme_Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK. 1612D..1612F ; Grapheme_Extend # Mn [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA 16AF0..16AF4 ; Grapheme_Extend # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; Grapheme_Extend # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM +16D98 ; Grapheme_Extend # Mn CHISOI SIGN ANUSVARA +16D9D ; Grapheme_Extend # Mn CHISOI SIGN SISO 16F4F ; Grapheme_Extend # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F8F..16F92 ; Grapheme_Extend # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16FE4 ; Grapheme_Extend # Mn KHITAN SMALL SCRIPT FILLER @@ -11171,7 +11192,7 @@ FF9E..FF9F ; Grapheme_Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK. E0020..E007F ; Grapheme_Extend # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Grapheme_Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2232 +# Total code points: 2234 # ================================================ @@ -12749,6 +12770,9 @@ FFFC..FFFD ; Grapheme_Base # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEME 16D6B..16D6C ; Grapheme_Base # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT 16D6D..16D6F ; Grapheme_Base # Po [3] KIRAT RAI SIGN YUPI..KIRAT RAI DOUBLE DANDA 16D70..16D79 ; Grapheme_Base # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16D80..16D97 ; Grapheme_Base # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D99..16D9C ; Grapheme_Base # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16DA0..16DA9 ; Grapheme_Base # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16E40..16E7F ; Grapheme_Base # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16E80..16E96 ; Grapheme_Base # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM 16E97..16E9A ; Grapheme_Base # Po [4] MEDEFAIDRIN COMMA..MEDEFAIDRIN EXCLAMATION OH @@ -12980,7 +13004,7 @@ FFFC..FFFD ; Grapheme_Base # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEME 30000..3134A ; Grapheme_Base # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; Grapheme_Base # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 157495 +# Total code points: 157533 # ================================================ @@ -13052,8 +13076,9 @@ ABED ; Grapheme_Link # Mn MEETEI MAYEK APUN IYEK 11F41 ; Grapheme_Link # Mc KAWI SIGN KILLER 11F42 ; Grapheme_Link # Mn KAWI CONJOINER 1612F ; Grapheme_Link # Mn GURUNG KHEMA SIGN THOLHOMA +16D9D ; Grapheme_Link # Mn CHISOI SIGN SISO -# Total code points: 69 +# Total code points: 70 # ================================================ @@ -13550,6 +13575,8 @@ FF9E..FF9F ; InCB; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HA 1612D..1612F ; InCB; Extend # Mn [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA 16AF0..16AF4 ; InCB; Extend # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; InCB; Extend # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM +16D98 ; InCB; Extend # Mn CHISOI SIGN ANUSVARA +16D9D ; InCB; Extend # Mn CHISOI SIGN SISO 16F4F ; InCB; Extend # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F8F..16F92 ; InCB; Extend # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16FE4 ; InCB; Extend # Mn KHITAN SMALL SCRIPT FILLER @@ -13591,6 +13618,6 @@ FF9E..FF9F ; InCB; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HA E0020..E007F ; InCB; Extend # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; InCB; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2217 +# Total code points: 2219 # EOF diff --git a/unicodetools/data/ucd/dev/EastAsianWidth.txt b/unicodetools/data/ucd/dev/EastAsianWidth.txt index 7eb4945ff..03a4b6877 100644 --- a/unicodetools/data/ucd/dev/EastAsianWidth.txt +++ b/unicodetools/data/ucd/dev/EastAsianWidth.txt @@ -1,5 +1,5 @@ # EastAsianWidth-17.0.0.txt -# Date: 2025-06-30, 06:20:23 GMT +# Date: 2025-07-23, 01:37:08 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -2360,6 +2360,11 @@ FFFD ; A # So REPLACEMENT CHARACTER 16D6B..16D6C ; N # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT 16D6D..16D6F ; N # Po [3] KIRAT RAI SIGN YUPI..KIRAT RAI DOUBLE DANDA 16D70..16D79 ; N # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16D80..16D97 ; N # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D98 ; N # Mn CHISOI SIGN ANUSVARA +16D99..16D9C ; N # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16D9D ; N # Mn CHISOI SIGN SISO +16DA0..16DA9 ; N # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16E40..16E7F ; N # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16E80..16E96 ; N # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM 16E97..16E9A ; N # Po [4] MEDEFAIDRIN COMMA..MEDEFAIDRIN EXCLAMATION OH diff --git a/unicodetools/data/ucd/dev/IndicPositionalCategory.txt b/unicodetools/data/ucd/dev/IndicPositionalCategory.txt index c4e07594c..649afcddf 100644 --- a/unicodetools/data/ucd/dev/IndicPositionalCategory.txt +++ b/unicodetools/data/ucd/dev/IndicPositionalCategory.txt @@ -1,5 +1,5 @@ # IndicPositionalCategory-17.0.0.txt -# Date: 2025-06-30, 06:18:52 GMT +# Date: 2025-07-23, 01:37:10 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -618,6 +618,7 @@ ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP 11F5A ; Top # Mn KAWI SIGN NUKTA 1611E..16129 ; Top # Mn [12] GURUNG KHEMA VOWEL SIGN AA..GURUNG KHEMA VOWEL LENGTH MARK 1612D ; Top # Mn GURUNG KHEMA SIGN ANUSVARA +16D98 ; Top # Mn CHISOI SIGN ANUSVARA # Indic_Positional_Category=Bottom @@ -773,6 +774,7 @@ ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK 11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U 11F38..11F3A ; Bottom # Mn [3] KAWI VOWEL SIGN U..KAWI VOWEL SIGN VOCALIC R 1612E..1612F ; Bottom # Mn [2] GURUNG KHEMA CONSONANT SIGN MEDIAL RA..GURUNG KHEMA SIGN THOLHOMA +16D9D ; Bottom # Mn CHISOI SIGN SISO # Indic_Positional_Category=Top_And_Bottom diff --git a/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt b/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt index 97d53c542..e39223702 100644 --- a/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt +++ b/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt @@ -1,5 +1,5 @@ # IndicSyllabicCategory-17.0.0.txt -# Date: 2025-06-30, 06:20:25 GMT +# Date: 2025-07-23, 01:37:10 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -140,6 +140,7 @@ A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK 11F00..11F01 ; Bindu # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA 1612D ; Bindu # Mn GURUNG KHEMA SIGN ANUSVARA 16D40..16D41 ; Bindu # Lm [2] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN TONPI +16D98 ; Bindu # Mn CHISOI SIGN ANUSVARA # ================================================ @@ -338,6 +339,7 @@ ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK 11F41 ; Pure_Killer # Mc KAWI SIGN KILLER 1612F ; Pure_Killer # Mn GURUNG KHEMA SIGN THOLHOMA 16D6B..16D6C ; Pure_Killer # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT +16D9D ; Pure_Killer # Mn CHISOI SIGN SISO # ================================================ @@ -771,6 +773,12 @@ A866 ; Vowel # Lo PHAGS-PA LETTER EE A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O 11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O +16D80 ; Vowel # Lo CHISOI LETTER A +16D82..16D83 ; Vowel # Lo [2] CHISOI LETTER AI..CHISOI LETTER AA +16D86 ; Vowel # Lo CHISOI LETTER E +16D89 ; Vowel # Lo CHISOI LETTER I +16D8F ; Vowel # Lo CHISOI LETTER U +16D92 ; Vowel # Lo CHISOI LETTER O # ================================================ @@ -979,6 +987,13 @@ ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTE 11F12..11F33 ; Consonant # Lo [34] KAWI LETTER KA..KAWI LETTER JNYA 16101..1611D ; Consonant # Lo [29] GURUNG KHEMA LETTER KA..GURUNG KHEMA LETTER SA 16D43..16D62 ; Consonant # Lo [32] KIRAT RAI LETTER A..KIRAT RAI LETTER HA +16D81 ; Consonant # Lo CHISOI LETTER BA +16D84..16D85 ; Consonant # Lo [2] CHISOI LETTER GA..CHISOI LETTER TA +16D87..16D88 ; Consonant # Lo [2] CHISOI LETTER SA..CHISOI LETTER NA +16D8A..16D8E ; Consonant # Lo [5] CHISOI LETTER KA..CHISOI LETTER RRA +16D90..16D91 ; Consonant # Lo [2] CHISOI LETTER DA..CHISOI LETTER LA +16D93..16D97 ; Consonant # Lo [5] CHISOI LETTER NYA..CHISOI LETTER PA +16D99..16D9C ; Consonant # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA # ================================================ @@ -1395,6 +1410,7 @@ ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NI 11F50..11F59 ; Number # Nd [10] KAWI DIGIT ZERO..KAWI DIGIT NINE 16130..16139 ; Number # Nd [10] GURUNG KHEMA DIGIT ZERO..GURUNG KHEMA DIGIT NINE 16D70..16D79 ; Number # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16DA0..16DA9 ; Number # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE # ================================================ diff --git a/unicodetools/data/ucd/dev/LineBreak.txt b/unicodetools/data/ucd/dev/LineBreak.txt index 2a55f1f1f..737c0c1bf 100644 --- a/unicodetools/data/ucd/dev/LineBreak.txt +++ b/unicodetools/data/ucd/dev/LineBreak.txt @@ -1,5 +1,5 @@ # LineBreak-17.0.0.txt -# Date: 2025-06-30, 06:20:25 GMT +# Date: 2025-07-23, 01:37:10 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -3269,6 +3269,11 @@ FFFD ; AI # So REPLACEMENT CHARACTER 16D6D ; AL # Po KIRAT RAI SIGN YUPI 16D6E..16D6F ; BA # Po [2] KIRAT RAI DANDA..KIRAT RAI DOUBLE DANDA 16D70..16D79 ; NU # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16D80..16D97 ; AL # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D98 ; CM # Mn CHISOI SIGN ANUSVARA +16D99..16D9C ; AL # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16D9D ; CM # Mn CHISOI SIGN SISO +16DA0..16DA9 ; NU # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16E40..16E7F ; AL # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16E80..16E96 ; AL # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM 16E97..16E98 ; BA # Po [2] MEDEFAIDRIN COMMA..MEDEFAIDRIN FULL STOP diff --git a/unicodetools/data/ucd/dev/NormalizationTest.txt b/unicodetools/data/ucd/dev/NormalizationTest.txt index 97b4e4e62..9eee32616 100644 --- a/unicodetools/data/ucd/dev/NormalizationTest.txt +++ b/unicodetools/data/ucd/dev/NormalizationTest.txt @@ -1,5 +1,5 @@ # NormalizationTest-17.0.0.txt -# Date: 2025-06-30, 06:16:16 GMT +# Date: 2025-01-27, 18:09:23 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -18891,6 +18891,8 @@ FFEE;FFEE;FFEE;25CB;25CB; # (○; ○; ○; ○; ○; ) HALFWIDTH WHITE CIRCLE 0061 16B35 0315 0300 05AE 0062;0061 05AE 16B35 0300 0315 0062;0061 05AE 16B35 0300 0315 0062;0061 05AE 16B35 0300 0315 0062;0061 05AE 16B35 0300 0315 0062; # (a◌𖬵◌̕◌̀◌֮b; a◌֮◌𖬵◌̀◌̕b; a◌֮◌𖬵◌̀◌̕b; a◌֮◌𖬵◌̀◌̕b; a◌֮◌𖬵◌̀◌̕b; ) LATIN SMALL LETTER A, PAHAWH HMONG MARK CIM HOM, COMBINING COMMA ABOVE RIGHT, COMBINING GRAVE ACCENT, HEBREW ACCENT ZINOR, LATIN SMALL LETTER B 0061 0315 0300 05AE 16B36 0062;00E0 05AE 16B36 0315 0062;0061 05AE 0300 16B36 0315 0062;00E0 05AE 16B36 0315 0062;0061 05AE 0300 16B36 0315 0062; # (a◌̕◌̀◌֮◌𖬶b; à◌֮◌𖬶◌̕b; a◌֮◌̀◌𖬶◌̕b; à◌֮◌𖬶◌̕b; a◌֮◌̀◌𖬶◌̕b; ) LATIN SMALL LETTER A, COMBINING COMMA ABOVE RIGHT, COMBINING GRAVE ACCENT, HEBREW ACCENT ZINOR, PAHAWH HMONG MARK CIM TAUM, LATIN SMALL LETTER B 0061 16B36 0315 0300 05AE 0062;0061 05AE 16B36 0300 0315 0062;0061 05AE 16B36 0300 0315 0062;0061 05AE 16B36 0300 0315 0062;0061 05AE 16B36 0300 0315 0062; # (a◌𖬶◌̕◌̀◌֮b; a◌֮◌𖬶◌̀◌̕b; a◌֮◌𖬶◌̀◌̕b; a◌֮◌𖬶◌̀◌̕b; a◌֮◌𖬶◌̀◌̕b; ) LATIN SMALL LETTER A, PAHAWH HMONG MARK CIM TAUM, COMBINING COMMA ABOVE RIGHT, COMBINING GRAVE ACCENT, HEBREW ACCENT ZINOR, LATIN SMALL LETTER B +0061 05B0 094D 3099 16D9D 0062;0061 3099 094D 16D9D 05B0 0062;0061 3099 094D 16D9D 05B0 0062;0061 3099 094D 16D9D 05B0 0062;0061 3099 094D 16D9D 05B0 0062; # (a◌ְ◌्◌゙◌𖶝b; a◌゙◌्◌𖶝◌ְb; a◌゙◌्◌𖶝◌ְb; a◌゙◌्◌𖶝◌ְb; a◌゙◌्◌𖶝◌ְb; ) LATIN SMALL LETTER A, HEBREW POINT SHEVA, DEVANAGARI SIGN VIRAMA, COMBINING KATAKANA-HIRAGANA VOICED SOUND MARK, CHISOI SIGN SISO, LATIN SMALL LETTER B +0061 16D9D 05B0 094D 3099 0062;0061 3099 16D9D 094D 05B0 0062;0061 3099 16D9D 094D 05B0 0062;0061 3099 16D9D 094D 05B0 0062;0061 3099 16D9D 094D 05B0 0062; # (a◌𖶝◌ְ◌्◌゙b; a◌゙◌𖶝◌्◌ְb; a◌゙◌𖶝◌्◌ְb; a◌゙◌𖶝◌्◌ְb; a◌゙◌𖶝◌्◌ְb; ) LATIN SMALL LETTER A, CHISOI SIGN SISO, HEBREW POINT SHEVA, DEVANAGARI SIGN VIRAMA, COMBINING KATAKANA-HIRAGANA VOICED SOUND MARK, LATIN SMALL LETTER B 0061 093C 16FF0 0334 16FF0 0062;0061 0334 16FF0 16FF0 093C 0062;0061 0334 16FF0 16FF0 093C 0062;0061 0334 16FF0 16FF0 093C 0062;0061 0334 16FF0 16FF0 093C 0062; # (a◌𖿰़◌̴𖿰b; a◌̴𖿰𖿰◌़b; a◌̴𖿰𖿰◌़b; a◌̴𖿰𖿰◌़b; a◌̴𖿰𖿰◌़b; ) LATIN SMALL LETTER A, DEVANAGARI SIGN NUKTA, VIETNAMESE ALTERNATE READING MARK CA, COMBINING TILDE OVERLAY, VIETNAMESE ALTERNATE READING MARK CA, LATIN SMALL LETTER B 0061 16FF0 093C 16FF0 0334 0062;0061 0334 16FF0 16FF0 093C 0062;0061 0334 16FF0 16FF0 093C 0062;0061 0334 16FF0 16FF0 093C 0062;0061 0334 16FF0 16FF0 093C 0062; # (a𖿰◌𖿰़◌̴b; a◌̴𖿰𖿰◌़b; a◌̴𖿰𖿰◌़b; a◌̴𖿰𖿰◌़b; a◌̴𖿰𖿰◌़b; ) LATIN SMALL LETTER A, VIETNAMESE ALTERNATE READING MARK CA, DEVANAGARI SIGN NUKTA, VIETNAMESE ALTERNATE READING MARK CA, COMBINING TILDE OVERLAY, LATIN SMALL LETTER B 0061 093C 16FF0 0334 16FF1 0062;0061 0334 16FF0 16FF1 093C 0062;0061 0334 16FF0 16FF1 093C 0062;0061 0334 16FF0 16FF1 093C 0062;0061 0334 16FF0 16FF1 093C 0062; # (a◌𖿰़◌̴𖿱b; a◌̴𖿰𖿱◌़b; a◌̴𖿰𖿱◌़b; a◌̴𖿰𖿱◌़b; a◌̴𖿰𖿱◌़b; ) LATIN SMALL LETTER A, DEVANAGARI SIGN NUKTA, VIETNAMESE ALTERNATE READING MARK CA, COMBINING TILDE OVERLAY, VIETNAMESE ALTERNATE READING MARK NHAY, LATIN SMALL LETTER B diff --git a/unicodetools/data/ucd/dev/PropList.txt b/unicodetools/data/ucd/dev/PropList.txt index e64b4224d..167bc3eae 100644 --- a/unicodetools/data/ucd/dev/PropList.txt +++ b/unicodetools/data/ucd/dev/PropList.txt @@ -1,5 +1,5 @@ # PropList-17.0.0.txt -# Date: 2025-06-30, 06:19:01 GMT +# Date: 2025-07-23, 01:37:21 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -848,6 +848,7 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA 1611E..16129 ; Other_Alphabetic # Mn [12] GURUNG KHEMA VOWEL SIGN AA..GURUNG KHEMA VOWEL LENGTH MARK 1612A..1612C ; Other_Alphabetic # Mc [3] GURUNG KHEMA CONSONANT SIGN MEDIAL YA..GURUNG KHEMA CONSONANT SIGN MEDIAL HA 1612D..1612E ; Other_Alphabetic # Mn [2] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA CONSONANT SIGN MEDIAL RA +16D98 ; Other_Alphabetic # Mn CHISOI SIGN ANUSVARA 16F4F ; Other_Alphabetic # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F51..16F87 ; Other_Alphabetic # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI 16F8F..16F92 ; Other_Alphabetic # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW @@ -868,7 +869,7 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA 1F150..1F169 ; Other_Alphabetic # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; Other_Alphabetic # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 1510 +# Total code points: 1511 # ================================================ @@ -1145,6 +1146,7 @@ FFE3 ; Diacritic # Sk FULLWIDTH MACRON 16AF0..16AF4 ; Diacritic # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; Diacritic # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM 16D6B..16D6C ; Diacritic # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT +16D9D ; Diacritic # Mn CHISOI SIGN SISO 16F8F..16F92 ; Diacritic # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16F93..16F9F ; Diacritic # Lm [13] MIAO LETTER TONE-2..MIAO LETTER REFORMED TONE-8 16FF0..16FF1 ; Diacritic # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY @@ -1167,7 +1169,7 @@ FFE3 ; Diacritic # Sk FULLWIDTH MACRON 1E944..1E946 ; Diacritic # Mn [3] ADLAM ALIF LENGTHENER..ADLAM GEMINATION MARK 1E948..1E94A ; Diacritic # Mn [3] ADLAM CONSONANT MODIFIER..ADLAM NUKTA -# Total code points: 1247 +# Total code points: 1248 # ================================================ diff --git a/unicodetools/data/ucd/dev/PropertyValueAliases.txt b/unicodetools/data/ucd/dev/PropertyValueAliases.txt index 4f56ef3eb..53d035e04 100644 --- a/unicodetools/data/ucd/dev/PropertyValueAliases.txt +++ b/unicodetools/data/ucd/dev/PropertyValueAliases.txt @@ -1,5 +1,5 @@ # PropertyValueAliases-17.0.0.txt -# Date: 2025-06-30, 06:16:21 GMT +# Date: 2025-04-25, 13:37:02 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -198,6 +198,7 @@ blk; Cham ; Cham blk; Cherokee ; Cherokee blk; Cherokee_Sup ; Cherokee_Supplement blk; Chess_Symbols ; Chess_Symbols +blk; Chisoi ; Chisoi blk; Chorasmian ; Chorasmian blk; CJK ; CJK_Unified_Ideographs blk; CJK_Compat ; CJK_Compatibility @@ -1342,6 +1343,7 @@ sc ; Cans ; Canadian_Aboriginal sc ; Cari ; Carian sc ; Cham ; Cham sc ; Cher ; Cherokee +sc ; Chis ; Chisoi sc ; Chrs ; Chorasmian sc ; Copt ; Coptic ; Qaac sc ; Cpmn ; Cypro_Minoan diff --git a/unicodetools/data/ucd/dev/ScriptExtensions.txt b/unicodetools/data/ucd/dev/ScriptExtensions.txt index dddbc5c3c..1b852f171 100644 --- a/unicodetools/data/ucd/dev/ScriptExtensions.txt +++ b/unicodetools/data/ucd/dev/ScriptExtensions.txt @@ -1,5 +1,5 @@ # ScriptExtensions-17.0.0.txt -# Date: 2025-06-30, 06:16:32 GMT +# Date: 2025-01-27, 18:09:38 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -81,8 +81,8 @@ 06D4 ; Arab Rohg # Po ARABIC FULL STOP 0951 ; Beng Deva Gran Gujr Guru Knda Latn Mlym Orya Shrd Taml Telu Tirh #Mn DEVANAGARI STRESS SIGN UDATTA 0952 ; Beng Deva Gran Gujr Guru Knda Latn Mlym Orya Taml Telu Tirh #Mn DEVANAGARI STRESS SIGN ANUDATTA -0964 ; Beng Deva Dogr Gong Gonm Gran Gujr Guru Knda Mahj Mlym Nand Onao Orya Sind Sinh Sylo Takr Taml Telu Tirh #Po DEVANAGARI DANDA -0965 ; Beng Deva Dogr Gong Gonm Gran Gujr Gukh Guru Knda Limb Mahj Mlym Nand Onao Orya Sind Sinh Sylo Takr Taml Telu Tirh #Po DEVANAGARI DOUBLE DANDA +0964 ; Beng Chis Deva Dogr Gong Gonm Gran Gujr Guru Knda Mahj Mlym Nand Onao Orya Sind Sinh Sylo Takr Taml Telu Tirh #Po DEVANAGARI DANDA +0965 ; Beng Chis Deva Dogr Gong Gonm Gran Gujr Gukh Guru Knda Limb Mahj Mlym Nand Onao Orya Sind Sinh Sylo Takr Taml Telu Tirh #Po DEVANAGARI DOUBLE DANDA 0966..096F ; Deva Dogr Kthi Mahj # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE 09E6..09EF ; Beng Cakm Sylo # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE 0A66..0A6F ; Guru Mult # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE diff --git a/unicodetools/data/ucd/dev/Scripts.txt b/unicodetools/data/ucd/dev/Scripts.txt index c53490ae4..eb174ed77 100644 --- a/unicodetools/data/ucd/dev/Scripts.txt +++ b/unicodetools/data/ucd/dev/Scripts.txt @@ -1,5 +1,5 @@ # Scripts-17.0.0.txt -# Date: 2025-06-30, 06:20:47 GMT +# Date: 2025-07-23, 01:37:34 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -3143,6 +3143,16 @@ ABF0..ABF9 ; Meetei_Mayek # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DI # ================================================ +16D80..16D97 ; Chisoi # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D98 ; Chisoi # Mn CHISOI SIGN ANUSVARA +16D99..16D9C ; Chisoi # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16D9D ; Chisoi # Mn CHISOI SIGN SISO +16DA0..16DA9 ; Chisoi # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE + +# Total code points: 40 + +# ================================================ + 10940..10959 ; Sidetic # Lo [26] SIDETIC LETTER N01..SIDETIC LETTER N26 # Total code points: 26 diff --git a/unicodetools/data/ucd/dev/UnicodeData.txt b/unicodetools/data/ucd/dev/UnicodeData.txt index 90effa8dc..1c274ab48 100644 --- a/unicodetools/data/ucd/dev/UnicodeData.txt +++ b/unicodetools/data/ucd/dev/UnicodeData.txt @@ -30197,6 +30197,46 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 16D77;KIRAT RAI DIGIT SEVEN;Nd;0;L;;7;7;7;N;;;;; 16D78;KIRAT RAI DIGIT EIGHT;Nd;0;L;;8;8;8;N;;;;; 16D79;KIRAT RAI DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; +16D80;CHISOI LETTER A;Lo;0;L;;;;;N;;;;; +16D81;CHISOI LETTER BA;Lo;0;L;;;;;N;;;;; +16D82;CHISOI LETTER AI;Lo;0;L;;;;;N;;;;; +16D83;CHISOI LETTER AA;Lo;0;L;;;;;N;;;;; +16D84;CHISOI LETTER GA;Lo;0;L;;;;;N;;;;; +16D85;CHISOI LETTER TA;Lo;0;L;;;;;N;;;;; +16D86;CHISOI LETTER E;Lo;0;L;;;;;N;;;;; +16D87;CHISOI LETTER SA;Lo;0;L;;;;;N;;;;; +16D88;CHISOI LETTER NA;Lo;0;L;;;;;N;;;;; +16D89;CHISOI LETTER I;Lo;0;L;;;;;N;;;;; +16D8A;CHISOI LETTER KA;Lo;0;L;;;;;N;;;;; +16D8B;CHISOI LETTER RA;Lo;0;L;;;;;N;;;;; +16D8C;CHISOI LETTER MA;Lo;0;L;;;;;N;;;;; +16D8D;CHISOI LETTER HA;Lo;0;L;;;;;N;;;;; +16D8E;CHISOI LETTER RRA;Lo;0;L;;;;;N;;;;; +16D8F;CHISOI LETTER U;Lo;0;L;;;;;N;;;;; +16D90;CHISOI LETTER DA;Lo;0;L;;;;;N;;;;; +16D91;CHISOI LETTER LA;Lo;0;L;;;;;N;;;;; +16D92;CHISOI LETTER O;Lo;0;L;;;;;N;;;;; +16D93;CHISOI LETTER NYA;Lo;0;L;;;;;N;;;;; +16D94;CHISOI LETTER NGA;Lo;0;L;;;;;N;;;;; +16D95;CHISOI LETTER CA;Lo;0;L;;;;;N;;;;; +16D96;CHISOI LETTER JA;Lo;0;L;;;;;N;;;;; +16D97;CHISOI LETTER PA;Lo;0;L;;;;;N;;;;; +16D98;CHISOI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;; +16D99;CHISOI LETTER YA;Lo;0;L;;;;;N;;;;; +16D9A;CHISOI LETTER DDA;Lo;0;L;;;;;N;;;;; +16D9B;CHISOI LETTER TTA;Lo;0;L;;;;;N;;;;; +16D9C;CHISOI LETTER JARAHA;Lo;0;L;;;;;N;;;;; +16D9D;CHISOI SIGN SISO;Mn;9;NSM;;;;;N;;;;; +16DA0;CHISOI DIGIT ZERO;Nd;0;L;;0;0;0;N;;;;; +16DA1;CHISOI DIGIT ONE;Nd;0;L;;1;1;1;N;;;;; +16DA2;CHISOI DIGIT TWO;Nd;0;L;;2;2;2;N;;;;; +16DA3;CHISOI DIGIT THREE;Nd;0;L;;3;3;3;N;;;;; +16DA4;CHISOI DIGIT FOUR;Nd;0;L;;4;4;4;N;;;;; +16DA5;CHISOI DIGIT FIVE;Nd;0;L;;5;5;5;N;;;;; +16DA6;CHISOI DIGIT SIX;Nd;0;L;;6;6;6;N;;;;; +16DA7;CHISOI DIGIT SEVEN;Nd;0;L;;7;7;7;N;;;;; +16DA8;CHISOI DIGIT EIGHT;Nd;0;L;;8;8;8;N;;;;; +16DA9;CHISOI DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 16E40;MEDEFAIDRIN CAPITAL LETTER M;Lu;0;L;;;;;N;;;;16E60; 16E41;MEDEFAIDRIN CAPITAL LETTER S;Lu;0;L;;;;;N;;;;16E61; 16E42;MEDEFAIDRIN CAPITAL LETTER V;Lu;0;L;;;;;N;;;;16E62; diff --git a/unicodetools/data/ucd/dev/VerticalOrientation.txt b/unicodetools/data/ucd/dev/VerticalOrientation.txt index 37b394bb2..f3e7ea688 100644 --- a/unicodetools/data/ucd/dev/VerticalOrientation.txt +++ b/unicodetools/data/ucd/dev/VerticalOrientation.txt @@ -1,5 +1,5 @@ # VerticalOrientation-17.0.0.txt -# Date: 2025-06-30, 06:20:49 GMT +# Date: 2025-07-23, 01:37:37 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -2195,6 +2195,11 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 16D6B..16D6C ; R # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT 16D6D..16D6F ; R # Po [3] KIRAT RAI SIGN YUPI..KIRAT RAI DOUBLE DANDA 16D70..16D79 ; R # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16D80..16D97 ; R # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D98 ; R # Mn CHISOI SIGN ANUSVARA +16D99..16D9C ; R # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16D9D ; R # Mn CHISOI SIGN SISO +16DA0..16DA9 ; R # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16E40..16E7F ; R # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16E80..16E96 ; R # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM 16E97..16E9A ; R # Po [4] MEDEFAIDRIN COMMA..MEDEFAIDRIN EXCLAMATION OH diff --git a/unicodetools/data/ucd/dev/auxiliary/GraphemeBreakProperty.txt b/unicodetools/data/ucd/dev/auxiliary/GraphemeBreakProperty.txt index 19b13571f..33fbda5b3 100644 --- a/unicodetools/data/ucd/dev/auxiliary/GraphemeBreakProperty.txt +++ b/unicodetools/data/ucd/dev/auxiliary/GraphemeBreakProperty.txt @@ -1,5 +1,5 @@ # GraphemeBreakProperty-17.0.0.txt -# Date: 2025-06-30, 06:20:23 GMT +# Date: 2025-07-23, 01:37:08 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -461,6 +461,8 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 1612D..1612F ; Extend # Mn [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA 16AF0..16AF4 ; Extend # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; Extend # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM +16D98 ; Extend # Mn CHISOI SIGN ANUSVARA +16D9D ; Extend # Mn CHISOI SIGN SISO 16F4F ; Extend # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F8F..16F92 ; Extend # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16FE4 ; Extend # Mn KHITAN SMALL SCRIPT FILLER @@ -502,7 +504,7 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT E0020..E007F ; Extend # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2237 +# Total code points: 2239 # ================================================ diff --git a/unicodetools/data/ucd/dev/auxiliary/SentenceBreakProperty.txt b/unicodetools/data/ucd/dev/auxiliary/SentenceBreakProperty.txt index c06f4e26a..090ee9070 100644 --- a/unicodetools/data/ucd/dev/auxiliary/SentenceBreakProperty.txt +++ b/unicodetools/data/ucd/dev/auxiliary/SentenceBreakProperty.txt @@ -1,5 +1,5 @@ # SentenceBreakProperty-17.0.0.txt -# Date: 2025-06-30, 06:20:48 GMT +# Date: 2025-07-23, 01:37:35 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -556,6 +556,8 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 1612D..1612F ; Extend # Mn [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA 16AF0..16AF4 ; Extend # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; Extend # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM +16D98 ; Extend # Mn CHISOI SIGN ANUSVARA +16D9D ; Extend # Mn CHISOI SIGN SISO 16F4F ; Extend # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F51..16F87 ; Extend # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI 16F8F..16F92 ; Extend # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW @@ -597,7 +599,7 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT E0020..E007F ; Extend # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2643 +# Total code points: 2645 # ================================================ @@ -2528,6 +2530,8 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 16D40..16D42 ; OLetter # Lm [3] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN VISARGA 16D43..16D6A ; OLetter # Lo [40] KIRAT RAI LETTER A..KIRAT RAI VOWEL SIGN AU 16D6B..16D6C ; OLetter # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT +16D80..16D97 ; OLetter # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D99..16D9C ; OLetter # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA 16F00..16F4A ; OLetter # Lo [75] MIAO LETTER PA..MIAO LETTER RTE 16F50 ; OLetter # Lo MIAO LETTER NASALIZATION 16F93..16F9F ; OLetter # Lm [13] MIAO LETTER TONE-2..MIAO LETTER REFORMED TONE-8 @@ -2616,7 +2620,7 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 30000..3134A ; OLetter # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; OLetter # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 141501 +# Total code points: 141529 # ================================================ @@ -2692,6 +2696,7 @@ FF10..FF19 ; Numeric # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 16AC0..16AC9 ; Numeric # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; Numeric # Nd [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 16D70..16D79 ; Numeric # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16DA0..16DA9 ; Numeric # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 1CCF0..1CCF9 ; Numeric # Nd [10] OUTLINED DIGIT ZERO..OUTLINED DIGIT NINE 1D7CE..1D7FF ; Numeric # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; Numeric # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -2701,7 +2706,7 @@ FF10..FF19 ; Numeric # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 1E950..1E959 ; Numeric # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; Numeric # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 785 +# Total code points: 795 # ================================================ diff --git a/unicodetools/data/ucd/dev/auxiliary/WordBreakProperty.txt b/unicodetools/data/ucd/dev/auxiliary/WordBreakProperty.txt index 20fa24e37..50e3c1f23 100644 --- a/unicodetools/data/ucd/dev/auxiliary/WordBreakProperty.txt +++ b/unicodetools/data/ucd/dev/auxiliary/WordBreakProperty.txt @@ -1,5 +1,5 @@ # WordBreakProperty-17.0.0.txt -# Date: 2025-06-30, 06:20:49 GMT +# Date: 2025-07-23, 01:37:37 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -592,6 +592,8 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 1612D..1612F ; Extend # Mn [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA 16AF0..16AF4 ; Extend # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; Extend # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM +16D98 ; Extend # Mn CHISOI SIGN ANUSVARA +16D9D ; Extend # Mn CHISOI SIGN SISO 16F4F ; Extend # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F51..16F87 ; Extend # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI 16F8F..16F92 ; Extend # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW @@ -634,7 +636,7 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT E0020..E007F ; Extend # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2647 +# Total code points: 2649 # ================================================ @@ -1272,6 +1274,8 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 16D40..16D42 ; ALetter # Lm [3] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN VISARGA 16D43..16D6A ; ALetter # Lo [40] KIRAT RAI LETTER A..KIRAT RAI VOWEL SIGN AU 16D6B..16D6C ; ALetter # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT +16D80..16D97 ; ALetter # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D99..16D9C ; ALetter # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA 16E40..16E7F ; ALetter # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16EA0..16EB8 ; ALetter # L& [25] BERIA ERFE CAPITAL LETTER ARKAB..BERIA ERFE CAPITAL LETTER AY 16EBB..16ED3 ; ALetter # L& [25] BERIA ERFE SMALL LETTER ARKAB..BERIA ERFE SMALL LETTER AY @@ -1379,7 +1383,7 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1F150..1F169 ; ALetter # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; ALetter # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 33973 +# Total code points: 34001 # ================================================ @@ -1498,6 +1502,7 @@ FF10..FF19 ; Numeric # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 16AC0..16AC9 ; Numeric # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; Numeric # Nd [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 16D70..16D79 ; Numeric # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16DA0..16DA9 ; Numeric # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 1CCF0..1CCF9 ; Numeric # Nd [10] OUTLINED DIGIT ZERO..OUTLINED DIGIT NINE 1D7CE..1D7FF ; Numeric # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; Numeric # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -1507,7 +1512,7 @@ FF10..FF19 ; Numeric # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 1E950..1E959 ; Numeric # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; Numeric # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 784 +# Total code points: 794 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt b/unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt index bb2824f56..3bb75eee8 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt @@ -1,5 +1,5 @@ # DerivedBidiClass-17.0.0.txt -# Date: 2025-06-30, 06:20:17 GMT +# Date: 2025-07-23, 01:37:02 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1098,6 +1098,9 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 16D6B..16D6C ; L # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT 16D6D..16D6F ; L # Po [3] KIRAT RAI SIGN YUPI..KIRAT RAI DOUBLE DANDA 16D70..16D79 ; L # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16D80..16D97 ; L # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D99..16D9C ; L # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16DA0..16DA9 ; L # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16E40..16E7F ; L # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16E80..16E96 ; L # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM 16E97..16E9A ; L # Po [4] MEDEFAIDRIN COMMA..MEDEFAIDRIN EXCLAMATION OH @@ -1229,8 +1232,8 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER F0000..FFFFD ; L # Co [65534] .. 100000..10FFFD; L # Co [65534] .. -# The above property value applies to 810614 code points not listed here. -# Total code points: 1095406 +# The above property value applies to 810574 code points not listed here. +# Total code points: 1095404 # ================================================ @@ -2405,6 +2408,8 @@ FE20..FE2F ; NSM # Mn [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC 1612D..1612F ; NSM # Mn [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA 16AF0..16AF4 ; NSM # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; NSM # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM +16D98 ; NSM # Mn CHISOI SIGN ANUSVARA +16D9D ; NSM # Mn CHISOI SIGN SISO 16F4F ; NSM # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F8F..16F92 ; NSM # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16FE4 ; NSM # Mn KHITAN SMALL SCRIPT FILLER @@ -2441,7 +2446,7 @@ FE20..FE2F ; NSM # Mn [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC 1E944..1E94A ; NSM # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA E0100..E01EF ; NSM # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2067 +# Total code points: 2069 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedCombiningClass.txt b/unicodetools/data/ucd/dev/extracted/DerivedCombiningClass.txt index c14c80b0e..13dfde458 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedCombiningClass.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedCombiningClass.txt @@ -1,5 +1,5 @@ # DerivedCombiningClass-17.0.0.txt -# Date: 2025-06-30, 06:20:18 GMT +# Date: 2025-07-23, 01:37:03 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1839,6 +1839,10 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 16D6B..16D6C ; 0 # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT 16D6D..16D6F ; 0 # Po [3] KIRAT RAI SIGN YUPI..KIRAT RAI DOUBLE DANDA 16D70..16D79 ; 0 # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16D80..16D97 ; 0 # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D98 ; 0 # Mn CHISOI SIGN ANUSVARA +16D99..16D9C ; 0 # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16DA0..16DA9 ; 0 # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16E40..16E7F ; 0 # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16E80..16E96 ; 0 # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM 16E97..16E9A ; 0 # Po [4] MEDEFAIDRIN COMMA..MEDEFAIDRIN EXCLAMATION OH @@ -2089,8 +2093,8 @@ E0100..E01EF ; 0 # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 F0000..FFFFD ; 0 # Co [65534] .. 100000..10FFFD; 0 # Co [65534] .. -# The above property value applies to 816777 code points not listed here. -# Total code points: 1113144 +# The above property value applies to 816737 code points not listed here. +# Total code points: 1113143 # ================================================ @@ -2227,8 +2231,9 @@ ABED ; 9 # Mn MEETEI MAYEK APUN IYEK 11F41 ; 9 # Mc KAWI SIGN KILLER 11F42 ; 9 # Mn KAWI CONJOINER 1612F ; 9 # Mn GURUNG KHEMA SIGN THOLHOMA +16D9D ; 9 # Mn CHISOI SIGN SISO -# Total code points: 69 +# Total code points: 70 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedEastAsianWidth.txt b/unicodetools/data/ucd/dev/extracted/DerivedEastAsianWidth.txt index ef85ad819..f5e743133 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedEastAsianWidth.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedEastAsianWidth.txt @@ -1,5 +1,5 @@ # DerivedEastAsianWidth-17.0.0.txt -# Date: 2025-06-30, 06:20:19 GMT +# Date: 2025-07-23, 01:37:05 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1880,6 +1880,11 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 16D6B..16D6C ; N # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT 16D6D..16D6F ; N # Po [3] KIRAT RAI SIGN YUPI..KIRAT RAI DOUBLE DANDA 16D70..16D79 ; N # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16D80..16D97 ; N # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D98 ; N # Mn CHISOI SIGN ANUSVARA +16D99..16D9C ; N # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA +16D9D ; N # Mn CHISOI SIGN SISO +16DA0..16DA9 ; N # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 16E40..16E7F ; N # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16E80..16E96 ; N # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM 16E97..16E9A ; N # Po [4] MEDEFAIDRIN COMMA..MEDEFAIDRIN EXCLAMATION OH @@ -2136,7 +2141,7 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER E0001 ; N # Cf LANGUAGE TAG E0020..E007F ; N # Cf [96] TAG SPACE..CANCEL TAG -# The above property value applies to 760611 code points not listed here. +# The above property value applies to 760571 code points not listed here. # Total code points: 792262 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedGeneralCategory.txt b/unicodetools/data/ucd/dev/extracted/DerivedGeneralCategory.txt index 0696c57fa..85058a0b7 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedGeneralCategory.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedGeneralCategory.txt @@ -1,5 +1,5 @@ # DerivedGeneralCategory-17.0.0.txt -# Date: 2025-06-30, 06:20:20 GMT +# Date: 2025-07-23, 01:37:05 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -569,7 +569,9 @@ FFFE..FFFF ; Cn # [2] .. 16B62 ; Cn # 16B78..16B7C ; Cn # [5] .. 16B90..16D3F ; Cn # [432] .. -16D7A..16E3F ; Cn # [198] .. +16D7A..16D7F ; Cn # [6] .. +16D9E..16D9F ; Cn # [2] .. +16DAA..16E3F ; Cn # [150] .. 16E9B..16E9F ; Cn # [5] .. 16EB9..16EBA ; Cn # [2] .. 16ED4..16EFF ; Cn # [44] .. @@ -751,7 +753,7 @@ E01F0..EFFFF ; Cn # [65040] .. FFFFE..FFFFF ; Cn # [2] .. 10FFFE..10FFFF; Cn # [2] .. -# Total code points: 814729 +# Total code points: 814689 # ================================================ @@ -2655,6 +2657,8 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 16B63..16B77 ; Lo # [21] PAHAWH HMONG SIGN VOS LUB..PAHAWH HMONG SIGN CIM NRES TOS 16B7D..16B8F ; Lo # [19] PAHAWH HMONG CLAN SIGN TSHEEJ..PAHAWH HMONG CLAN SIGN VWJ 16D43..16D6A ; Lo # [40] KIRAT RAI LETTER A..KIRAT RAI VOWEL SIGN AU +16D80..16D97 ; Lo # [24] CHISOI LETTER A..CHISOI LETTER PA +16D99..16D9C ; Lo # [4] CHISOI LETTER YA..CHISOI LETTER JARAHA 16F00..16F4A ; Lo # [75] MIAO LETTER PA..MIAO LETTER RTE 16F50 ; Lo # MIAO LETTER NASALIZATION 17000..18CD5 ; Lo # [7382] TANGUT IDEOGRAPH-17000..KHITAN SMALL SCRIPT CHARACTER-18CD5 @@ -2731,7 +2735,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 30000..3134A ; Lo # [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 31350..33479 ; Lo # [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479 -# Total code points: 141062 +# Total code points: 141090 # ================================================ @@ -3067,6 +3071,8 @@ FE20..FE2F ; Mn # [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC TITL 1612D..1612F ; Mn # [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA 16AF0..16AF4 ; Mn # [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; Mn # [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM +16D98 ; Mn # CHISOI SIGN ANUSVARA +16D9D ; Mn # CHISOI SIGN SISO 16F4F ; Mn # MIAO SIGN CONSONANT MODIFIER BAR 16F8F..16F92 ; Mn # [4] MIAO TONE RIGHT..MIAO TONE BELOW 16FE4 ; Mn # KHITAN SMALL SCRIPT FILLER @@ -3103,7 +3109,7 @@ FE20..FE2F ; Mn # [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC TITL 1E944..1E94A ; Mn # [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA E0100..E01EF ; Mn # [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2059 +# Total code points: 2061 # ================================================ @@ -3385,6 +3391,7 @@ FF10..FF19 ; Nd # [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 16AC0..16AC9 ; Nd # [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; Nd # [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 16D70..16D79 ; Nd # [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16DA0..16DA9 ; Nd # [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 1CCF0..1CCF9 ; Nd # [10] OUTLINED DIGIT ZERO..OUTLINED DIGIT NINE 1D7CE..1D7FF ; Nd # [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; Nd # [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -3394,7 +3401,7 @@ FF10..FF19 ; Nd # [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 1E950..1E959 ; Nd # [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; Nd # [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 770 +# Total code points: 780 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedJoiningType.txt b/unicodetools/data/ucd/dev/extracted/DerivedJoiningType.txt index 9e6aa70d0..6f97ef821 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedJoiningType.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedJoiningType.txt @@ -1,5 +1,5 @@ # DerivedJoiningType-17.0.0.txt -# Date: 2025-06-30, 06:20:20 GMT +# Date: 2025-07-23, 01:37:06 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -550,6 +550,8 @@ FFF9..FFFB ; T # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTATI 1612D..1612F ; T # Mn [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA 16AF0..16AF4 ; T # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; T # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM +16D98 ; T # Mn CHISOI SIGN ANUSVARA +16D9D ; T # Mn CHISOI SIGN SISO 16F4F ; T # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F8F..16F92 ; T # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16FE4 ; T # Mn KHITAN SMALL SCRIPT FILLER @@ -591,6 +593,6 @@ E0001 ; T # Cf LANGUAGE TAG E0020..E007F ; T # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; T # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2224 +# Total code points: 2226 # EOF diff --git a/unicodetools/data/ucd/dev/extracted/DerivedLineBreak.txt b/unicodetools/data/ucd/dev/extracted/DerivedLineBreak.txt index 4fb501c97..7e8219b11 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedLineBreak.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedLineBreak.txt @@ -1,5 +1,5 @@ # DerivedLineBreak-17.0.0.txt -# Date: 2025-06-30, 06:20:21 GMT +# Date: 2025-07-23, 01:37:06 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -70,8 +70,8 @@ E000..F8FF ; XX # Co [6400] .. F0000..FFFFD ; XX # Co [65534] .. 100000..10FFFD; XX # Co [65534] .. -# The above property value applies to 757182 code points not listed here. -# Total code points: 894650 +# The above property value applies to 757142 code points not listed here. +# Total code points: 894610 # ================================================ @@ -551,6 +551,7 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 16AC0..16AC9 ; NU # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; NU # Nd [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 16D70..16D79 ; NU # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16DA0..16DA9 ; NU # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 1CCF0..1CCF9 ; NU # Nd [10] OUTLINED DIGIT ZERO..OUTLINED DIGIT NINE 1D7CE..1D7FF ; NU # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; NU # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -560,7 +561,7 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 1E950..1E959 ; NU # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; NU # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 705 +# Total code points: 715 # ================================================ @@ -1447,6 +1448,8 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 16D43..16D6A ; AL # Lo [40] KIRAT RAI LETTER A..KIRAT RAI VOWEL SIGN AU 16D6B..16D6C ; AL # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT 16D6D ; AL # Po KIRAT RAI SIGN YUPI +16D80..16D97 ; AL # Lo [24] CHISOI LETTER A..CHISOI LETTER PA +16D99..16D9C ; AL # Lo [4] CHISOI LETTER YA..CHISOI LETTER JARAHA 16E40..16E7F ; AL # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16E80..16E96 ; AL # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM 16E99..16E9A ; AL # Po [2] MEDEFAIDRIN SYMBOL AIVA..MEDEFAIDRIN EXCLAMATION OH @@ -1638,7 +1641,7 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 1FB94..1FBEF ; AL # So [92] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..TOP LEFT JUSTIFIED LOWER RIGHT QUARTER BLACK CIRCLE 1FBFA ; AL # So ALARM BELL SYMBOL -# Total code points: 26955 +# Total code points: 26983 # ================================================ @@ -2381,6 +2384,8 @@ FFF9..FFFB ; CM # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTAT 1612D..1612F ; CM # Mn [3] GURUNG KHEMA SIGN ANUSVARA..GURUNG KHEMA SIGN THOLHOMA 16AF0..16AF4 ; CM # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B30..16B36 ; CM # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM +16D98 ; CM # Mn CHISOI SIGN ANUSVARA +16D9D ; CM # Mn CHISOI SIGN SISO 16F4F ; CM # Mn MIAO SIGN CONSONANT MODIFIER BAR 16F51..16F87 ; CM # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI 16F8F..16F92 ; CM # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW @@ -2424,7 +2429,7 @@ E0001 ; CM # Cf LANGUAGE TAG E0020..E007F ; CM # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; CM # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2512 +# Total code points: 2514 # ================================================ diff --git a/unicodetools/data/ucd/dev/extracted/DerivedName.txt b/unicodetools/data/ucd/dev/extracted/DerivedName.txt index e1b94d582..1c5e1d678 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedName.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedName.txt @@ -1,5 +1,5 @@ # DerivedName-17.0.0.txt -# Date: 2025-06-30, 06:20:21 GMT +# Date: 2025-07-23, 01:37:06 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -36868,6 +36868,46 @@ FFFD ; REPLACEMENT CHARACTER 16D77 ; KIRAT RAI DIGIT SEVEN 16D78 ; KIRAT RAI DIGIT EIGHT 16D79 ; KIRAT RAI DIGIT NINE +16D80 ; CHISOI LETTER A +16D81 ; CHISOI LETTER BA +16D82 ; CHISOI LETTER AI +16D83 ; CHISOI LETTER AA +16D84 ; CHISOI LETTER GA +16D85 ; CHISOI LETTER TA +16D86 ; CHISOI LETTER E +16D87 ; CHISOI LETTER SA +16D88 ; CHISOI LETTER NA +16D89 ; CHISOI LETTER I +16D8A ; CHISOI LETTER KA +16D8B ; CHISOI LETTER RA +16D8C ; CHISOI LETTER MA +16D8D ; CHISOI LETTER HA +16D8E ; CHISOI LETTER RRA +16D8F ; CHISOI LETTER U +16D90 ; CHISOI LETTER DA +16D91 ; CHISOI LETTER LA +16D92 ; CHISOI LETTER O +16D93 ; CHISOI LETTER NYA +16D94 ; CHISOI LETTER NGA +16D95 ; CHISOI LETTER CA +16D96 ; CHISOI LETTER JA +16D97 ; CHISOI LETTER PA +16D98 ; CHISOI SIGN ANUSVARA +16D99 ; CHISOI LETTER YA +16D9A ; CHISOI LETTER DDA +16D9B ; CHISOI LETTER TTA +16D9C ; CHISOI LETTER JARAHA +16D9D ; CHISOI SIGN SISO +16DA0 ; CHISOI DIGIT ZERO +16DA1 ; CHISOI DIGIT ONE +16DA2 ; CHISOI DIGIT TWO +16DA3 ; CHISOI DIGIT THREE +16DA4 ; CHISOI DIGIT FOUR +16DA5 ; CHISOI DIGIT FIVE +16DA6 ; CHISOI DIGIT SIX +16DA7 ; CHISOI DIGIT SEVEN +16DA8 ; CHISOI DIGIT EIGHT +16DA9 ; CHISOI DIGIT NINE 16E40 ; MEDEFAIDRIN CAPITAL LETTER M 16E41 ; MEDEFAIDRIN CAPITAL LETTER S 16E42 ; MEDEFAIDRIN CAPITAL LETTER V @@ -45824,6 +45864,6 @@ E01ED ; VARIATION SELECTOR-254 E01EE ; VARIATION SELECTOR-255 E01EF ; VARIATION SELECTOR-256 -# Total code points: 159802 +# Total code points: 159842 # EOF diff --git a/unicodetools/data/ucd/dev/extracted/DerivedNumericType.txt b/unicodetools/data/ucd/dev/extracted/DerivedNumericType.txt index cc6eb00ad..fb22d8cde 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedNumericType.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedNumericType.txt @@ -1,5 +1,5 @@ # DerivedNumericType-17.0.0.txt -# Date: 2025-06-30, 06:20:22 GMT +# Date: 2025-07-23, 01:37:07 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -293,6 +293,7 @@ FF10..FF19 ; Decimal # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 16AC0..16AC9 ; Decimal # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; Decimal # Nd [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 16D70..16D79 ; Decimal # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE +16DA0..16DA9 ; Decimal # Nd [10] CHISOI DIGIT ZERO..CHISOI DIGIT NINE 1CCF0..1CCF9 ; Decimal # Nd [10] OUTLINED DIGIT ZERO..OUTLINED DIGIT NINE 1D7CE..1D7FF ; Decimal # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; Decimal # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -302,6 +303,6 @@ FF10..FF19 ; Decimal # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 1E950..1E959 ; Decimal # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; Decimal # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 770 +# Total code points: 780 # EOF diff --git a/unicodetools/data/ucd/dev/extracted/DerivedNumericValues.txt b/unicodetools/data/ucd/dev/extracted/DerivedNumericValues.txt index 8613d3585..4df8badc0 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedNumericValues.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedNumericValues.txt @@ -1,5 +1,5 @@ # DerivedNumericValues-17.0.0.txt -# Date: 2025-06-30, 06:20:22 GMT +# Date: 2025-07-23, 01:37:08 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -117,6 +117,7 @@ FF10 ; 0.0 ; ; 0 # Nd FULLWIDTH DIGIT ZERO 16AC0 ; 0.0 ; ; 0 # Nd TANGSA DIGIT ZERO 16B50 ; 0.0 ; ; 0 # Nd PAHAWH HMONG DIGIT ZERO 16D70 ; 0.0 ; ; 0 # Nd KIRAT RAI DIGIT ZERO +16DA0 ; 0.0 ; ; 0 # Nd CHISOI DIGIT ZERO 16E80 ; 0.0 ; ; 0 # No MEDEFAIDRIN DIGIT ZERO 1CCF0 ; 0.0 ; ; 0 # Nd OUTLINED DIGIT ZERO 1D2C0 ; 0.0 ; ; 0 # No KAKTOVIK NUMERAL ZERO @@ -135,7 +136,7 @@ FF10 ; 0.0 ; ; 0 # Nd FULLWIDTH DIGIT ZERO 1F10B..1F10C ; 0.0 ; ; 0 # No [2] DINGBAT CIRCLED SANS-SERIF DIGIT ZERO..DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT ZERO 1FBF0 ; 0.0 ; ; 0 # Nd SEGMENTED DIGIT ZERO -# Total code points: 97 +# Total code points: 98 # ================================================ @@ -548,6 +549,7 @@ FF11 ; 1.0 ; ; 1 # Nd FULLWIDTH DIGIT ONE 16AC1 ; 1.0 ; ; 1 # Nd TANGSA DIGIT ONE 16B51 ; 1.0 ; ; 1 # Nd PAHAWH HMONG DIGIT ONE 16D71 ; 1.0 ; ; 1 # Nd KIRAT RAI DIGIT ONE +16DA1 ; 1.0 ; ; 1 # Nd CHISOI DIGIT ONE 16E81 ; 1.0 ; ; 1 # No MEDEFAIDRIN DIGIT ONE 16E94 ; 1.0 ; ; 1 # No MEDEFAIDRIN DIGIT ONE ALTERNATE FORM 16FF4 ; 1.0 ; ; 1 # Nl YANGQIN SIGN SLOW ONE BEAT @@ -576,7 +578,7 @@ FF11 ; 1.0 ; ; 1 # Nd FULLWIDTH DIGIT ONE 1FBF1 ; 1.0 ; ; 1 # Nd SEGMENTED DIGIT ONE 2092A ; 1.0 ; ; 1 # Lo CJK UNIFIED IDEOGRAPH-2092A -# Total code points: 158 +# Total code points: 159 # ================================================ @@ -715,6 +717,7 @@ FF12 ; 2.0 ; ; 2 # Nd FULLWIDTH DIGIT TWO 16AC2 ; 2.0 ; ; 2 # Nd TANGSA DIGIT TWO 16B52 ; 2.0 ; ; 2 # Nd PAHAWH HMONG DIGIT TWO 16D72 ; 2.0 ; ; 2 # Nd KIRAT RAI DIGIT TWO +16DA2 ; 2.0 ; ; 2 # Nd CHISOI DIGIT TWO 16E82 ; 2.0 ; ; 2 # No MEDEFAIDRIN DIGIT TWO 16E95 ; 2.0 ; ; 2 # No MEDEFAIDRIN DIGIT TWO ALTERNATE FORM 16FF6 ; 2.0 ; ; 2 # Nl YANGQIN SIGN SLOW TWO BEATS @@ -743,7 +746,7 @@ FF12 ; 2.0 ; ; 2 # Nd FULLWIDTH DIGIT TWO 1FBF2 ; 2.0 ; ; 2 # Nd SEGMENTED DIGIT TWO 22390 ; 2.0 ; ; 2 # Lo CJK UNIFIED IDEOGRAPH-22390 -# Total code points: 158 +# Total code points: 159 # ================================================ @@ -872,6 +875,7 @@ FF13 ; 3.0 ; ; 3 # Nd FULLWIDTH DIGIT THREE 16AC3 ; 3.0 ; ; 3 # Nd TANGSA DIGIT THREE 16B53 ; 3.0 ; ; 3 # Nd PAHAWH HMONG DIGIT THREE 16D73 ; 3.0 ; ; 3 # Nd KIRAT RAI DIGIT THREE +16DA3 ; 3.0 ; ; 3 # Nd CHISOI DIGIT THREE 16E83 ; 3.0 ; ; 3 # No MEDEFAIDRIN DIGIT THREE 16E96 ; 3.0 ; ; 3 # No MEDEFAIDRIN DIGIT THREE ALTERNATE FORM 1CCF3 ; 3.0 ; ; 3 # Nd OUTLINED DIGIT THREE @@ -901,7 +905,7 @@ FF13 ; 3.0 ; ; 3 # Nd FULLWIDTH DIGIT THREE 22998 ; 3.0 ; ; 3 # Lo CJK UNIFIED IDEOGRAPH-22998 23B1B ; 3.0 ; ; 3 # Lo CJK UNIFIED IDEOGRAPH-23B1B -# Total code points: 154 +# Total code points: 155 # ================================================ @@ -1024,6 +1028,7 @@ FF14 ; 4.0 ; ; 4 # Nd FULLWIDTH DIGIT FOUR 16AC4 ; 4.0 ; ; 4 # Nd TANGSA DIGIT FOUR 16B54 ; 4.0 ; ; 4 # Nd PAHAWH HMONG DIGIT FOUR 16D74 ; 4.0 ; ; 4 # Nd KIRAT RAI DIGIT FOUR +16DA4 ; 4.0 ; ; 4 # Nd CHISOI DIGIT FOUR 16E84 ; 4.0 ; ; 4 # No MEDEFAIDRIN DIGIT FOUR 1CCF4 ; 4.0 ; ; 4 # Nd OUTLINED DIGIT FOUR 1D2C4 ; 4.0 ; ; 4 # No KAKTOVIK NUMERAL FOUR @@ -1051,7 +1056,7 @@ FF14 ; 4.0 ; ; 4 # Nd FULLWIDTH DIGIT FOUR 200E2 ; 4.0 ; ; 4 # Lo CJK UNIFIED IDEOGRAPH-200E2 2626D ; 4.0 ; ; 4 # Lo CJK UNIFIED IDEOGRAPH-2626D -# Total code points: 144 +# Total code points: 145 # ================================================ @@ -1177,6 +1182,7 @@ FF15 ; 5.0 ; ; 5 # Nd FULLWIDTH DIGIT FIVE 16AC5 ; 5.0 ; ; 5 # Nd TANGSA DIGIT FIVE 16B55 ; 5.0 ; ; 5 # Nd PAHAWH HMONG DIGIT FIVE 16D75 ; 5.0 ; ; 5 # Nd KIRAT RAI DIGIT FIVE +16DA5 ; 5.0 ; ; 5 # Nd CHISOI DIGIT FIVE 16E85 ; 5.0 ; ; 5 # No MEDEFAIDRIN DIGIT FIVE 1CCF5 ; 5.0 ; ; 5 # Nd OUTLINED DIGIT FIVE 1D2C5 ; 5.0 ; ; 5 # No KAKTOVIK NUMERAL FIVE @@ -1203,7 +1209,7 @@ FF15 ; 5.0 ; ; 5 # Nd FULLWIDTH DIGIT FIVE 1FBF5 ; 5.0 ; ; 5 # Nd SEGMENTED DIGIT FIVE 20121 ; 5.0 ; ; 5 # Lo CJK UNIFIED IDEOGRAPH-20121 -# Total code points: 142 +# Total code points: 143 # ================================================ @@ -1316,6 +1322,7 @@ FF16 ; 6.0 ; ; 6 # Nd FULLWIDTH DIGIT SIX 16AC6 ; 6.0 ; ; 6 # Nd TANGSA DIGIT SIX 16B56 ; 6.0 ; ; 6 # Nd PAHAWH HMONG DIGIT SIX 16D76 ; 6.0 ; ; 6 # Nd KIRAT RAI DIGIT SIX +16DA6 ; 6.0 ; ; 6 # Nd CHISOI DIGIT SIX 16E86 ; 6.0 ; ; 6 # No MEDEFAIDRIN DIGIT SIX 1CCF6 ; 6.0 ; ; 6 # Nd OUTLINED DIGIT SIX 1D2C6 ; 6.0 ; ; 6 # No KAKTOVIK NUMERAL SIX @@ -1340,7 +1347,7 @@ FF16 ; 6.0 ; ; 6 # Nd FULLWIDTH DIGIT SIX 1FBF6 ; 6.0 ; ; 6 # Nd SEGMENTED DIGIT SIX 20AEA ; 6.0 ; ; 6 # Lo CJK UNIFIED IDEOGRAPH-20AEA -# Total code points: 126 +# Total code points: 127 # ================================================ @@ -1451,6 +1458,7 @@ FF17 ; 7.0 ; ; 7 # Nd FULLWIDTH DIGIT SEVEN 16AC7 ; 7.0 ; ; 7 # Nd TANGSA DIGIT SEVEN 16B57 ; 7.0 ; ; 7 # Nd PAHAWH HMONG DIGIT SEVEN 16D77 ; 7.0 ; ; 7 # Nd KIRAT RAI DIGIT SEVEN +16DA7 ; 7.0 ; ; 7 # Nd CHISOI DIGIT SEVEN 16E87 ; 7.0 ; ; 7 # No MEDEFAIDRIN DIGIT SEVEN 1CCF7 ; 7.0 ; ; 7 # Nd OUTLINED DIGIT SEVEN 1D2C7 ; 7.0 ; ; 7 # No KAKTOVIK NUMERAL SEVEN @@ -1475,7 +1483,7 @@ FF17 ; 7.0 ; ; 7 # Nd FULLWIDTH DIGIT SEVEN 1FBF7 ; 7.0 ; ; 7 # Nd SEGMENTED DIGIT SEVEN 20001 ; 7.0 ; ; 7 # Lo CJK UNIFIED IDEOGRAPH-20001 -# Total code points: 126 +# Total code points: 127 # ================================================ @@ -1583,6 +1591,7 @@ FF18 ; 8.0 ; ; 8 # Nd FULLWIDTH DIGIT EIGHT 16AC8 ; 8.0 ; ; 8 # Nd TANGSA DIGIT EIGHT 16B58 ; 8.0 ; ; 8 # Nd PAHAWH HMONG DIGIT EIGHT 16D78 ; 8.0 ; ; 8 # Nd KIRAT RAI DIGIT EIGHT +16DA8 ; 8.0 ; ; 8 # Nd CHISOI DIGIT EIGHT 16E88 ; 8.0 ; ; 8 # No MEDEFAIDRIN DIGIT EIGHT 1CCF8 ; 8.0 ; ; 8 # Nd OUTLINED DIGIT EIGHT 1D2C8 ; 8.0 ; ; 8 # No KAKTOVIK NUMERAL EIGHT @@ -1606,7 +1615,7 @@ FF18 ; 8.0 ; ; 8 # Nd FULLWIDTH DIGIT EIGHT 1F109 ; 8.0 ; ; 8 # No DIGIT EIGHT COMMA 1FBF8 ; 8.0 ; ; 8 # Nd SEGMENTED DIGIT EIGHT -# Total code points: 121 +# Total code points: 122 # ================================================ @@ -1717,6 +1726,7 @@ FF19 ; 9.0 ; ; 9 # Nd FULLWIDTH DIGIT NINE 16AC9 ; 9.0 ; ; 9 # Nd TANGSA DIGIT NINE 16B59 ; 9.0 ; ; 9 # Nd PAHAWH HMONG DIGIT NINE 16D79 ; 9.0 ; ; 9 # Nd KIRAT RAI DIGIT NINE +16DA9 ; 9.0 ; ; 9 # Nd CHISOI DIGIT NINE 16E89 ; 9.0 ; ; 9 # No MEDEFAIDRIN DIGIT NINE 1CCF9 ; 9.0 ; ; 9 # Nd OUTLINED DIGIT NINE 1D2C9 ; 9.0 ; ; 9 # No KAKTOVIK NUMERAL NINE @@ -1741,7 +1751,7 @@ FF19 ; 9.0 ; ; 9 # Nd FULLWIDTH DIGIT NINE 1FBF9 ; 9.0 ; ; 9 # Nd SEGMENTED DIGIT NINE 2F890 ; 9.0 ; ; 9 # Lo CJK COMPATIBILITY IDEOGRAPH-2F890 -# Total code points: 127 +# Total code points: 128 # ================================================ diff --git a/unicodetools/src/main/java/org/unicode/props/UcdPropertyValues.java b/unicodetools/src/main/java/org/unicode/props/UcdPropertyValues.java index 70e081b3e..cbbd126d9 100644 --- a/unicodetools/src/main/java/org/unicode/props/UcdPropertyValues.java +++ b/unicodetools/src/main/java/org/unicode/props/UcdPropertyValues.java @@ -222,6 +222,7 @@ public enum Block_Values implements Named { Cherokee("Cherokee"), Cherokee_Supplement("Cherokee_Sup"), Chess_Symbols("Chess_Symbols"), + Chisoi("Chisoi"), Chorasmian("Chorasmian"), CJK_Unified_Ideographs("CJK"), CJK_Compatibility("CJK_Compat"), @@ -2073,6 +2074,7 @@ public enum Script_Values implements Named { Carian("Cari"), Cham("Cham"), Cherokee("Cher"), + Chisoi("Chis"), Chorasmian("Chrs"), Coptic("Copt", "Qaac"), Cypro_Minoan("Cpmn"), diff --git a/unicodetools/src/main/resources/org/unicode/text/UCD/ShortBlockNames.txt b/unicodetools/src/main/resources/org/unicode/text/UCD/ShortBlockNames.txt index 9b03e59ed..d5da74c45 100644 --- a/unicodetools/src/main/resources/org/unicode/text/UCD/ShortBlockNames.txt +++ b/unicodetools/src/main/resources/org/unicode/text/UCD/ShortBlockNames.txt @@ -43,6 +43,7 @@ Cham ; Cham Cherokee ; Cherokee Cherokee_Sup ; Cherokee_Supplement Chess_Symbols ; Chess_Symbols +Chisoi ; Chisoi Chorasmian ; Chorasmian CJK_Compat ; CJK_Compatibility CJK_Compat_Forms ; CJK_Compatibility_Forms From 0624daaeda80be1a8dde88bed23f294351c0c5a8 Mon Sep 17 00:00:00 2001 From: Robin Leroy Date: Wed, 23 Jul 2025 03:43:06 +0200 Subject: [PATCH 2/3] UTC-184-C25 Change the name of code point U+16D82 approved by 181-C61 from CHISOI LETTER AI to CHISOI LETTER AAI --- unicodetools/data/ucd/dev/UnicodeData.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/unicodetools/data/ucd/dev/UnicodeData.txt b/unicodetools/data/ucd/dev/UnicodeData.txt index 1c274ab48..5e4bb9ed2 100644 --- a/unicodetools/data/ucd/dev/UnicodeData.txt +++ b/unicodetools/data/ucd/dev/UnicodeData.txt @@ -30199,7 +30199,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 16D79;KIRAT RAI DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 16D80;CHISOI LETTER A;Lo;0;L;;;;;N;;;;; 16D81;CHISOI LETTER BA;Lo;0;L;;;;;N;;;;; -16D82;CHISOI LETTER AI;Lo;0;L;;;;;N;;;;; +16D82;CHISOI LETTER AAI;Lo;0;L;;;;;N;;;;; 16D83;CHISOI LETTER AA;Lo;0;L;;;;;N;;;;; 16D84;CHISOI LETTER GA;Lo;0;L;;;;;N;;;;; 16D85;CHISOI LETTER TA;Lo;0;L;;;;;N;;;;; From 57792445637082631c4f39e6ec611900ffdb276e Mon Sep 17 00:00:00 2001 From: Robin Leroy Date: Wed, 23 Jul 2025 03:51:54 +0200 Subject: [PATCH 3/3] Regenerate UCD --- unicodetools/data/ucd/dev/IndicSyllabicCategory.txt | 4 ++-- unicodetools/data/ucd/dev/extracted/DerivedName.txt | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt b/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt index e39223702..57fc3ba6d 100644 --- a/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt +++ b/unicodetools/data/ucd/dev/IndicSyllabicCategory.txt @@ -1,5 +1,5 @@ # IndicSyllabicCategory-17.0.0.txt -# Date: 2025-07-23, 01:37:10 GMT +# Date: 2025-07-23, 01:44:19 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -774,7 +774,7 @@ A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O 11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O 16D80 ; Vowel # Lo CHISOI LETTER A -16D82..16D83 ; Vowel # Lo [2] CHISOI LETTER AI..CHISOI LETTER AA +16D82..16D83 ; Vowel # Lo [2] CHISOI LETTER AAI..CHISOI LETTER AA 16D86 ; Vowel # Lo CHISOI LETTER E 16D89 ; Vowel # Lo CHISOI LETTER I 16D8F ; Vowel # Lo CHISOI LETTER U diff --git a/unicodetools/data/ucd/dev/extracted/DerivedName.txt b/unicodetools/data/ucd/dev/extracted/DerivedName.txt index 1c5e1d678..e4f7e28eb 100644 --- a/unicodetools/data/ucd/dev/extracted/DerivedName.txt +++ b/unicodetools/data/ucd/dev/extracted/DerivedName.txt @@ -1,5 +1,5 @@ # DerivedName-17.0.0.txt -# Date: 2025-07-23, 01:37:06 GMT +# Date: 2025-07-23, 01:44:14 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -36870,7 +36870,7 @@ FFFD ; REPLACEMENT CHARACTER 16D79 ; KIRAT RAI DIGIT NINE 16D80 ; CHISOI LETTER A 16D81 ; CHISOI LETTER BA -16D82 ; CHISOI LETTER AI +16D82 ; CHISOI LETTER AAI 16D83 ; CHISOI LETTER AA 16D84 ; CHISOI LETTER GA 16D85 ; CHISOI LETTER TA