diff --git a/icu4c/source/common/unicode/uchar.h b/icu4c/source/common/unicode/uchar.h index 2d2511e6654..3c2fc9ac2ad 100644 --- a/icu4c/source/common/unicode/uchar.h +++ b/icu4c/source/common/unicode/uchar.h @@ -1885,6 +1885,21 @@ enum UBlockCode { /** @stable ICU 70 */ UBLOCK_ZNAMENNY_MUSICAL_NOTATION = 320, /*[1CF00]*/ + /** @stable ICU 72 */ + UBLOCK_ARABIC_EXTENDED_C = 321, /*[10EC0]*/ + /** @stable ICU 72 */ + UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_H = 322, /*[31350]*/ + /** @stable ICU 72 */ + UBLOCK_CYRILLIC_EXTENDED_D = 323, /*[1E030]*/ + /** @stable ICU 72 */ + UBLOCK_DEVANAGARI_EXTENDED_A = 324, /*[11B00]*/ + /** @stable ICU 72 */ + UBLOCK_KAKTOVIK_NUMERALS = 325, /*[1D2C0]*/ + /** @stable ICU 72 */ + UBLOCK_KAWI = 326, /*[11F00]*/ + /** @stable ICU 72 */ + UBLOCK_NAG_MUNDARI = 327, /*[1E4D0]*/ + #ifndef U_HIDE_DEPRECATED_API /** * One more than the highest normal UBlockCode value. @@ -1892,7 +1907,7 @@ enum UBlockCode { * * @deprecated ICU 58 The numeric value may change over time, see ICU ticket #12420. */ - UBLOCK_COUNT = 321, + UBLOCK_COUNT = 328, #endif // U_HIDE_DEPRECATED_API /** @stable ICU 2.0 */ diff --git a/icu4c/source/common/unicode/uscript.h b/icu4c/source/common/unicode/uscript.h index 6cb15328085..dc97ab2ba56 100644 --- a/icu4c/source/common/unicode/uscript.h +++ b/icu4c/source/common/unicode/uscript.h @@ -495,6 +495,11 @@ typedef enum UScriptCode { /** @stable ICU 70 */ USCRIPT_VITHKUQI = 197,/* Vith */ + /** @stable ICU 72 */ + USCRIPT_KAWI = 198,/* Kawi */ + /** @stable ICU 72 */ + USCRIPT_NAG_MUNDARI = 199,/* Nagm */ + #ifndef U_HIDE_DEPRECATED_API /** * One more than the highest normal UScriptCode value. @@ -502,7 +507,7 @@ typedef enum UScriptCode { * * @deprecated ICU 58 The numeric value may change over time, see ICU ticket #12420. */ - USCRIPT_CODE_LIMIT = 198 + USCRIPT_CODE_LIMIT = 200 #endif // U_HIDE_DEPRECATED_API } UScriptCode; diff --git a/icu4c/source/common/uscript_props.cpp b/icu4c/source/common/uscript_props.cpp index 07bae251ea3..886acfafa88 100644 --- a/icu4c/source/common/uscript_props.cpp +++ b/icu4c/source/common/uscript_props.cpp @@ -242,6 +242,8 @@ const int32_t SCRIPT_PROPS[] = { 0x16ABC | EXCLUSION, // Tnsa 0x1E290 | EXCLUSION, // Toto 0x10582 | EXCLUSION | CASED, // Vith + 0x11F1B | EXCLUSION | LB_LETTERS, // Kawi + 0x1E4E6 | EXCLUSION, // Nagm // End copy-paste from parsescriptmetadata.py }; diff --git a/icu4c/source/data/unidata/CaseFolding.txt b/icu4c/source/data/unidata/CaseFolding.txt index 932ace29e6d..65aa0fcd6b3 100644 --- a/icu4c/source/data/unidata/CaseFolding.txt +++ b/icu4c/source/data/unidata/CaseFolding.txt @@ -1,11 +1,11 @@ -# CaseFolding-14.0.0.txt -# Date: 2021-03-08, 19:35:41 GMT -# © 2021 Unicode®, Inc. +# CaseFolding-15.0.0.txt +# Date: 2022-02-02, 23:35:35 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Case Folding Properties # diff --git a/icu4c/source/data/unidata/DerivedCoreProperties.txt b/icu4c/source/data/unidata/DerivedCoreProperties.txt index 443d1a5dceb..e55b7f1ab49 100644 --- a/icu4c/source/data/unidata/DerivedCoreProperties.txt +++ b/icu4c/source/data/unidata/DerivedCoreProperties.txt @@ -1,11 +1,11 @@ -# DerivedCoreProperties-14.0.0.txt -# Date: 2021-08-12, 23:12:53 GMT -# © 2021 Unicode®, Inc. +# DerivedCoreProperties-15.0.0.txt +# Date: 2022-04-26, 23:14:31 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # ================================================ @@ -497,6 +497,7 @@ FFE9..FFEC ; Math 0CE0..0CE1 ; Alphabetic 0CE2..0CE3 ; Alphabetic 0CF1..0CF2 ; Alphabetic +0CF3 ; Alphabetic 0D00..0D01 ; Alphabetic 0D02..0D03 ; Alphabetic 0D04..0D0C ; Alphabetic @@ -1089,6 +1090,8 @@ FFDA..FFDC ; Alphabetic 11234 ; Alphabetic 11237 ; Alphabetic 1123E ; Alphabetic +1123F..11240 ; Alphabetic +11241 ; Alphabetic 11280..11286 ; Alphabetic 11288 ; Alphabetic 1128A..1128D ; Alphabetic @@ -1243,12 +1246,22 @@ FFDA..FFDC ; Alphabetic 11EE0..11EF2 ; Alphabetic 11EF3..11EF4 ; Alphabetic 11EF5..11EF6 ; Alphabetic +11F00..11F01 ; Alphabetic +11F02 ; Alphabetic +11F03 ; Alphabetic +11F04..11F10 ; Alphabetic +11F12..11F33 ; Alphabetic +11F34..11F35 ; Alphabetic +11F36..11F3A ; Alphabetic +11F3E..11F3F ; Alphabetic +11F40 ; Alphabetic 11FB0 ; Alphabetic 12000..12399 ; Alphabetic 12400..1246E ; Alphabetic 12480..12543 ; Alphabetic 12F90..12FF0 ; Alphabetic -13000..1342E ; Alphabetic +13000..1342F ; Alphabetic +13441..13446 ; Alphabetic 14400..14646 ; Alphabetic 16800..16A38 ; Alphabetic 16A40..16A5E ; Alphabetic @@ -1275,7 +1288,9 @@ FFDA..FFDC ; Alphabetic 1AFF5..1AFFB ; Alphabetic 1AFFD..1AFFE ; Alphabetic 1B000..1B122 ; Alphabetic +1B132 ; Alphabetic 1B150..1B152 ; Alphabetic +1B155 ; Alphabetic 1B164..1B167 ; Alphabetic 1B170..1B2FB ; Alphabetic 1BC00..1BC6A ; Alphabetic @@ -1316,16 +1331,21 @@ FFDA..FFDC ; Alphabetic 1DF00..1DF09 ; Alphabetic 1DF0A ; Alphabetic 1DF0B..1DF1E ; Alphabetic +1DF25..1DF2A ; Alphabetic 1E000..1E006 ; Alphabetic 1E008..1E018 ; Alphabetic 1E01B..1E021 ; Alphabetic 1E023..1E024 ; Alphabetic 1E026..1E02A ; Alphabetic +1E030..1E06D ; Alphabetic +1E08F ; Alphabetic 1E100..1E12C ; Alphabetic 1E137..1E13D ; Alphabetic 1E14E ; Alphabetic 1E290..1E2AD ; Alphabetic 1E2C0..1E2EB ; Alphabetic +1E4D0..1E4EA ; Alphabetic +1E4EB ; Alphabetic 1E7E0..1E7E6 ; Alphabetic 1E7E8..1E7EB ; Alphabetic 1E7ED..1E7EE ; Alphabetic @@ -1371,14 +1391,15 @@ FFDA..FFDC ; Alphabetic 1F150..1F169 ; Alphabetic 1F170..1F189 ; Alphabetic 20000..2A6DF ; Alphabetic -2A700..2B738 ; Alphabetic +2A700..2B739 ; Alphabetic 2B740..2B81D ; Alphabetic 2B820..2CEA1 ; Alphabetic 2CEB0..2EBE0 ; Alphabetic 2F800..2FA1D ; Alphabetic 30000..3134A ; Alphabetic +31350..323AF ; Alphabetic -# Total code points: 133396 +# Total code points: 137760 # ================================================ @@ -2065,9 +2086,11 @@ FF41..FF5A ; Lowercase 1D7CB ; Lowercase 1DF00..1DF09 ; Lowercase 1DF0B..1DF1E ; Lowercase +1DF25..1DF2A ; Lowercase +1E030..1E06C ; Lowercase 1E922..1E943 ; Lowercase -# Total code points: 2471 +# Total code points: 2538 # ================================================ @@ -2899,12 +2922,14 @@ FF41..FF5A ; Cased 1D7C4..1D7CB ; Cased 1DF00..1DF09 ; Cased 1DF0B..1DF1E ; Cased +1DF25..1DF2A ; Cased +1E030..1E06C ; Cased 1E900..1E943 ; Cased 1F130..1F149 ; Cased 1F150..1F169 ; Cased 1F170..1F189 ; Cased -# Total code points: 4453 +# Total code points: 4520 # ================================================ @@ -3054,7 +3079,7 @@ FF41..FF5A ; Cased 0EB1 ; Case_Ignorable 0EB4..0EBC ; Case_Ignorable 0EC6 ; Case_Ignorable -0EC8..0ECD ; Case_Ignorable +0EC8..0ECE ; Case_Ignorable 0F18..0F19 ; Case_Ignorable 0F35 ; Case_Ignorable 0F37 ; Case_Ignorable @@ -3263,6 +3288,7 @@ FFF9..FFFB ; Case_Ignorable 10AE5..10AE6 ; Case_Ignorable 10D24..10D27 ; Case_Ignorable 10EAB..10EAC ; Case_Ignorable +10EFD..10EFF ; Case_Ignorable 10F46..10F50 ; Case_Ignorable 10F82..10F85 ; Case_Ignorable 11001 ; Case_Ignorable @@ -3287,6 +3313,7 @@ FFF9..FFFB ; Case_Ignorable 11234 ; Case_Ignorable 11236..11237 ; Case_Ignorable 1123E ; Case_Ignorable +11241 ; Case_Ignorable 112DF ; Case_Ignorable 112E3..112EA ; Case_Ignorable 11300..11301 ; Case_Ignorable @@ -3348,7 +3375,13 @@ FFF9..FFFB ; Case_Ignorable 11D95 ; Case_Ignorable 11D97 ; Case_Ignorable 11EF3..11EF4 ; Case_Ignorable -13430..13438 ; Case_Ignorable +11F00..11F01 ; Case_Ignorable +11F36..11F3A ; Case_Ignorable +11F40 ; Case_Ignorable +11F42 ; Case_Ignorable +13430..1343F ; Case_Ignorable +13440 ; Case_Ignorable +13447..13455 ; Case_Ignorable 16AF0..16AF4 ; Case_Ignorable 16B30..16B36 ; Case_Ignorable 16B40..16B43 ; Case_Ignorable @@ -3382,10 +3415,14 @@ FFF9..FFFB ; Case_Ignorable 1E01B..1E021 ; Case_Ignorable 1E023..1E024 ; Case_Ignorable 1E026..1E02A ; Case_Ignorable +1E030..1E06D ; Case_Ignorable +1E08F ; Case_Ignorable 1E130..1E136 ; Case_Ignorable 1E137..1E13D ; Case_Ignorable 1E2AE ; Case_Ignorable 1E2EC..1E2EF ; Case_Ignorable +1E4EB ; Case_Ignorable +1E4EC..1E4EF ; Case_Ignorable 1E8D0..1E8D6 ; Case_Ignorable 1E944..1E94A ; Case_Ignorable 1E94B ; Case_Ignorable @@ -3394,7 +3431,7 @@ E0001 ; Case_Ignorable E0020..E007F ; Case_Ignorable E0100..E01EF ; Case_Ignorable -# Total code points: 2602 +# Total code points: 2707 # ================================================ @@ -6617,6 +6654,7 @@ FFDA..FFDC ; ID_Start 111DC ; ID_Start 11200..11211 ; ID_Start 11213..1122B ; ID_Start +1123F..11240 ; ID_Start 11280..11286 ; ID_Start 11288 ; ID_Start 1128A..1128D ; ID_Start @@ -6679,12 +6717,16 @@ FFDA..FFDC ; ID_Start 11D6A..11D89 ; ID_Start 11D98 ; ID_Start 11EE0..11EF2 ; ID_Start +11F02 ; ID_Start +11F04..11F10 ; ID_Start +11F12..11F33 ; ID_Start 11FB0 ; ID_Start 12000..12399 ; ID_Start 12400..1246E ; ID_Start 12480..12543 ; ID_Start 12F90..12FF0 ; ID_Start -13000..1342E ; ID_Start +13000..1342F ; ID_Start +13441..13446 ; ID_Start 14400..14646 ; ID_Start 16800..16A38 ; ID_Start 16A40..16A5E ; ID_Start @@ -6707,7 +6749,9 @@ FFDA..FFDC ; ID_Start 1AFF5..1AFFB ; ID_Start 1AFFD..1AFFE ; ID_Start 1B000..1B122 ; ID_Start +1B132 ; ID_Start 1B150..1B152 ; ID_Start +1B155 ; ID_Start 1B164..1B167 ; ID_Start 1B170..1B2FB ; ID_Start 1BC00..1BC6A ; ID_Start @@ -6747,11 +6791,15 @@ FFDA..FFDC ; ID_Start 1DF00..1DF09 ; ID_Start 1DF0A ; ID_Start 1DF0B..1DF1E ; ID_Start +1DF25..1DF2A ; ID_Start +1E030..1E06D ; ID_Start 1E100..1E12C ; ID_Start 1E137..1E13D ; ID_Start 1E14E ; ID_Start 1E290..1E2AD ; ID_Start 1E2C0..1E2EB ; ID_Start +1E4D0..1E4EA ; ID_Start +1E4EB ; ID_Start 1E7E0..1E7E6 ; ID_Start 1E7E8..1E7EB ; ID_Start 1E7ED..1E7EE ; ID_Start @@ -6793,14 +6841,15 @@ FFDA..FFDC ; ID_Start 1EEA5..1EEA9 ; ID_Start 1EEAB..1EEBB ; ID_Start 20000..2A6DF ; ID_Start -2A700..2B738 ; ID_Start +2A700..2B739 ; ID_Start 2B740..2B81D ; ID_Start 2B820..2CEA1 ; ID_Start 2CEB0..2EBE0 ; ID_Start 2F800..2FA1D ; ID_Start 30000..3134A ; ID_Start +31350..323AF ; ID_Start -# Total code points: 131997 +# Total code points: 136345 # ================================================ @@ -7083,6 +7132,7 @@ FFDA..FFDC ; ID_Start 0CE2..0CE3 ; ID_Continue 0CE6..0CEF ; ID_Continue 0CF1..0CF2 ; ID_Continue +0CF3 ; ID_Continue 0D00..0D01 ; ID_Continue 0D02..0D03 ; ID_Continue 0D04..0D0C ; ID_Continue @@ -7136,7 +7186,7 @@ FFDA..FFDC ; ID_Start 0EBD ; ID_Continue 0EC0..0EC4 ; ID_Continue 0EC6 ; ID_Continue -0EC8..0ECD ; ID_Continue +0EC8..0ECE ; ID_Continue 0ED0..0ED9 ; ID_Continue 0EDC..0EDF ; ID_Continue 0F00 ; ID_Continue @@ -7719,6 +7769,7 @@ FFDA..FFDC ; ID_Continue 10E80..10EA9 ; ID_Continue 10EAB..10EAC ; ID_Continue 10EB0..10EB1 ; ID_Continue +10EFD..10EFF ; ID_Continue 10F00..10F1C ; ID_Continue 10F27 ; ID_Continue 10F30..10F45 ; ID_Continue @@ -7781,6 +7832,8 @@ FFDA..FFDC ; ID_Continue 11235 ; ID_Continue 11236..11237 ; ID_Continue 1123E ; ID_Continue +1123F..11240 ; ID_Continue +11241 ; ID_Continue 11280..11286 ; ID_Continue 11288 ; ID_Continue 1128A..1128D ; ID_Continue @@ -7963,12 +8016,27 @@ FFDA..FFDC ; ID_Continue 11EE0..11EF2 ; ID_Continue 11EF3..11EF4 ; ID_Continue 11EF5..11EF6 ; ID_Continue +11F00..11F01 ; ID_Continue +11F02 ; ID_Continue +11F03 ; ID_Continue +11F04..11F10 ; ID_Continue +11F12..11F33 ; ID_Continue +11F34..11F35 ; ID_Continue +11F36..11F3A ; ID_Continue +11F3E..11F3F ; ID_Continue +11F40 ; ID_Continue +11F41 ; ID_Continue +11F42 ; ID_Continue +11F50..11F59 ; ID_Continue 11FB0 ; ID_Continue 12000..12399 ; ID_Continue 12400..1246E ; ID_Continue 12480..12543 ; ID_Continue 12F90..12FF0 ; ID_Continue -13000..1342E ; ID_Continue +13000..1342F ; ID_Continue +13440 ; ID_Continue +13441..13446 ; ID_Continue +13447..13455 ; ID_Continue 14400..14646 ; ID_Continue 16800..16A38 ; ID_Continue 16A40..16A5E ; ID_Continue @@ -8001,7 +8069,9 @@ FFDA..FFDC ; ID_Continue 1AFF5..1AFFB ; ID_Continue 1AFFD..1AFFE ; ID_Continue 1B000..1B122 ; ID_Continue +1B132 ; ID_Continue 1B150..1B152 ; ID_Continue +1B155 ; ID_Continue 1B164..1B167 ; ID_Continue 1B170..1B2FB ; ID_Continue 1BC00..1BC6A ; ID_Continue @@ -8058,11 +8128,14 @@ FFDA..FFDC ; ID_Continue 1DF00..1DF09 ; ID_Continue 1DF0A ; ID_Continue 1DF0B..1DF1E ; ID_Continue +1DF25..1DF2A ; ID_Continue 1E000..1E006 ; ID_Continue 1E008..1E018 ; ID_Continue 1E01B..1E021 ; ID_Continue 1E023..1E024 ; ID_Continue 1E026..1E02A ; ID_Continue +1E030..1E06D ; ID_Continue +1E08F ; ID_Continue 1E100..1E12C ; ID_Continue 1E130..1E136 ; ID_Continue 1E137..1E13D ; ID_Continue @@ -8073,6 +8146,10 @@ FFDA..FFDC ; ID_Continue 1E2C0..1E2EB ; ID_Continue 1E2EC..1E2EF ; ID_Continue 1E2F0..1E2F9 ; ID_Continue +1E4D0..1E4EA ; ID_Continue +1E4EB ; ID_Continue +1E4EC..1E4EF ; ID_Continue +1E4F0..1E4F9 ; ID_Continue 1E7E0..1E7E6 ; ID_Continue 1E7E8..1E7EB ; ID_Continue 1E7ED..1E7EE ; ID_Continue @@ -8118,15 +8195,16 @@ FFDA..FFDC ; ID_Continue 1EEAB..1EEBB ; ID_Continue 1FBF0..1FBF9 ; ID_Continue 20000..2A6DF ; ID_Continue -2A700..2B738 ; ID_Continue +2A700..2B739 ; ID_Continue 2B740..2B81D ; ID_Continue 2B820..2CEA1 ; ID_Continue 2CEB0..2EBE0 ; ID_Continue 2F800..2FA1D ; ID_Continue 30000..3134A ; ID_Continue +31350..323AF ; ID_Continue E0100..E01EF ; ID_Continue -# Total code points: 135072 +# Total code points: 139482 # ================================================ @@ -8685,6 +8763,7 @@ FFDA..FFDC ; XID_Start 111DC ; XID_Start 11200..11211 ; XID_Start 11213..1122B ; XID_Start +1123F..11240 ; XID_Start 11280..11286 ; XID_Start 11288 ; XID_Start 1128A..1128D ; XID_Start @@ -8747,12 +8826,16 @@ FFDA..FFDC ; XID_Start 11D6A..11D89 ; XID_Start 11D98 ; XID_Start 11EE0..11EF2 ; XID_Start +11F02 ; XID_Start +11F04..11F10 ; XID_Start +11F12..11F33 ; XID_Start 11FB0 ; XID_Start 12000..12399 ; XID_Start 12400..1246E ; XID_Start 12480..12543 ; XID_Start 12F90..12FF0 ; XID_Start -13000..1342E ; XID_Start +13000..1342F ; XID_Start +13441..13446 ; XID_Start 14400..14646 ; XID_Start 16800..16A38 ; XID_Start 16A40..16A5E ; XID_Start @@ -8775,7 +8858,9 @@ FFDA..FFDC ; XID_Start 1AFF5..1AFFB ; XID_Start 1AFFD..1AFFE ; XID_Start 1B000..1B122 ; XID_Start +1B132 ; XID_Start 1B150..1B152 ; XID_Start +1B155 ; XID_Start 1B164..1B167 ; XID_Start 1B170..1B2FB ; XID_Start 1BC00..1BC6A ; XID_Start @@ -8815,11 +8900,15 @@ FFDA..FFDC ; XID_Start 1DF00..1DF09 ; XID_Start 1DF0A ; XID_Start 1DF0B..1DF1E ; XID_Start +1DF25..1DF2A ; XID_Start +1E030..1E06D ; XID_Start 1E100..1E12C ; XID_Start 1E137..1E13D ; XID_Start 1E14E ; XID_Start 1E290..1E2AD ; XID_Start 1E2C0..1E2EB ; XID_Start +1E4D0..1E4EA ; XID_Start +1E4EB ; XID_Start 1E7E0..1E7E6 ; XID_Start 1E7E8..1E7EB ; XID_Start 1E7ED..1E7EE ; XID_Start @@ -8861,14 +8950,15 @@ FFDA..FFDC ; XID_Start 1EEA5..1EEA9 ; XID_Start 1EEAB..1EEBB ; XID_Start 20000..2A6DF ; XID_Start -2A700..2B738 ; XID_Start +2A700..2B739 ; XID_Start 2B740..2B81D ; XID_Start 2B820..2CEA1 ; XID_Start 2CEB0..2EBE0 ; XID_Start 2F800..2FA1D ; XID_Start 30000..3134A ; XID_Start +31350..323AF ; XID_Start -# Total code points: 131974 +# Total code points: 136322 # ================================================ @@ -9147,6 +9237,7 @@ FFDA..FFDC ; XID_Start 0CE2..0CE3 ; XID_Continue 0CE6..0CEF ; XID_Continue 0CF1..0CF2 ; XID_Continue +0CF3 ; XID_Continue 0D00..0D01 ; XID_Continue 0D02..0D03 ; XID_Continue 0D04..0D0C ; XID_Continue @@ -9200,7 +9291,7 @@ FFDA..FFDC ; XID_Start 0EBD ; XID_Continue 0EC0..0EC4 ; XID_Continue 0EC6 ; XID_Continue -0EC8..0ECD ; XID_Continue +0EC8..0ECE ; XID_Continue 0ED0..0ED9 ; XID_Continue 0EDC..0EDF ; XID_Continue 0F00 ; XID_Continue @@ -9788,6 +9879,7 @@ FFDA..FFDC ; XID_Continue 10E80..10EA9 ; XID_Continue 10EAB..10EAC ; XID_Continue 10EB0..10EB1 ; XID_Continue +10EFD..10EFF ; XID_Continue 10F00..10F1C ; XID_Continue 10F27 ; XID_Continue 10F30..10F45 ; XID_Continue @@ -9850,6 +9942,8 @@ FFDA..FFDC ; XID_Continue 11235 ; XID_Continue 11236..11237 ; XID_Continue 1123E ; XID_Continue +1123F..11240 ; XID_Continue +11241 ; XID_Continue 11280..11286 ; XID_Continue 11288 ; XID_Continue 1128A..1128D ; XID_Continue @@ -10032,12 +10126,27 @@ FFDA..FFDC ; XID_Continue 11EE0..11EF2 ; XID_Continue 11EF3..11EF4 ; XID_Continue 11EF5..11EF6 ; XID_Continue +11F00..11F01 ; XID_Continue +11F02 ; XID_Continue +11F03 ; XID_Continue +11F04..11F10 ; XID_Continue +11F12..11F33 ; XID_Continue +11F34..11F35 ; XID_Continue +11F36..11F3A ; XID_Continue +11F3E..11F3F ; XID_Continue +11F40 ; XID_Continue +11F41 ; XID_Continue +11F42 ; XID_Continue +11F50..11F59 ; XID_Continue 11FB0 ; XID_Continue 12000..12399 ; XID_Continue 12400..1246E ; XID_Continue 12480..12543 ; XID_Continue 12F90..12FF0 ; XID_Continue -13000..1342E ; XID_Continue +13000..1342F ; XID_Continue +13440 ; XID_Continue +13441..13446 ; XID_Continue +13447..13455 ; XID_Continue 14400..14646 ; XID_Continue 16800..16A38 ; XID_Continue 16A40..16A5E ; XID_Continue @@ -10070,7 +10179,9 @@ FFDA..FFDC ; XID_Continue 1AFF5..1AFFB ; XID_Continue 1AFFD..1AFFE ; XID_Continue 1B000..1B122 ; XID_Continue +1B132 ; XID_Continue 1B150..1B152 ; XID_Continue +1B155 ; XID_Continue 1B164..1B167 ; XID_Continue 1B170..1B2FB ; XID_Continue 1BC00..1BC6A ; XID_Continue @@ -10127,11 +10238,14 @@ FFDA..FFDC ; XID_Continue 1DF00..1DF09 ; XID_Continue 1DF0A ; XID_Continue 1DF0B..1DF1E ; XID_Continue +1DF25..1DF2A ; XID_Continue 1E000..1E006 ; XID_Continue 1E008..1E018 ; XID_Continue 1E01B..1E021 ; XID_Continue 1E023..1E024 ; XID_Continue 1E026..1E02A ; XID_Continue +1E030..1E06D ; XID_Continue +1E08F ; XID_Continue 1E100..1E12C ; XID_Continue 1E130..1E136 ; XID_Continue 1E137..1E13D ; XID_Continue @@ -10142,6 +10256,10 @@ FFDA..FFDC ; XID_Continue 1E2C0..1E2EB ; XID_Continue 1E2EC..1E2EF ; XID_Continue 1E2F0..1E2F9 ; XID_Continue +1E4D0..1E4EA ; XID_Continue +1E4EB ; XID_Continue +1E4EC..1E4EF ; XID_Continue +1E4F0..1E4F9 ; XID_Continue 1E7E0..1E7E6 ; XID_Continue 1E7E8..1E7EB ; XID_Continue 1E7ED..1E7EE ; XID_Continue @@ -10187,15 +10305,16 @@ FFDA..FFDC ; XID_Continue 1EEAB..1EEBB ; XID_Continue 1FBF0..1FBF9 ; XID_Continue 20000..2A6DF ; XID_Continue -2A700..2B738 ; XID_Continue +2A700..2B739 ; XID_Continue 2B740..2B81D ; XID_Continue 2B820..2CEA1 ; XID_Continue 2CEB0..2EBE0 ; XID_Continue 2F800..2FA1D ; XID_Continue 30000..3134A ; XID_Continue +31350..323AF ; XID_Continue E0100..E01EF ; XID_Continue -# Total code points: 135053 +# Total code points: 139463 # ================================================ @@ -10206,7 +10325,7 @@ E0100..E01EF ; XID_Continue # + Variation_Selector # - White_Space # - FFF9..FFFB (Interlinear annotation format characters) -# - 13430..13438 (Egyptian hieroglyph format characters) +# - 13430..13440 (Egyptian hieroglyph format characters) # - Prepended_Concatenation_Mark (Exceptional format characters that should be visible) 00AD ; Default_Ignorable_Code_Point @@ -10351,7 +10470,7 @@ E01F0..E0FFF ; Default_Ignorable_Code_Point 0E47..0E4E ; Grapheme_Extend 0EB1 ; Grapheme_Extend 0EB4..0EBC ; Grapheme_Extend -0EC8..0ECD ; Grapheme_Extend +0EC8..0ECE ; Grapheme_Extend 0F18..0F19 ; Grapheme_Extend 0F35 ; Grapheme_Extend 0F37 ; Grapheme_Extend @@ -10490,6 +10609,7 @@ FF9E..FF9F ; Grapheme_Extend 10AE5..10AE6 ; Grapheme_Extend 10D24..10D27 ; Grapheme_Extend 10EAB..10EAC ; Grapheme_Extend +10EFD..10EFF ; Grapheme_Extend 10F46..10F50 ; Grapheme_Extend 10F82..10F85 ; Grapheme_Extend 11001 ; Grapheme_Extend @@ -10512,6 +10632,7 @@ FF9E..FF9F ; Grapheme_Extend 11234 ; Grapheme_Extend 11236..11237 ; Grapheme_Extend 1123E ; Grapheme_Extend +11241 ; Grapheme_Extend 112DF ; Grapheme_Extend 112E3..112EA ; Grapheme_Extend 11300..11301 ; Grapheme_Extend @@ -10579,6 +10700,12 @@ FF9E..FF9F ; Grapheme_Extend 11D95 ; Grapheme_Extend 11D97 ; Grapheme_Extend 11EF3..11EF4 ; Grapheme_Extend +11F00..11F01 ; Grapheme_Extend +11F36..11F3A ; Grapheme_Extend +11F40 ; Grapheme_Extend +11F42 ; Grapheme_Extend +13440 ; Grapheme_Extend +13447..13455 ; Grapheme_Extend 16AF0..16AF4 ; Grapheme_Extend 16B30..16B36 ; Grapheme_Extend 16F4F ; Grapheme_Extend @@ -10605,15 +10732,17 @@ FF9E..FF9F ; Grapheme_Extend 1E01B..1E021 ; Grapheme_Extend 1E023..1E024 ; Grapheme_Extend 1E026..1E02A ; Grapheme_Extend +1E08F ; Grapheme_Extend 1E130..1E136 ; Grapheme_Extend 1E2AE ; Grapheme_Extend 1E2EC..1E2EF ; Grapheme_Extend +1E4EC..1E4EF ; Grapheme_Extend 1E8D0..1E8D6 ; Grapheme_Extend 1E944..1E94A ; Grapheme_Extend E0020..E007F ; Grapheme_Extend E0100..E01EF ; Grapheme_Extend -# Total code points: 2090 +# Total code points: 2125 # ================================================ @@ -10913,6 +11042,7 @@ E0100..E01EF ; Grapheme_Extend 0CE0..0CE1 ; Grapheme_Base 0CE6..0CEF ; Grapheme_Base 0CF1..0CF2 ; Grapheme_Base +0CF3 ; Grapheme_Base 0D02..0D03 ; Grapheme_Base 0D04..0D0C ; Grapheme_Base 0D0E..0D10 ; Grapheme_Base @@ -11965,6 +12095,7 @@ FFFC..FFFD ; Grapheme_Base 11232..11233 ; Grapheme_Base 11235 ; Grapheme_Base 11238..1123D ; Grapheme_Base +1123F..11240 ; Grapheme_Base 11280..11286 ; Grapheme_Base 11288 ; Grapheme_Base 1128A..1128D ; Grapheme_Base @@ -12080,6 +12211,7 @@ FFFC..FFFD ; Grapheme_Base 11A9D ; Grapheme_Base 11A9E..11AA2 ; Grapheme_Base 11AB0..11AF8 ; Grapheme_Base +11B00..11B09 ; Grapheme_Base 11C00..11C08 ; Grapheme_Base 11C0A..11C2E ; Grapheme_Base 11C2F ; Grapheme_Base @@ -12109,6 +12241,15 @@ FFFC..FFFD ; Grapheme_Base 11EE0..11EF2 ; Grapheme_Base 11EF5..11EF6 ; Grapheme_Base 11EF7..11EF8 ; Grapheme_Base +11F02 ; Grapheme_Base +11F03 ; Grapheme_Base +11F04..11F10 ; Grapheme_Base +11F12..11F33 ; Grapheme_Base +11F34..11F35 ; Grapheme_Base +11F3E..11F3F ; Grapheme_Base +11F41 ; Grapheme_Base +11F43..11F4F ; Grapheme_Base +11F50..11F59 ; Grapheme_Base 11FB0 ; Grapheme_Base 11FC0..11FD4 ; Grapheme_Base 11FD5..11FDC ; Grapheme_Base @@ -12121,7 +12262,8 @@ FFFC..FFFD ; Grapheme_Base 12480..12543 ; Grapheme_Base 12F90..12FF0 ; Grapheme_Base 12FF1..12FF2 ; Grapheme_Base -13000..1342E ; Grapheme_Base +13000..1342F ; Grapheme_Base +13441..13446 ; Grapheme_Base 14400..14646 ; Grapheme_Base 16800..16A38 ; Grapheme_Base 16A40..16A5E ; Grapheme_Base @@ -12159,7 +12301,9 @@ FFFC..FFFD ; Grapheme_Base 1AFF5..1AFFB ; Grapheme_Base 1AFFD..1AFFE ; Grapheme_Base 1B000..1B122 ; Grapheme_Base +1B132 ; Grapheme_Base 1B150..1B152 ; Grapheme_Base +1B155 ; Grapheme_Base 1B164..1B167 ; Grapheme_Base 1B170..1B2FB ; Grapheme_Base 1BC00..1BC6A ; Grapheme_Base @@ -12180,6 +12324,7 @@ FFFC..FFFD ; Grapheme_Base 1D1AE..1D1EA ; Grapheme_Base 1D200..1D241 ; Grapheme_Base 1D245 ; Grapheme_Base +1D2C0..1D2D3 ; Grapheme_Base 1D2E0..1D2F3 ; Grapheme_Base 1D300..1D356 ; Grapheme_Base 1D360..1D378 ; Grapheme_Base @@ -12233,6 +12378,8 @@ FFFC..FFFD ; Grapheme_Base 1DF00..1DF09 ; Grapheme_Base 1DF0A ; Grapheme_Base 1DF0B..1DF1E ; Grapheme_Base +1DF25..1DF2A ; Grapheme_Base +1E030..1E06D ; Grapheme_Base 1E100..1E12C ; Grapheme_Base 1E137..1E13D ; Grapheme_Base 1E140..1E149 ; Grapheme_Base @@ -12242,6 +12389,9 @@ FFFC..FFFD ; Grapheme_Base 1E2C0..1E2EB ; Grapheme_Base 1E2F0..1E2F9 ; Grapheme_Base 1E2FF ; Grapheme_Base +1E4D0..1E4EA ; Grapheme_Base +1E4EB ; Grapheme_Base +1E4F0..1E4F9 ; Grapheme_Base 1E7E0..1E7E6 ; Grapheme_Base 1E7E8..1E7EB ; Grapheme_Base 1E7ED..1E7EE ; Grapheme_Base @@ -12310,10 +12460,10 @@ FFFC..FFFD ; Grapheme_Base 1F300..1F3FA ; Grapheme_Base 1F3FB..1F3FF ; Grapheme_Base 1F400..1F6D7 ; Grapheme_Base -1F6DD..1F6EC ; Grapheme_Base +1F6DC..1F6EC ; Grapheme_Base 1F6F0..1F6FC ; Grapheme_Base -1F700..1F773 ; Grapheme_Base -1F780..1F7D8 ; Grapheme_Base +1F700..1F776 ; Grapheme_Base +1F77B..1F7D9 ; Grapheme_Base 1F7E0..1F7EB ; Grapheme_Base 1F7F0 ; Grapheme_Base 1F800..1F80B ; Grapheme_Base @@ -12324,27 +12474,26 @@ FFFC..FFFD ; Grapheme_Base 1F8B0..1F8B1 ; Grapheme_Base 1F900..1FA53 ; Grapheme_Base 1FA60..1FA6D ; Grapheme_Base -1FA70..1FA74 ; Grapheme_Base -1FA78..1FA7C ; Grapheme_Base -1FA80..1FA86 ; Grapheme_Base -1FA90..1FAAC ; Grapheme_Base -1FAB0..1FABA ; Grapheme_Base -1FAC0..1FAC5 ; Grapheme_Base -1FAD0..1FAD9 ; Grapheme_Base -1FAE0..1FAE7 ; Grapheme_Base -1FAF0..1FAF6 ; Grapheme_Base +1FA70..1FA7C ; Grapheme_Base +1FA80..1FA88 ; Grapheme_Base +1FA90..1FABD ; Grapheme_Base +1FABF..1FAC5 ; Grapheme_Base +1FACE..1FADB ; Grapheme_Base +1FAE0..1FAE8 ; Grapheme_Base +1FAF0..1FAF8 ; Grapheme_Base 1FB00..1FB92 ; Grapheme_Base 1FB94..1FBCA ; Grapheme_Base 1FBF0..1FBF9 ; Grapheme_Base 20000..2A6DF ; Grapheme_Base -2A700..2B738 ; Grapheme_Base +2A700..2B739 ; Grapheme_Base 2B740..2B81D ; Grapheme_Base 2B820..2CEA1 ; Grapheme_Base 2CEB0..2EBE0 ; Grapheme_Base 2F800..2FA1D ; Grapheme_Base 30000..3134A ; Grapheme_Base +31350..323AF ; Grapheme_Base -# Total code points: 142539 +# Total code points: 146986 # ================================================ @@ -12410,7 +12559,9 @@ ABED ; Grapheme_Link 11C3F ; Grapheme_Link 11D44..11D45 ; Grapheme_Link 11D97 ; Grapheme_Link +11F41 ; Grapheme_Link +11F42 ; Grapheme_Link -# Total code points: 63 +# Total code points: 65 # EOF diff --git a/icu4c/source/data/unidata/DerivedNormalizationProps.txt b/icu4c/source/data/unidata/DerivedNormalizationProps.txt index f583aba3164..9d1a44f3fd8 100644 --- a/icu4c/source/data/unidata/DerivedNormalizationProps.txt +++ b/icu4c/source/data/unidata/DerivedNormalizationProps.txt @@ -1,11 +1,11 @@ -# DerivedNormalizationProps-14.0.0.txt -# Date: 2021-06-04, 02:19:20 GMT -# © 2021 Unicode®, Inc. +# DerivedNormalizationProps-15.0.0.txt +# Date: 2022-04-02, 01:29:03 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # ================================================ @@ -1652,6 +1652,7 @@ FFED..FFEE ; NFKD_QC; N 1D7C3 ; NFKD_QC; N 1D7C4..1D7CB ; NFKD_QC; N 1D7CE..1D7FF ; NFKD_QC; N +1E030..1E06D ; NFKD_QC; N 1EE00..1EE03 ; NFKD_QC; N 1EE05..1EE1F ; NFKD_QC; N 1EE21..1EE22 ; NFKD_QC; N @@ -1697,7 +1698,7 @@ FFED..FFEE ; NFKD_QC; N 1FBF0..1FBF9 ; NFKD_QC; N 2F800..2FA1D ; NFKD_QC; N -# Total code points: 16967 +# Total code points: 17029 # ================================================ @@ -2060,6 +2061,7 @@ FFED..FFEE ; NFKC_QC; N 1D7C3 ; NFKC_QC; N 1D7C4..1D7CB ; NFKC_QC; N 1D7CE..1D7FF ; NFKC_QC; N +1E030..1E06D ; NFKC_QC; N 1EE00..1EE03 ; NFKC_QC; N 1EE05..1EE1F ; NFKC_QC; N 1EE21..1EE22 ; NFKC_QC; N @@ -2105,7 +2107,7 @@ FFED..FFEE ; NFKC_QC; N 1FBF0..1FBF9 ; NFKC_QC; N 2F800..2FA1D ; NFKC_QC; N -# Total code points: 4866 +# Total code points: 4928 # ================================================ @@ -8076,6 +8078,68 @@ FFF0..FFF8 ; NFKC_CF; 1D7FD ; NFKC_CF; 0037 1D7FE ; NFKC_CF; 0038 1D7FF ; NFKC_CF; 0039 +1E030 ; NFKC_CF; 0430 +1E031 ; NFKC_CF; 0431 +1E032 ; NFKC_CF; 0432 +1E033 ; NFKC_CF; 0433 +1E034 ; NFKC_CF; 0434 +1E035 ; NFKC_CF; 0435 +1E036 ; NFKC_CF; 0436 +1E037 ; NFKC_CF; 0437 +1E038 ; NFKC_CF; 0438 +1E039 ; NFKC_CF; 043A +1E03A ; NFKC_CF; 043B +1E03B ; NFKC_CF; 043C +1E03C ; NFKC_CF; 043E +1E03D ; NFKC_CF; 043F +1E03E ; NFKC_CF; 0440 +1E03F ; NFKC_CF; 0441 +1E040 ; NFKC_CF; 0442 +1E041 ; NFKC_CF; 0443 +1E042 ; NFKC_CF; 0444 +1E043 ; NFKC_CF; 0445 +1E044 ; NFKC_CF; 0446 +1E045 ; NFKC_CF; 0447 +1E046 ; NFKC_CF; 0448 +1E047 ; NFKC_CF; 044B +1E048 ; NFKC_CF; 044D +1E049 ; NFKC_CF; 044E +1E04A ; NFKC_CF; A689 +1E04B ; NFKC_CF; 04D9 +1E04C ; NFKC_CF; 0456 +1E04D ; NFKC_CF; 0458 +1E04E ; NFKC_CF; 04E9 +1E04F ; NFKC_CF; 04AF +1E050 ; NFKC_CF; 04CF +1E051 ; NFKC_CF; 0430 +1E052 ; NFKC_CF; 0431 +1E053 ; NFKC_CF; 0432 +1E054 ; NFKC_CF; 0433 +1E055 ; NFKC_CF; 0434 +1E056 ; NFKC_CF; 0435 +1E057 ; NFKC_CF; 0436 +1E058 ; NFKC_CF; 0437 +1E059 ; NFKC_CF; 0438 +1E05A ; NFKC_CF; 043A +1E05B ; NFKC_CF; 043B +1E05C ; NFKC_CF; 043E +1E05D ; NFKC_CF; 043F +1E05E ; NFKC_CF; 0441 +1E05F ; NFKC_CF; 0443 +1E060 ; NFKC_CF; 0444 +1E061 ; NFKC_CF; 0445 +1E062 ; NFKC_CF; 0446 +1E063 ; NFKC_CF; 0447 +1E064 ; NFKC_CF; 0448 +1E065 ; NFKC_CF; 044A +1E066 ; NFKC_CF; 044B +1E067 ; NFKC_CF; 0491 +1E068 ; NFKC_CF; 0456 +1E069 ; NFKC_CF; 0455 +1E06A ; NFKC_CF; 045F +1E06B ; NFKC_CF; 04AB +1E06C ; NFKC_CF; A651 +1E06D ; NFKC_CF; 04B1 1E900 ; NFKC_CF; 1E922 1E901 ; NFKC_CF; 1E923 1E902 ; NFKC_CF; 1E924 @@ -8937,7 +9001,7 @@ E0080..E00FF ; NFKC_CF; E0100..E01EF ; NFKC_CF; E01F0..E0FFF ; NFKC_CF; -# Total code points: 10429 +# Total code points: 10491 # ================================================ @@ -9895,6 +9959,7 @@ FFF0..FFF8 ; Changes_When_NFKC_Casefolded 1D7C3 ; Changes_When_NFKC_Casefolded 1D7C4..1D7CB ; Changes_When_NFKC_Casefolded 1D7CE..1D7FF ; Changes_When_NFKC_Casefolded +1E030..1E06D ; Changes_When_NFKC_Casefolded 1E900..1E921 ; Changes_When_NFKC_Casefolded 1EE00..1EE03 ; Changes_When_NFKC_Casefolded 1EE05..1EE1F ; Changes_When_NFKC_Casefolded @@ -9948,6 +10013,6 @@ E0080..E00FF ; Changes_When_NFKC_Casefolded E0100..E01EF ; Changes_When_NFKC_Casefolded E01F0..E0FFF ; Changes_When_NFKC_Casefolded -# Total code points: 10429 +# Total code points: 10491 # EOF diff --git a/icu4c/source/data/unidata/NormalizationCorrections.txt b/icu4c/source/data/unidata/NormalizationCorrections.txt index a1a34d6bb6f..f992c0d53ce 100644 --- a/icu4c/source/data/unidata/NormalizationCorrections.txt +++ b/icu4c/source/data/unidata/NormalizationCorrections.txt @@ -1,10 +1,10 @@ -# NormalizationCorrections-14.0.0.txt -# Date: 2021-03-16, 22:07:00 GMT [KW, LI] -# © 2021 Unicode®, Inc. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# NormalizationCorrections-15.0.0.txt +# Date: 2022-05-03, 18:53:00 GMT [KW, LI] +# © 2022 Unicode®, Inc. +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # This file is a normative contributory data file in the # Unicode Character Database. diff --git a/icu4c/source/data/unidata/NormalizationTest.txt b/icu4c/source/data/unidata/NormalizationTest.txt index 7f45760cf95..b7d2fd1f84a 100644 --- a/icu4c/source/data/unidata/NormalizationTest.txt +++ b/icu4c/source/data/unidata/NormalizationTest.txt @@ -1,11 +1,11 @@ -# NormalizationTest-14.0.0.txt -# Date: 2021-05-28, 21:49:12 GMT -# © 2021 Unicode®, Inc. +# NormalizationTest-15.0.0.txt +# Date: 2022-04-02, 01:29:09 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Normalization Test Suite # Format: @@ -16208,6 +16208,68 @@ FFEE;FFEE;FFEE;25CB;25CB; 1D7FD;1D7FD;1D7FD;0037;0037; 1D7FE;1D7FE;1D7FE;0038;0038; 1D7FF;1D7FF;1D7FF;0039;0039; +1E030;1E030;1E030;0430;0430; +1E031;1E031;1E031;0431;0431; +1E032;1E032;1E032;0432;0432; +1E033;1E033;1E033;0433;0433; +1E034;1E034;1E034;0434;0434; +1E035;1E035;1E035;0435;0435; +1E036;1E036;1E036;0436;0436; +1E037;1E037;1E037;0437;0437; +1E038;1E038;1E038;0438;0438; +1E039;1E039;1E039;043A;043A; +1E03A;1E03A;1E03A;043B;043B; +1E03B;1E03B;1E03B;043C;043C; +1E03C;1E03C;1E03C;043E;043E; +1E03D;1E03D;1E03D;043F;043F; +1E03E;1E03E;1E03E;0440;0440; +1E03F;1E03F;1E03F;0441;0441; +1E040;1E040;1E040;0442;0442; +1E041;1E041;1E041;0443;0443; +1E042;1E042;1E042;0444;0444; +1E043;1E043;1E043;0445;0445; +1E044;1E044;1E044;0446;0446; +1E045;1E045;1E045;0447;0447; +1E046;1E046;1E046;0448;0448; +1E047;1E047;1E047;044B;044B; +1E048;1E048;1E048;044D;044D; +1E049;1E049;1E049;044E;044E; +1E04A;1E04A;1E04A;A689;A689; +1E04B;1E04B;1E04B;04D9;04D9; +1E04C;1E04C;1E04C;0456;0456; +1E04D;1E04D;1E04D;0458;0458; +1E04E;1E04E;1E04E;04E9;04E9; +1E04F;1E04F;1E04F;04AF;04AF; +1E050;1E050;1E050;04CF;04CF; +1E051;1E051;1E051;0430;0430; +1E052;1E052;1E052;0431;0431; +1E053;1E053;1E053;0432;0432; +1E054;1E054;1E054;0433;0433; +1E055;1E055;1E055;0434;0434; +1E056;1E056;1E056;0435;0435; +1E057;1E057;1E057;0436;0436; +1E058;1E058;1E058;0437;0437; +1E059;1E059;1E059;0438;0438; +1E05A;1E05A;1E05A;043A;043A; +1E05B;1E05B;1E05B;043B;043B; +1E05C;1E05C;1E05C;043E;043E; +1E05D;1E05D;1E05D;043F;043F; +1E05E;1E05E;1E05E;0441;0441; +1E05F;1E05F;1E05F;0443;0443; +1E060;1E060;1E060;0444;0444; +1E061;1E061;1E061;0445;0445; +1E062;1E062;1E062;0446;0446; +1E063;1E063;1E063;0447;0447; +1E064;1E064;1E064;0448;0448; +1E065;1E065;1E065;044A;044A; +1E066;1E066;1E066;044B;044B; +1E067;1E067;1E067;0491;0491; +1E068;1E068;1E068;0456;0456; +1E069;1E069;1E069;0455;0455; +1E06A;1E06A;1E06A;045F;045F; +1E06B;1E06B;1E06B;04AB;04AB; +1E06C;1E06C;1E06C;A651;A651; +1E06D;1E06D;1E06D;04B1;04B1; 1EE00;1EE00;1EE00;0627;0627; 1EE01;1EE01;1EE01;0628;0628; 1EE02;1EE02;1EE02;062C;062C; @@ -18496,6 +18558,12 @@ FFEE;FFEE;FFEE;25CB;25CB; 0061 10EAB 0315 0300 05AE 0062;0061 05AE 10EAB 0300 0315 0062;0061 05AE 10EAB 0300 0315 0062;0061 05AE 10EAB 0300 0315 0062;0061 05AE 10EAB 0300 0315 0062; 0061 0315 0300 05AE 10EAC 0062;00E0 05AE 10EAC 0315 0062;0061 05AE 0300 10EAC 0315 0062;00E0 05AE 10EAC 0315 0062;0061 05AE 0300 10EAC 0315 0062; 0061 10EAC 0315 0300 05AE 0062;0061 05AE 10EAC 0300 0315 0062;0061 05AE 10EAC 0300 0315 0062;0061 05AE 10EAC 0300 0315 0062;0061 05AE 10EAC 0300 0315 0062; +0061 059A 0316 1DFA 10EFD 0062;0061 1DFA 0316 10EFD 059A 0062;0061 1DFA 0316 10EFD 059A 0062;0061 1DFA 0316 10EFD 059A 0062;0061 1DFA 0316 10EFD 059A 0062; +0061 10EFD 059A 0316 1DFA 0062;0061 1DFA 10EFD 0316 059A 0062;0061 1DFA 10EFD 0316 059A 0062;0061 1DFA 10EFD 0316 059A 0062;0061 1DFA 10EFD 0316 059A 0062; +0061 059A 0316 1DFA 10EFE 0062;0061 1DFA 0316 10EFE 059A 0062;0061 1DFA 0316 10EFE 059A 0062;0061 1DFA 0316 10EFE 059A 0062;0061 1DFA 0316 10EFE 059A 0062; +0061 10EFE 059A 0316 1DFA 0062;0061 1DFA 10EFE 0316 059A 0062;0061 1DFA 10EFE 0316 059A 0062;0061 1DFA 10EFE 0316 059A 0062;0061 1DFA 10EFE 0316 059A 0062; +0061 059A 0316 1DFA 10EFF 0062;0061 1DFA 0316 10EFF 059A 0062;0061 1DFA 0316 10EFF 059A 0062;0061 1DFA 0316 10EFF 059A 0062;0061 1DFA 0316 10EFF 059A 0062; +0061 10EFF 059A 0316 1DFA 0062;0061 1DFA 10EFF 0316 059A 0062;0061 1DFA 10EFF 0316 059A 0062;0061 1DFA 10EFF 0316 059A 0062;0061 1DFA 10EFF 0316 059A 0062; 0061 059A 0316 1DFA 10F46 0062;0061 1DFA 0316 10F46 059A 0062;0061 1DFA 0316 10F46 059A 0062;0061 1DFA 0316 10F46 059A 0062;0061 1DFA 0316 10F46 059A 0062; 0061 10F46 059A 0316 1DFA 0062;0061 1DFA 10F46 0316 059A 0062;0061 1DFA 10F46 0316 059A 0062;0061 1DFA 10F46 0316 059A 0062;0061 1DFA 10F46 0316 059A 0062; 0061 059A 0316 1DFA 10F47 0062;0061 1DFA 0316 10F47 059A 0062;0061 1DFA 0316 10F47 059A 0062;0061 1DFA 0316 10F47 059A 0062;0061 1DFA 0316 10F47 059A 0062; @@ -18640,6 +18708,10 @@ FFEE;FFEE;FFEE;25CB;25CB; 0061 11D45 05B0 094D 3099 0062;0061 3099 11D45 094D 05B0 0062;0061 3099 11D45 094D 05B0 0062;0061 3099 11D45 094D 05B0 0062;0061 3099 11D45 094D 05B0 0062; 0061 05B0 094D 3099 11D97 0062;0061 3099 094D 11D97 05B0 0062;0061 3099 094D 11D97 05B0 0062;0061 3099 094D 11D97 05B0 0062;0061 3099 094D 11D97 05B0 0062; 0061 11D97 05B0 094D 3099 0062;0061 3099 11D97 094D 05B0 0062;0061 3099 11D97 094D 05B0 0062;0061 3099 11D97 094D 05B0 0062;0061 3099 11D97 094D 05B0 0062; +0061 05B0 094D 3099 11F41 0062;0061 3099 094D 11F41 05B0 0062;0061 3099 094D 11F41 05B0 0062;0061 3099 094D 11F41 05B0 0062;0061 3099 094D 11F41 05B0 0062; +0061 11F41 05B0 094D 3099 0062;0061 3099 11F41 094D 05B0 0062;0061 3099 11F41 094D 05B0 0062;0061 3099 11F41 094D 05B0 0062;0061 3099 11F41 094D 05B0 0062; +0061 05B0 094D 3099 11F42 0062;0061 3099 094D 11F42 05B0 0062;0061 3099 094D 11F42 05B0 0062;0061 3099 094D 11F42 05B0 0062;0061 3099 094D 11F42 05B0 0062; +0061 11F42 05B0 094D 3099 0062;0061 3099 11F42 094D 05B0 0062;0061 3099 11F42 094D 05B0 0062;0061 3099 11F42 094D 05B0 0062;0061 3099 11F42 094D 05B0 0062; 0061 16FF0 0334 16AF0 0062;0061 0334 16AF0 16FF0 0062;0061 0334 16AF0 16FF0 0062;0061 0334 16AF0 16FF0 0062;0061 0334 16AF0 16FF0 0062; 0061 16AF0 16FF0 0334 0062;0061 16AF0 0334 16FF0 0062;0061 16AF0 0334 16FF0 0062;0061 16AF0 0334 16FF0 0062;0061 16AF0 0334 16FF0 0062; 0061 16FF0 0334 16AF1 0062;0061 0334 16AF1 16FF0 0062;0061 0334 16AF1 16FF0 0062;0061 0334 16AF1 16FF0 0062;0061 0334 16AF1 16FF0 0062; @@ -18812,6 +18884,8 @@ FFEE;FFEE;FFEE;25CB;25CB; 0061 1E029 0315 0300 05AE 0062;0061 05AE 1E029 0300 0315 0062;0061 05AE 1E029 0300 0315 0062;0061 05AE 1E029 0300 0315 0062;0061 05AE 1E029 0300 0315 0062; 0061 0315 0300 05AE 1E02A 0062;00E0 05AE 1E02A 0315 0062;0061 05AE 0300 1E02A 0315 0062;00E0 05AE 1E02A 0315 0062;0061 05AE 0300 1E02A 0315 0062; 0061 1E02A 0315 0300 05AE 0062;0061 05AE 1E02A 0300 0315 0062;0061 05AE 1E02A 0300 0315 0062;0061 05AE 1E02A 0300 0315 0062;0061 05AE 1E02A 0300 0315 0062; +0061 0315 0300 05AE 1E08F 0062;00E0 05AE 1E08F 0315 0062;0061 05AE 0300 1E08F 0315 0062;00E0 05AE 1E08F 0315 0062;0061 05AE 0300 1E08F 0315 0062; +0061 1E08F 0315 0300 05AE 0062;0061 05AE 1E08F 0300 0315 0062;0061 05AE 1E08F 0300 0315 0062;0061 05AE 1E08F 0300 0315 0062;0061 05AE 1E08F 0300 0315 0062; 0061 0315 0300 05AE 1E130 0062;00E0 05AE 1E130 0315 0062;0061 05AE 0300 1E130 0315 0062;00E0 05AE 1E130 0315 0062;0061 05AE 0300 1E130 0315 0062; 0061 1E130 0315 0300 05AE 0062;0061 05AE 1E130 0300 0315 0062;0061 05AE 1E130 0300 0315 0062;0061 05AE 1E130 0300 0315 0062;0061 05AE 1E130 0300 0315 0062; 0061 0315 0300 05AE 1E131 0062;00E0 05AE 1E131 0315 0062;0061 05AE 0300 1E131 0315 0062;00E0 05AE 1E131 0315 0062;0061 05AE 0300 1E131 0315 0062; @@ -18836,6 +18910,14 @@ FFEE;FFEE;FFEE;25CB;25CB; 0061 1E2EE 0315 0300 05AE 0062;0061 05AE 1E2EE 0300 0315 0062;0061 05AE 1E2EE 0300 0315 0062;0061 05AE 1E2EE 0300 0315 0062;0061 05AE 1E2EE 0300 0315 0062; 0061 0315 0300 05AE 1E2EF 0062;00E0 05AE 1E2EF 0315 0062;0061 05AE 0300 1E2EF 0315 0062;00E0 05AE 1E2EF 0315 0062;0061 05AE 0300 1E2EF 0315 0062; 0061 1E2EF 0315 0300 05AE 0062;0061 05AE 1E2EF 0300 0315 0062;0061 05AE 1E2EF 0300 0315 0062;0061 05AE 1E2EF 0300 0315 0062;0061 05AE 1E2EF 0300 0315 0062; +0061 035C 0315 0300 1E4EC 0062;00E0 0315 1E4EC 035C 0062;0061 0300 0315 1E4EC 035C 0062;00E0 0315 1E4EC 035C 0062;0061 0300 0315 1E4EC 035C 0062; +0061 1E4EC 035C 0315 0300 0062;00E0 1E4EC 0315 035C 0062;0061 0300 1E4EC 0315 035C 0062;00E0 1E4EC 0315 035C 0062;0061 0300 1E4EC 0315 035C 0062; +0061 035C 0315 0300 1E4ED 0062;00E0 0315 1E4ED 035C 0062;0061 0300 0315 1E4ED 035C 0062;00E0 0315 1E4ED 035C 0062;0061 0300 0315 1E4ED 035C 0062; +0061 1E4ED 035C 0315 0300 0062;00E0 1E4ED 0315 035C 0062;0061 0300 1E4ED 0315 035C 0062;00E0 1E4ED 0315 035C 0062;0061 0300 1E4ED 0315 035C 0062; +0061 059A 0316 1DFA 1E4EE 0062;0061 1DFA 0316 1E4EE 059A 0062;0061 1DFA 0316 1E4EE 059A 0062;0061 1DFA 0316 1E4EE 059A 0062;0061 1DFA 0316 1E4EE 059A 0062; +0061 1E4EE 059A 0316 1DFA 0062;0061 1DFA 1E4EE 0316 059A 0062;0061 1DFA 1E4EE 0316 059A 0062;0061 1DFA 1E4EE 0316 059A 0062;0061 1DFA 1E4EE 0316 059A 0062; +0061 0315 0300 05AE 1E4EF 0062;00E0 05AE 1E4EF 0315 0062;0061 05AE 0300 1E4EF 0315 0062;00E0 05AE 1E4EF 0315 0062;0061 05AE 0300 1E4EF 0315 0062; +0061 1E4EF 0315 0300 05AE 0062;0061 05AE 1E4EF 0300 0315 0062;0061 05AE 1E4EF 0300 0315 0062;0061 05AE 1E4EF 0300 0315 0062;0061 05AE 1E4EF 0300 0315 0062; 0061 059A 0316 1DFA 1E8D0 0062;0061 1DFA 0316 1E8D0 059A 0062;0061 1DFA 0316 1E8D0 059A 0062;0061 1DFA 0316 1E8D0 059A 0062;0061 1DFA 0316 1E8D0 059A 0062; 0061 1E8D0 059A 0316 1DFA 0062;0061 1DFA 1E8D0 0316 059A 0062;0061 1DFA 1E8D0 0316 059A 0062;0061 1DFA 1E8D0 0316 059A 0062;0061 1DFA 1E8D0 0316 059A 0062; 0061 059A 0316 1DFA 1E8D1 0062;0061 1DFA 0316 1E8D1 059A 0062;0061 1DFA 0316 1E8D1 059A 0062;0061 1DFA 0316 1E8D1 059A 0062;0061 1DFA 0316 1E8D1 059A 0062; diff --git a/icu4c/source/data/unidata/SpecialCasing.txt b/icu4c/source/data/unidata/SpecialCasing.txt index 1c2e968a8c4..08d04fa9421 100644 --- a/icu4c/source/data/unidata/SpecialCasing.txt +++ b/icu4c/source/data/unidata/SpecialCasing.txt @@ -1,11 +1,11 @@ -# SpecialCasing-14.0.0.txt -# Date: 2021-03-08, 19:35:55 GMT -# © 2021 Unicode®, Inc. +# SpecialCasing-15.0.0.txt +# Date: 2022-02-02, 23:35:52 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Special Casing # diff --git a/icu4c/source/data/unidata/UnicodeData.txt b/icu4c/source/data/unidata/UnicodeData.txt index b5abef7ed43..249ec55863e 100644 --- a/icu4c/source/data/unidata/UnicodeData.txt +++ b/icu4c/source/data/unidata/UnicodeData.txt @@ -2975,6 +2975,7 @@ 0CEF;KANNADA DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 0CF1;KANNADA SIGN JIHVAMULIYA;Lo;0;L;;;;;N;;;;; 0CF2;KANNADA SIGN UPADHMANIYA;Lo;0;L;;;;;N;;;;; +0CF3;KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT;Mc;0;L;;;;;N;;;;; 0D00;MALAYALAM SIGN COMBINING ANUSVARA ABOVE;Mn;0;NSM;;;;;N;;;;; 0D01;MALAYALAM SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;; 0D02;MALAYALAM SIGN ANUSVARA;Mc;0;L;;;;;N;;;;; @@ -3339,6 +3340,7 @@ 0ECB;LAO TONE MAI CATAWA;Mn;122;NSM;;;;;N;;;;; 0ECC;LAO CANCELLATION MARK;Mn;0;NSM;;;;;N;;;;; 0ECD;LAO NIGGAHITA;Mn;0;NSM;;;;;N;;;;; +0ECE;LAO YAMAKKAN;Mn;0;NSM;;;;;N;;;;; 0ED0;LAO DIGIT ZERO;Nd;0;L;;0;0;0;N;;;;; 0ED1;LAO DIGIT ONE;Nd;0;L;;1;1;1;N;;;;; 0ED2;LAO DIGIT TWO;Nd;0;L;;2;2;2;N;;;;; @@ -19393,6 +19395,9 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 10EAD;YEZIDI HYPHENATION MARK;Pd;0;R;;;;;N;;;;; 10EB0;YEZIDI LETTER LAM WITH DOT ABOVE;Lo;0;R;;;;;N;;;;; 10EB1;YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE;Lo;0;R;;;;;N;;;;; +10EFD;ARABIC SMALL LOW WORD SAKTA;Mn;220;NSM;;;;;N;;;;; +10EFE;ARABIC SMALL LOW WORD QASR;Mn;220;NSM;;;;;N;;;;; +10EFF;ARABIC SMALL LOW WORD MADDA;Mn;220;NSM;;;;;N;;;;; 10F00;OLD SOGDIAN LETTER ALEPH;Lo;0;R;;;;;N;;;;; 10F01;OLD SOGDIAN LETTER FINAL ALEPH;Lo;0;R;;;;;N;;;;; 10F02;OLD SOGDIAN LETTER BETH;Lo;0;R;;;;;N;;;;; @@ -20058,6 +20063,9 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1123C;KHOJKI DOUBLE SECTION MARK;Po;0;L;;;;;N;;;;; 1123D;KHOJKI ABBREVIATION SIGN;Po;0;L;;;;;N;;;;; 1123E;KHOJKI SIGN SUKUN;Mn;0;NSM;;;;;N;;;;; +1123F;KHOJKI LETTER QA;Lo;0;L;;;;;N;;;;; +11240;KHOJKI LETTER SHORT I;Lo;0;L;;;;;N;;;;; +11241;KHOJKI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;; 11280;MULTANI LETTER A;Lo;0;L;;;;;N;;;;; 11281;MULTANI LETTER I;Lo;0;L;;;;;N;;;;; 11282;MULTANI LETTER U;Lo;0;L;;;;;N;;;;; @@ -21256,6 +21264,16 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 11AF6;PAU CIN HAU LOW-FALLING TONE LONG FINAL;Lo;0;L;;;;;N;;;;; 11AF7;PAU CIN HAU LOW-FALLING TONE FINAL;Lo;0;L;;;;;N;;;;; 11AF8;PAU CIN HAU GLOTTAL STOP FINAL;Lo;0;L;;;;;N;;;;; +11B00;DEVANAGARI HEAD MARK;Po;0;L;;;;;N;;;;; +11B01;DEVANAGARI HEAD MARK WITH HEADSTROKE;Po;0;L;;;;;N;;;;; +11B02;DEVANAGARI SIGN BHALE;Po;0;L;;;;;N;;;;; +11B03;DEVANAGARI SIGN BHALE WITH HOOK;Po;0;L;;;;;N;;;;; +11B04;DEVANAGARI SIGN EXTENDED BHALE;Po;0;L;;;;;N;;;;; +11B05;DEVANAGARI SIGN EXTENDED BHALE WITH HOOK;Po;0;L;;;;;N;;;;; +11B06;DEVANAGARI SIGN WESTERN FIVE-LIKE BHALE;Po;0;L;;;;;N;;;;; +11B07;DEVANAGARI SIGN WESTERN NINE-LIKE BHALE;Po;0;L;;;;;N;;;;; +11B08;DEVANAGARI SIGN REVERSED NINE-LIKE BHALE;Po;0;L;;;;;N;;;;; +11B09;DEVANAGARI SIGN MINDU;Po;0;L;;;;;N;;;;; 11C00;BHAIKSUKI LETTER A;Lo;0;L;;;;;N;;;;; 11C01;BHAIKSUKI LETTER AA;Lo;0;L;;;;;N;;;;; 11C02;BHAIKSUKI LETTER I;Lo;0;L;;;;;N;;;;; @@ -21584,6 +21602,92 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 11EF6;MAKASAR VOWEL SIGN O;Mc;0;L;;;;;N;;;;; 11EF7;MAKASAR PASSIMBANG;Po;0;L;;;;;N;;;;; 11EF8;MAKASAR END OF SECTION;Po;0;L;;;;;N;;;;; +11F00;KAWI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;; +11F01;KAWI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;; +11F02;KAWI SIGN REPHA;Lo;0;L;;;;;N;;;;; +11F03;KAWI SIGN VISARGA;Mc;0;L;;;;;N;;;;; +11F04;KAWI LETTER A;Lo;0;L;;;;;N;;;;; +11F05;KAWI LETTER AA;Lo;0;L;;;;;N;;;;; +11F06;KAWI LETTER I;Lo;0;L;;;;;N;;;;; +11F07;KAWI LETTER II;Lo;0;L;;;;;N;;;;; +11F08;KAWI LETTER U;Lo;0;L;;;;;N;;;;; +11F09;KAWI LETTER UU;Lo;0;L;;;;;N;;;;; +11F0A;KAWI LETTER VOCALIC R;Lo;0;L;;;;;N;;;;; +11F0B;KAWI LETTER VOCALIC RR;Lo;0;L;;;;;N;;;;; +11F0C;KAWI LETTER VOCALIC L;Lo;0;L;;;;;N;;;;; +11F0D;KAWI LETTER VOCALIC LL;Lo;0;L;;;;;N;;;;; +11F0E;KAWI LETTER E;Lo;0;L;;;;;N;;;;; +11F0F;KAWI LETTER AI;Lo;0;L;;;;;N;;;;; +11F10;KAWI LETTER O;Lo;0;L;;;;;N;;;;; +11F12;KAWI LETTER KA;Lo;0;L;;;;;N;;;;; +11F13;KAWI LETTER KHA;Lo;0;L;;;;;N;;;;; +11F14;KAWI LETTER GA;Lo;0;L;;;;;N;;;;; +11F15;KAWI LETTER GHA;Lo;0;L;;;;;N;;;;; +11F16;KAWI LETTER NGA;Lo;0;L;;;;;N;;;;; +11F17;KAWI LETTER CA;Lo;0;L;;;;;N;;;;; +11F18;KAWI LETTER CHA;Lo;0;L;;;;;N;;;;; +11F19;KAWI LETTER JA;Lo;0;L;;;;;N;;;;; +11F1A;KAWI LETTER JHA;Lo;0;L;;;;;N;;;;; +11F1B;KAWI LETTER NYA;Lo;0;L;;;;;N;;;;; +11F1C;KAWI LETTER TTA;Lo;0;L;;;;;N;;;;; +11F1D;KAWI LETTER TTHA;Lo;0;L;;;;;N;;;;; +11F1E;KAWI LETTER DDA;Lo;0;L;;;;;N;;;;; +11F1F;KAWI LETTER DDHA;Lo;0;L;;;;;N;;;;; +11F20;KAWI LETTER NNA;Lo;0;L;;;;;N;;;;; +11F21;KAWI LETTER TA;Lo;0;L;;;;;N;;;;; +11F22;KAWI LETTER THA;Lo;0;L;;;;;N;;;;; +11F23;KAWI LETTER DA;Lo;0;L;;;;;N;;;;; +11F24;KAWI LETTER DHA;Lo;0;L;;;;;N;;;;; +11F25;KAWI LETTER NA;Lo;0;L;;;;;N;;;;; +11F26;KAWI LETTER PA;Lo;0;L;;;;;N;;;;; +11F27;KAWI LETTER PHA;Lo;0;L;;;;;N;;;;; +11F28;KAWI LETTER BA;Lo;0;L;;;;;N;;;;; +11F29;KAWI LETTER BHA;Lo;0;L;;;;;N;;;;; +11F2A;KAWI LETTER MA;Lo;0;L;;;;;N;;;;; +11F2B;KAWI LETTER YA;Lo;0;L;;;;;N;;;;; +11F2C;KAWI LETTER RA;Lo;0;L;;;;;N;;;;; +11F2D;KAWI LETTER LA;Lo;0;L;;;;;N;;;;; +11F2E;KAWI LETTER WA;Lo;0;L;;;;;N;;;;; +11F2F;KAWI LETTER SHA;Lo;0;L;;;;;N;;;;; +11F30;KAWI LETTER SSA;Lo;0;L;;;;;N;;;;; +11F31;KAWI LETTER SA;Lo;0;L;;;;;N;;;;; +11F32;KAWI LETTER HA;Lo;0;L;;;;;N;;;;; +11F33;KAWI LETTER JNYA;Lo;0;L;;;;;N;;;;; +11F34;KAWI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;; +11F35;KAWI VOWEL SIGN ALTERNATE AA;Mc;0;L;;;;;N;;;;; +11F36;KAWI VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;; +11F37;KAWI VOWEL SIGN II;Mn;0;NSM;;;;;N;;;;; +11F38;KAWI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;; +11F39;KAWI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;; +11F3A;KAWI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;; +11F3E;KAWI VOWEL SIGN E;Mc;0;L;;;;;N;;;;; +11F3F;KAWI VOWEL SIGN AI;Mc;0;L;;;;;N;;;;; +11F40;KAWI VOWEL SIGN EU;Mn;0;NSM;;;;;N;;;;; +11F41;KAWI SIGN KILLER;Mc;9;L;;;;;N;;;;; +11F42;KAWI CONJOINER;Mn;9;NSM;;;;;N;;;;; +11F43;KAWI DANDA;Po;0;L;;;;;N;;;;; +11F44;KAWI DOUBLE DANDA;Po;0;L;;;;;N;;;;; +11F45;KAWI PUNCTUATION SECTION MARKER;Po;0;L;;;;;N;;;;; +11F46;KAWI PUNCTUATION ALTERNATE SECTION MARKER;Po;0;L;;;;;N;;;;; +11F47;KAWI PUNCTUATION FLOWER;Po;0;L;;;;;N;;;;; +11F48;KAWI PUNCTUATION SPACE FILLER;Po;0;L;;;;;N;;;;; +11F49;KAWI PUNCTUATION DOT;Po;0;L;;;;;N;;;;; +11F4A;KAWI PUNCTUATION DOUBLE DOT;Po;0;L;;;;;N;;;;; +11F4B;KAWI PUNCTUATION TRIPLE DOT;Po;0;L;;;;;N;;;;; +11F4C;KAWI PUNCTUATION CIRCLE;Po;0;L;;;;;N;;;;; +11F4D;KAWI PUNCTUATION FILLED CIRCLE;Po;0;L;;;;;N;;;;; +11F4E;KAWI PUNCTUATION SPIRAL;Po;0;L;;;;;N;;;;; +11F4F;KAWI PUNCTUATION CLOSING SPIRAL;Po;0;L;;;;;N;;;;; +11F50;KAWI DIGIT ZERO;Nd;0;L;;0;0;0;N;;;;; +11F51;KAWI DIGIT ONE;Nd;0;L;;1;1;1;N;;;;; +11F52;KAWI DIGIT TWO;Nd;0;L;;2;2;2;N;;;;; +11F53;KAWI DIGIT THREE;Nd;0;L;;3;3;3;N;;;;; +11F54;KAWI DIGIT FOUR;Nd;0;L;;4;4;4;N;;;;; +11F55;KAWI DIGIT FIVE;Nd;0;L;;5;5;5;N;;;;; +11F56;KAWI DIGIT SIX;Nd;0;L;;6;6;6;N;;;;; +11F57;KAWI DIGIT SEVEN;Nd;0;L;;7;7;7;N;;;;; +11F58;KAWI DIGIT EIGHT;Nd;0;L;;8;8;8;N;;;;; +11F59;KAWI DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 11FB0;LISU LETTER YHA;Lo;0;L;;;;;N;;;;; 11FC0;TAMIL FRACTION ONE THREE-HUNDRED-AND-TWENTIETH;No;0;L;;;;1/320;N;;;;; 11FC1;TAMIL FRACTION ONE ONE-HUNDRED-AND-SIXTIETH;No;0;L;;;;1/160;N;;;;; @@ -24040,6 +24144,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1342C;EGYPTIAN HIEROGLYPH AA030;Lo;0;L;;;;;N;;;;; 1342D;EGYPTIAN HIEROGLYPH AA031;Lo;0;L;;;;;N;;;;; 1342E;EGYPTIAN HIEROGLYPH AA032;Lo;0;L;;;;;N;;;;; +1342F;EGYPTIAN HIEROGLYPH V011D;Lo;0;L;;;;;N;;;;; 13430;EGYPTIAN HIEROGLYPH VERTICAL JOINER;Cf;0;L;;;;;N;;;;; 13431;EGYPTIAN HIEROGLYPH HORIZONTAL JOINER;Cf;0;L;;;;;N;;;;; 13432;EGYPTIAN HIEROGLYPH INSERT AT TOP START;Cf;0;L;;;;;N;;;;; @@ -24049,6 +24154,35 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 13436;EGYPTIAN HIEROGLYPH OVERLAY MIDDLE;Cf;0;L;;;;;N;;;;; 13437;EGYPTIAN HIEROGLYPH BEGIN SEGMENT;Cf;0;L;;;;;N;;;;; 13438;EGYPTIAN HIEROGLYPH END SEGMENT;Cf;0;L;;;;;N;;;;; +13439;EGYPTIAN HIEROGLYPH INSERT AT MIDDLE;Cf;0;L;;;;;N;;;;; +1343A;EGYPTIAN HIEROGLYPH INSERT AT TOP;Cf;0;L;;;;;N;;;;; +1343B;EGYPTIAN HIEROGLYPH INSERT AT BOTTOM;Cf;0;L;;;;;N;;;;; +1343C;EGYPTIAN HIEROGLYPH BEGIN ENCLOSURE;Cf;0;L;;;;;N;;;;; +1343D;EGYPTIAN HIEROGLYPH END ENCLOSURE;Cf;0;L;;;;;N;;;;; +1343E;EGYPTIAN HIEROGLYPH BEGIN WALLED ENCLOSURE;Cf;0;L;;;;;N;;;;; +1343F;EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE;Cf;0;L;;;;;N;;;;; +13440;EGYPTIAN HIEROGLYPH MIRROR HORIZONTALLY;Mn;0;NSM;;;;;N;;;;; +13441;EGYPTIAN HIEROGLYPH FULL BLANK;Lo;0;L;;;;;N;;;;; +13442;EGYPTIAN HIEROGLYPH HALF BLANK;Lo;0;L;;;;;N;;;;; +13443;EGYPTIAN HIEROGLYPH LOST SIGN;Lo;0;L;;;;;N;;;;; +13444;EGYPTIAN HIEROGLYPH HALF LOST SIGN;Lo;0;L;;;;;N;;;;; +13445;EGYPTIAN HIEROGLYPH TALL LOST SIGN;Lo;0;L;;;;;N;;;;; +13446;EGYPTIAN HIEROGLYPH WIDE LOST SIGN;Lo;0;L;;;;;N;;;;; +13447;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP START;Mn;0;NSM;;;;;N;;;;; +13448;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM START;Mn;0;NSM;;;;;N;;;;; +13449;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT START;Mn;0;NSM;;;;;N;;;;; +1344A;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP END;Mn;0;NSM;;;;;N;;;;; +1344B;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP;Mn;0;NSM;;;;;N;;;;; +1344C;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM START AND TOP END;Mn;0;NSM;;;;;N;;;;; +1344D;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT START AND TOP;Mn;0;NSM;;;;;N;;;;; +1344E;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM END;Mn;0;NSM;;;;;N;;;;; +1344F;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP START AND BOTTOM END;Mn;0;NSM;;;;;N;;;;; +13450;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM;Mn;0;NSM;;;;;N;;;;; +13451;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT START AND BOTTOM;Mn;0;NSM;;;;;N;;;;; +13452;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT END;Mn;0;NSM;;;;;N;;;;; +13453;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP AND END;Mn;0;NSM;;;;;N;;;;; +13454;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM AND END;Mn;0;NSM;;;;;N;;;;; +13455;EGYPTIAN HIEROGLYPH MODIFIER DAMAGED;Mn;0;NSM;;;;;N;;;;; 14400;ANATOLIAN HIEROGLYPH A001;Lo;0;L;;;;;N;;;;; 14401;ANATOLIAN HIEROGLYPH A002;Lo;0;L;;;;;N;;;;; 14402;ANATOLIAN HIEROGLYPH A003;Lo;0;L;;;;;N;;;;; @@ -27289,9 +27423,11 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1B120;KATAKANA LETTER ARCHAIC YI;Lo;0;L;;;;;N;;;;; 1B121;KATAKANA LETTER ARCHAIC YE;Lo;0;L;;;;;N;;;;; 1B122;KATAKANA LETTER ARCHAIC WU;Lo;0;L;;;;;N;;;;; +1B132;HIRAGANA LETTER SMALL KO;Lo;0;L;;;;;N;;;;; 1B150;HIRAGANA LETTER SMALL WI;Lo;0;L;;;;;N;;;;; 1B151;HIRAGANA LETTER SMALL WE;Lo;0;L;;;;;N;;;;; 1B152;HIRAGANA LETTER SMALL WO;Lo;0;L;;;;;N;;;;; +1B155;KATAKANA LETTER SMALL KO;Lo;0;L;;;;;N;;;;; 1B164;KATAKANA LETTER SMALL WI;Lo;0;L;;;;;N;;;;; 1B165;KATAKANA LETTER SMALL WE;Lo;0;L;;;;;N;;;;; 1B166;KATAKANA LETTER SMALL WO;Lo;0;L;;;;;N;;;;; @@ -28573,6 +28709,26 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1D243;COMBINING GREEK MUSICAL TETRASEME;Mn;230;NSM;;;;;N;;;;; 1D244;COMBINING GREEK MUSICAL PENTASEME;Mn;230;NSM;;;;;N;;;;; 1D245;GREEK MUSICAL LEIMMA;So;0;ON;;;;;N;;;;; +1D2C0;KAKTOVIK NUMERAL ZERO;No;0;ON;;;;0;N;;;;; +1D2C1;KAKTOVIK NUMERAL ONE;No;0;ON;;;;1;N;;;;; +1D2C2;KAKTOVIK NUMERAL TWO;No;0;ON;;;;2;N;;;;; +1D2C3;KAKTOVIK NUMERAL THREE;No;0;ON;;;;3;N;;;;; +1D2C4;KAKTOVIK NUMERAL FOUR;No;0;ON;;;;4;N;;;;; +1D2C5;KAKTOVIK NUMERAL FIVE;No;0;ON;;;;5;N;;;;; +1D2C6;KAKTOVIK NUMERAL SIX;No;0;ON;;;;6;N;;;;; +1D2C7;KAKTOVIK NUMERAL SEVEN;No;0;ON;;;;7;N;;;;; +1D2C8;KAKTOVIK NUMERAL EIGHT;No;0;ON;;;;8;N;;;;; +1D2C9;KAKTOVIK NUMERAL NINE;No;0;ON;;;;9;N;;;;; +1D2CA;KAKTOVIK NUMERAL TEN;No;0;ON;;;;10;N;;;;; +1D2CB;KAKTOVIK NUMERAL ELEVEN;No;0;ON;;;;11;N;;;;; +1D2CC;KAKTOVIK NUMERAL TWELVE;No;0;ON;;;;12;N;;;;; +1D2CD;KAKTOVIK NUMERAL THIRTEEN;No;0;ON;;;;13;N;;;;; +1D2CE;KAKTOVIK NUMERAL FOURTEEN;No;0;ON;;;;14;N;;;;; +1D2CF;KAKTOVIK NUMERAL FIFTEEN;No;0;ON;;;;15;N;;;;; +1D2D0;KAKTOVIK NUMERAL SIXTEEN;No;0;ON;;;;16;N;;;;; +1D2D1;KAKTOVIK NUMERAL SEVENTEEN;No;0;ON;;;;17;N;;;;; +1D2D2;KAKTOVIK NUMERAL EIGHTEEN;No;0;ON;;;;18;N;;;;; +1D2D3;KAKTOVIK NUMERAL NINETEEN;No;0;ON;;;;19;N;;;;; 1D2E0;MAYAN NUMERAL ZERO;No;0;L;;;;0;N;;;;; 1D2E1;MAYAN NUMERAL ONE;No;0;L;;;;1;N;;;;; 1D2E2;MAYAN NUMERAL TWO;No;0;L;;;;2;N;;;;; @@ -30404,6 +30560,12 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1DF1C;LATIN SMALL LETTER TESH DIGRAPH WITH RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; 1DF1D;LATIN SMALL LETTER C WITH RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; 1DF1E;LATIN SMALL LETTER S WITH CURL;Ll;0;L;;;;;N;;;;; +1DF25;LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK;Ll;0;L;;;;;N;;;;; +1DF26;LATIN SMALL LETTER L WITH MID-HEIGHT LEFT HOOK;Ll;0;L;;;;;N;;;;; +1DF27;LATIN SMALL LETTER N WITH MID-HEIGHT LEFT HOOK;Ll;0;L;;;;;N;;;;; +1DF28;LATIN SMALL LETTER R WITH MID-HEIGHT LEFT HOOK;Ll;0;L;;;;;N;;;;; +1DF29;LATIN SMALL LETTER S WITH MID-HEIGHT LEFT HOOK;Ll;0;L;;;;;N;;;;; +1DF2A;LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK;Ll;0;L;;;;;N;;;;; 1E000;COMBINING GLAGOLITIC LETTER AZU;Mn;230;NSM;;;;;N;;;;; 1E001;COMBINING GLAGOLITIC LETTER BUKY;Mn;230;NSM;;;;;N;;;;; 1E002;COMBINING GLAGOLITIC LETTER VEDE;Mn;230;NSM;;;;;N;;;;; @@ -30442,6 +30604,69 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1E028;COMBINING GLAGOLITIC LETTER BIG YUS;Mn;230;NSM;;;;;N;;;;; 1E029;COMBINING GLAGOLITIC LETTER IOTATED BIG YUS;Mn;230;NSM;;;;;N;;;;; 1E02A;COMBINING GLAGOLITIC LETTER FITA;Mn;230;NSM;;;;;N;;;;; +1E030;MODIFIER LETTER CYRILLIC SMALL A;Lm;0;L; 0430;;;;N;;;;; +1E031;MODIFIER LETTER CYRILLIC SMALL BE;Lm;0;L; 0431;;;;N;;;;; +1E032;MODIFIER LETTER CYRILLIC SMALL VE;Lm;0;L; 0432;;;;N;;;;; +1E033;MODIFIER LETTER CYRILLIC SMALL GHE;Lm;0;L; 0433;;;;N;;;;; +1E034;MODIFIER LETTER CYRILLIC SMALL DE;Lm;0;L; 0434;;;;N;;;;; +1E035;MODIFIER LETTER CYRILLIC SMALL IE;Lm;0;L; 0435;;;;N;;;;; +1E036;MODIFIER LETTER CYRILLIC SMALL ZHE;Lm;0;L; 0436;;;;N;;;;; +1E037;MODIFIER LETTER CYRILLIC SMALL ZE;Lm;0;L; 0437;;;;N;;;;; +1E038;MODIFIER LETTER CYRILLIC SMALL I;Lm;0;L; 0438;;;;N;;;;; +1E039;MODIFIER LETTER CYRILLIC SMALL KA;Lm;0;L; 043A;;;;N;;;;; +1E03A;MODIFIER LETTER CYRILLIC SMALL EL;Lm;0;L; 043B;;;;N;;;;; +1E03B;MODIFIER LETTER CYRILLIC SMALL EM;Lm;0;L; 043C;;;;N;;;;; +1E03C;MODIFIER LETTER CYRILLIC SMALL O;Lm;0;L; 043E;;;;N;;;;; +1E03D;MODIFIER LETTER CYRILLIC SMALL PE;Lm;0;L; 043F;;;;N;;;;; +1E03E;MODIFIER LETTER CYRILLIC SMALL ER;Lm;0;L; 0440;;;;N;;;;; +1E03F;MODIFIER LETTER CYRILLIC SMALL ES;Lm;0;L; 0441;;;;N;;;;; +1E040;MODIFIER LETTER CYRILLIC SMALL TE;Lm;0;L; 0442;;;;N;;;;; +1E041;MODIFIER LETTER CYRILLIC SMALL U;Lm;0;L; 0443;;;;N;;;;; +1E042;MODIFIER LETTER CYRILLIC SMALL EF;Lm;0;L; 0444;;;;N;;;;; +1E043;MODIFIER LETTER CYRILLIC SMALL HA;Lm;0;L; 0445;;;;N;;;;; +1E044;MODIFIER LETTER CYRILLIC SMALL TSE;Lm;0;L; 0446;;;;N;;;;; +1E045;MODIFIER LETTER CYRILLIC SMALL CHE;Lm;0;L; 0447;;;;N;;;;; +1E046;MODIFIER LETTER CYRILLIC SMALL SHA;Lm;0;L; 0448;;;;N;;;;; +1E047;MODIFIER LETTER CYRILLIC SMALL YERU;Lm;0;L; 044B;;;;N;;;;; +1E048;MODIFIER LETTER CYRILLIC SMALL E;Lm;0;L; 044D;;;;N;;;;; +1E049;MODIFIER LETTER CYRILLIC SMALL YU;Lm;0;L; 044E;;;;N;;;;; +1E04A;MODIFIER LETTER CYRILLIC SMALL DZZE;Lm;0;L; A689;;;;N;;;;; +1E04B;MODIFIER LETTER CYRILLIC SMALL SCHWA;Lm;0;L; 04D9;;;;N;;;;; +1E04C;MODIFIER LETTER CYRILLIC SMALL BYELORUSSIAN-UKRAINIAN I;Lm;0;L; 0456;;;;N;;;;; +1E04D;MODIFIER LETTER CYRILLIC SMALL JE;Lm;0;L; 0458;;;;N;;;;; +1E04E;MODIFIER LETTER CYRILLIC SMALL BARRED O;Lm;0;L; 04E9;;;;N;;;;; +1E04F;MODIFIER LETTER CYRILLIC SMALL STRAIGHT U;Lm;0;L; 04AF;;;;N;;;;; +1E050;MODIFIER LETTER CYRILLIC SMALL PALOCHKA;Lm;0;L; 04CF;;;;N;;;;; +1E051;CYRILLIC SUBSCRIPT SMALL LETTER A;Lm;0;L; 0430;;;;N;;;;; +1E052;CYRILLIC SUBSCRIPT SMALL LETTER BE;Lm;0;L; 0431;;;;N;;;;; +1E053;CYRILLIC SUBSCRIPT SMALL LETTER VE;Lm;0;L; 0432;;;;N;;;;; +1E054;CYRILLIC SUBSCRIPT SMALL LETTER GHE;Lm;0;L; 0433;;;;N;;;;; +1E055;CYRILLIC SUBSCRIPT SMALL LETTER DE;Lm;0;L; 0434;;;;N;;;;; +1E056;CYRILLIC SUBSCRIPT SMALL LETTER IE;Lm;0;L; 0435;;;;N;;;;; +1E057;CYRILLIC SUBSCRIPT SMALL LETTER ZHE;Lm;0;L; 0436;;;;N;;;;; +1E058;CYRILLIC SUBSCRIPT SMALL LETTER ZE;Lm;0;L; 0437;;;;N;;;;; +1E059;CYRILLIC SUBSCRIPT SMALL LETTER I;Lm;0;L; 0438;;;;N;;;;; +1E05A;CYRILLIC SUBSCRIPT SMALL LETTER KA;Lm;0;L; 043A;;;;N;;;;; +1E05B;CYRILLIC SUBSCRIPT SMALL LETTER EL;Lm;0;L; 043B;;;;N;;;;; +1E05C;CYRILLIC SUBSCRIPT SMALL LETTER O;Lm;0;L; 043E;;;;N;;;;; +1E05D;CYRILLIC SUBSCRIPT SMALL LETTER PE;Lm;0;L; 043F;;;;N;;;;; +1E05E;CYRILLIC SUBSCRIPT SMALL LETTER ES;Lm;0;L; 0441;;;;N;;;;; +1E05F;CYRILLIC SUBSCRIPT SMALL LETTER U;Lm;0;L; 0443;;;;N;;;;; +1E060;CYRILLIC SUBSCRIPT SMALL LETTER EF;Lm;0;L; 0444;;;;N;;;;; +1E061;CYRILLIC SUBSCRIPT SMALL LETTER HA;Lm;0;L; 0445;;;;N;;;;; +1E062;CYRILLIC SUBSCRIPT SMALL LETTER TSE;Lm;0;L; 0446;;;;N;;;;; +1E063;CYRILLIC SUBSCRIPT SMALL LETTER CHE;Lm;0;L; 0447;;;;N;;;;; +1E064;CYRILLIC SUBSCRIPT SMALL LETTER SHA;Lm;0;L; 0448;;;;N;;;;; +1E065;CYRILLIC SUBSCRIPT SMALL LETTER HARD SIGN;Lm;0;L; 044A;;;;N;;;;; +1E066;CYRILLIC SUBSCRIPT SMALL LETTER YERU;Lm;0;L; 044B;;;;N;;;;; +1E067;CYRILLIC SUBSCRIPT SMALL LETTER GHE WITH UPTURN;Lm;0;L; 0491;;;;N;;;;; +1E068;CYRILLIC SUBSCRIPT SMALL LETTER BYELORUSSIAN-UKRAINIAN I;Lm;0;L; 0456;;;;N;;;;; +1E069;CYRILLIC SUBSCRIPT SMALL LETTER DZE;Lm;0;L; 0455;;;;N;;;;; +1E06A;CYRILLIC SUBSCRIPT SMALL LETTER DZHE;Lm;0;L; 045F;;;;N;;;;; +1E06B;MODIFIER LETTER CYRILLIC SMALL ES WITH DESCENDER;Lm;0;L; 04AB;;;;N;;;;; +1E06C;MODIFIER LETTER CYRILLIC SMALL YERU WITH BACK YER;Lm;0;L; A651;;;;N;;;;; +1E06D;MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE;Lm;0;L; 04B1;;;;N;;;;; +1E08F;COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I;Mn;230;NSM;;;;;N;;;;; 1E100;NYIAKENG PUACHUE HMONG LETTER MA;Lo;0;L;;;;;N;;;;; 1E101;NYIAKENG PUACHUE HMONG LETTER TSA;Lo;0;L;;;;;N;;;;; 1E102;NYIAKENG PUACHUE HMONG LETTER NTA;Lo;0;L;;;;;N;;;;; @@ -30603,6 +30828,48 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1E2F8;WANCHO DIGIT EIGHT;Nd;0;L;;8;8;8;N;;;;; 1E2F9;WANCHO DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 1E2FF;WANCHO NGUN SIGN;Sc;0;ET;;;;;N;;;;; +1E4D0;NAG MUNDARI LETTER O;Lo;0;L;;;;;N;;;;; +1E4D1;NAG MUNDARI LETTER OP;Lo;0;L;;;;;N;;;;; +1E4D2;NAG MUNDARI LETTER OL;Lo;0;L;;;;;N;;;;; +1E4D3;NAG MUNDARI LETTER OY;Lo;0;L;;;;;N;;;;; +1E4D4;NAG MUNDARI LETTER ONG;Lo;0;L;;;;;N;;;;; +1E4D5;NAG MUNDARI LETTER A;Lo;0;L;;;;;N;;;;; +1E4D6;NAG MUNDARI LETTER AJ;Lo;0;L;;;;;N;;;;; +1E4D7;NAG MUNDARI LETTER AB;Lo;0;L;;;;;N;;;;; +1E4D8;NAG MUNDARI LETTER ANY;Lo;0;L;;;;;N;;;;; +1E4D9;NAG MUNDARI LETTER AH;Lo;0;L;;;;;N;;;;; +1E4DA;NAG MUNDARI LETTER I;Lo;0;L;;;;;N;;;;; +1E4DB;NAG MUNDARI LETTER IS;Lo;0;L;;;;;N;;;;; +1E4DC;NAG MUNDARI LETTER IDD;Lo;0;L;;;;;N;;;;; +1E4DD;NAG MUNDARI LETTER IT;Lo;0;L;;;;;N;;;;; +1E4DE;NAG MUNDARI LETTER IH;Lo;0;L;;;;;N;;;;; +1E4DF;NAG MUNDARI LETTER U;Lo;0;L;;;;;N;;;;; +1E4E0;NAG MUNDARI LETTER UC;Lo;0;L;;;;;N;;;;; +1E4E1;NAG MUNDARI LETTER UD;Lo;0;L;;;;;N;;;;; +1E4E2;NAG MUNDARI LETTER UK;Lo;0;L;;;;;N;;;;; +1E4E3;NAG MUNDARI LETTER UR;Lo;0;L;;;;;N;;;;; +1E4E4;NAG MUNDARI LETTER E;Lo;0;L;;;;;N;;;;; +1E4E5;NAG MUNDARI LETTER ENN;Lo;0;L;;;;;N;;;;; +1E4E6;NAG MUNDARI LETTER EG;Lo;0;L;;;;;N;;;;; +1E4E7;NAG MUNDARI LETTER EM;Lo;0;L;;;;;N;;;;; +1E4E8;NAG MUNDARI LETTER EN;Lo;0;L;;;;;N;;;;; +1E4E9;NAG MUNDARI LETTER ETT;Lo;0;L;;;;;N;;;;; +1E4EA;NAG MUNDARI LETTER ELL;Lo;0;L;;;;;N;;;;; +1E4EB;NAG MUNDARI SIGN OJOD;Lm;0;L;;;;;N;;;;; +1E4EC;NAG MUNDARI SIGN MUHOR;Mn;232;NSM;;;;;N;;;;; +1E4ED;NAG MUNDARI SIGN TOYOR;Mn;232;NSM;;;;;N;;;;; +1E4EE;NAG MUNDARI SIGN IKIR;Mn;220;NSM;;;;;N;;;;; +1E4EF;NAG MUNDARI SIGN SUTUH;Mn;230;NSM;;;;;N;;;;; +1E4F0;NAG MUNDARI DIGIT ZERO;Nd;0;L;;0;0;0;N;;;;; +1E4F1;NAG MUNDARI DIGIT ONE;Nd;0;L;;1;1;1;N;;;;; +1E4F2;NAG MUNDARI DIGIT TWO;Nd;0;L;;2;2;2;N;;;;; +1E4F3;NAG MUNDARI DIGIT THREE;Nd;0;L;;3;3;3;N;;;;; +1E4F4;NAG MUNDARI DIGIT FOUR;Nd;0;L;;4;4;4;N;;;;; +1E4F5;NAG MUNDARI DIGIT FIVE;Nd;0;L;;5;5;5;N;;;;; +1E4F6;NAG MUNDARI DIGIT SIX;Nd;0;L;;6;6;6;N;;;;; +1E4F7;NAG MUNDARI DIGIT SEVEN;Nd;0;L;;7;7;7;N;;;;; +1E4F8;NAG MUNDARI DIGIT EIGHT;Nd;0;L;;8;8;8;N;;;;; +1E4F9;NAG MUNDARI DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 1E7E0;ETHIOPIC SYLLABLE HHYA;Lo;0;L;;;;;N;;;;; 1E7E1;ETHIOPIC SYLLABLE HHYU;Lo;0;L;;;;;N;;;;; 1E7E2;ETHIOPIC SYLLABLE HHYI;Lo;0;L;;;;;N;;;;; @@ -32678,6 +32945,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1F6D5;HINDU TEMPLE;So;0;ON;;;;;N;;;;; 1F6D6;HUT;So;0;ON;;;;;N;;;;; 1F6D7;ELEVATOR;So;0;ON;;;;;N;;;;; +1F6DC;WIRELESS;So;0;ON;;;;;N;;;;; 1F6DD;PLAYGROUND SLIDE;So;0;ON;;;;;N;;;;; 1F6DE;WHEEL;So;0;ON;;;;;N;;;;; 1F6DF;RING BUOY;So;0;ON;;;;;N;;;;; @@ -32823,6 +33091,14 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1F771;ALCHEMICAL SYMBOL FOR MONTH;So;0;ON;;;;;N;;;;; 1F772;ALCHEMICAL SYMBOL FOR HALF DRAM;So;0;ON;;;;;N;;;;; 1F773;ALCHEMICAL SYMBOL FOR HALF OUNCE;So;0;ON;;;;;N;;;;; +1F774;LOT OF FORTUNE;So;0;ON;;;;;N;;;;; +1F775;OCCULTATION;So;0;ON;;;;;N;;;;; +1F776;LUNAR ECLIPSE;So;0;ON;;;;;N;;;;; +1F77B;HAUMEA;So;0;ON;;;;;N;;;;; +1F77C;MAKEMAKE;So;0;ON;;;;;N;;;;; +1F77D;GONGGONG;So;0;ON;;;;;N;;;;; +1F77E;QUAOAR;So;0;ON;;;;;N;;;;; +1F77F;ORCUS;So;0;ON;;;;;N;;;;; 1F780;BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE;So;0;ON;;;;;N;;;;; 1F781;BLACK UP-POINTING ISOSCELES RIGHT TRIANGLE;So;0;ON;;;;;N;;;;; 1F782;BLACK RIGHT-POINTING ISOSCELES RIGHT TRIANGLE;So;0;ON;;;;;N;;;;; @@ -32912,6 +33188,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1F7D6;NEGATIVE CIRCLED TRIANGLE;So;0;ON;;;;;N;;;;; 1F7D7;CIRCLED SQUARE;So;0;ON;;;;;N;;;;; 1F7D8;NEGATIVE CIRCLED SQUARE;So;0;ON;;;;;N;;;;; +1F7D9;NINE POINTED WHITE STAR;So;0;ON;;;;;N;;;;; 1F7E0;LARGE ORANGE CIRCLE;So;0;ON;;;;;N;;;;; 1F7E1;LARGE YELLOW CIRCLE;So;0;ON;;;;;N;;;;; 1F7E2;LARGE GREEN CIRCLE;So;0;ON;;;;;N;;;;; @@ -33434,6 +33711,9 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FA72;BRIEFS;So;0;ON;;;;;N;;;;; 1FA73;SHORTS;So;0;ON;;;;;N;;;;; 1FA74;THONG SANDAL;So;0;ON;;;;;N;;;;; +1FA75;LIGHT BLUE HEART;So;0;ON;;;;;N;;;;; +1FA76;GREY HEART;So;0;ON;;;;;N;;;;; +1FA77;PINK HEART;So;0;ON;;;;;N;;;;; 1FA78;DROP OF BLOOD;So;0;ON;;;;;N;;;;; 1FA79;ADHESIVE BANDAGE;So;0;ON;;;;;N;;;;; 1FA7A;STETHOSCOPE;So;0;ON;;;;;N;;;;; @@ -33446,6 +33726,8 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FA84;MAGIC WAND;So;0;ON;;;;;N;;;;; 1FA85;PINATA;So;0;ON;;;;;N;;;;; 1FA86;NESTING DOLLS;So;0;ON;;;;;N;;;;; +1FA87;MARACAS;So;0;ON;;;;;N;;;;; +1FA88;FLUTE;So;0;ON;;;;;N;;;;; 1FA90;RINGED PLANET;So;0;ON;;;;;N;;;;; 1FA91;CHAIR;So;0;ON;;;;;N;;;;; 1FA92;RAZOR;So;0;ON;;;;;N;;;;; @@ -33475,6 +33757,9 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FAAA;IDENTIFICATION CARD;So;0;ON;;;;;N;;;;; 1FAAB;LOW BATTERY;So;0;ON;;;;;N;;;;; 1FAAC;HAMSA;So;0;ON;;;;;N;;;;; +1FAAD;FOLDING HAND FAN;So;0;ON;;;;;N;;;;; +1FAAE;HAIR PICK;So;0;ON;;;;;N;;;;; +1FAAF;KHANDA;So;0;ON;;;;;N;;;;; 1FAB0;FLY;So;0;ON;;;;;N;;;;; 1FAB1;WORM;So;0;ON;;;;;N;;;;; 1FAB2;BEETLE;So;0;ON;;;;;N;;;;; @@ -33486,12 +33771,18 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FAB8;CORAL;So;0;ON;;;;;N;;;;; 1FAB9;EMPTY NEST;So;0;ON;;;;;N;;;;; 1FABA;NEST WITH EGGS;So;0;ON;;;;;N;;;;; +1FABB;HYACINTH;So;0;ON;;;;;N;;;;; +1FABC;JELLYFISH;So;0;ON;;;;;N;;;;; +1FABD;WING;So;0;ON;;;;;N;;;;; +1FABF;GOOSE;So;0;ON;;;;;N;;;;; 1FAC0;ANATOMICAL HEART;So;0;ON;;;;;N;;;;; 1FAC1;LUNGS;So;0;ON;;;;;N;;;;; 1FAC2;PEOPLE HUGGING;So;0;ON;;;;;N;;;;; 1FAC3;PREGNANT MAN;So;0;ON;;;;;N;;;;; 1FAC4;PREGNANT PERSON;So;0;ON;;;;;N;;;;; 1FAC5;PERSON WITH CROWN;So;0;ON;;;;;N;;;;; +1FACE;MOOSE;So;0;ON;;;;;N;;;;; +1FACF;DONKEY;So;0;ON;;;;;N;;;;; 1FAD0;BLUEBERRIES;So;0;ON;;;;;N;;;;; 1FAD1;BELL PEPPER;So;0;ON;;;;;N;;;;; 1FAD2;OLIVE;So;0;ON;;;;;N;;;;; @@ -33502,6 +33793,8 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FAD7;POURING LIQUID;So;0;ON;;;;;N;;;;; 1FAD8;BEANS;So;0;ON;;;;;N;;;;; 1FAD9;JAR;So;0;ON;;;;;N;;;;; +1FADA;GINGER ROOT;So;0;ON;;;;;N;;;;; +1FADB;PEA POD;So;0;ON;;;;;N;;;;; 1FAE0;MELTING FACE;So;0;ON;;;;;N;;;;; 1FAE1;SALUTING FACE;So;0;ON;;;;;N;;;;; 1FAE2;FACE WITH OPEN EYES AND HAND OVER MOUTH;So;0;ON;;;;;N;;;;; @@ -33510,6 +33803,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FAE5;DOTTED LINE FACE;So;0;ON;;;;;N;;;;; 1FAE6;BITING LIP;So;0;ON;;;;;N;;;;; 1FAE7;BUBBLES;So;0;ON;;;;;N;;;;; +1FAE8;SHAKING FACE;So;0;ON;;;;;N;;;;; 1FAF0;HAND WITH INDEX FINGER AND THUMB CROSSED;So;0;ON;;;;;N;;;;; 1FAF1;RIGHTWARDS HAND;So;0;ON;;;;;N;;;;; 1FAF2;LEFTWARDS HAND;So;0;ON;;;;;N;;;;; @@ -33517,6 +33811,8 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FAF4;PALM UP HAND;So;0;ON;;;;;N;;;;; 1FAF5;INDEX POINTING AT THE VIEWER;So;0;ON;;;;;N;;;;; 1FAF6;HEART HANDS;So;0;ON;;;;;N;;;;; +1FAF7;LEFTWARDS PUSHING HAND;So;0;ON;;;;;N;;;;; +1FAF8;RIGHTWARDS PUSHING HAND;So;0;ON;;;;;N;;;;; 1FB00;BLOCK SEXTANT-1;So;0;ON;;;;;N;;;;; 1FB01;BLOCK SEXTANT-2;So;0;ON;;;;;N;;;;; 1FB02;BLOCK SEXTANT-12;So;0;ON;;;;;N;;;;; @@ -33732,7 +34028,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 20000;;Lo;0;L;;;;;N;;;;; 2A6DF;;Lo;0;L;;;;;N;;;;; 2A700;;Lo;0;L;;;;;N;;;;; -2B738;;Lo;0;L;;;;;N;;;;; +2B739;;Lo;0;L;;;;;N;;;;; 2B740;;Lo;0;L;;;;;N;;;;; 2B81D;;Lo;0;L;;;;;N;;;;; 2B820;;Lo;0;L;;;;;N;;;;; @@ -34283,6 +34579,8 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 2FA1D;CJK COMPATIBILITY IDEOGRAPH-2FA1D;Lo;0;L;2A600;;;;N;;;;; 30000;;Lo;0;L;;;;;N;;;;; 3134A;;Lo;0;L;;;;;N;;;;; +31350;;Lo;0;L;;;;;N;;;;; +323AF;;Lo;0;L;;;;;N;;;;; E0001;LANGUAGE TAG;Cf;0;BN;;;;;N;;;;; E0020;TAG SPACE;Cf;0;BN;;;;;N;;;;; E0021;TAG EXCLAMATION MARK;Cf;0;BN;;;;;N;;;;; diff --git a/icu4c/source/data/unidata/changes.txt b/icu4c/source/data/unidata/changes.txt index 031b75584c3..d928abb17e0 100644 --- a/icu4c/source/data/unidata/changes.txt +++ b/icu4c/source/data/unidata/changes.txt @@ -68,15 +68,22 @@ export LD_LIBRARY_PATH=$ICU_ROOT/dbg/icu4c/lib - mkdir -p $UNICODE_DATA - download Unicode files into $UNICODE_DATA + subfolders: emoji, idna, security, ucd, uca - + inside ucd: extract Unihan.zip to "here" (.../ucd/Unihan/*.txt), delete Unihan.zip - + split Unihan into single-property files - ~/unitools/mine/src$ py/splitunihan.py $UNICODE_DATA/ucd/Unihan + + old way of fetching files: from the "Public" area on unicode.org + ~ inside ucd: extract Unihan.zip to "here" (.../ucd/Unihan/*.txt), delete Unihan.zip + ~ split Unihan into single-property files + ~/unitools/mine/src$ py/splitunihan.py $UNICODE_DATA/ucd/Unihan + + new way of fetching files, if available: + copy the files from a Unicode Tools workspace that is up to date with + https://github.com/unicode-org/unicodetools + and which might at this point be *ahead* of "Public" + ~ before the Unicode release copy files from "dev" subfolders, for example + https://github.com/unicode-org/unicodetools/tree/main/unicodetools/data/ucd/dev + get GraphemeBreakTest-cldr.txt from $CLDR_SRC/common/properties/segments/GraphemeBreakTest.txt or from the UCD/cldr/ output folder of the Unicode Tools: Since Unicode 12/CLDR 35/ICU 64 CLDR uses modified break rules. cp $CLDR_SRC/common/properties/segments/GraphemeBreakTest.txt icu4c/source/test/testdata or - cp ~/unitools/mine/Generated/UCD/d19/cldr/GraphemeBreakTest-cldr-14.0.0d19.txt icu4c/source/test/testdata/GraphemeBreakTest.txt + cp ~/unitools/mine/Generated/UCD/15.0.0/cldr/GraphemeBreakTest-cldr.txt icu4c/source/test/testdata/GraphemeBreakTest.txt * for manual diffs and for Unicode Tools input data updates: remove version suffixes from the file names @@ -94,52 +101,32 @@ export LD_LIBRARY_PATH=$ICU_ROOT/dbg/icu4c/lib * new constants for new property values - preparseucd.py error: - ValueError: missing uchar.h enum constants for some property values: - [(u'blk', set([u'Toto', u'Tangsa', u'Cypro_Minoan', u'Arabic_Ext_B', u'Vithkuqi', u'Old_Uyghur', u'Latin_Ext_F', u'UCAS_Ext_A', u'Kana_Ext_B', u'Ethiopic_Ext_B', u'Latin_Ext_G', u'Znamenny_Music'])), - (u'jg', set([u'Vertical_Tail', u'Thin_Yeh'])), - (u'sc', set([u'Toto', u'Ougr', u'Vith', u'Tnsa', u'Cpmn']))] + ValueError: missing uchar.h enum constants for some property values: [('blk', {'Nag_Mundari', 'CJK_Ext_H', 'Kawi', 'Kaktovik_Numerals', 'Devanagari_Ext_A', 'Arabic_Ext_C', 'Cyrillic_Ext_D'}), ('sc', {'Nagm', 'Kawi'})] = PropertyValueAliases.txt new property values (diff old & new .txt files) - ~/unidata$ diff -u uni13/20200304/ucd/PropertyValueAliases.txt uni14/20210609/ucd/PropertyValueAliases.txt | egrep '^[-+][a-zA-Z]' - +age; 14.0 ; V14_0 - +blk; Arabic_Ext_B ; Arabic_Extended_B - +blk; Cypro_Minoan ; Cypro_Minoan - +blk; Ethiopic_Ext_B ; Ethiopic_Extended_B - +blk; Kana_Ext_B ; Kana_Extended_B - +blk; Latin_Ext_F ; Latin_Extended_F - +blk; Latin_Ext_G ; Latin_Extended_G - +blk; Old_Uyghur ; Old_Uyghur - +blk; Tangsa ; Tangsa - +blk; Toto ; Toto - +blk; UCAS_Ext_A ; Unified_Canadian_Aboriginal_Syllabics_Extended_A - +blk; Vithkuqi ; Vithkuqi - +blk; Znamenny_Music ; Znamenny_Musical_Notation - +jg ; Thin_Yeh ; Thin_Yeh - +jg ; Vertical_Tail ; Vertical_Tail - +sc ; Cpmn ; Cypro_Minoan - +sc ; Ougr ; Old_Uyghur - +sc ; Tnsa ; Tangsa - +sc ; Toto ; Toto - +sc ; Vith ; Vithkuqi + ~/unidata$ diff -u uni14/20210922/ucd/PropertyValueAliases.txt uni15/beta/ucd/PropertyValueAliases.txt | egrep '^[-+][a-zA-Z]' + +age; 15.0 ; V15_0 + +blk; Arabic_Ext_C ; Arabic_Extended_C + +blk; CJK_Ext_H ; CJK_Unified_Ideographs_Extension_H + +blk; Cyrillic_Ext_D ; Cyrillic_Extended_D + +blk; Devanagari_Ext_A ; Devanagari_Extended_A + +blk; Kaktovik_Numerals ; Kaktovik_Numerals + +blk; Kawi ; Kawi + +blk; Nag_Mundari ; Nag_Mundari + +sc ; Kawi ; Kawi + +sc ; Nagm ; Nag_Mundari -> add new blocks to uchar.h before UBLOCK_COUNT use long property names for enum constants, for the trailing comment get the block start code point: diff old & new Blocks.txt - ~/unidata$ diff -u uni13/20200304/ucd/Blocks.txt uni14/20210609/ucd/Blocks.txt | egrep '^[-+][0-9A-Z]' - +0870..089F; Arabic Extended-B - +10570..105BF; Vithkuqi - +10780..107BF; Latin Extended-F - +10F70..10FAF; Old Uyghur - -11700..1173F; Ahom - +11700..1174F; Ahom - +11AB0..11ABF; Unified Canadian Aboriginal Syllabics Extended-A - +12F90..12FFF; Cypro-Minoan - +16A70..16ACF; Tangsa - -18D00..18D8F; Tangut Supplement - +18D00..18D7F; Tangut Supplement - +1AFF0..1AFFF; Kana Extended-B - +1CF00..1CFCF; Znamenny Musical Notation - +1DF00..1DFFF; Latin Extended-G - +1E290..1E2BF; Toto - +1E7E0..1E7FF; Ethiopic Extended-B + ~/unidata$ diff -u uni14/20210922/ucd/Blocks.txt uni15/beta/ucd/Blocks.txt | egrep '^[-+][0-9A-Z]' + +10EC0..10EFF; Arabic Extended-C + +11B00..11B5F; Devanagari Extended-A + +11F00..11F5F; Kawi + -13430..1343F; Egyptian Hieroglyph Format Controls + +13430..1345F; Egyptian Hieroglyph Format Controls + +1D2C0..1D2DF; Kaktovik Numerals + +1E030..1E08F; Cyrillic Extended-D + +1E4D0..1E4FF; Nag Mundari + +31350..323AF; CJK Unified Ideographs Extension H (ignore blocks whose end code point changed) -> add new blocks to UCharacter.UnicodeBlock IDs Eclipse find UBLOCK_([^ ]+) = ([0-9]+), (/.+) @@ -152,7 +139,6 @@ export LD_LIBRARY_PATH=$ICU_ROOT/dbg/icu4c/lib replace public static final int \1 = \2; \3 -> for new scripts: fix expectedLong names in cintltst/cucdapi.c/TestUScriptCodeAPI() and in com.ibm.icu.dev.test.lang.TestUScript.java - -> add new joining groups to uchar.h & UCharacter.JoiningGroup * update Script metadata: SCRIPT_PROPS[] in uscript_props.cpp & UScript.ScriptMetadata (not strictly necessary for NOT_ENCODED scripts) @@ -163,6 +149,8 @@ export LD_LIBRARY_PATH=$ICU_ROOT/dbg/icu4c/lib $ICU_ROOT/dbg/icu4c$ echo;echo; date; make -j7 tests &> out.txt ; tail -n 30 out.txt ; date +TODO + * update spoof checker UnicodeSet initializers: inclusionPat & recommendedPat in i18n/uspoof.cpp INCLUSION & RECOMMENDED in SpoofChecker.java diff --git a/icu4c/source/data/unidata/confusables.txt b/icu4c/source/data/unidata/confusables.txt index 371612c607c..3b65d309f9a 100644 --- a/icu4c/source/data/unidata/confusables.txt +++ b/icu4c/source/data/unidata/confusables.txt @@ -1,13 +1,13 @@ # confusables.txt -# Date: 2021-05-29, 22:09:29 GMT -# © 2021 Unicode®, Inc. +# Date: 2022-05-18, 21:51:56 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Security Mechanisms for UTS #39 -# Version: 14.0.0 +# Version: 15.0.0 # -# For documentation and usage, see http://www.unicode.org/reports/tr39 +# For documentation and usage, see https://www.unicode.org/reports/tr39 # 05AD ; 0596 ; MA # ( ֭ → ֖ ) HEBREW ACCENT DEHI → HEBREW ACCENT TIPEHA # @@ -2761,11 +2761,11 @@ FE87 ; 006C 0655 ; MA # ( ‎ﺇ‎ → lٕ ) ARABIC LETTER ALEF WITH HAMZA BELO 02AB ; 006C 007A ; MA # ( ʫ → lz ) LATIN SMALL LETTER LZ DIGRAPH → LATIN SMALL LETTER L, LATIN SMALL LETTER Z # +0675 ; 006C 0674 ; MA # ( ‎ٵ‎ → ‎lٴ‎ ) ARABIC LETTER HIGH HAMZA ALEF → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎اٴ‎→ 0623 ; 006C 0674 ; MA # ( ‎أ‎ → ‎lٴ‎ ) ARABIC LETTER ALEF WITH HAMZA ABOVE → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎ٵ‎→→‎اٴ‎→ FE84 ; 006C 0674 ; MA # ( ‎ﺄ‎ → ‎lٴ‎ ) ARABIC LETTER ALEF WITH HAMZA ABOVE FINAL FORM → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎أ‎→→‎ٵ‎→→‎اٴ‎→ FE83 ; 006C 0674 ; MA # ( ‎ﺃ‎ → ‎lٴ‎ ) ARABIC LETTER ALEF WITH HAMZA ABOVE ISOLATED FORM → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎ٵ‎→→‎اٴ‎→ 0672 ; 006C 0674 ; MA # ( ‎ٲ‎ → ‎lٴ‎ ) ARABIC LETTER ALEF WITH WAVY HAMZA ABOVE → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎أ‎→→‎ٵ‎→→‎اٴ‎→ -0675 ; 006C 0674 ; MA # ( ‎ٵ‎ → ‎lٴ‎ ) ARABIC LETTER HIGH HAMZA ALEF → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎اٴ‎→ FDF3 ; 006C 0643 0628 0631 ; MA # ( ‎ﷳ‎ → ‎lكبر‎ ) ARABIC LIGATURE AKBAR ISOLATED FORM → LATIN SMALL LETTER L, ARABIC LETTER KAF, ARABIC LETTER BEH, ARABIC LETTER REH # →‎اكبر‎→ @@ -5351,10 +5351,10 @@ FBE2 ; 0648 0302 ; MA # ( ‎ﯢ‎ → ‎و̂‎ ) ARABIC LETTER KIRGHIZ YU IS FBDC ; 0648 0670 ; MA # ( ‎ﯜ‎ → ‎وٰ‎ ) ARABIC LETTER YU FINAL FORM → ARABIC LETTER WAW, ARABIC LETTER SUPERSCRIPT ALEF # →‎ۈ‎→ FBDB ; 0648 0670 ; MA # ( ‎ﯛ‎ → ‎وٰ‎ ) ARABIC LETTER YU ISOLATED FORM → ARABIC LETTER WAW, ARABIC LETTER SUPERSCRIPT ALEF # →‎ۈ‎→ +0676 ; 0648 0674 ; MA # ( ‎ٶ‎ → ‎وٴ‎ ) ARABIC LETTER HIGH HAMZA WAW → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # 0624 ; 0648 0674 ; MA # ( ‎ؤ‎ → ‎وٴ‎ ) ARABIC LETTER WAW WITH HAMZA ABOVE → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # →‎ٶ‎→ FE86 ; 0648 0674 ; MA # ( ‎ﺆ‎ → ‎وٴ‎ ) ARABIC LETTER WAW WITH HAMZA ABOVE FINAL FORM → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # →‎ٶ‎→ FE85 ; 0648 0674 ; MA # ( ‎ﺅ‎ → ‎وٴ‎ ) ARABIC LETTER WAW WITH HAMZA ABOVE ISOLATED FORM → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # →‎ٶ‎→ -0676 ; 0648 0674 ; MA # ( ‎ٶ‎ → ‎وٴ‎ ) ARABIC LETTER HIGH HAMZA WAW → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # 0677 ; 0648 0313 0674 ; MA # ( ‎ٷ‎ → ‎و̓ٴ‎ ) ARABIC LETTER U WITH HAMZA ABOVE → ARABIC LETTER WAW, COMBINING COMMA ABOVE, ARABIC LETTER HIGH HAMZA # →‎ۇٴ‎→ FBDD ; 0648 0313 0674 ; MA # ( ‎ﯝ‎ → ‎و̓ٴ‎ ) ARABIC LETTER U WITH HAMZA ABOVE ISOLATED FORM → ARABIC LETTER WAW, COMBINING COMMA ABOVE, ARABIC LETTER HIGH HAMZA # →‎ۇٴ‎→ @@ -5446,12 +5446,12 @@ FCF1 ; 0649 006F ; MA # ( ‎ﳱ‎ → ‎ىo‎ ) ARABIC LIGATURE YEH WITH HEH FCE6 ; 0649 06DB 006F ; MA # ( ‎ﳦ‎ → ‎ىۛo‎ ) ARABIC LIGATURE THEH WITH HEH MEDIAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC SMALL HIGH THREE DOTS, LATIN SMALL LETTER O # →‎ثه‎→ +0678 ; 0649 0674 ; MA # ( ‎ٸ‎ → ‎ىٴ‎ ) ARABIC LETTER HIGH HAMZA YEH → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎يٴ‎→ 0626 ; 0649 0674 ; MA # ( ‎ئ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ٸ‎→→‎يٴ‎→ FE8B ; 0649 0674 ; MA # ( ‎ﺋ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE INITIAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ئ‎→→‎ٸ‎→→‎يٴ‎→ FE8C ; 0649 0674 ; MA # ( ‎ﺌ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE MEDIAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ئ‎→→‎ٸ‎→→‎يٴ‎→ FE8A ; 0649 0674 ; MA # ( ‎ﺊ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE FINAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ئ‎→→‎ٸ‎→→‎يٴ‎→ FE89 ; 0649 0674 ; MA # ( ‎ﺉ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE ISOLATED FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ٸ‎→→‎يٴ‎→ -0678 ; 0649 0674 ; MA # ( ‎ٸ‎ → ‎ىٴ‎ ) ARABIC LETTER HIGH HAMZA YEH → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎يٴ‎→ FBEB ; 0649 0674 006C ; MA # ( ‎ﯫ‎ → ‎ىٴl‎ ) ARABIC LIGATURE YEH WITH HAMZA ABOVE WITH ALEF FINAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA, LATIN SMALL LETTER L # →‎ئا‎→ FBEA ; 0649 0674 006C ; MA # ( ‎ﯪ‎ → ‎ىٴl‎ ) ARABIC LIGATURE YEH WITH HAMZA ABOVE WITH ALEF ISOLATED FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA, LATIN SMALL LETTER L # →‎ئا‎→ diff --git a/icu4c/source/data/unidata/emoji-sequences.txt b/icu4c/source/data/unidata/emoji-sequences.txt index e8aa0fc97fd..f137a9831f9 100644 --- a/icu4c/source/data/unidata/emoji-sequences.txt +++ b/icu4c/source/data/unidata/emoji-sequences.txt @@ -1,13 +1,13 @@ # emoji-sequences.txt -# Date: 2021-08-26, 17:22:22 GMT -# © 2021 Unicode®, Inc. +# Date: 2022-05-06, 16:14:52 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Emoji Sequence Data for UTS #51 -# Version: 14.0 +# Version: 15.0 # -# For documentation and usage, see http://www.unicode.org/reports/tr51 +# For documentation and usage, see https://www.unicode.org/reports/tr51 # # Format: # code_point(s) ; type_field ; description # comments @@ -238,6 +238,7 @@ 1F6D1..1F6D2 ; Basic_Emoji ; stop sign # E3.0 [2] (🛑..🛒) 1F6D5 ; Basic_Emoji ; hindu temple # E12.0 [1] (🛕) 1F6D6..1F6D7 ; Basic_Emoji ; hut # E13.0 [2] (🛖..🛗) +1F6DC ; Basic_Emoji ; wireless # E15.0 [1] (🛜) 1F6DD..1F6DF ; Basic_Emoji ; playground slide # E14.0 [3] (🛝..🛟) 1F6EB..1F6EC ; Basic_Emoji ; airplane departure # E1.0 [2] (🛫..🛬) 1F6F4..1F6F6 ; Basic_Emoji ; kick scooter # E3.0 [3] (🛴..🛶) @@ -294,21 +295,30 @@ 1F9E7..1F9FF ; Basic_Emoji ; red envelope # E11.0 [25] (🧧..🧿) 1FA70..1FA73 ; Basic_Emoji ; ballet shoes # E12.0 [4] (🩰..🩳) 1FA74 ; Basic_Emoji ; thong sandal # E13.0 [1] (🩴) +1FA75..1FA77 ; Basic_Emoji ; light blue heart # E15.0 [3] (🩵..🩷) 1FA78..1FA7A ; Basic_Emoji ; drop of blood # E12.0 [3] (🩸..🩺) 1FA7B..1FA7C ; Basic_Emoji ; x-ray # E14.0 [2] (🩻..🩼) 1FA80..1FA82 ; Basic_Emoji ; yo-yo # E12.0 [3] (🪀..🪂) 1FA83..1FA86 ; Basic_Emoji ; boomerang # E13.0 [4] (🪃..🪆) +1FA87..1FA88 ; Basic_Emoji ; maracas # E15.0 [2] (🪇..🪈) 1FA90..1FA95 ; Basic_Emoji ; ringed planet # E12.0 [6] (🪐..🪕) 1FA96..1FAA8 ; Basic_Emoji ; military helmet # E13.0 [19] (🪖..🪨) 1FAA9..1FAAC ; Basic_Emoji ; mirror ball # E14.0 [4] (🪩..🪬) +1FAAD..1FAAF ; Basic_Emoji ; folding hand fan # E15.0 [3] (🪭..🪯) 1FAB0..1FAB6 ; Basic_Emoji ; fly # E13.0 [7] (🪰..🪶) 1FAB7..1FABA ; Basic_Emoji ; lotus # E14.0 [4] (🪷..🪺) +1FABB..1FABD ; Basic_Emoji ; hyacinth # E15.0 [3] (🪻..🪽) +1FABF ; Basic_Emoji ; goose # E15.0 [1] (🪿) 1FAC0..1FAC2 ; Basic_Emoji ; anatomical heart # E13.0 [3] (🫀..🫂) 1FAC3..1FAC5 ; Basic_Emoji ; pregnant man # E14.0 [3] (🫃..🫅) +1FACE..1FACF ; Basic_Emoji ; moose # E15.0 [2] (🫎..🫏) 1FAD0..1FAD6 ; Basic_Emoji ; blueberries # E13.0 [7] (🫐..🫖) 1FAD7..1FAD9 ; Basic_Emoji ; pouring liquid # E14.0 [3] (🫗..🫙) +1FADA..1FADB ; Basic_Emoji ; ginger root # E15.0 [2] (🫚..🫛) 1FAE0..1FAE7 ; Basic_Emoji ; melting face # E14.0 [8] (🫠..🫧) +1FAE8 ; Basic_Emoji ; shaking face # E15.0 [1] (🫨) 1FAF0..1FAF6 ; Basic_Emoji ; hand with index finger and thumb crossed # E14.0 [7] (🫰..🫶) +1FAF7..1FAF8 ; Basic_Emoji ; leftwards pushing hand # E15.0 [2] (🫷..🫸) 00A9 FE0F ; Basic_Emoji ; copyright # E0.6 [1] (©️) 00AE FE0F ; Basic_Emoji ; registered # E0.6 [1] (®️) 203C FE0F ; Basic_Emoji ; double exclamation mark # E0.6 [1] (‼️) @@ -517,7 +527,7 @@ 1F6F0 FE0F ; Basic_Emoji ; satellite # E0.7 [1] (🛰️) 1F6F3 FE0F ; Basic_Emoji ; passenger ship # E0.7 [1] (🛳️) -# Total elements: 1366 +# Total elements: 1386 # ================================================ @@ -1463,7 +1473,17 @@ 1FAF6 1F3FD ; RGI_Emoji_Modifier_Sequence ; heart hands: medium skin tone # E14.0 [1] (🫶🏽) 1FAF6 1F3FE ; RGI_Emoji_Modifier_Sequence ; heart hands: medium-dark skin tone # E14.0 [1] (🫶🏾) 1FAF6 1F3FF ; RGI_Emoji_Modifier_Sequence ; heart hands: dark skin tone # E14.0 [1] (🫶🏿) +1FAF7 1F3FB ; RGI_Emoji_Modifier_Sequence ; leftwards pushing hand: light skin tone # E15.0 [1] (🫷🏻) +1FAF7 1F3FC ; RGI_Emoji_Modifier_Sequence ; leftwards pushing hand: medium-light skin tone # E15.0 [1] (🫷🏼) +1FAF7 1F3FD ; RGI_Emoji_Modifier_Sequence ; leftwards pushing hand: medium skin tone # E15.0 [1] (🫷🏽) +1FAF7 1F3FE ; RGI_Emoji_Modifier_Sequence ; leftwards pushing hand: medium-dark skin tone # E15.0 [1] (🫷🏾) +1FAF7 1F3FF ; RGI_Emoji_Modifier_Sequence ; leftwards pushing hand: dark skin tone # E15.0 [1] (🫷🏿) +1FAF8 1F3FB ; RGI_Emoji_Modifier_Sequence ; rightwards pushing hand: light skin tone # E15.0 [1] (🫸🏻) +1FAF8 1F3FC ; RGI_Emoji_Modifier_Sequence ; rightwards pushing hand: medium-light skin tone # E15.0 [1] (🫸🏼) +1FAF8 1F3FD ; RGI_Emoji_Modifier_Sequence ; rightwards pushing hand: medium skin tone # E15.0 [1] (🫸🏽) +1FAF8 1F3FE ; RGI_Emoji_Modifier_Sequence ; rightwards pushing hand: medium-dark skin tone # E15.0 [1] (🫸🏾) +1FAF8 1F3FF ; RGI_Emoji_Modifier_Sequence ; rightwards pushing hand: dark skin tone # E15.0 [1] (🫸🏿) -# Total elements: 645 +# Total elements: 655 #EOF diff --git a/icu4c/source/data/unidata/emoji-zwj-sequences.txt b/icu4c/source/data/unidata/emoji-zwj-sequences.txt index 1d64edcdc70..c71fe183ad4 100644 --- a/icu4c/source/data/unidata/emoji-zwj-sequences.txt +++ b/icu4c/source/data/unidata/emoji-zwj-sequences.txt @@ -1,13 +1,13 @@ # emoji-zwj-sequences.txt -# Date: 2021-06-08, 05:19:16 GMT -# © 2021 Unicode®, Inc. +# Date: 2022-05-06, 16:14:52 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Emoji ZWJ Sequences for UTS #51 -# Version: 14.0 +# Version: 15.0 # -# For documentation and usage, see http://www.unicode.org/reports/tr51 +# For documentation and usage, see https://www.unicode.org/reports/tr51 # # Format: # code_point(s) ; type_field ; description # comments @@ -1398,6 +1398,7 @@ 1F3F4 200D 2620 FE0F ; RGI_Emoji_ZWJ_Sequence ; pirate flag # E11.0 [1] (🏴‍☠️) 1F408 200D 2B1B ; RGI_Emoji_ZWJ_Sequence ; black cat # E13.0 [1] (🐈‍⬛) 1F415 200D 1F9BA ; RGI_Emoji_ZWJ_Sequence ; service dog # E12.0 [1] (🐕‍🦺) +1F426 200D 2B1B ; RGI_Emoji_ZWJ_Sequence ; black bird # E15.0 [1] (🐦‍⬛) 1F43B 200D 2744 FE0F ; RGI_Emoji_ZWJ_Sequence ; polar bear # E13.0 [1] (🐻‍❄️) 1F441 FE0F 200D 1F5E8 FE0F ; RGI_Emoji_ZWJ_Sequence ; eye in speech bubble # E2.0 [1] (👁️‍🗨️) 1F62E 200D 1F4A8 ; RGI_Emoji_ZWJ_Sequence ; face exhaling # E13.1 [1] (😮‍💨) @@ -1405,6 +1406,6 @@ 1F636 200D 1F32B FE0F ; RGI_Emoji_ZWJ_Sequence ; face in clouds # E13.1 [1] (😶‍🌫️) 1F9D1 200D 1F384 ; RGI_Emoji_ZWJ_Sequence ; mx claus # E13.0 [1] (🧑‍🎄) -# Total elements: 13 +# Total elements: 14 #EOF diff --git a/icu4c/source/data/unidata/norm2/nfc.txt b/icu4c/source/data/unidata/norm2/nfc.txt index c9168ad4c50..dcf35f8fece 100644 --- a/icu4c/source/data/unidata/norm2/nfc.txt +++ b/icu4c/source/data/unidata/norm2/nfc.txt @@ -9,7 +9,7 @@ # # Complete data for Unicode NFC normalization. -* Unicode 14.0.0 +* Unicode 15.0.0 # Canonical_Combining_Class (ccc) values 0300..0314:230 @@ -320,6 +320,7 @@ FE2E..FE2F:230 10AE6:220 10D24..10D27:230 10EAB..10EAC:230 +10EFD..10EFF:220 10F46..10F47:220 10F48..10F4A:230 10F4B:220 @@ -370,6 +371,7 @@ FE2E..FE2F:230 11D42:7 11D44..11D45:9 11D97:9 +11F41..11F42:9 16AF0..16AF4:1 16B30..16B36:230 16FF0..16FF1:6 @@ -388,9 +390,13 @@ FE2E..FE2F:230 1E01B..1E021:230 1E023..1E024:230 1E026..1E02A:230 +1E08F:230 1E130..1E136:230 1E2AE:230 1E2EC..1E2EF:230 +1E4EC..1E4ED:232 +1E4EE:220 +1E4EF:230 1E8D0..1E8D6:220 1E944..1E949:230 1E94A:7 diff --git a/icu4c/source/data/unidata/norm2/nfkc.txt b/icu4c/source/data/unidata/norm2/nfkc.txt index 566468419a2..7d2f642e3a6 100644 --- a/icu4c/source/data/unidata/norm2/nfkc.txt +++ b/icu4c/source/data/unidata/norm2/nfkc.txt @@ -13,7 +13,7 @@ # to NFKC one-way mappings. # Use this file as the second gennorm2 input file after nfc.txt. -* Unicode 14.0.0 +* Unicode 15.0.0 00A0>0020 00A8>0020 0308 @@ -3474,6 +3474,68 @@ FFEE>25CB 1D7FD>0037 1D7FE>0038 1D7FF>0039 +1E030>0430 +1E031>0431 +1E032>0432 +1E033>0433 +1E034>0434 +1E035>0435 +1E036>0436 +1E037>0437 +1E038>0438 +1E039>043A +1E03A>043B +1E03B>043C +1E03C>043E +1E03D>043F +1E03E>0440 +1E03F>0441 +1E040>0442 +1E041>0443 +1E042>0444 +1E043>0445 +1E044>0446 +1E045>0447 +1E046>0448 +1E047>044B +1E048>044D +1E049>044E +1E04A>A689 +1E04B>04D9 +1E04C>0456 +1E04D>0458 +1E04E>04E9 +1E04F>04AF +1E050>04CF +1E051>0430 +1E052>0431 +1E053>0432 +1E054>0433 +1E055>0434 +1E056>0435 +1E057>0436 +1E058>0437 +1E059>0438 +1E05A>043A +1E05B>043B +1E05C>043E +1E05D>043F +1E05E>0441 +1E05F>0443 +1E060>0444 +1E061>0445 +1E062>0446 +1E063>0447 +1E064>0448 +1E065>044A +1E066>044B +1E067>0491 +1E068>0456 +1E069>0455 +1E06A>045F +1E06B>04AB +1E06C>A651 +1E06D>04B1 1EE00>0627 1EE01>0628 1EE02>062C diff --git a/icu4c/source/data/unidata/norm2/nfkc_cf.txt b/icu4c/source/data/unidata/norm2/nfkc_cf.txt index fe677510e60..8c5deec0035 100644 --- a/icu4c/source/data/unidata/norm2/nfkc_cf.txt +++ b/icu4c/source/data/unidata/norm2/nfkc_cf.txt @@ -12,7 +12,7 @@ # and reformatted into syntax for the gennorm2 Normalizer2 data generator tool. # Use this file as the third gennorm2 input file after nfc.txt and nfkc.txt. -* Unicode 14.0.0 +* Unicode 15.0.0 0041>0061 0042>0062 @@ -5179,6 +5179,68 @@ FFF0..FFF8> 1D7FD>0037 1D7FE>0038 1D7FF>0039 +1E030>0430 +1E031>0431 +1E032>0432 +1E033>0433 +1E034>0434 +1E035>0435 +1E036>0436 +1E037>0437 +1E038>0438 +1E039>043A +1E03A>043B +1E03B>043C +1E03C>043E +1E03D>043F +1E03E>0440 +1E03F>0441 +1E040>0442 +1E041>0443 +1E042>0444 +1E043>0445 +1E044>0446 +1E045>0447 +1E046>0448 +1E047>044B +1E048>044D +1E049>044E +1E04A>A689 +1E04B>04D9 +1E04C>0456 +1E04D>0458 +1E04E>04E9 +1E04F>04AF +1E050>04CF +1E051>0430 +1E052>0431 +1E053>0432 +1E054>0433 +1E055>0434 +1E056>0435 +1E057>0436 +1E058>0437 +1E059>0438 +1E05A>043A +1E05B>043B +1E05C>043E +1E05D>043F +1E05E>0441 +1E05F>0443 +1E060>0444 +1E061>0445 +1E062>0446 +1E063>0447 +1E064>0448 +1E065>044A +1E066>044B +1E067>0491 +1E068>0456 +1E069>0455 +1E06A>045F +1E06B>04AB +1E06C>A651 +1E06D>04B1 1E900>1E922 1E901>1E923 1E902>1E924 diff --git a/icu4c/source/data/unidata/norm2/uts46.txt b/icu4c/source/data/unidata/norm2/uts46.txt index a96f08b55a0..20bb7088601 100644 --- a/icu4c/source/data/unidata/norm2/uts46.txt +++ b/icu4c/source/data/unidata/norm2/uts46.txt @@ -1,14 +1,14 @@ # Original file: # IdnaMappingTable.txt -# Date: 2021-07-10, 00:49:51 GMT -# © 2021 Unicode®, Inc. +# Date: 2022-05-02, 19:29:26 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode IDNA Compatible Preprocessing for UTS #46 -# Version: 14.0.0 +# Version: 15.0.0 # -# For documentation and usage, see http://www.unicode.org/reports/tr46 +# For documentation and usage, see https://www.unicode.org/reports/tr46 # ================================================ # This file has been reformatted into syntax for the @@ -1295,7 +1295,8 @@ # 0CE6..0CEF valid # 1.1 KANNADA DIGIT ZERO..KANNADA DIGIT NINE 0CF0 >FFFD # NA # 0CF1..0CF2 valid # 5.0 KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA -0CF3..0CFF >FFFD # NA .. +# 0CF3 valid # 15.0 KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0CF4..0CFF >FFFD # NA .. # 0D00 valid # 10.0 MALAYALAM SIGN COMBINING ANUSVARA ABOVE # 0D01 valid # 7.0 MALAYALAM SIGN CANDRABINDU # 0D02..0D03 valid # 1.1 MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA @@ -1403,7 +1404,8 @@ # 0EC6 valid # 1.1 LAO KO LA 0EC7 >FFFD # NA # 0EC8..0ECD valid # 1.1 LAO TONE MAI EK..LAO NIGGAHITA -0ECE..0ECF >FFFD # NA .. +# 0ECE valid # 15.0 LAO YAMAKKAN +0ECF >FFFD # NA # 0ED0..0ED9 valid # 1.1 LAO DIGIT ZERO..LAO DIGIT NINE 0EDA..0EDB >FFFD # NA .. 0EDC >0EAB 0E99 # 1.1 LAO HO NO @@ -6223,7 +6225,8 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 10EB0..10EB1valid # 13.0 YEZIDI LETTER LAM WITH DOT ABOVE..YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE -10EB2..10EFF >FFFD # NA .. +10EB2..10EFC >FFFD # NA .. +# 10EFD..10EFFvalid # 15.0 ARABIC SMALL LOW WORD SAKTA..ARABIC SMALL LOW WORD MADDA # 10F00..10F1Cvalid # 11.0 OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL # 10F1D..10F26valid # 11.0 OLD SOGDIAN NUMBER ONE..OLD SOGDIAN FRACTION ONE HALF # 10F27 valid # 11.0 OLD SOGDIAN LIGATURE AYIN-DALETH @@ -6288,7 +6291,8 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. +# 1123F..11241valid # 15.0 KHOJKI LETTER QA..KHOJKI VOWEL SIGN VOCALIC R +11242..1127F >FFFD # NA .. # 11280..11286valid # 8.0 MULTANI LETTER A..MULTANI LETTER GA 11287 >FFFD # NA # 11288 valid # 8.0 MULTANI LETTER GHA @@ -6460,7 +6464,9 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 11AB0..11ABFvalid # 14.0 CANADIAN SYLLABICS NATTILIK HI..CANADIAN SYLLABICS SPA # 11AC0..11AF8valid # 7.0 PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL -11AF9..11BFF >FFFD # NA .. +11AF9..11AFF >FFFD # NA .. +# 11B00..11B09valid # 15.0 DEVANAGARI HEAD MARK..DEVANAGARI SIGN MINDU +11B0A..11BFF >FFFD # NA .. # 11C00..11C08valid # 9.0 BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C09 >FFFD # NA # 11C0A..11C36valid # 9.0 BHAIKSUKI LETTER E..BHAIKSUKI VOWEL SIGN VOCALIC L @@ -6506,7 +6512,15 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 11EE0..11EF6valid # 11.0 MAKASAR LETTER KA..MAKASAR VOWEL SIGN O # 11EF7..11EF8valid # 11.0 MAKASAR PASSIMBANG..MAKASAR END OF SECTION -11EF9..11FAF >FFFD # NA .. +11EF9..11EFF >FFFD # NA .. +# 11F00..11F10valid # 15.0 KAWI SIGN CANDRABINDU..KAWI LETTER O +11F11 >FFFD # NA +# 11F12..11F3Avalid # 15.0 KAWI LETTER KA..KAWI VOWEL SIGN VOCALIC R +11F3B..11F3D >FFFD # NA .. +# 11F3E..11F42valid # 15.0 KAWI VOWEL SIGN E..KAWI CONJOINER +# 11F43..11F4Fvalid # 15.0 KAWI DANDA..KAWI PUNCTUATION CLOSING SPIRAL +# 11F50..11F59valid # 15.0 KAWI DIGIT ZERO..KAWI DIGIT NINE +11F5A..11FAF >FFFD # NA .. # 11FB0 valid # 13.0 LISU LETTER YHA 11FB1..11FBF >FFFD # NA .. # 11FC0..11FF1valid # 12.0 TAMIL FRACTION ONE THREE-HUNDRED-AND-TWENTIETH..TAMIL SIGN VAKAIYARAA @@ -6528,9 +6542,11 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 13000..1342Evalid # 5.2 EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 -1342F >FFFD # NA +# 1342F valid # 15.0 EGYPTIAN HIEROGLYPH V011D 13430..13438 >FFFD # 12.0 EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END SEGMENT -13439..143FF >FFFD # NA .. +13439..1343F >FFFD # 15.0 EGYPTIAN HIEROGLYPH INSERT AT MIDDLE..EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE +# 13440..13455valid # 15.0 EGYPTIAN HIEROGLYPH MIRROR HORIZONTALLY..EGYPTIAN HIEROGLYPH MODIFIER DAMAGED +13456..143FF >FFFD # NA .. # 14400..14646valid # 8.0 ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 14647..167FF >FFFD # NA .. # 16800..16A38valid # 6.0 BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ @@ -6632,9 +6648,13 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. +1B123..1B131 >FFFD # NA .. +# 1B132 valid # 15.0 HIRAGANA LETTER SMALL KO +1B133..1B14F >FFFD # NA .. # 1B150..1B152valid # 12.0 HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO -1B153..1B163 >FFFD # NA .. +1B153..1B154 >FFFD # NA .. +# 1B155 valid # 15.0 KATAKANA LETTER SMALL KO +1B156..1B163 >FFFD # NA .. # 1B164..1B167valid # 12.0 KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B168..1B16F >FFFD # NA .. # 1B170..1B2FBvalid # 10.0 NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -6685,7 +6705,9 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 1D200..1D245valid # 4.1 GREEK VOCAL NOTATION SYMBOL-1..GREEK MUSICAL LEIMMA -1D246..1D2DF >FFFD # NA .. +1D246..1D2BF >FFFD # NA .. +# 1D2C0..1D2D3valid # 15.0 KAKTOVIK NUMERAL ZERO..KAKTOVIK NUMERAL NINETEEN +1D2D4..1D2DF >FFFD # NA .. # 1D2E0..1D2F3valid # 11.0 MAYAN NUMERAL ZERO..MAYAN NUMERAL NINETEEN 1D2F4..1D2FF >FFFD # NA .. # 1D300..1D356valid # 4.0 MONOGRAM FOR EARTH..TETRAGRAM FOR FOSTERING @@ -7718,7 +7740,9 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 1DF00..1DF1Evalid # 14.0 LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER S WITH CURL -1DF1F..1DFFF >FFFD # NA .. +1DF1F..1DF24 >FFFD # NA .. +# 1DF25..1DF2Avalid # 15.0 LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF2B..1DFFF >FFFD # NA .. # 1E000..1E006valid # 9.0 COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E007 >FFFD # NA # 1E008..1E018valid # 9.0 COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU @@ -7728,7 +7752,72 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA # 1E026..1E02Avalid # 9.0 COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA -1E02B..1E0FF >FFFD # NA .. +1E02B..1E02F >FFFD # NA .. +1E030 >0430 # 15.0 MODIFIER LETTER CYRILLIC SMALL A +1E031 >0431 # 15.0 MODIFIER LETTER CYRILLIC SMALL BE +1E032 >0432 # 15.0 MODIFIER LETTER CYRILLIC SMALL VE +1E033 >0433 # 15.0 MODIFIER LETTER CYRILLIC SMALL GHE +1E034 >0434 # 15.0 MODIFIER LETTER CYRILLIC SMALL DE +1E035 >0435 # 15.0 MODIFIER LETTER CYRILLIC SMALL IE +1E036 >0436 # 15.0 MODIFIER LETTER CYRILLIC SMALL ZHE +1E037 >0437 # 15.0 MODIFIER LETTER CYRILLIC SMALL ZE +1E038 >0438 # 15.0 MODIFIER LETTER CYRILLIC SMALL I +1E039 >043A # 15.0 MODIFIER LETTER CYRILLIC SMALL KA +1E03A >043B # 15.0 MODIFIER LETTER CYRILLIC SMALL EL +1E03B >043C # 15.0 MODIFIER LETTER CYRILLIC SMALL EM +1E03C >043E # 15.0 MODIFIER LETTER CYRILLIC SMALL O +1E03D >043F # 15.0 MODIFIER LETTER CYRILLIC SMALL PE +1E03E >0440 # 15.0 MODIFIER LETTER CYRILLIC SMALL ER +1E03F >0441 # 15.0 MODIFIER LETTER CYRILLIC SMALL ES +1E040 >0442 # 15.0 MODIFIER LETTER CYRILLIC SMALL TE +1E041 >0443 # 15.0 MODIFIER LETTER CYRILLIC SMALL U +1E042 >0444 # 15.0 MODIFIER LETTER CYRILLIC SMALL EF +1E043 >0445 # 15.0 MODIFIER LETTER CYRILLIC SMALL HA +1E044 >0446 # 15.0 MODIFIER LETTER CYRILLIC SMALL TSE +1E045 >0447 # 15.0 MODIFIER LETTER CYRILLIC SMALL CHE +1E046 >0448 # 15.0 MODIFIER LETTER CYRILLIC SMALL SHA +1E047 >044B # 15.0 MODIFIER LETTER CYRILLIC SMALL YERU +1E048 >044D # 15.0 MODIFIER LETTER CYRILLIC SMALL E +1E049 >044E # 15.0 MODIFIER LETTER CYRILLIC SMALL YU +1E04A >A689 # 15.0 MODIFIER LETTER CYRILLIC SMALL DZZE +1E04B >04D9 # 15.0 MODIFIER LETTER CYRILLIC SMALL SCHWA +1E04C >0456 # 15.0 MODIFIER LETTER CYRILLIC SMALL BYELORUSSIAN-UKRAINIAN I +1E04D >0458 # 15.0 MODIFIER LETTER CYRILLIC SMALL JE +1E04E >04E9 # 15.0 MODIFIER LETTER CYRILLIC SMALL BARRED O +1E04F >04AF # 15.0 MODIFIER LETTER CYRILLIC SMALL STRAIGHT U +1E050 >04CF # 15.0 MODIFIER LETTER CYRILLIC SMALL PALOCHKA +1E051 >0430 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER A +1E052 >0431 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER BE +1E053 >0432 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER VE +1E054 >0433 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER GHE +1E055 >0434 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER DE +1E056 >0435 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER IE +1E057 >0436 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER ZHE +1E058 >0437 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER ZE +1E059 >0438 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER I +1E05A >043A # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER KA +1E05B >043B # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER EL +1E05C >043E # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER O +1E05D >043F # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER PE +1E05E >0441 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER ES +1E05F >0443 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER U +1E060 >0444 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER EF +1E061 >0445 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER HA +1E062 >0446 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER TSE +1E063 >0447 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER CHE +1E064 >0448 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER SHA +1E065 >044A # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER HARD SIGN +1E066 >044B # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER YERU +1E067 >0491 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER GHE WITH UPTURN +1E068 >0456 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER BYELORUSSIAN-UKRAINIAN I +1E069 >0455 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER DZE +1E06A >045F # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER DZHE +1E06B >04AB # 15.0 MODIFIER LETTER CYRILLIC SMALL ES WITH DESCENDER +1E06C >A651 # 15.0 MODIFIER LETTER CYRILLIC SMALL YERU WITH BACK YER +1E06D >04B1 # 15.0 MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE +1E06E..1E08E >FFFD # NA .. +# 1E08F valid # 15.0 COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I +1E090..1E0FF >FFFD # NA .. # 1E100..1E12Cvalid # 12.0 NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E12D..1E12F >FFFD # NA .. # 1E130..1E13Dvalid # 12.0 NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER @@ -7743,7 +7832,9 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 1E2FF valid # 12.0 WANCHO NGUN SIGN -1E300..1E7DF >FFFD # NA .. +1E300..1E4CF >FFFD # NA .. +# 1E4D0..1E4F9valid # 15.0 NAG MUNDARI LETTER O..NAG MUNDARI DIGIT NINE +1E4FA..1E7DF >FFFD # NA .. # 1E7E0..1E7E6valid # 14.0 ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO 1E7E7 >FFFD # NA # 1E7E8..1E7EBvalid # 14.0 ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE @@ -8230,7 +8321,8 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. +1F6D8..1F6DB >FFFD # NA .. +# 1F6DC valid # 15.0 WIRELESS # 1F6DD..1F6DFvalid # 14.0 PLAYGROUND SLIDE..RING BUOY # 1F6E0..1F6ECvalid # 7.0 HAMMER AND WRENCH..AIRPLANE ARRIVING 1F6ED..1F6EF >FFFD # NA .. @@ -8242,10 +8334,13 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 1F700..1F773valid # 6.0 ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE -1F774..1F77F >FFFD # NA .. +# 1F774..1F776valid # 15.0 LOT OF FORTUNE..LUNAR ECLIPSE +1F777..1F77A >FFFD # NA .. +# 1F77B..1F77Fvalid # 15.0 HAUMEA..ORCUS # 1F780..1F7D4valid # 7.0 BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..HEAVY TWELVE POINTED PINWHEEL STAR # 1F7D5..1F7D8valid # 11.0 CIRCLED TRIANGLE..NEGATIVE CIRCLED SQUARE -1F7D9..1F7DF >FFFD # NA .. +# 1F7D9 valid # 15.0 NINE POINTED WHITE STAR +1F7DA..1F7DF >FFFD # NA .. # 1F7E0..1F7EBvalid # 12.0 LARGE ORANGE CIRCLE..LARGE BROWN SQUARE 1F7EC..1F7EF >FFFD # NA .. # 1F7F0 valid # 14.0 HEAVY EQUALS SIGN @@ -8312,30 +8407,37 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 1FA70..1FA73valid # 12.0 BALLET SHOES..SHORTS # 1FA74 valid # 13.0 THONG SANDAL -1FA75..1FA77 >FFFD # NA .. +# 1FA75..1FA77valid # 15.0 LIGHT BLUE HEART..PINK HEART # 1FA78..1FA7Avalid # 12.0 DROP OF BLOOD..STETHOSCOPE # 1FA7B..1FA7Cvalid # 14.0 X-RAY..CRUTCH 1FA7D..1FA7F >FFFD # NA .. # 1FA80..1FA82valid # 12.0 YO-YO..PARACHUTE # 1FA83..1FA86valid # 13.0 BOOMERANG..NESTING DOLLS -1FA87..1FA8F >FFFD # NA .. +# 1FA87..1FA88valid # 15.0 MARACAS..FLUTE +1FA89..1FA8F >FFFD # NA .. # 1FA90..1FA95valid # 12.0 RINGED PLANET..BANJO # 1FA96..1FAA8valid # 13.0 MILITARY HELMET..ROCK # 1FAA9..1FAACvalid # 14.0 MIRROR BALL..HAMSA -1FAAD..1FAAF >FFFD # NA .. +# 1FAAD..1FAAFvalid # 15.0 FOLDING HAND FAN..KHANDA # 1FAB0..1FAB6valid # 13.0 FLY..FEATHER # 1FAB7..1FABAvalid # 14.0 LOTUS..NEST WITH EGGS -1FABB..1FABF >FFFD # NA .. +# 1FABB..1FABDvalid # 15.0 HYACINTH..WING +1FABE >FFFD # NA +# 1FABF valid # 15.0 GOOSE # 1FAC0..1FAC2valid # 13.0 ANATOMICAL HEART..PEOPLE HUGGING # 1FAC3..1FAC5valid # 14.0 PREGNANT MAN..PERSON WITH CROWN -1FAC6..1FACF >FFFD # NA .. +1FAC6..1FACD >FFFD # NA .. +# 1FACE..1FACFvalid # 15.0 MOOSE..DONKEY # 1FAD0..1FAD6valid # 13.0 BLUEBERRIES..TEAPOT # 1FAD7..1FAD9valid # 14.0 POURING LIQUID..JAR -1FADA..1FADF >FFFD # NA .. +# 1FADA..1FADBvalid # 15.0 GINGER ROOT..PEA POD +1FADC..1FADF >FFFD # NA .. # 1FAE0..1FAE7valid # 14.0 MELTING FACE..BUBBLES -1FAE8..1FAEF >FFFD # NA .. +# 1FAE8 valid # 15.0 SHAKING FACE +1FAE9..1FAEF >FFFD # NA .. # 1FAF0..1FAF6valid # 14.0 HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS -1FAF7..1FAFF >FFFD # NA .. +# 1FAF7..1FAF8valid # 15.0 LEFTWARDS PUSHING HAND..RIGHTWARDS PUSHING HAND +1FAF9..1FAFF >FFFD # NA .. # 1FB00..1FB92valid # 13.0 BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB93 >FFFD # NA # 1FB94..1FBCAvalid # 13.0 LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON @@ -8358,7 +8460,8 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. # 2A700..2B734valid # 5.2 CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 # 2B735..2B738valid # 14.0 CJK UNIFIED IDEOGRAPH-2B735..CJK UNIFIED IDEOGRAPH-2B738 -2B739..2B73F >FFFD # NA .. +# 2B739 valid # 15.0 CJK UNIFIED IDEOGRAPH-2B739 +2B73A..2B73F >FFFD # NA .. # 2B740..2B81Dvalid # 6.0 CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B81E..2B81F >FFFD # NA .. # 2B820..2CEA1valid # 8.0 CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 @@ -8900,7 +9003,9 @@ FFFE..FFFF >FFFD # 1.1 ..FFFD # NA .. 2FFFE..2FFFF >FFFD # 2.0 .. # 30000..3134Avalid # 13.0 CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -3134B..3FFFD >FFFD # NA .. +3134B..3134F >FFFD # NA .. +# 31350..323AFvalid # 15.0 CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-323AF +323B0..3FFFD >FFFD # NA .. 3FFFE..3FFFF >FFFD # 2.0 .. 40000..4FFFD >FFFD # NA .. 4FFFE..4FFFF >FFFD # 2.0 .. diff --git a/icu4c/source/data/unidata/ppucd.txt b/icu4c/source/data/unidata/ppucd.txt index f0a0fd79f7f..3865e80f182 100644 --- a/icu4c/source/data/unidata/ppucd.txt +++ b/icu4c/source/data/unidata/ppucd.txt @@ -1,7 +1,7 @@ # Preparsed UCD generated by ICU preparseucd.py # Copyright (C) 1991 and later: Unicode, Inc. and others. # License & terms of use: http://www.unicode.org/copyright.html -ucd;14.0.0 +ucd;15.0.0 property;Catalog;age;Age property;Binary;AHex;ASCII_Hex_Digit @@ -134,6 +134,7 @@ value;age;12.0;V12_0 value;age;12.1;V12_1 value;age;13.0;V13_0 value;age;14.0;V14_0 +value;age;15.0;V15_0 value;age;2.0;V2_0 value;age;2.1;V2_1 value;age;3.0;V3_0 @@ -188,6 +189,7 @@ value;blk;Ancient_Symbols;Ancient_Symbols value;blk;Arabic;Arabic value;blk;Arabic_Ext_A;Arabic_Extended_A value;blk;Arabic_Ext_B;Arabic_Extended_B +value;blk;Arabic_Ext_C;Arabic_Extended_C value;blk;Arabic_Math;Arabic_Mathematical_Alphabetic_Symbols value;blk;Arabic_PF_A;Arabic_Presentation_Forms_A;Arabic_Presentation_Forms-A value;blk;Arabic_PF_B;Arabic_Presentation_Forms_B @@ -223,6 +225,7 @@ value;blk;CJK_Ext_D;CJK_Unified_Ideographs_Extension_D value;blk;CJK_Ext_E;CJK_Unified_Ideographs_Extension_E value;blk;CJK_Ext_F;CJK_Unified_Ideographs_Extension_F value;blk;CJK_Ext_G;CJK_Unified_Ideographs_Extension_G +value;blk;CJK_Ext_H;CJK_Unified_Ideographs_Extension_H value;blk;CJK_Radicals_Sup;CJK_Radicals_Supplement value;blk;CJK_Strokes;CJK_Strokes value;blk;CJK_Symbols;CJK_Symbols_And_Punctuation @@ -248,10 +251,12 @@ value;blk;Cyrillic;Cyrillic value;blk;Cyrillic_Ext_A;Cyrillic_Extended_A value;blk;Cyrillic_Ext_B;Cyrillic_Extended_B value;blk;Cyrillic_Ext_C;Cyrillic_Extended_C +value;blk;Cyrillic_Ext_D;Cyrillic_Extended_D value;blk;Cyrillic_Sup;Cyrillic_Supplement;Cyrillic_Supplementary value;blk;Deseret;Deseret value;blk;Devanagari;Devanagari value;blk;Devanagari_Ext;Devanagari_Extended +value;blk;Devanagari_Ext_A;Devanagari_Extended_A value;blk;Diacriticals;Combining_Diacritical_Marks value;blk;Diacriticals_Ext;Combining_Diacritical_Marks_Extended value;blk;Diacriticals_For_Symbols;Combining_Diacritical_Marks_For_Symbols;Combining_Marks_For_Symbols @@ -313,6 +318,7 @@ value;blk;Jamo_Ext_A;Hangul_Jamo_Extended_A value;blk;Jamo_Ext_B;Hangul_Jamo_Extended_B value;blk;Javanese;Javanese value;blk;Kaithi;Kaithi +value;blk;Kaktovik_Numerals;Kaktovik_Numerals value;blk;Kana_Ext_A;Kana_Extended_A value;blk;Kana_Ext_B;Kana_Extended_B value;blk;Kana_Sup;Kana_Supplement @@ -321,6 +327,7 @@ value;blk;Kangxi;Kangxi_Radicals value;blk;Kannada;Kannada value;blk;Katakana;Katakana value;blk;Katakana_Ext;Katakana_Phonetic_Extensions +value;blk;Kawi;Kawi value;blk;Kayah_Li;Kayah_Li value;blk;Kharoshthi;Kharoshthi value;blk;Khitan_Small_Script;Khitan_Small_Script @@ -387,6 +394,7 @@ value;blk;Myanmar_Ext_B;Myanmar_Extended_B value;blk;NB;No_Block value;blk;NKo;NKo value;blk;Nabataean;Nabataean +value;blk;Nag_Mundari;Nag_Mundari value;blk;Nandinagari;Nandinagari value;blk;New_Tai_Lue;New_Tai_Lue value;blk;Newa;Newa @@ -1048,6 +1056,7 @@ value;sc;Jpan;Jpan value;sc;Jurc;Jurc value;sc;Kali;Kayah_Li value;sc;Kana;Katakana +value;sc;Kawi;Kawi value;sc;Khar;Kharoshthi value;sc;Khmr;Khmer value;sc;Khoj;Khojki @@ -1087,6 +1096,7 @@ value;sc;Mroo;Mro value;sc;Mtei;Meetei_Mayek value;sc;Mult;Multani value;sc;Mymr;Myanmar +value;sc;Nagm;Nag_Mundari value;sc;Nand;Nandinagari value;sc;Narb;Old_North_Arabian value;sc;Nbat;Nabataean @@ -1287,7 +1297,7 @@ cp;0015;bc=BN;ea=N;GCB=CN;-Gr_Base;lb=CM;Name_Alias=control=NEGATIVE ACKNOWLEDGE cp;0016;bc=BN;ea=N;GCB=CN;-Gr_Base;lb=CM;Name_Alias=control=SYNCHRONOUS IDLE,abbreviation=SYN cp;0017;bc=BN;ea=N;GCB=CN;-Gr_Base;lb=CM;Name_Alias=control=END OF TRANSMISSION BLOCK,abbreviation=ETB cp;0018;bc=BN;ea=N;GCB=CN;-Gr_Base;lb=CM;Name_Alias=control=CANCEL,abbreviation=CAN -cp;0019;bc=BN;ea=N;GCB=CN;-Gr_Base;lb=CM;Name_Alias=control=END OF MEDIUM,abbreviation=EOM +cp;0019;bc=BN;ea=N;GCB=CN;-Gr_Base;lb=CM;Name_Alias=control=END OF MEDIUM,abbreviation=EOM,abbreviation=EM cp;001A;bc=BN;ea=N;GCB=CN;-Gr_Base;lb=CM;Name_Alias=control=SUBSTITUTE,abbreviation=SUB cp;001B;bc=BN;ea=N;GCB=CN;-Gr_Base;lb=CM;Name_Alias=control=ESCAPE,abbreviation=ESC cp;001C;bc=B;ea=N;GCB=CN;-Gr_Base;lb=CM;Name_Alias=control=INFORMATION SEPARATOR FOUR,control=FILE SEPARATOR,abbreviation=FS @@ -3895,8 +3905,8 @@ cp;0950;InSC=Other;na=DEVANAGARI OM cp;0951;-Alpha;bc=NSM;ccc=230;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Cantillation_Mark;jt=T;lb=CM;na=DEVANAGARI STRESS SIGN UDATTA;SB=EX;sc=Zinh;scx=Beng Deva Gran Gujr Guru Knda Latn Mlym Orya Shrd Taml Telu Tirh;WB=Extend;-XIDS cp;0952;-Alpha;bc=NSM;ccc=220;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Bottom;InSC=Cantillation_Mark;jt=T;lb=CM;na=DEVANAGARI STRESS SIGN ANUDATTA;SB=EX;sc=Zinh;scx=Beng Deva Gran Gujr Guru Knda Latn Mlym Orya Taml Telu Tirh;WB=Extend;-XIDS # Accent marks -cp;0953;-Alpha;bc=NSM;ccc=230;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Other;jt=T;lb=CM;na=DEVANAGARI GRAVE ACCENT;SB=EX;sc=Zinh;WB=Extend;-XIDS -cp;0954;-Alpha;bc=NSM;ccc=230;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Other;jt=T;lb=CM;na=DEVANAGARI ACUTE ACCENT;SB=EX;sc=Zinh;WB=Extend;-XIDS +cp;0953;-Alpha;bc=NSM;ccc=230;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InSC=Other;jt=T;lb=CM;na=DEVANAGARI GRAVE ACCENT;SB=EX;sc=Zinh;WB=Extend;-XIDS +cp;0954;-Alpha;bc=NSM;ccc=230;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InSC=Other;jt=T;lb=CM;na=DEVANAGARI ACUTE ACCENT;SB=EX;sc=Zinh;WB=Extend;-XIDS # Dependent vowel sign cp;0955;age=5.2;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Vowel_Dependent;jt=T;lb=CM;na=DEVANAGARI VOWEL SIGN CANDRA LONG E;SB=EX;WB=Extend;-XIDS # Dependent vowel signs for Kashmiri @@ -4317,7 +4327,7 @@ unassigned;0AF2..0AF8 cp;0AF9;age=8.0;na=GUJARATI LETTER ZHA # Transliteration signs cp;0AFA;age=10.0;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Cantillation_Mark;jt=T;lb=CM;na=GUJARATI SIGN SUKUN;SB=EX;WB=Extend;-XIDS -cp;0AFB;age=10.0;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Cantillation_Mark;jt=T;lb=CM;na=GUJARATI SIGN SHADDA;SB=EX;WB=Extend;-XIDS +cp;0AFB;age=10.0;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Gemination_Mark;jt=T;lb=CM;na=GUJARATI SIGN SHADDA;SB=EX;WB=Extend;-XIDS cp;0AFC;age=10.0;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Cantillation_Mark;jt=T;lb=CM;na=GUJARATI SIGN MADDAH;SB=EX;WB=Extend;-XIDS cp;0AFD;age=10.0;-Alpha;bc=NSM;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Nukta;jt=T;lb=CM;na=GUJARATI SIGN THREE-DOT NUKTA ABOVE;SB=EX;WB=Extend;-XIDS cp;0AFE;age=10.0;-Alpha;bc=NSM;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Nukta;jt=T;lb=CM;na=GUJARATI SIGN CIRCLE NUKTA ABOVE;SB=EX;WB=Extend;-XIDS @@ -4803,7 +4813,8 @@ unassigned;0CF0 # Signs used in Sanskrit cp;0CF1;age=5.0;InSC=Consonant_With_Stacker;na=KANNADA SIGN JIHVAMULIYA cp;0CF2;age=5.0;InSC=Consonant_With_Stacker;na=KANNADA SIGN UPADHMANIYA -unassigned;0CF3..0CFF +cp;0CF3;age=15.0;gc=Mc;GCB=SM;-IDS;InPC=Right;InSC=Bindu;lb=CM;na=KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT;SB=EX;WB=Extend;-XIDS +unassigned;0CF4..0CFF block;0D00..0D7F;age=1.1;Alpha;blk=Malayalam;gc=Lo;Gr_Base;IDC;IDS;InSC=Consonant;lb=AL;SB=LE;sc=Mlym;WB=LE;XIDC;XIDS # 0D00..0D7F Malayalam @@ -5265,7 +5276,8 @@ cp;0ECB;-Alpha;bc=NSM;ccc=122;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top; # Signs cp;0ECC;-Alpha;bc=NSM;CI;Dia;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Other;jt=T;na=LAO CANCELLATION MARK;SB=EX;WB=Extend;-XIDS cp;0ECD;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Bindu;jt=T;na=LAO NIGGAHITA;SB=EX;WB=Extend;-XIDS -unassigned;0ECE..0ECF +cp;0ECE;age=15.0;-Alpha;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Syllable_Modifier;jt=T;na=LAO YAMAKKAN;SB=EX;WB=Extend;-XIDS +unassigned;0ECF # Digits cp;0ED0;-Alpha;gc=Nd;-IDS;InSC=Number;lb=NU;na=LAO DIGIT ZERO;nt=De;nv=0;SB=NU;WB=NU;-XIDS cp;0ED1;-Alpha;gc=Nd;-IDS;InSC=Number;lb=NU;na=LAO DIGIT ONE;nt=De;nv=1;SB=NU;WB=NU;-XIDS @@ -8595,7 +8607,7 @@ cp;1BBA;age=6.1;InSC=Avagraha;na=SUNDANESE AVAGRAHA # Historic letters cp;1BBB;age=6.1;na=SUNDANESE LETTER REU cp;1BBC;age=6.1;na=SUNDANESE LETTER LEU -cp;1BBD;age=6.1;na=SUNDANESE LETTER BHA +cp;1BBD;age=6.1;na=SUNDANESE LETTER BHA;Name_Alias=correction=SUNDANESE LETTER ARCHAIC I cp;1BBE;age=6.1;InSC=Consonant_Final;na=SUNDANESE LETTER FINAL K cp;1BBF;age=6.1;InSC=Consonant_Final;na=SUNDANESE LETTER FINAL M @@ -17847,11 +17859,11 @@ cp;A91E;na=KAYAH LI LETTER THA cp;A91F;na=KAYAH LI LETTER HA cp;A920;na=KAYAH LI LETTER VA cp;A921;na=KAYAH LI LETTER CA +# Vowels cp;A922;InSC=Vowel;na=KAYAH LI LETTER A cp;A923;InSC=Vowel;na=KAYAH LI LETTER OE cp;A924;InSC=Vowel;na=KAYAH LI LETTER I cp;A925;InSC=Vowel;na=KAYAH LI LETTER OO -# Vowels cp;A926;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InSC=Vowel;jt=T;lb=CM;na=KAYAH LI VOWEL UE;SB=EX;WB=Extend;-XIDS cp;A927;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InSC=Vowel;jt=T;lb=CM;na=KAYAH LI VOWEL E;SB=EX;WB=Extend;-XIDS cp;A928;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InSC=Vowel;jt=T;lb=CM;na=KAYAH LI VOWEL U;SB=EX;WB=Extend;-XIDS @@ -24126,8 +24138,13 @@ cp;10EB0;na=YEZIDI LETTER LAM WITH DOT ABOVE cp;10EB1;na=YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE unassigned;10EB2..10EBF;bc=R -# No block -unassigned;10EC0..10EFF;bc=R +block;10EC0..10EFF;age=15.0;bc=NSM;blk=Arabic_Ext_C;ccc=220;CI;Dia;gc=Mn;GCB=EX;Gr_Ext;IDC;jt=T;lb=CM;SB=EX;sc=Arab;WB=Extend;XIDC +# 10EC0..10EFF Arabic Extended-C +unassigned;10EC0..10EFC;bc=AL +# Quranic marks used in Turkey +cp;10EFD;na=ARABIC SMALL LOW WORD SAKTA +cp;10EFE;na=ARABIC SMALL LOW WORD QASR +cp;10EFF;na=ARABIC SMALL LOW WORD MADDA block;10F00..10F2F;age=11.0;Alpha;bc=R;blk=Old_Sogdian;gc=Lo;Gr_Base;IDC;IDS;lb=AL;SB=LE;sc=Sogo;WB=LE;XIDC;XIDS # 10F00..10F2F Old Sogdian @@ -24928,7 +24945,13 @@ cp;1123C;-Alpha;gc=Po;-IDC;-IDS;InSC=Other;lb=BA;na=KHOJKI DOUBLE SECTION MARK;S cp;1123D;-Alpha;gc=Po;-IDC;-IDS;InSC=Other;na=KHOJKI ABBREVIATION SIGN;SB=XX;WB=XX;-XIDC;-XIDS # Sign cp;1123E;age=9.0;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Top;InSC=Cantillation_Mark;jt=T;lb=CM;na=KHOJKI SIGN SUKUN;SB=EX;WB=Extend;-XIDS -unassigned;1123F..1124F +# Consonant +cp;1123F;age=15.0;na=KHOJKI LETTER QA +# Independent vowel +cp;11240;age=15.0;InSC=Vowel_Independent;na=KHOJKI LETTER SHORT I +# Dependent vowel sign +cp;11241;age=15.0;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;InPC=Bottom;InSC=Vowel_Dependent;jt=T;lb=CM;na=KHOJKI VOWEL SIGN VOCALIC R;SB=EX;WB=Extend;-XIDS +unassigned;11242..1124F block;11280..112AF;age=8.0;Alpha;blk=Multani;gc=Lo;Gr_Base;IDC;IDS;InSC=Consonant;lb=AL;SB=LE;sc=Mult;WB=LE;XIDC;XIDS # 11280..112AF Multani @@ -26368,6 +26391,22 @@ cp;11AF7;na=PAU CIN HAU LOW-FALLING TONE FINAL cp;11AF8;na=PAU CIN HAU GLOTTAL STOP FINAL unassigned;11AF9..11AFF +block;11B00..11B5F;age=15.0;blk=Devanagari_Ext_A;gc=Po;Gr_Base;lb=BB;sc=Deva +# 11B00..11B5F Devanagari Extended-A +# Head marks +cp;11B00;na=DEVANAGARI HEAD MARK +cp;11B01;na=DEVANAGARI HEAD MARK WITH HEADSTROKE +# Auspicious signs +cp;11B02;na=DEVANAGARI SIGN BHALE +cp;11B03;na=DEVANAGARI SIGN BHALE WITH HOOK +cp;11B04;na=DEVANAGARI SIGN EXTENDED BHALE +cp;11B05;na=DEVANAGARI SIGN EXTENDED BHALE WITH HOOK +cp;11B06;na=DEVANAGARI SIGN WESTERN FIVE-LIKE BHALE +cp;11B07;na=DEVANAGARI SIGN WESTERN NINE-LIKE BHALE +cp;11B08;na=DEVANAGARI SIGN REVERSED NINE-LIKE BHALE +cp;11B09;na=DEVANAGARI SIGN MINDU +unassigned;11B0A..11B5F + block;11C00..11C6F;age=9.0;Alpha;blk=Bhaiksuki;gc=Lo;Gr_Base;IDC;InSC=Consonant;lb=AL;SB=LE;sc=Bhks;WB=LE;XIDC # 11C00..11C6F Bhaiksuki # Independent vowels @@ -26764,6 +26803,105 @@ cp;11EF7;-Alpha;gc=Po;-IDC;-IDS;InSC=Other;na=MAKASAR PASSIMBANG;SB=ST;STerm;Ter cp;11EF8;-Alpha;gc=Po;-IDC;-IDS;InSC=Other;na=MAKASAR END OF SECTION;SB=ST;STerm;Term;WB=XX;-XIDC;-XIDS unassigned;11EF9..11EFF +block;11F00..11F5F;age=15.0;Alpha;blk=Kawi;gc=Lo;Gr_Base;IDC;InSC=Consonant;lb=AL;SB=LE;sc=Kawi;WB=LE;XIDC;XIDS +# 11F00..11F5F Kawi +# Signs +cp;11F00;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;InPC=Top;InSC=Bindu;jt=T;lb=CM;na=KAWI SIGN CANDRABINDU;SB=EX;WB=Extend;-XIDS +cp;11F01;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;InPC=Top;InSC=Bindu;jt=T;lb=CM;na=KAWI SIGN ANUSVARA;SB=EX;WB=Extend;-XIDS +cp;11F02;GCB=PP;IDS;InPC=Top;InSC=Consonant_Preceding_Repha;na=KAWI SIGN REPHA +cp;11F03;gc=Mc;GCB=SM;InPC=Right;InSC=Visarga;lb=CM;na=KAWI SIGN VISARGA;SB=EX;WB=Extend;-XIDS +# Independent vowels +cp;11F04;IDS;InSC=Vowel_Independent;na=KAWI LETTER A +cp;11F05;IDS;InSC=Vowel_Independent;na=KAWI LETTER AA +cp;11F06;IDS;InSC=Vowel_Independent;na=KAWI LETTER I +cp;11F07;IDS;InSC=Vowel_Independent;na=KAWI LETTER II +cp;11F08;IDS;InSC=Vowel_Independent;na=KAWI LETTER U +cp;11F09;IDS;InSC=Vowel_Independent;na=KAWI LETTER UU +cp;11F0A;IDS;InSC=Vowel_Independent;na=KAWI LETTER VOCALIC R +cp;11F0B;IDS;InSC=Vowel_Independent;na=KAWI LETTER VOCALIC RR +cp;11F0C;IDS;InSC=Vowel_Independent;na=KAWI LETTER VOCALIC L +cp;11F0D;IDS;InSC=Vowel_Independent;na=KAWI LETTER VOCALIC LL +cp;11F0E;IDS;InSC=Vowel_Independent;na=KAWI LETTER E +cp;11F0F;IDS;InSC=Vowel_Independent;na=KAWI LETTER AI +cp;11F10;IDS;InSC=Vowel_Independent;na=KAWI LETTER O +unassigned;11F11 +# Consonants +cp;11F12;IDS;na=KAWI LETTER KA +cp;11F13;IDS;na=KAWI LETTER KHA +cp;11F14;IDS;na=KAWI LETTER GA +cp;11F15;IDS;na=KAWI LETTER GHA +cp;11F16;IDS;na=KAWI LETTER NGA +cp;11F17;IDS;na=KAWI LETTER CA +cp;11F18;IDS;na=KAWI LETTER CHA +cp;11F19;IDS;na=KAWI LETTER JA +cp;11F1A;IDS;na=KAWI LETTER JHA +cp;11F1B;IDS;na=KAWI LETTER NYA +cp;11F1C;IDS;na=KAWI LETTER TTA +cp;11F1D;IDS;na=KAWI LETTER TTHA +cp;11F1E;IDS;na=KAWI LETTER DDA +cp;11F1F;IDS;na=KAWI LETTER DDHA +cp;11F20;IDS;na=KAWI LETTER NNA +cp;11F21;IDS;na=KAWI LETTER TA +cp;11F22;IDS;na=KAWI LETTER THA +cp;11F23;IDS;na=KAWI LETTER DA +cp;11F24;IDS;na=KAWI LETTER DHA +cp;11F25;IDS;na=KAWI LETTER NA +cp;11F26;IDS;na=KAWI LETTER PA +cp;11F27;IDS;na=KAWI LETTER PHA +cp;11F28;IDS;na=KAWI LETTER BA +cp;11F29;IDS;na=KAWI LETTER BHA +cp;11F2A;IDS;na=KAWI LETTER MA +cp;11F2B;IDS;na=KAWI LETTER YA +cp;11F2C;IDS;na=KAWI LETTER RA +cp;11F2D;IDS;na=KAWI LETTER LA +cp;11F2E;IDS;na=KAWI LETTER WA +cp;11F2F;IDS;na=KAWI LETTER SHA +cp;11F30;IDS;na=KAWI LETTER SSA +cp;11F31;IDS;na=KAWI LETTER SA +cp;11F32;IDS;na=KAWI LETTER HA +cp;11F33;IDS;na=KAWI LETTER JNYA +# Dependent vowel signs +cp;11F34;gc=Mc;GCB=SM;InPC=Right;InSC=Vowel_Dependent;lb=CM;na=KAWI VOWEL SIGN AA;SB=EX;WB=Extend;-XIDS +cp;11F35;gc=Mc;GCB=SM;InPC=Right;InSC=Vowel_Dependent;lb=CM;na=KAWI VOWEL SIGN ALTERNATE AA;SB=EX;WB=Extend;-XIDS +cp;11F36;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;InPC=Top;InSC=Vowel_Dependent;jt=T;lb=CM;na=KAWI VOWEL SIGN I;SB=EX;WB=Extend;-XIDS +cp;11F37;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;InPC=Top;InSC=Vowel_Dependent;jt=T;lb=CM;na=KAWI VOWEL SIGN II;SB=EX;WB=Extend;-XIDS +cp;11F38;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;InPC=Bottom;InSC=Vowel_Dependent;jt=T;lb=CM;na=KAWI VOWEL SIGN U;SB=EX;WB=Extend;-XIDS +cp;11F39;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;InPC=Bottom;InSC=Vowel_Dependent;jt=T;lb=CM;na=KAWI VOWEL SIGN UU;SB=EX;WB=Extend;-XIDS +cp;11F3A;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;InPC=Bottom;InSC=Vowel_Dependent;jt=T;lb=CM;na=KAWI VOWEL SIGN VOCALIC R;SB=EX;WB=Extend;-XIDS +unassigned;11F3B..11F3D +cp;11F3E;gc=Mc;GCB=SM;InPC=Left;InSC=Vowel_Dependent;lb=CM;na=KAWI VOWEL SIGN E;SB=EX;WB=Extend;-XIDS +cp;11F3F;gc=Mc;GCB=SM;InPC=Left;InSC=Vowel_Dependent;lb=CM;na=KAWI VOWEL SIGN AI;SB=EX;WB=Extend;-XIDS +cp;11F40;bc=NSM;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;InPC=Top;InSC=Vowel_Dependent;jt=T;lb=CM;na=KAWI VOWEL SIGN EU;SB=EX;WB=Extend;-XIDS +# Viramas +cp;11F41;-Alpha;ccc=9;gc=Mc;GCB=SM;Gr_Link;InPC=Right;InSC=Pure_Killer;lb=CM;na=KAWI SIGN KILLER;SB=EX;WB=Extend;-XIDS +cp;11F42;-Alpha;bc=NSM;ccc=9;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;Gr_Link;InSC=Invisible_Stacker;jt=T;lb=CM;na=KAWI CONJOINER;SB=EX;WB=Extend;-XIDS +# Punctuation +cp;11F43;-Alpha;gc=Po;-IDC;InSC=Other;lb=BA;na=KAWI DANDA;SB=ST;STerm;Term;WB=XX;-XIDC;-XIDS +cp;11F44;-Alpha;gc=Po;-IDC;InSC=Other;lb=BA;na=KAWI DOUBLE DANDA;SB=ST;STerm;Term;WB=XX;-XIDC;-XIDS +cp;11F45;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION SECTION MARKER;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F46;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION ALTERNATE SECTION MARKER;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F47;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION FLOWER;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F48;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION SPACE FILLER;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F49;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION DOT;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F4A;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION DOUBLE DOT;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F4B;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION TRIPLE DOT;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F4C;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION CIRCLE;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F4D;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION FILLED CIRCLE;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F4E;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION SPIRAL;SB=XX;WB=XX;-XIDC;-XIDS +cp;11F4F;-Alpha;gc=Po;-IDC;InSC=Other;lb=ID;na=KAWI PUNCTUATION CLOSING SPIRAL;SB=XX;WB=XX;-XIDC;-XIDS +# Digits +cp;11F50;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT ZERO;nt=De;nv=0;SB=NU;WB=NU;-XIDS +cp;11F51;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT ONE;nt=De;nv=1;SB=NU;WB=NU;-XIDS +cp;11F52;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT TWO;nt=De;nv=2;SB=NU;WB=NU;-XIDS +cp;11F53;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT THREE;nt=De;nv=3;SB=NU;WB=NU;-XIDS +cp;11F54;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT FOUR;nt=De;nv=4;SB=NU;WB=NU;-XIDS +cp;11F55;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT FIVE;nt=De;nv=5;SB=NU;WB=NU;-XIDS +cp;11F56;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT SIX;nt=De;nv=6;SB=NU;WB=NU;-XIDS +cp;11F57;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT SEVEN;nt=De;nv=7;SB=NU;WB=NU;-XIDS +cp;11F58;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT EIGHT;nt=De;nv=8;SB=NU;WB=NU;-XIDS +cp;11F59;-Alpha;gc=Nd;InSC=Number;lb=NU;na=KAWI DIGIT NINE;nt=De;nv=9;SB=NU;WB=NU;-XIDS +unassigned;11F5A..11F5F + block;11FB0..11FBF;age=13.0;Alpha;blk=Lisu_Sup;gc=Lo;Gr_Base;IDC;IDS;lb=AL;na=LISU LETTER YHA;SB=LE;sc=Lisu;WB=LE;XIDC;XIDS # 11FB0..11FBF Lisu Supplement # Letter @@ -29295,24 +29433,59 @@ cp;1342B;na=EGYPTIAN HIEROGLYPH AA029 cp;1342C;na=EGYPTIAN HIEROGLYPH AA030 cp;1342D;na=EGYPTIAN HIEROGLYPH AA031 cp;1342E;na=EGYPTIAN HIEROGLYPH AA032 -unassigned;1342F;vo=U +# Addition to group V +cp;1342F;age=15.0;na=EGYPTIAN HIEROGLYPH V011D -block;13430..1343F;age=12.0;blk=Egyptian_Hieroglyph_Format_Controls;CI;gc=Cf;GCB=CN;jt=T;lb=GL;SB=FO;sc=Egyp;vo=U;WB=FO -# 13430..1343F Egyptian Hieroglyph Format Controls +block;13430..1345F;age=15.0;blk=Egyptian_Hieroglyph_Format_Controls;CI;gc=Cf;GCB=CN;IDC;jt=T;lb=CM;SB=EX;sc=Egyp;vo=U;WB=Extend;XIDC +# 13430..1345F Egyptian Hieroglyph Format Controls # Joiners -cp;13430;na=EGYPTIAN HIEROGLYPH VERTICAL JOINER -cp;13431;na=EGYPTIAN HIEROGLYPH HORIZONTAL JOINER +cp;13430;age=12.0;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH VERTICAL JOINER;SB=FO;WB=FO;-XIDC +cp;13431;age=12.0;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH HORIZONTAL JOINER;SB=FO;WB=FO;-XIDC # Sign insertion controls -cp;13432;na=EGYPTIAN HIEROGLYPH INSERT AT TOP START -cp;13433;na=EGYPTIAN HIEROGLYPH INSERT AT BOTTOM START -cp;13434;na=EGYPTIAN HIEROGLYPH INSERT AT TOP END -cp;13435;na=EGYPTIAN HIEROGLYPH INSERT AT BOTTOM END +cp;13432;age=12.0;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH INSERT AT TOP START;SB=FO;WB=FO;-XIDC +cp;13433;age=12.0;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH INSERT AT BOTTOM START;SB=FO;WB=FO;-XIDC +cp;13434;age=12.0;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH INSERT AT TOP END;SB=FO;WB=FO;-XIDC +cp;13435;age=12.0;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH INSERT AT BOTTOM END;SB=FO;WB=FO;-XIDC # Sign stacking control -cp;13436;na=EGYPTIAN HIEROGLYPH OVERLAY MIDDLE +cp;13436;age=12.0;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH OVERLAY MIDDLE;SB=FO;WB=FO;-XIDC # Segment scoping delimiters -cp;13437;lb=OP;na=EGYPTIAN HIEROGLYPH BEGIN SEGMENT -cp;13438;lb=CL;na=EGYPTIAN HIEROGLYPH END SEGMENT -unassigned;13439..1343F;vo=U +cp;13437;age=12.0;-IDC;lb=OP;na=EGYPTIAN HIEROGLYPH BEGIN SEGMENT;SB=FO;WB=FO;-XIDC +cp;13438;age=12.0;-IDC;lb=CL;na=EGYPTIAN HIEROGLYPH END SEGMENT;SB=FO;WB=FO;-XIDC +# Sign insertion controls +cp;13439;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH INSERT AT MIDDLE;SB=FO;WB=FO;-XIDC +cp;1343A;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH INSERT AT TOP;SB=FO;WB=FO;-XIDC +cp;1343B;-IDC;lb=GL;na=EGYPTIAN HIEROGLYPH INSERT AT BOTTOM;SB=FO;WB=FO;-XIDC +# Enclosure controls +cp;1343C;-IDC;lb=OP;na=EGYPTIAN HIEROGLYPH BEGIN ENCLOSURE;SB=FO;WB=FO;-XIDC +cp;1343D;-IDC;lb=CL;na=EGYPTIAN HIEROGLYPH END ENCLOSURE;SB=FO;WB=FO;-XIDC +cp;1343E;-IDC;lb=OP;na=EGYPTIAN HIEROGLYPH BEGIN WALLED ENCLOSURE;SB=FO;WB=FO;-XIDC +cp;1343F;-IDC;lb=CL;na=EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE;SB=FO;WB=FO;-XIDC +# Mirror control +cp;13440;bc=NSM;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MIRROR HORIZONTALLY +# Blank and lost signs +cp;13441;Alpha;-CI;gc=Lo;GCB=XX;Gr_Base;IDS;jt=U;lb=AL;na=EGYPTIAN HIEROGLYPH FULL BLANK;SB=LE;WB=LE;XIDS +cp;13442;Alpha;-CI;gc=Lo;GCB=XX;Gr_Base;IDS;jt=U;lb=AL;na=EGYPTIAN HIEROGLYPH HALF BLANK;SB=LE;WB=LE;XIDS +cp;13443;Alpha;-CI;gc=Lo;GCB=XX;Gr_Base;IDS;jt=U;lb=AL;na=EGYPTIAN HIEROGLYPH LOST SIGN;SB=LE;WB=LE;XIDS +cp;13444;Alpha;-CI;gc=Lo;GCB=XX;Gr_Base;IDS;jt=U;lb=AL;na=EGYPTIAN HIEROGLYPH HALF LOST SIGN;SB=LE;WB=LE;XIDS +cp;13445;Alpha;-CI;gc=Lo;GCB=XX;Gr_Base;IDS;jt=U;lb=AL;na=EGYPTIAN HIEROGLYPH TALL LOST SIGN;SB=LE;WB=LE;XIDS +cp;13446;Alpha;-CI;gc=Lo;GCB=XX;Gr_Base;IDS;jt=U;lb=AL;na=EGYPTIAN HIEROGLYPH WIDE LOST SIGN;SB=LE;WB=LE;XIDS +# Damage modifiers +cp;13447;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP START +cp;13448;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM START +cp;13449;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT START +cp;1344A;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP END +cp;1344B;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP +cp;1344C;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM START AND TOP END +cp;1344D;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT START AND TOP +cp;1344E;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM END +cp;1344F;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP START AND BOTTOM END +cp;13450;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM +cp;13451;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT START AND BOTTOM +cp;13452;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT END +cp;13453;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP AND END +cp;13454;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM AND END +cp;13455;bc=NSM;Dia;gc=Mn;GCB=EX;Gr_Ext;na=EGYPTIAN HIEROGLYPH MODIFIER DAMAGED +unassigned;13456..1345F;vo=U block;14400..1467F;age=8.0;Alpha;blk=Anatolian_Hieroglyphs;gc=Lo;Gr_Base;IDC;IDS;lb=AL;SB=LE;sc=Hluw;vo=U;WB=LE;XIDC;XIDS # 14400..1467F Anatolian Hieroglyphs @@ -32729,13 +32902,17 @@ unassigned;1B123..1B12F;vo=U block;1B130..1B16F;age=12.0;Alpha;blk=Small_Kana_Ext;ea=W;gc=Lo;Gr_Base;IDC;IDS;lb=CJ;SB=LE;sc=Kana;vo=U;XIDC;XIDS # 1B130..1B16F Small Kana Extension -unassigned;1B130..1B14F;vo=U +unassigned;1B130..1B131;vo=U # Historic small hiragana letters +cp;1B132;age=15.0;na=HIRAGANA LETTER SMALL KO;sc=Hira +unassigned;1B133..1B14F;vo=U cp;1B150;na=HIRAGANA LETTER SMALL WI;sc=Hira cp;1B151;na=HIRAGANA LETTER SMALL WE;sc=Hira cp;1B152;na=HIRAGANA LETTER SMALL WO;sc=Hira -unassigned;1B153..1B163;vo=U +unassigned;1B153..1B154;vo=U # Historic small katakana letters +cp;1B155;age=15.0;na=KATAKANA LETTER SMALL KO;WB=KA +unassigned;1B156..1B163;vo=U cp;1B164;na=KATAKANA LETTER SMALL WI;WB=KA cp;1B165;na=KATAKANA LETTER SMALL WE;WB=KA cp;1B166;na=KATAKANA LETTER SMALL WO;WB=KA @@ -34152,6 +34329,31 @@ cp;1D244;bc=NSM;ccc=230;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;IDC;jt=T;lb=CM;na=COMBIN cp;1D245;na=GREEK MUSICAL LEIMMA unassigned;1D246..1D24F +block;1D2C0..1D2DF;age=15.0;bc=ON;blk=Kaktovik_Numerals;gc=No;Gr_Base;lb=AL;nt=Nu;sc=Zyyy +# 1D2C0..1D2DF Kaktovik Numerals +# Numerals +cp;1D2C0;na=KAKTOVIK NUMERAL ZERO;nv=0 +cp;1D2C1;na=KAKTOVIK NUMERAL ONE;nv=1 +cp;1D2C2;na=KAKTOVIK NUMERAL TWO;nv=2 +cp;1D2C3;na=KAKTOVIK NUMERAL THREE;nv=3 +cp;1D2C4;na=KAKTOVIK NUMERAL FOUR;nv=4 +cp;1D2C5;na=KAKTOVIK NUMERAL FIVE;nv=5 +cp;1D2C6;na=KAKTOVIK NUMERAL SIX;nv=6 +cp;1D2C7;na=KAKTOVIK NUMERAL SEVEN;nv=7 +cp;1D2C8;na=KAKTOVIK NUMERAL EIGHT;nv=8 +cp;1D2C9;na=KAKTOVIK NUMERAL NINE;nv=9 +cp;1D2CA;na=KAKTOVIK NUMERAL TEN;nv=10 +cp;1D2CB;na=KAKTOVIK NUMERAL ELEVEN;nv=11 +cp;1D2CC;na=KAKTOVIK NUMERAL TWELVE;nv=12 +cp;1D2CD;na=KAKTOVIK NUMERAL THIRTEEN;nv=13 +cp;1D2CE;na=KAKTOVIK NUMERAL FOURTEEN;nv=14 +cp;1D2CF;na=KAKTOVIK NUMERAL FIFTEEN;nv=15 +cp;1D2D0;na=KAKTOVIK NUMERAL SIXTEEN;nv=16 +cp;1D2D1;na=KAKTOVIK NUMERAL SEVENTEEN;nv=17 +cp;1D2D2;na=KAKTOVIK NUMERAL EIGHTEEN;nv=18 +cp;1D2D3;na=KAKTOVIK NUMERAL NINETEEN;nv=19 +unassigned;1D2D4..1D2DF + block;1D2E0..1D2FF;age=11.0;blk=Mayan_Numerals;gc=No;Gr_Base;lb=AL;nt=Nu;sc=Zyyy;vo=U # 1D2E0..1D2FF Mayan Numerals # Mayan numerals @@ -36089,7 +36291,15 @@ cp;1DF1C;na=LATIN SMALL LETTER TESH DIGRAPH WITH RETROFLEX HOOK cp;1DF1D;na=LATIN SMALL LETTER C WITH RETROFLEX HOOK # IPA extension cp;1DF1E;na=LATIN SMALL LETTER S WITH CURL -unassigned;1DF1F..1DFFF +unassigned;1DF1F..1DF24 +# Letters for Malayalam transliteration +cp;1DF25;age=15.0;na=LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK +cp;1DF26;age=15.0;na=LATIN SMALL LETTER L WITH MID-HEIGHT LEFT HOOK +cp;1DF27;age=15.0;na=LATIN SMALL LETTER N WITH MID-HEIGHT LEFT HOOK +cp;1DF28;age=15.0;na=LATIN SMALL LETTER R WITH MID-HEIGHT LEFT HOOK +cp;1DF29;age=15.0;na=LATIN SMALL LETTER S WITH MID-HEIGHT LEFT HOOK +cp;1DF2A;age=15.0;na=LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +unassigned;1DF2B..1DFFF block;1E000..1E02F;age=9.0;Alpha;bc=NSM;blk=Glagolitic_Sup;ccc=230;CI;gc=Mn;GCB=EX;Gr_Ext;IDC;jt=T;lb=CM;SB=EX;sc=Glag;WB=Extend;XIDC # 1E000..1E02F Glagolitic Supplement @@ -36138,6 +36348,77 @@ cp;1E029;na=COMBINING GLAGOLITIC LETTER IOTATED BIG YUS cp;1E02A;na=COMBINING GLAGOLITIC LETTER FITA unassigned;1E02B..1E02F +block;1E030..1E08F;age=15.0;Alpha;blk=Cyrillic_Ext_D;Cased;CI;CWKCF;Dia;dt=Sup;gc=Lm;Gr_Base;IDC;IDS;lb=AL;Lower;NFKC_QC=N;NFKD_QC=N;SB=LO;sc=Cyrl;WB=LE;XIDC;XIDS +# 1E030..1E08F Cyrillic Extended-D +# Superscript modifier letters +cp;1E030;dm=0430;na=MODIFIER LETTER CYRILLIC SMALL A;NFKC_CF=0430 +cp;1E031;dm=0431;na=MODIFIER LETTER CYRILLIC SMALL BE;NFKC_CF=0431 +cp;1E032;dm=0432;na=MODIFIER LETTER CYRILLIC SMALL VE;NFKC_CF=0432 +cp;1E033;dm=0433;na=MODIFIER LETTER CYRILLIC SMALL GHE;NFKC_CF=0433 +cp;1E034;dm=0434;na=MODIFIER LETTER CYRILLIC SMALL DE;NFKC_CF=0434 +cp;1E035;dm=0435;na=MODIFIER LETTER CYRILLIC SMALL IE;NFKC_CF=0435 +cp;1E036;dm=0436;na=MODIFIER LETTER CYRILLIC SMALL ZHE;NFKC_CF=0436 +cp;1E037;dm=0437;na=MODIFIER LETTER CYRILLIC SMALL ZE;NFKC_CF=0437 +cp;1E038;dm=0438;na=MODIFIER LETTER CYRILLIC SMALL I;NFKC_CF=0438 +cp;1E039;dm=043A;na=MODIFIER LETTER CYRILLIC SMALL KA;NFKC_CF=043A +cp;1E03A;dm=043B;na=MODIFIER LETTER CYRILLIC SMALL EL;NFKC_CF=043B +cp;1E03B;dm=043C;na=MODIFIER LETTER CYRILLIC SMALL EM;NFKC_CF=043C +cp;1E03C;dm=043E;na=MODIFIER LETTER CYRILLIC SMALL O;NFKC_CF=043E +cp;1E03D;dm=043F;na=MODIFIER LETTER CYRILLIC SMALL PE;NFKC_CF=043F +cp;1E03E;dm=0440;na=MODIFIER LETTER CYRILLIC SMALL ER;NFKC_CF=0440 +cp;1E03F;dm=0441;na=MODIFIER LETTER CYRILLIC SMALL ES;NFKC_CF=0441 +cp;1E040;dm=0442;na=MODIFIER LETTER CYRILLIC SMALL TE;NFKC_CF=0442 +cp;1E041;dm=0443;na=MODIFIER LETTER CYRILLIC SMALL U;NFKC_CF=0443 +cp;1E042;dm=0444;na=MODIFIER LETTER CYRILLIC SMALL EF;NFKC_CF=0444 +cp;1E043;dm=0445;na=MODIFIER LETTER CYRILLIC SMALL HA;NFKC_CF=0445 +cp;1E044;dm=0446;na=MODIFIER LETTER CYRILLIC SMALL TSE;NFKC_CF=0446 +cp;1E045;dm=0447;na=MODIFIER LETTER CYRILLIC SMALL CHE;NFKC_CF=0447 +cp;1E046;dm=0448;na=MODIFIER LETTER CYRILLIC SMALL SHA;NFKC_CF=0448 +cp;1E047;dm=044B;na=MODIFIER LETTER CYRILLIC SMALL YERU;NFKC_CF=044B +cp;1E048;dm=044D;na=MODIFIER LETTER CYRILLIC SMALL E;NFKC_CF=044D +cp;1E049;dm=044E;na=MODIFIER LETTER CYRILLIC SMALL YU;NFKC_CF=044E +cp;1E04A;dm=A689;na=MODIFIER LETTER CYRILLIC SMALL DZZE;NFKC_CF=A689 +cp;1E04B;dm=04D9;na=MODIFIER LETTER CYRILLIC SMALL SCHWA;NFKC_CF=04D9 +cp;1E04C;dm=0456;na=MODIFIER LETTER CYRILLIC SMALL BYELORUSSIAN-UKRAINIAN I;NFKC_CF=0456 +cp;1E04D;dm=0458;na=MODIFIER LETTER CYRILLIC SMALL JE;NFKC_CF=0458 +cp;1E04E;dm=04E9;na=MODIFIER LETTER CYRILLIC SMALL BARRED O;NFKC_CF=04E9 +cp;1E04F;dm=04AF;na=MODIFIER LETTER CYRILLIC SMALL STRAIGHT U;NFKC_CF=04AF +cp;1E050;dm=04CF;na=MODIFIER LETTER CYRILLIC SMALL PALOCHKA;NFKC_CF=04CF +# Subscript modifier letters +cp;1E051;dm=0430;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER A;NFKC_CF=0430 +cp;1E052;dm=0431;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER BE;NFKC_CF=0431 +cp;1E053;dm=0432;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER VE;NFKC_CF=0432 +cp;1E054;dm=0433;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER GHE;NFKC_CF=0433 +cp;1E055;dm=0434;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER DE;NFKC_CF=0434 +cp;1E056;dm=0435;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER IE;NFKC_CF=0435 +cp;1E057;dm=0436;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER ZHE;NFKC_CF=0436 +cp;1E058;dm=0437;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER ZE;NFKC_CF=0437 +cp;1E059;dm=0438;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER I;NFKC_CF=0438 +cp;1E05A;dm=043A;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER KA;NFKC_CF=043A +cp;1E05B;dm=043B;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER EL;NFKC_CF=043B +cp;1E05C;dm=043E;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER O;NFKC_CF=043E +cp;1E05D;dm=043F;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER PE;NFKC_CF=043F +cp;1E05E;dm=0441;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER ES;NFKC_CF=0441 +cp;1E05F;dm=0443;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER U;NFKC_CF=0443 +cp;1E060;dm=0444;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER EF;NFKC_CF=0444 +cp;1E061;dm=0445;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER HA;NFKC_CF=0445 +cp;1E062;dm=0446;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER TSE;NFKC_CF=0446 +cp;1E063;dm=0447;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER CHE;NFKC_CF=0447 +cp;1E064;dm=0448;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER SHA;NFKC_CF=0448 +cp;1E065;dm=044A;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER HARD SIGN;NFKC_CF=044A +cp;1E066;dm=044B;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER YERU;NFKC_CF=044B +cp;1E067;dm=0491;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER GHE WITH UPTURN;NFKC_CF=0491 +cp;1E068;dm=0456;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER BYELORUSSIAN-UKRAINIAN I;NFKC_CF=0456 +cp;1E069;dm=0455;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER DZE;NFKC_CF=0455 +cp;1E06A;dm=045F;dt=Sub;na=CYRILLIC SUBSCRIPT SMALL LETTER DZHE;NFKC_CF=045F +# Superscript modifier letters +cp;1E06B;dm=04AB;na=MODIFIER LETTER CYRILLIC SMALL ES WITH DESCENDER;NFKC_CF=04AB +cp;1E06C;dm=A651;na=MODIFIER LETTER CYRILLIC SMALL YERU WITH BACK YER;NFKC_CF=A651 +cp;1E06D;-Cased;dm=04B1;-Lower;na=MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE;NFKC_CF=04B1;SB=LE +unassigned;1E06E..1E08E +# Diacritical mark +cp;1E08F;bc=NSM;-Cased;ccc=230;-CWKCF;-Dia;dt=None;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;jt=T;lb=CM;-Lower;na=COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I;NFKC_QC=Y;NFKD_QC=Y;SB=EX;WB=Extend;-XIDS + block;1E100..1E14F;age=12.0;Alpha;blk=Nyiakeng_Puachue_Hmong;gc=Lo;Gr_Base;IDC;IDS;lb=AL;SB=LE;sc=Hmnp;WB=LE;XIDC;XIDS # 1E100..1E14F Nyiakeng Puachue Hmong # Consonant onsets @@ -36328,6 +36609,55 @@ unassigned;1E2FA..1E2FE # Currency symbol cp;1E2FF;-Alpha;bc=ET;gc=Sc;-IDC;-IDS;lb=PR;na=WANCHO NGUN SIGN;SB=XX;WB=XX;-XIDC;-XIDS +block;1E4D0..1E4FF;age=15.0;Alpha;blk=Nag_Mundari;gc=Lo;Gr_Base;IDC;IDS;lb=AL;SB=LE;sc=Nagm;WB=LE;XIDC;XIDS +# 1E4D0..1E4FF Nag Mundari +# Letters +cp;1E4D0;na=NAG MUNDARI LETTER O +cp;1E4D1;na=NAG MUNDARI LETTER OP +cp;1E4D2;na=NAG MUNDARI LETTER OL +cp;1E4D3;na=NAG MUNDARI LETTER OY +cp;1E4D4;na=NAG MUNDARI LETTER ONG +cp;1E4D5;na=NAG MUNDARI LETTER A +cp;1E4D6;na=NAG MUNDARI LETTER AJ +cp;1E4D7;na=NAG MUNDARI LETTER AB +cp;1E4D8;na=NAG MUNDARI LETTER ANY +cp;1E4D9;na=NAG MUNDARI LETTER AH +cp;1E4DA;na=NAG MUNDARI LETTER I +cp;1E4DB;na=NAG MUNDARI LETTER IS +cp;1E4DC;na=NAG MUNDARI LETTER IDD +cp;1E4DD;na=NAG MUNDARI LETTER IT +cp;1E4DE;na=NAG MUNDARI LETTER IH +cp;1E4DF;na=NAG MUNDARI LETTER U +cp;1E4E0;na=NAG MUNDARI LETTER UC +cp;1E4E1;na=NAG MUNDARI LETTER UD +cp;1E4E2;na=NAG MUNDARI LETTER UK +cp;1E4E3;na=NAG MUNDARI LETTER UR +cp;1E4E4;na=NAG MUNDARI LETTER E +cp;1E4E5;na=NAG MUNDARI LETTER ENN +cp;1E4E6;na=NAG MUNDARI LETTER EG +cp;1E4E7;na=NAG MUNDARI LETTER EM +cp;1E4E8;na=NAG MUNDARI LETTER EN +cp;1E4E9;na=NAG MUNDARI LETTER ETT +cp;1E4EA;na=NAG MUNDARI LETTER ELL +# Various signs +cp;1E4EB;CI;gc=Lm;na=NAG MUNDARI SIGN OJOD +cp;1E4EC;-Alpha;bc=NSM;ccc=232;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;jt=T;na=NAG MUNDARI SIGN MUHOR;SB=EX;WB=Extend;-XIDS +cp;1E4ED;-Alpha;bc=NSM;ccc=232;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;jt=T;na=NAG MUNDARI SIGN TOYOR;SB=EX;WB=Extend;-XIDS +cp;1E4EE;-Alpha;bc=NSM;ccc=220;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;jt=T;na=NAG MUNDARI SIGN IKIR;SB=EX;WB=Extend;-XIDS +cp;1E4EF;-Alpha;bc=NSM;ccc=230;CI;gc=Mn;GCB=EX;-Gr_Base;Gr_Ext;-IDS;jt=T;na=NAG MUNDARI SIGN SUTUH;SB=EX;WB=Extend;-XIDS +# Digits +cp;1E4F0;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT ZERO;nt=De;nv=0;SB=NU;WB=NU;-XIDS +cp;1E4F1;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT ONE;nt=De;nv=1;SB=NU;WB=NU;-XIDS +cp;1E4F2;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT TWO;nt=De;nv=2;SB=NU;WB=NU;-XIDS +cp;1E4F3;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT THREE;nt=De;nv=3;SB=NU;WB=NU;-XIDS +cp;1E4F4;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT FOUR;nt=De;nv=4;SB=NU;WB=NU;-XIDS +cp;1E4F5;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT FIVE;nt=De;nv=5;SB=NU;WB=NU;-XIDS +cp;1E4F6;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT SIX;nt=De;nv=6;SB=NU;WB=NU;-XIDS +cp;1E4F7;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT SEVEN;nt=De;nv=7;SB=NU;WB=NU;-XIDS +cp;1E4F8;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT EIGHT;nt=De;nv=8;SB=NU;WB=NU;-XIDS +cp;1E4F9;-Alpha;gc=Nd;-IDS;lb=NU;na=NAG MUNDARI DIGIT NINE;nt=De;nv=9;SB=NU;WB=NU;-XIDS +unassigned;1E4FA..1E4FF + block;1E7E0..1E7FF;age=14.0;Alpha;blk=Ethiopic_Ext_B;gc=Lo;Gr_Base;IDC;IDS;lb=AL;SB=LE;sc=Ethi;WB=LE;XIDC;XIDS # 1E7E0..1E7FF Ethiopic Extended-B # Syllables for Gurage @@ -38732,8 +39062,9 @@ cp;1F6D4;age=10.0;ea=N;-Emoji;-EPres;na=PAGODA cp;1F6D5;age=12.0;na=HINDU TEMPLE cp;1F6D6;age=13.0;na=HUT cp;1F6D7;age=13.0;na=ELEVATOR -unassigned;1F6D8..1F6DC;ExtPict;lb=ID;vo=U +unassigned;1F6D8..1F6DB;ExtPict;lb=ID;vo=U # Miscellaneous symbols +cp;1F6DC;age=15.0;na=WIRELESS cp;1F6DD;age=14.0;na=PLAYGROUND SLIDE cp;1F6DE;age=14.0;na=WHEEL cp;1F6DF;age=14.0;na=RING BUOY @@ -38899,7 +39230,18 @@ cp;1F771;na=ALCHEMICAL SYMBOL FOR MONTH # Measures cp;1F772;na=ALCHEMICAL SYMBOL FOR HALF DRAM cp;1F773;na=ALCHEMICAL SYMBOL FOR HALF OUNCE -unassigned;1F774..1F77F;ExtPict;lb=ID;vo=U +# Other symbol +cp;1F774;age=15.0;ExtPict;lb=ID;na=LOT OF FORTUNE +# Eclipse symbols +cp;1F775;age=15.0;ExtPict;lb=ID;na=OCCULTATION +cp;1F776;age=15.0;ExtPict;lb=ID;na=LUNAR ECLIPSE +unassigned;1F777..1F77A;ExtPict;lb=ID;vo=U +# Symbols for dwarf planets +cp;1F77B;age=15.0;ExtPict;lb=ID;na=HAUMEA +cp;1F77C;age=15.0;ExtPict;lb=ID;na=MAKEMAKE +cp;1F77D;age=15.0;ExtPict;lb=ID;na=GONGGONG +cp;1F77E;age=15.0;ExtPict;lb=ID;na=QUAOAR +cp;1F77F;age=15.0;ExtPict;lb=ID;na=ORCUS block;1F780..1F7FF;age=7.0;bc=ON;blk=Geometric_Shapes_Ext;gc=So;Gr_Base;lb=AL;sc=Zyyy;vo=U # 1F780..1F7FF Geometric Shapes Extended @@ -39018,7 +39360,9 @@ cp;1F7D5;age=11.0;ExtPict;lb=ID;na=CIRCLED TRIANGLE cp;1F7D6;age=11.0;ExtPict;lb=ID;na=NEGATIVE CIRCLED TRIANGLE cp;1F7D7;age=11.0;ExtPict;lb=ID;na=CIRCLED SQUARE cp;1F7D8;age=11.0;ExtPict;lb=ID;na=NEGATIVE CIRCLED SQUARE -unassigned;1F7D9..1F7DF;ExtPict;lb=ID;vo=U +# Nine pointed star +cp;1F7D9;age=15.0;ExtPict;lb=ID;na=NINE POINTED WHITE STAR +unassigned;1F7DA..1F7DF;ExtPict;lb=ID;vo=U # Colored circles cp;1F7E0;age=12.0;ea=W;Emoji;EPres;ExtPict;lb=ID;na=LARGE ORANGE CIRCLE cp;1F7E1;age=12.0;ea=W;Emoji;EPres;ExtPict;lb=ID;na=LARGE YELLOW CIRCLE @@ -39621,7 +39965,10 @@ cp;1FA71;age=12.0;na=ONE-PIECE SWIMSUIT cp;1FA72;age=12.0;na=BRIEFS cp;1FA73;age=12.0;na=SHORTS cp;1FA74;na=THONG SANDAL -unassigned;1FA75..1FA77;ExtPict;lb=ID;vo=U +# Colored heart symbols +cp;1FA75;age=15.0;na=LIGHT BLUE HEART +cp;1FA76;age=15.0;na=GREY HEART +cp;1FA77;age=15.0;na=PINK HEART # Medical symbols cp;1FA78;age=12.0;na=DROP OF BLOOD cp;1FA79;age=12.0;na=ADHESIVE BANDAGE @@ -39637,7 +39984,10 @@ cp;1FA83;na=BOOMERANG cp;1FA84;na=MAGIC WAND cp;1FA85;na=PINATA cp;1FA86;na=NESTING DOLLS -unassigned;1FA87..1FA8F;ExtPict;lb=ID;vo=U +# Musical instruments +cp;1FA87;age=15.0;na=MARACAS +cp;1FA88;age=15.0;na=FLUTE +unassigned;1FA89..1FA8F;ExtPict;lb=ID;vo=U # Miscellaneous objects cp;1FA90;age=12.0;na=RINGED PLANET cp;1FA91;age=12.0;na=CHAIR @@ -39668,7 +40018,10 @@ cp;1FAA9;age=14.0;na=MIRROR BALL cp;1FAAA;age=14.0;na=IDENTIFICATION CARD cp;1FAAB;age=14.0;na=LOW BATTERY cp;1FAAC;age=14.0;na=HAMSA -unassigned;1FAAD..1FAAF;ExtPict;lb=ID;vo=U +cp;1FAAD;age=15.0;na=FOLDING HAND FAN +cp;1FAAE;age=15.0;na=HAIR PICK +# Religious symbol +cp;1FAAF;age=15.0;na=KHANDA # Animals and nature cp;1FAB0;na=FLY cp;1FAB1;na=WORM @@ -39681,7 +40034,11 @@ cp;1FAB7;age=14.0;na=LOTUS cp;1FAB8;age=14.0;na=CORAL cp;1FAB9;age=14.0;na=EMPTY NEST cp;1FABA;age=14.0;na=NEST WITH EGGS -unassigned;1FABB..1FABF;ExtPict;lb=ID;vo=U +cp;1FABB;age=15.0;na=HYACINTH +cp;1FABC;age=15.0;na=JELLYFISH +cp;1FABD;age=15.0;na=WING +unassigned;1FABE;ea=W;ExtPict;lb=ID;vo=U +cp;1FABF;age=15.0;na=GOOSE # Body parts cp;1FAC0;na=ANATOMICAL HEART cp;1FAC1;na=LUNGS @@ -39690,7 +40047,10 @@ cp;1FAC2;na=PEOPLE HUGGING cp;1FAC3;age=14.0;EBase;lb=EB;na=PREGNANT MAN cp;1FAC4;age=14.0;EBase;lb=EB;na=PREGNANT PERSON cp;1FAC5;age=14.0;EBase;lb=EB;na=PERSON WITH CROWN -unassigned;1FAC6..1FACF;ExtPict;lb=ID;vo=U +unassigned;1FAC6..1FACD;ExtPict;lb=ID;vo=U +# Animals and nature +cp;1FACE;age=15.0;na=MOOSE +cp;1FACF;age=15.0;na=DONKEY # Food and drink cp;1FAD0;na=BLUEBERRIES cp;1FAD1;na=BELL PEPPER @@ -39702,7 +40062,9 @@ cp;1FAD6;na=TEAPOT cp;1FAD7;age=14.0;na=POURING LIQUID cp;1FAD8;age=14.0;na=BEANS cp;1FAD9;age=14.0;na=JAR -unassigned;1FADA..1FADF;ExtPict;lb=ID;vo=U +cp;1FADA;age=15.0;na=GINGER ROOT +cp;1FADB;age=15.0;na=PEA POD +unassigned;1FADC..1FADF;ExtPict;lb=ID;vo=U # Faces cp;1FAE0;age=14.0;na=MELTING FACE cp;1FAE1;age=14.0;na=SALUTING FACE @@ -39713,7 +40075,9 @@ cp;1FAE5;age=14.0;na=DOTTED LINE FACE # Emotion cp;1FAE6;age=14.0;na=BITING LIP cp;1FAE7;age=14.0;na=BUBBLES -unassigned;1FAE8..1FAEF;ExtPict;lb=ID;vo=U +# Face +cp;1FAE8;age=15.0;na=SHAKING FACE +unassigned;1FAE9..1FAEF;ExtPict;lb=ID;vo=U # Hand symbols cp;1FAF0;age=14.0;EBase;lb=EB;na=HAND WITH INDEX FINGER AND THUMB CROSSED cp;1FAF1;age=14.0;EBase;lb=EB;na=RIGHTWARDS HAND @@ -39722,7 +40086,9 @@ cp;1FAF3;age=14.0;EBase;lb=EB;na=PALM DOWN HAND cp;1FAF4;age=14.0;EBase;lb=EB;na=PALM UP HAND cp;1FAF5;age=14.0;EBase;lb=EB;na=INDEX POINTING AT THE VIEWER cp;1FAF6;age=14.0;EBase;lb=EB;na=HEART HANDS -unassigned;1FAF7..1FAFF;ExtPict;lb=ID;vo=U +cp;1FAF7;age=15.0;EBase;lb=EB;na=LEFTWARDS PUSHING HAND +cp;1FAF8;age=15.0;EBase;lb=EB;na=RIGHTWARDS PUSHING HAND +unassigned;1FAF9..1FAFF;ExtPict;lb=ID;vo=U block;1FB00..1FBFF;age=13.0;bc=ON;blk=Symbols_For_Legacy_Computing;gc=So;Gr_Base;lb=AL;sc=Zyyy # 1FB00..1FBFF Symbols for Legacy Computing @@ -39989,11 +40355,12 @@ cp;2A6DE..2A6DF;age=14.0 unassigned;2A6E0..2A6FF;ea=W;lb=ID;vo=U block;2A700..2B73F;Alpha;blk=CJK_Ext_C;ea=W;gc=Lo;Gr_Base;IDC;Ideo;IDS;lb=ID;SB=LE;sc=Hani;UIdeo;vo=U;XIDC;XIDS -# 2A700..2B738 CJK Unified Ideographs Extension C -algnamesrange;2A700..2B738;han;CJK UNIFIED IDEOGRAPH- +# 2A700..2B739 CJK Unified Ideographs Extension C +algnamesrange;2A700..2B739;han;CJK UNIFIED IDEOGRAPH- cp;2A700..2B734;age=5.2 cp;2B735..2B738;age=14.0 -unassigned;2B739..2B73F;ea=W;lb=ID;vo=U +cp;2B739;age=15.0 +unassigned;2B73A..2B73F;ea=W;lb=ID;vo=U block;2B740..2B81F;age=6.0;Alpha;blk=CJK_Ext_D;ea=W;gc=Lo;Gr_Base;IDC;Ideo;IDS;lb=ID;SB=LE;sc=Hani;UIdeo;vo=U;XIDC;XIDS # 2B740..2B81D CJK Unified Ideographs Extension D @@ -40572,8 +40939,12 @@ block;30000..3134F;age=13.0;Alpha;blk=CJK_Ext_G;ea=W;gc=Lo;Gr_Base;IDC;Ideo;IDS; algnamesrange;30000..3134A;han;CJK UNIFIED IDEOGRAPH- unassigned;3134B..3134F;ea=W;lb=ID;vo=U +block;31350..323AF;age=15.0;Alpha;blk=CJK_Ext_H;ea=W;gc=Lo;Gr_Base;IDC;Ideo;IDS;lb=ID;SB=LE;sc=Hani;UIdeo;vo=U;XIDC;XIDS +# 31350..323AF CJK Unified Ideographs Extension H +algnamesrange;31350..323AF;han;CJK UNIFIED IDEOGRAPH- + # No block -unassigned;31350..3FF7F;ea=W;lb=ID;vo=U +unassigned;323B0..3FF7F;ea=W;lb=ID;vo=U # 3FF80..3FFFF Unassigned unassigned;3FF80..3FFFD;ea=W;lb=ID;vo=U # Noncharacters diff --git a/icu4c/source/test/cintltst/cucdapi.c b/icu4c/source/test/cintltst/cucdapi.c index 6501e585fba..e6beb1d7f1e 100644 --- a/icu4c/source/test/cintltst/cucdapi.c +++ b/icu4c/source/test/cintltst/cucdapi.c @@ -423,6 +423,8 @@ void TestUScriptCodeAPI(){ "Chorasmian", "Dives_Akuru", "Khitan_Small_Script", "Yezidi", // new in ICU 70 "Cypro_Minoan", "Old_Uyghur", "Tangsa", "Toto", "Vithkuqi", + // new in ICU 72 + "Kawi", "Nag_Mundari", }; static const char* expectedShort[] = { "Bali", "Batk", "Blis", "Brah", "Cham", "Cirt", "Cyrs", "Egyd", "Egyh", "Egyp", @@ -461,6 +463,8 @@ void TestUScriptCodeAPI(){ "Chrs", "Diak", "Kits", "Yezi", // new in ICU 70 "Cpmn", "Ougr", "Tnsa", "Toto", "Vith", + // new in ICU 72 + "Kawi", "Nagm", }; int32_t j = 0; if(UPRV_LENGTHOF(expectedLong)!=(USCRIPT_CODE_LIMIT-USCRIPT_BALINESE)) { diff --git a/icu4c/source/test/testdata/BidiTest.txt b/icu4c/source/test/testdata/BidiTest.txt index 2df6fe230e1..5e75ef42556 100644 --- a/icu4c/source/test/testdata/BidiTest.txt +++ b/icu4c/source/test/testdata/BidiTest.txt @@ -1,11 +1,11 @@ -# BidiTest-14.0.0.txt -# Date: 2021-03-08, 19:35:40 GMT -# © 2021 Unicode®, Inc. +# BidiTest-15.0.0.txt +# Date: 2022-02-02, 23:35:34 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # This file provides a conformance test for UBA (Unicode Bidi Algorithm) implementations. # It is designed to be reasonably compact, and yet provide a thorough test of all cases up to diff --git a/icu4c/source/test/testdata/GraphemeBreakTest.txt b/icu4c/source/test/testdata/GraphemeBreakTest.txt index 0e3949c32dc..91ab748f1d0 100644 --- a/icu4c/source/test/testdata/GraphemeBreakTest.txt +++ b/icu4c/source/test/testdata/GraphemeBreakTest.txt @@ -1,11 +1,11 @@ -# GraphemeBreakTest-cldr-14.0.0.txt -# Date: 2021-08-17, 04:43:19 GMT -# © 2021 Unicode®, Inc. +# GraphemeBreakTest-cldr-15.0.0.txt +# Date: 2022-05-11, 21:35:20 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Default Grapheme_Cluster_Break Test # diff --git a/icu4c/source/test/testdata/IdnaTestV2.txt b/icu4c/source/test/testdata/IdnaTestV2.txt index 42e09043567..d8b87030b7c 100644 --- a/icu4c/source/test/testdata/IdnaTestV2.txt +++ b/icu4c/source/test/testdata/IdnaTestV2.txt @@ -1,13 +1,13 @@ # IdnaTestV2.txt -# Date: 2021-08-17, 19:34:01 GMT -# © 2021 Unicode®, Inc. +# Date: 2022-05-04, 23:03:45 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode IDNA Compatible Preprocessing for UTS #46 -# Version: 14.0.0 +# Version: 15.0.0 # -# For documentation and usage, see http://www.unicode.org/reports/tr46 +# For documentation and usage, see https://www.unicode.org/reports/tr46 # # Test cases for verifying UTS #46 conformance. # @@ -1516,14 +1516,14 @@ xn--0ug27500a.xn--2b7hs861pl540a; 𯻼‌.𞶞򻙤񥘇; [B2, B3, B6, C1, V6]; xn 𑑄≯。𑜤; 𑑄≯.𑜤; [P1, V5, V6]; xn--hdh5636g.xn--ci2d; ; ; # 𑑄≯.𑜤 𑑄≯。𑜤; 𑑄≯.𑜤; [P1, V5, V6]; xn--hdh5636g.xn--ci2d; ; ; # 𑑄≯.𑜤 xn--hdh5636g.xn--ci2d; 𑑄≯.𑜤; [V5, V6]; xn--hdh5636g.xn--ci2d; ; ; # 𑑄≯.𑜤 -Ⴋ≮𱲆。‍ާ𐋣; Ⴋ≮𱲆.‍ާ𐋣; [C2, P1, V6]; xn--jnd802gsm17c.xn--lrb506jqr4n; ; xn--jnd802gsm17c.xn--lrb6479j; [P1, V5, V6] # Ⴋ≮.ާ𐋣 -Ⴋ≮𱲆。‍ާ𐋣; Ⴋ≮𱲆.‍ާ𐋣; [C2, P1, V6]; xn--jnd802gsm17c.xn--lrb506jqr4n; ; xn--jnd802gsm17c.xn--lrb6479j; [P1, V5, V6] # Ⴋ≮.ާ𐋣 -ⴋ≮𱲆。‍ާ𐋣; ⴋ≮𱲆.‍ާ𐋣; [C2, P1, V6]; xn--gdhz03bxt42d.xn--lrb506jqr4n; ; xn--gdhz03bxt42d.xn--lrb6479j; [P1, V5, V6] # ⴋ≮.ާ𐋣 -ⴋ≮𱲆。‍ާ𐋣; ⴋ≮𱲆.‍ާ𐋣; [C2, P1, V6]; xn--gdhz03bxt42d.xn--lrb506jqr4n; ; xn--gdhz03bxt42d.xn--lrb6479j; [P1, V5, V6] # ⴋ≮.ާ𐋣 -xn--gdhz03bxt42d.xn--lrb6479j; ⴋ≮𱲆.ާ𐋣; [V5, V6]; xn--gdhz03bxt42d.xn--lrb6479j; ; ; # ⴋ≮.ާ𐋣 -xn--gdhz03bxt42d.xn--lrb506jqr4n; ⴋ≮𱲆.‍ާ𐋣; [C2, V6]; xn--gdhz03bxt42d.xn--lrb506jqr4n; ; ; # ⴋ≮.ާ𐋣 -xn--jnd802gsm17c.xn--lrb6479j; Ⴋ≮𱲆.ާ𐋣; [V5, V6]; xn--jnd802gsm17c.xn--lrb6479j; ; ; # Ⴋ≮.ާ𐋣 -xn--jnd802gsm17c.xn--lrb506jqr4n; Ⴋ≮𱲆.‍ާ𐋣; [C2, V6]; xn--jnd802gsm17c.xn--lrb506jqr4n; ; ; # Ⴋ≮.ާ𐋣 +Ⴋ≮𱲆。‍ާ𐋣; Ⴋ≮𱲆.‍ާ𐋣; [C2, P1, V6]; xn--jnd802gsm17c.xn--lrb506jqr4n; ; xn--jnd802gsm17c.xn--lrb6479j; [P1, V5, V6] # Ⴋ≮𱲆.ާ𐋣 +Ⴋ≮𱲆。‍ާ𐋣; Ⴋ≮𱲆.‍ާ𐋣; [C2, P1, V6]; xn--jnd802gsm17c.xn--lrb506jqr4n; ; xn--jnd802gsm17c.xn--lrb6479j; [P1, V5, V6] # Ⴋ≮𱲆.ާ𐋣 +ⴋ≮𱲆。‍ާ𐋣; ⴋ≮𱲆.‍ާ𐋣; [C2, P1, V6]; xn--gdhz03bxt42d.xn--lrb506jqr4n; ; xn--gdhz03bxt42d.xn--lrb6479j; [P1, V5, V6] # ⴋ≮𱲆.ާ𐋣 +ⴋ≮𱲆。‍ާ𐋣; ⴋ≮𱲆.‍ާ𐋣; [C2, P1, V6]; xn--gdhz03bxt42d.xn--lrb506jqr4n; ; xn--gdhz03bxt42d.xn--lrb6479j; [P1, V5, V6] # ⴋ≮𱲆.ާ𐋣 +xn--gdhz03bxt42d.xn--lrb6479j; ⴋ≮𱲆.ާ𐋣; [V5, V6]; xn--gdhz03bxt42d.xn--lrb6479j; ; ; # ⴋ≮𱲆.ާ𐋣 +xn--gdhz03bxt42d.xn--lrb506jqr4n; ⴋ≮𱲆.‍ާ𐋣; [C2, V6]; xn--gdhz03bxt42d.xn--lrb506jqr4n; ; ; # ⴋ≮𱲆.ާ𐋣 +xn--jnd802gsm17c.xn--lrb6479j; Ⴋ≮𱲆.ާ𐋣; [V5, V6]; xn--jnd802gsm17c.xn--lrb6479j; ; ; # Ⴋ≮𱲆.ާ𐋣 +xn--jnd802gsm17c.xn--lrb506jqr4n; Ⴋ≮𱲆.‍ާ𐋣; [C2, V6]; xn--jnd802gsm17c.xn--lrb506jqr4n; ; ; # Ⴋ≮𱲆.ާ𐋣 ្.򆽒≯; ; [P1, V5, V6]; xn--u4e.xn--hdhx0084f; ; ; # ្.≯ ្.򆽒≯; ្.򆽒≯; [P1, V5, V6]; xn--u4e.xn--hdhx0084f; ; ; # ្.≯ xn--u4e.xn--hdhx0084f; ្.򆽒≯; [V5, V6]; xn--u4e.xn--hdhx0084f; ; ; # ្.≯ @@ -2051,8 +2051,8 @@ xn--7-xmb182aez5a.xn--wy1ao4929b; ߢς‍7.蔑򛖢; [B2, C2, V6]; xn--7-xmb182ae ߢσ‍𝟳。蔑򛖢; ߢσ‍7.蔑򛖢; [B2, C2, P1, V6]; xn--7-zmb872aez5a.xn--wy1ao4929b; ; xn--7-zmb872a.xn--wy1ao4929b; [B2, P1, V6] # ߢσ7.蔑 𐹰.؀; ; [B1, P1, V6]; xn--oo0d.xn--ifb; ; ; # 𐹰. xn--oo0d.xn--ifb; 𐹰.؀; [B1, V6]; xn--oo0d.xn--ifb; ; ; # 𐹰. --ࢨ.𱠖; ; [B1, P1, V3, V6]; xn----mod.xn--5o9n; ; ; # -ࢨ. -xn----mod.xn--5o9n; -ࢨ.𱠖; [B1, V3, V6]; xn----mod.xn--5o9n; ; ; # -ࢨ. +-ࢨ.𱠖; ; [B1, V3]; xn----mod.xn--5o9n; ; ; # -ࢨ.𱠖 +xn----mod.xn--5o9n; -ࢨ.𱠖; [B1, V3]; xn----mod.xn--5o9n; ; ; # -ࢨ.𱠖 ≯𞱸󠇀。誆⒈; ≯𞱸.誆⒈; [B1, P1, V6]; xn--hdh7151p.xn--tsh1248a; ; ; # ≯𞱸.誆⒈ ≯𞱸󠇀。誆⒈; ≯𞱸.誆⒈; [B1, P1, V6]; xn--hdh7151p.xn--tsh1248a; ; ; # ≯𞱸.誆⒈ ≯𞱸󠇀。誆1.; ≯𞱸.誆1.; [B1, P1, V6]; xn--hdh7151p.xn--1-dy1d.; ; ; # ≯𞱸.誆1. @@ -2931,14 +2931,14 @@ xn--tshz828m.xn--3kj4524l; 𝉃⒈.ⴌ𞱓; [B1, B5, B6, V5, V6]; xn--tshz828m.x xn--1ug68oq348b.xn--3kj4524l; 𝉃‍⒈.ⴌ𞱓; [B1, B5, B6, C2, V5, V6]; xn--1ug68oq348b.xn--3kj4524l; ; ; # 𝉃⒈.ⴌ xn--tshz828m.xn--knd8464v; 𝉃⒈.Ⴌ𞱓; [B1, B5, B6, V5, V6]; xn--tshz828m.xn--knd8464v; ; ; # 𝉃⒈.Ⴌ xn--1ug68oq348b.xn--knd8464v; 𝉃‍⒈.Ⴌ𞱓; [B1, B5, B6, C2, V5, V6]; xn--1ug68oq348b.xn--knd8464v; ; ; # 𝉃⒈.Ⴌ -󠣙੍𱫘𞤸.ς񵯞􈰔; ; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--3xa03737giye6b; ; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; # ੍𞤸.ς -󠣙੍𱫘𞤖.Σ񵯞􈰔; 󠣙੍𱫘𞤸.σ񵯞􈰔; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𞤸.σ -󠣙੍𱫘𞤸.σ񵯞􈰔; ; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𞤸.σ -󠣙੍𱫘𞤖.σ񵯞􈰔; 󠣙੍𱫘𞤸.σ񵯞􈰔; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𞤸.σ -xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; 󠣙੍𱫘𞤸.σ񵯞􈰔; [B1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𞤸.σ -󠣙੍𱫘𞤖.ς񵯞􈰔; 󠣙੍𱫘𞤸.ς񵯞􈰔; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--3xa03737giye6b; ; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; # ੍𞤸.ς -xn--ybc0236vjvxgt5q0g.xn--3xa03737giye6b; 󠣙੍𱫘𞤸.ς񵯞􈰔; [B1, V6]; xn--ybc0236vjvxgt5q0g.xn--3xa03737giye6b; ; ; # ੍𞤸.ς -󠣙੍𱫘𞤸.Σ񵯞􈰔; 󠣙੍𱫘𞤸.σ񵯞􈰔; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𞤸.σ +󠣙੍𱫘𞤸.ς񵯞􈰔; ; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--3xa03737giye6b; ; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; # ੍𱫘𞤸.ς +󠣙੍𱫘𞤖.Σ񵯞􈰔; 󠣙੍𱫘𞤸.σ񵯞􈰔; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𱫘𞤸.σ +󠣙੍𱫘𞤸.σ񵯞􈰔; ; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𱫘𞤸.σ +󠣙੍𱫘𞤖.σ񵯞􈰔; 󠣙੍𱫘𞤸.σ񵯞􈰔; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𱫘𞤸.σ +xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; 󠣙੍𱫘𞤸.σ񵯞􈰔; [B1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𱫘𞤸.σ +󠣙੍𱫘𞤖.ς񵯞􈰔; 󠣙੍𱫘𞤸.ς񵯞􈰔; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--3xa03737giye6b; ; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; # ੍𱫘𞤸.ς +xn--ybc0236vjvxgt5q0g.xn--3xa03737giye6b; 󠣙੍𱫘𞤸.ς񵯞􈰔; [B1, V6]; xn--ybc0236vjvxgt5q0g.xn--3xa03737giye6b; ; ; # ੍𱫘𞤸.ς +󠣙੍𱫘𞤸.Σ񵯞􈰔; 󠣙੍𱫘𞤸.σ񵯞􈰔; [B1, P1, V6]; xn--ybc0236vjvxgt5q0g.xn--4xa82737giye6b; ; ; # ੍𱫘𞤸.σ ߓ。‌𐫀򞭱; ߓ.‌𐫀򞭱; [B1, C1, P1, V6]; xn--usb.xn--0ug9553gm3v5d; ; xn--usb.xn--pw9ci1099a; [B2, B3, P1, V6] # ߓ.𐫀 xn--usb.xn--pw9ci1099a; ߓ.𐫀򞭱; [B2, B3, V6]; xn--usb.xn--pw9ci1099a; ; ; # ߓ.𐫀 xn--usb.xn--0ug9553gm3v5d; ߓ.‌𐫀򞭱; [B1, C1, V6]; xn--usb.xn--0ug9553gm3v5d; ; ; # ߓ.𐫀 @@ -3801,12 +3801,12 @@ xn--nmw.xn--1ugx6gs128a1134j; 歷.𐹻≯󳛽‍; [B1, C2, V6]; xn--nmw.xn--1ugx ໋‍.鎁󠰑; ; [C2, P1, V5, V6]; xn--t8c059f.xn--iz4a43209d; ; xn--t8c.xn--iz4a43209d; [P1, V5, V6] # ໋.鎁 xn--t8c.xn--iz4a43209d; ໋.鎁󠰑; [V5, V6]; xn--t8c.xn--iz4a43209d; ; ; # ໋.鎁 xn--t8c059f.xn--iz4a43209d; ໋‍.鎁󠰑; [C2, V5, V6]; xn--t8c059f.xn--iz4a43209d; ; ; # ໋.鎁 -‍‌𞤀。𱘅𐶃; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, P1, V6]; xn--0ugb45126a.xn--wh0dj799f; ; xn--9d6h.xn--wh0dj799f; [B5, B6, P1, V6] # 𞤢. -‍‌𞤀。𱘅𐶃; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, P1, V6]; xn--0ugb45126a.xn--wh0dj799f; ; xn--9d6h.xn--wh0dj799f; [B5, B6, P1, V6] # 𞤢. -‍‌𞤢。𱘅𐶃; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, P1, V6]; xn--0ugb45126a.xn--wh0dj799f; ; xn--9d6h.xn--wh0dj799f; [B5, B6, P1, V6] # 𞤢. -xn--9d6h.xn--wh0dj799f; 𞤢.𱘅𐶃; [B5, B6, V6]; xn--9d6h.xn--wh0dj799f; ; ; # 𞤢. -xn--0ugb45126a.xn--wh0dj799f; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, V6]; xn--0ugb45126a.xn--wh0dj799f; ; ; # 𞤢. -‍‌𞤢。𱘅𐶃; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, P1, V6]; xn--0ugb45126a.xn--wh0dj799f; ; xn--9d6h.xn--wh0dj799f; [B5, B6, P1, V6] # 𞤢. +‍‌𞤀。𱘅𐶃; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, P1, V6]; xn--0ugb45126a.xn--wh0dj799f; ; xn--9d6h.xn--wh0dj799f; [B5, B6, P1, V6] # 𞤢.𱘅 +‍‌𞤀。𱘅𐶃; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, P1, V6]; xn--0ugb45126a.xn--wh0dj799f; ; xn--9d6h.xn--wh0dj799f; [B5, B6, P1, V6] # 𞤢.𱘅 +‍‌𞤢。𱘅𐶃; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, P1, V6]; xn--0ugb45126a.xn--wh0dj799f; ; xn--9d6h.xn--wh0dj799f; [B5, B6, P1, V6] # 𞤢.𱘅 +xn--9d6h.xn--wh0dj799f; 𞤢.𱘅𐶃; [B5, B6, V6]; xn--9d6h.xn--wh0dj799f; ; ; # 𞤢.𱘅 +xn--0ugb45126a.xn--wh0dj799f; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, V6]; xn--0ugb45126a.xn--wh0dj799f; ; ; # 𞤢.𱘅 +‍‌𞤢。𱘅𐶃; ‍‌𞤢.𱘅𐶃; [B1, B5, B6, C1, C2, P1, V6]; xn--0ugb45126a.xn--wh0dj799f; ; xn--9d6h.xn--wh0dj799f; [B5, B6, P1, V6] # 𞤢.𱘅 ب≠𝟫-.ς⒍𐹦≠; ب≠9-.ς⒍𐹦≠; [B3, B5, B6, P1, V3, V6]; xn--9--etd0100a.xn--3xa097mzpbzz04b; ; xn--9--etd0100a.xn--4xa887mzpbzz04b; # ب≠9-.ς⒍𐹦≠ ب≠𝟫-.ς⒍𐹦≠; ب≠9-.ς⒍𐹦≠; [B3, B5, B6, P1, V3, V6]; xn--9--etd0100a.xn--3xa097mzpbzz04b; ; xn--9--etd0100a.xn--4xa887mzpbzz04b; # ب≠9-.ς⒍𐹦≠ ب≠9-.ς6.𐹦≠; ; [B1, B3, P1, V3, V6]; xn--9--etd0100a.xn--6-xmb.xn--1ch8704g; ; xn--9--etd0100a.xn--6-zmb.xn--1ch8704g; # ب≠9-.ς6.𐹦≠ @@ -5925,10 +5925,10 @@ xn--qib.xn--4xa21s; ٱ.σߜ; [B5, B6]; xn--qib.xn--4xa21s; ; ; # ٱ.σߜ xn--qib.xn--3xa41s; ٱ.ςߜ; [B5, B6]; xn--qib.xn--3xa41s; ; ; # ٱ.ςߜ ٱ.Σߜ; ٱ.σߜ; [B5, B6]; xn--qib.xn--4xa21s; ; ; # ٱ.σߜ ٱ.σߜ; ٱ.σߜ; [B5, B6]; xn--qib.xn--4xa21s; ; ; # ٱ.σߜ -񼈶؅.ࣁ‍𑑂𱼱; 񼈶؅.ࣁ‍𑑂𱼱; [B2, B3, B5, B6, C2, P1, V6]; xn--nfb17942h.xn--nzb240jv06otevq; ; xn--nfb17942h.xn--nzb6708kx3pn; [B2, B3, B5, B6, P1, V6] # .ࣁ𑑂 -񼈶؅.ࣁ‍𑑂𱼱; ; [B2, B3, B5, B6, C2, P1, V6]; xn--nfb17942h.xn--nzb240jv06otevq; ; xn--nfb17942h.xn--nzb6708kx3pn; [B2, B3, B5, B6, P1, V6] # .ࣁ𑑂 -xn--nfb17942h.xn--nzb6708kx3pn; 񼈶؅.ࣁ𑑂𱼱; [B2, B3, B5, B6, V6]; xn--nfb17942h.xn--nzb6708kx3pn; ; ; # .ࣁ𑑂 -xn--nfb17942h.xn--nzb240jv06otevq; 񼈶؅.ࣁ‍𑑂𱼱; [B2, B3, B5, B6, C2, V6]; xn--nfb17942h.xn--nzb240jv06otevq; ; ; # .ࣁ𑑂 +񼈶؅.ࣁ‍𑑂𱼱; 񼈶؅.ࣁ‍𑑂𱼱; [B2, B3, B5, B6, C2, P1, V6]; xn--nfb17942h.xn--nzb240jv06otevq; ; xn--nfb17942h.xn--nzb6708kx3pn; [B2, B3, B5, B6, P1, V6] # .ࣁ𑑂𱼱 +񼈶؅.ࣁ‍𑑂𱼱; ; [B2, B3, B5, B6, C2, P1, V6]; xn--nfb17942h.xn--nzb240jv06otevq; ; xn--nfb17942h.xn--nzb6708kx3pn; [B2, B3, B5, B6, P1, V6] # .ࣁ𑑂𱼱 +xn--nfb17942h.xn--nzb6708kx3pn; 񼈶؅.ࣁ𑑂𱼱; [B2, B3, B5, B6, V6]; xn--nfb17942h.xn--nzb6708kx3pn; ; ; # .ࣁ𑑂𱼱 +xn--nfb17942h.xn--nzb240jv06otevq; 񼈶؅.ࣁ‍𑑂𱼱; [B2, B3, B5, B6, C2, V6]; xn--nfb17942h.xn--nzb240jv06otevq; ; ; # .ࣁ𑑂𱼱 𐹾𐋩𞵜。᯲; 𐹾𐋩𞵜.᯲; [B1, P1, V5, V6]; xn--d97cn8rn44p.xn--0zf; ; ; # 𐹾𐋩.᯲ 𐹾𐋩𞵜。᯲; 𐹾𐋩𞵜.᯲; [B1, P1, V5, V6]; xn--d97cn8rn44p.xn--0zf; ; ; # 𐹾𐋩.᯲ xn--d97cn8rn44p.xn--0zf; 𐹾𐋩𞵜.᯲; [B1, V5, V6]; xn--d97cn8rn44p.xn--0zf; ; ; # 𐹾𐋩.᯲ diff --git a/icu4c/source/test/testdata/LineBreakTest.txt b/icu4c/source/test/testdata/LineBreakTest.txt index 8d1cef0f785..3122a2e21ec 100644 --- a/icu4c/source/test/testdata/LineBreakTest.txt +++ b/icu4c/source/test/testdata/LineBreakTest.txt @@ -1,11 +1,11 @@ -# LineBreakTest-14.0.0.txt -# Date: 2021-08-20, 21:08:45 GMT -# © 2021 Unicode®, Inc. +# LineBreakTest-15.0.0.txt +# Date: 2022-02-26, 00:38:39 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Default Line_Break Test # diff --git a/icu4c/source/test/testdata/SentenceBreakTest.txt b/icu4c/source/test/testdata/SentenceBreakTest.txt index 61ea42cf1a2..be53fe95e73 100644 --- a/icu4c/source/test/testdata/SentenceBreakTest.txt +++ b/icu4c/source/test/testdata/SentenceBreakTest.txt @@ -1,11 +1,11 @@ -# SentenceBreakTest-14.0.0.txt -# Date: 2021-03-08, 06:22:40 GMT -# © 2021 Unicode®, Inc. +# SentenceBreakTest-15.0.0.txt +# Date: 2022-02-26, 00:39:00 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Default Sentence_Break Test # diff --git a/icu4c/source/test/testdata/WordBreakTest.txt b/icu4c/source/test/testdata/WordBreakTest.txt index 1d1435bfc76..27f64bfeeed 100644 --- a/icu4c/source/test/testdata/WordBreakTest.txt +++ b/icu4c/source/test/testdata/WordBreakTest.txt @@ -1,11 +1,11 @@ -# WordBreakTest-14.0.0.txt -# Date: 2021-03-08, 06:22:40 GMT -# © 2021 Unicode®, Inc. +# WordBreakTest-15.0.0.txt +# Date: 2022-02-26, 00:39:00 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Default Word_Break Test # diff --git a/icu4j/main/classes/core/src/com/ibm/icu/lang/UCharacter.java b/icu4j/main/classes/core/src/com/ibm/icu/lang/UCharacter.java index 2bdfcf380b3..00db9291115 100644 --- a/icu4j/main/classes/core/src/com/ibm/icu/lang/UCharacter.java +++ b/icu4j/main/classes/core/src/com/ibm/icu/lang/UCharacter.java @@ -1292,6 +1292,21 @@ public final class UCharacter implements ECharacterCategory, ECharacterDirection /** @stable ICU 70 */ public static final int ZNAMENNY_MUSICAL_NOTATION_ID = 320; /*[1CF00]*/ + /** @stable ICU 72 */ + public static final int ARABIC_EXTENDED_C_ID = 321; /*[10EC0]*/ + /** @stable ICU 72 */ + public static final int CJK_UNIFIED_IDEOGRAPHS_EXTENSION_H_ID = 322; /*[31350]*/ + /** @stable ICU 72 */ + public static final int CYRILLIC_EXTENDED_D_ID = 323; /*[1E030]*/ + /** @stable ICU 72 */ + public static final int DEVANAGARI_EXTENDED_A_ID = 324; /*[11B00]*/ + /** @stable ICU 72 */ + public static final int KAKTOVIK_NUMERALS_ID = 325; /*[1D2C0]*/ + /** @stable ICU 72 */ + public static final int KAWI_ID = 326; /*[11F00]*/ + /** @stable ICU 72 */ + public static final int NAG_MUNDARI_ID = 327; /*[1E4D0]*/ + /** * One more than the highest normal UnicodeBlock value. * The highest value is available via UCharacter.getIntPropertyMaxValue(UProperty.BLOCK). @@ -1299,7 +1314,7 @@ public final class UCharacter implements ECharacterCategory, ECharacterDirection * @deprecated ICU 58 The numeric value may change over time, see ICU ticket #12420. */ @Deprecated - public static final int COUNT = 321; + public static final int COUNT = 328; // blocks objects --------------------------------------------------- @@ -2706,6 +2721,28 @@ public final class UCharacter implements ECharacterCategory, ECharacterDirection new UnicodeBlock("ZNAMENNY_MUSICAL_NOTATION", ZNAMENNY_MUSICAL_NOTATION_ID); /*[1CF00]*/ + /** @stable ICU 72 */ + public static final UnicodeBlock ARABIC_EXTENDED_C = + new UnicodeBlock("ARABIC_EXTENDED_C", ARABIC_EXTENDED_C_ID); /*[10EC0]*/ + /** @stable ICU 72 */ + public static final UnicodeBlock CJK_UNIFIED_IDEOGRAPHS_EXTENSION_H = + new UnicodeBlock("CJK_UNIFIED_IDEOGRAPHS_EXTENSION_H", + CJK_UNIFIED_IDEOGRAPHS_EXTENSION_H_ID); /*[31350]*/ + /** @stable ICU 72 */ + public static final UnicodeBlock CYRILLIC_EXTENDED_D = + new UnicodeBlock("CYRILLIC_EXTENDED_D", CYRILLIC_EXTENDED_D_ID); /*[1E030]*/ + /** @stable ICU 72 */ + public static final UnicodeBlock DEVANAGARI_EXTENDED_A = + new UnicodeBlock("DEVANAGARI_EXTENDED_A", DEVANAGARI_EXTENDED_A_ID); /*[11B00]*/ + /** @stable ICU 72 */ + public static final UnicodeBlock KAKTOVIK_NUMERALS = + new UnicodeBlock("KAKTOVIK_NUMERALS", KAKTOVIK_NUMERALS_ID); /*[1D2C0]*/ + /** @stable ICU 72 */ + public static final UnicodeBlock KAWI = new UnicodeBlock("KAWI", KAWI_ID); /*[11F00]*/ + /** @stable ICU 72 */ + public static final UnicodeBlock NAG_MUNDARI = + new UnicodeBlock("NAG_MUNDARI", NAG_MUNDARI_ID); /*[1E4D0]*/ + /** * @stable ICU 2.4 */ diff --git a/icu4j/main/classes/core/src/com/ibm/icu/lang/UScript.java b/icu4j/main/classes/core/src/com/ibm/icu/lang/UScript.java index 23da513971f..abf37ff335e 100644 --- a/icu4j/main/classes/core/src/com/ibm/icu/lang/UScript.java +++ b/icu4j/main/classes/core/src/com/ibm/icu/lang/UScript.java @@ -1060,6 +1060,11 @@ public final class UScript { /** @stable ICU 70 */ public static final int VITHKUQI = 197; /* Vith */ + /** @stable ICU 72 */ + public static final int KAWI = 198; /* Kawi */ + /** @stable ICU 72 */ + public static final int NAG_MUNDARI = 199; /* Nagm */ + /** * One more than the highest normal UScript code. * The highest value is available via UCharacter.getIntPropertyMaxValue(UProperty.SCRIPT). @@ -1067,7 +1072,7 @@ public final class UScript { * @deprecated ICU 58 The numeric value may change over time, see ICU ticket #12420. */ @Deprecated - public static final int CODE_LIMIT = 198; + public static final int CODE_LIMIT = 200; private static int[] getCodesFromLocale(ULocale locale) { // Multi-script languages, equivalent to the LocaleScript data @@ -1547,6 +1552,8 @@ public final class UScript { 0x16ABC | EXCLUSION, // Tnsa 0x1E290 | EXCLUSION, // Toto 0x10582 | EXCLUSION | CASED, // Vith + 0x11F1B | EXCLUSION | LB_LETTERS, // Kawi + 0x1E4E6 | EXCLUSION, // Nagm // End copy-paste from parsescriptmetadata.py }; diff --git a/icu4j/main/tests/core/src/com/ibm/icu/dev/test/lang/TestUScript.java b/icu4j/main/tests/core/src/com/ibm/icu/dev/test/lang/TestUScript.java index bfb6f843f77..54e017edbb1 100644 --- a/icu4j/main/tests/core/src/com/ibm/icu/dev/test/lang/TestUScript.java +++ b/icu4j/main/tests/core/src/com/ibm/icu/dev/test/lang/TestUScript.java @@ -335,6 +335,8 @@ public class TestUScript extends TestFmwk { "Chorasmian", "Dives_Akuru", "Khitan_Small_Script", "Yezidi", // new in ICU 70 "Cypro_Minoan", "Old_Uyghur", "Tangsa", "Toto", "Vithkuqi", + // new in ICU 72 + "Kawi", "Nag_Mundari", }; String[] expectedShort = new String[]{ "Bali", "Batk", "Blis", "Brah", "Cham", "Cirt", "Cyrs", "Egyd", "Egyh", "Egyp", @@ -373,6 +375,8 @@ public class TestUScript extends TestFmwk { "Chrs", "Diak", "Kits", "Yezi", // new in ICU 70 "Cpmn", "Ougr", "Tnsa", "Toto", "Vith", + // new in ICU 72 + "Kawi", "Nagm", }; if(expectedLong.length!=(UScript.CODE_LIMIT-UScript.BALINESE)) { errln("need to add new script codes in lang.TestUScript.java!"); diff --git a/tools/unicode/c/genprops/pnames_data.h b/tools/unicode/c/genprops/pnames_data.h index f3facc382cd..1403d365529 100644 --- a/tools/unicode/c/genprops/pnames_data.h +++ b/tools/unicode/c/genprops/pnames_data.h @@ -7,7 +7,7 @@ * machine-generated by: icu/tools/unicode/py/preparseucd.py */ -#define UNICODE_VERSION { 14, 0, 0, 0 } +#define UNICODE_VERSION { 15, 0, 0, 0 } static const Value VALUES_binprop[2] = { Value(0, "N No F False"), @@ -40,7 +40,7 @@ static const Value VALUES_bc[23] = { Value(U_POP_DIRECTIONAL_ISOLATE, "PDI Pop_Directional_Isolate"), }; -static const Value VALUES_blk[321] = { +static const Value VALUES_blk[328] = { Value(UBLOCK_NO_BLOCK, "NB No_Block"), Value(UBLOCK_BASIC_LATIN, "ASCII Basic_Latin"), Value(UBLOCK_LATIN_1_SUPPLEMENT, "Latin_1_Sup Latin_1_Supplement Latin_1"), @@ -362,6 +362,13 @@ static const Value VALUES_blk[321] = { Value(UBLOCK_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS_EXTENDED_A, "UCAS_Ext_A Unified_Canadian_Aboriginal_Syllabics_Extended_A"), Value(UBLOCK_VITHKUQI, "Vithkuqi Vithkuqi"), Value(UBLOCK_ZNAMENNY_MUSICAL_NOTATION, "Znamenny_Music Znamenny_Musical_Notation"), + Value(UBLOCK_ARABIC_EXTENDED_C, "Arabic_Ext_C Arabic_Extended_C"), + Value(UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_H, "CJK_Ext_H CJK_Unified_Ideographs_Extension_H"), + Value(UBLOCK_CYRILLIC_EXTENDED_D, "Cyrillic_Ext_D Cyrillic_Extended_D"), + Value(UBLOCK_DEVANAGARI_EXTENDED_A, "Devanagari_Ext_A Devanagari_Extended_A"), + Value(UBLOCK_KAKTOVIK_NUMERALS, "Kaktovik_Numerals Kaktovik_Numerals"), + Value(UBLOCK_KAWI, "Kawi Kawi"), + Value(UBLOCK_NAG_MUNDARI, "Nag_Mundari Nag_Mundari"), }; static const Value VALUES_ccc[58] = { @@ -657,7 +664,7 @@ static const Value VALUES_nt[4] = { Value(U_NT_NUMERIC, "Nu Numeric"), }; -static const Value VALUES_sc[198] = { +static const Value VALUES_sc[200] = { Value(USCRIPT_COMMON, "Zyyy Common"), Value(USCRIPT_INHERITED, "Zinh Inherited Qaai"), Value(USCRIPT_ARABIC, "Arab Arabic"), @@ -856,6 +863,8 @@ static const Value VALUES_sc[198] = { Value(USCRIPT_TANGSA, "Tnsa Tangsa"), Value(USCRIPT_TOTO, "Toto Toto"), Value(USCRIPT_VITHKUQI, "Vith Vithkuqi"), + Value(USCRIPT_KAWI, "Kawi Kawi"), + Value(USCRIPT_NAG_MUNDARI, "Nagm Nag_Mundari"), }; static const Value VALUES_hst[6] = { @@ -1262,7 +1271,7 @@ static const Property PROPERTIES[114] = { Property(UCHAR_RGI_EMOJI_ZWJ_SEQUENCE, "RGI_Emoji_ZWJ_Sequence RGI_Emoji_ZWJ_Sequence"), Property(UCHAR_RGI_EMOJI, "RGI_Emoji RGI_Emoji"), Property(UCHAR_BIDI_CLASS, "bc Bidi_Class", VALUES_bc, 23), - Property(UCHAR_BLOCK, "blk Block", VALUES_blk, 321), + Property(UCHAR_BLOCK, "blk Block", VALUES_blk, 328), Property(UCHAR_CANONICAL_COMBINING_CLASS, "ccc Canonical_Combining_Class", VALUES_ccc, 58), Property(UCHAR_DECOMPOSITION_TYPE, "dt Decomposition_Type", VALUES_dt, 18), Property(UCHAR_EAST_ASIAN_WIDTH, "ea East_Asian_Width", VALUES_ea, 6), @@ -1271,7 +1280,7 @@ static const Property PROPERTIES[114] = { Property(UCHAR_JOINING_TYPE, "jt Joining_Type", VALUES_jt, 6), Property(UCHAR_LINE_BREAK, "lb Line_Break", VALUES_lb, 43), Property(UCHAR_NUMERIC_TYPE, "nt Numeric_Type", VALUES_nt, 4), - Property(UCHAR_SCRIPT, "sc Script", VALUES_sc, 198), + Property(UCHAR_SCRIPT, "sc Script", VALUES_sc, 200), Property(UCHAR_HANGUL_SYLLABLE_TYPE, "hst Hangul_Syllable_Type", VALUES_hst, 6), Property(UCHAR_NFD_QUICK_CHECK, "NFD_QC NFD_Quick_Check", VALUES_NFD_QC, 2), Property(UCHAR_NFKD_QUICK_CHECK, "NFKD_QC NFKD_Quick_Check", VALUES_NFKD_QC, 2), diff --git a/tools/unicode/py/parsescriptmetadata.py b/tools/unicode/py/parsescriptmetadata.py index 5b60b1a6109..8c93905c514 100755 --- a/tools/unicode/py/parsescriptmetadata.py +++ b/tools/unicode/py/parsescriptmetadata.py @@ -1,4 +1,4 @@ -#!/usr/bin/python -B +#!/usr/bin/python3 -B # -*- coding: utf-8 -*- # # Copyright (C) 2017 and later: Unicode, Inc. and others.