From b3a9efcd9273c00f3c3214e0a06696ac2ba20c3b Mon Sep 17 00:00:00 2001 From: "Steven R. Loomis" Date: Tue, 9 Aug 2022 14:55:02 -0500 Subject: [PATCH 1/4] fix(jsps): fix UpdateJspFiles path For: #271 --- .../src/main/java/org/unicode/tools/UpdateJspFiles.java | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/unicodetools/src/main/java/org/unicode/tools/UpdateJspFiles.java b/unicodetools/src/main/java/org/unicode/tools/UpdateJspFiles.java index 7be631ca94..fc336e37c4 100644 --- a/unicodetools/src/main/java/org/unicode/tools/UpdateJspFiles.java +++ b/unicodetools/src/main/java/org/unicode/tools/UpdateJspFiles.java @@ -140,7 +140,7 @@ private static void generateSubtagNames() throws IOException { private static void copyOtherProps(VersionInfo fromVersion) throws IOException { copyTextFiles( - UNICODE_TOOLS_DIR.resolve("org/unicode/props"), // TODO: will break with mavenize + UNICODE_TOOLS_DIR.resolve("src/main/resources/org/unicode/props"), // TODO: will break with mavenize JSP_RESOURCE_DATA.resolve("data"), "ExtraPropertyAliases.txt", "ExtraPropertyValueAliases.txt"); From 151db1a3f9d9cac3b05d0a61e6fecfde072f4d43 Mon Sep 17 00:00:00 2001 From: "Steven R. Loomis" Date: Tue, 9 Aug 2022 15:03:50 -0500 Subject: [PATCH 2/4] fix(jsps): update docs to fix jetty:run - Instead of mvn jetty:run, suggest a more verbose command line that does succeed Fixes: #165 --- docs/unicodejsps/index.md | 10 +++++++--- .../main/java/org/unicode/tools/UpdateJspFiles.java | 7 +++++-- 2 files changed, 12 insertions(+), 5 deletions(-) diff --git a/docs/unicodejsps/index.md b/docs/unicodejsps/index.md index 0422bb4504..ba4f4fcec4 100644 --- a/docs/unicodejsps/index.md +++ b/docs/unicodejsps/index.md @@ -27,17 +27,21 @@ If you already have `UnicodeJsps` in eclipse, it might be better to remove it fr ### Command Line ```shell -mvn jetty:run +mvn org.eclipse.jetty:jetty-maven-plugin:run ``` You can now connect to as suggested from the command line. Use Control-C to stop the server. +> Note: this used to be `mvn jetty:run` but a more verbose command is needed at present. + ### Running from within Eclipse -This screenshot shows creating a `jetty:run` maven run configuration. +This screenshot shows creating a `org.eclipse.jetty:jetty-maven-plugin:run` maven run configuration. + +![Running org.eclipse.jetty:jetty-maven-plugin:run from eclipse](eclipse-jetty-run.png) -![Running jetty:run from eclipse](eclipse-jetty-run.png) +> Note: Please change the Goal to `org.eclipse.jetty:jetty-maven-plugin:run` instead of `jetty:run` ### Debugging from within eclipse diff --git a/unicodetools/src/main/java/org/unicode/tools/UpdateJspFiles.java b/unicodetools/src/main/java/org/unicode/tools/UpdateJspFiles.java index fc336e37c4..69202fc161 100644 --- a/unicodetools/src/main/java/org/unicode/tools/UpdateJspFiles.java +++ b/unicodetools/src/main/java/org/unicode/tools/UpdateJspFiles.java @@ -54,7 +54,8 @@ public static void main(String args[]) throws IOException { System.out.println("Sublaunching CopyPropsToUnicodeJsp"); CopyPropsToUnicodeJsp.main(args); - System.out.println("DONE! Now go run 'mvn jetty:run' to fire up the JSP"); + System.out.println( + "DONE! Now go run 'mvn org.eclipse.jetty:jetty-maven-plugin:run' to fire up the JSP"); } private static void copyTextFiles(VersionInfo fromVersion) throws IOException { @@ -140,7 +141,9 @@ private static void generateSubtagNames() throws IOException { private static void copyOtherProps(VersionInfo fromVersion) throws IOException { copyTextFiles( - UNICODE_TOOLS_DIR.resolve("src/main/resources/org/unicode/props"), // TODO: will break with mavenize + UNICODE_TOOLS_DIR.resolve("src/main/resources/org/unicode/props"), // TODO: will + // break with + // mavenize JSP_RESOURCE_DATA.resolve("data"), "ExtraPropertyAliases.txt", "ExtraPropertyValueAliases.txt"); From adf0edbadbccf01085174e1dc6f82535c0e4b84f Mon Sep 17 00:00:00 2001 From: "Steven R. Loomis" Date: Tue, 9 Aug 2022 14:57:36 -0500 Subject: [PATCH 3/4] chore(jsps): update JSPs to U15 For: #271 --- .../org/unicode/jsp/IdentifierStatus.txt | 26 +- .../org/unicode/jsp/IdentifierType.txt | 77 +- .../org/unicode/jsp/IdnaMappingTable.txt | 174 ++- .../resources/org/unicode/jsp/NameAliases.txt | 17 +- .../resources/org/unicode/jsp/NamesList.txt | 1019 ++++++++++++++++- .../org/unicode/jsp/ScriptExtensions.txt | 10 +- .../org/unicode/jsp/StandardizedVariants.txt | 115 +- .../resources/org/unicode/jsp/confusables.txt | 16 +- .../org/unicode/jsp/data/PropertyAliases.txt | 10 +- .../unicode/jsp/data/PropertyValueAliases.txt | 24 +- .../org/unicode/jsp/emoji-sequences.txt | 36 +- .../org/unicode/jsp/emoji-zwj-sequences.txt | 13 +- .../org/unicode/jsp/props/ASCII_Hex_Digit.bin | Bin 41 -> 40 bytes .../resources/org/unicode/jsp/props/Age.bin | Bin 2783 -> 2846 bytes .../org/unicode/jsp/props/Alphabetic.bin | Bin 1164 -> 1182 bytes .../org/unicode/jsp/props/Basic_Emoji.bin | Bin 683 -> 680 bytes .../org/unicode/jsp/props/Bidi_Class.bin | Bin 1459 -> 1478 bytes .../org/unicode/jsp/props/Bidi_Control.bin | Bin 45 -> 44 bytes .../org/unicode/jsp/props/Bidi_Mirrored.bin | Bin 223 -> 223 bytes .../jsp/props/Bidi_Mirroring_Glyph.bin | Bin 1623 -> 1623 bytes .../unicode/jsp/props/Bidi_Paired_Bracket.bin | Bin 536 -> 536 bytes .../jsp/props/Bidi_Paired_Bracket_Type.bin | Bin 150 -> 147 bytes .../resources/org/unicode/jsp/props/Block.bin | Bin 3345 -> 3374 bytes .../org/unicode/jsp/props/CJK_Radical.bin | Bin 1671 -> 1687 bytes .../jsp/props/Canonical_Combining_Class.bin | Bin 2066 -> 2094 bytes .../org/unicode/jsp/props/Case_Folding.bin | Bin 5854 -> 5854 bytes .../org/unicode/jsp/props/Case_Ignorable.bin | Bin 745 -> 762 bytes .../resources/org/unicode/jsp/props/Cased.bin | Bin 318 -> 328 bytes .../jsp/props/Changes_When_Casefolded.bin | Bin 321 -> 320 bytes .../jsp/props/Changes_When_Casemapped.bin | Bin 289 -> 288 bytes .../jsp/props/Changes_When_Lowercased.bin | Bin 297 -> 296 bytes .../props/Changes_When_NFKC_Casefolded.bin | Bin 655 -> 660 bytes .../jsp/props/Changes_When_Titlecased.bin | Bin 331 -> 330 bytes .../jsp/props/Changes_When_Uppercased.bin | Bin 340 -> 339 bytes .../org/unicode/jsp/props/Confusable_MA.bin | Bin 31054 -> 30776 bytes .../resources/org/unicode/jsp/props/Dash.bin | Bin 94 -> 94 bytes .../unicode/jsp/props/Decomposition_Type.bin | Bin 1008 -> 1017 bytes .../props/Default_Ignorable_Code_Point.bin | Bin 90 -> 89 bytes .../org/unicode/jsp/props/Deprecated.bin | Bin 59 -> 59 bytes .../org/unicode/jsp/props/Diacritic.bin | Bin 432 -> 439 bytes .../unicode/jsp/props/East_Asian_Width.bin | Bin 636 -> 637 bytes .../resources/org/unicode/jsp/props/Emoji.bin | Bin 286 -> 283 bytes .../org/unicode/jsp/props/Emoji_Component.bin | Bin 67 -> 66 bytes .../org/unicode/jsp/props/Emoji_Modifier.bin | Bin 38 -> 38 bytes .../unicode/jsp/props/Emoji_Modifier_Base.bin | Bin 129 -> 128 bytes .../unicode/jsp/props/Emoji_Presentation.bin | Bin 208 -> 202 bytes .../props/Equivalent_Unified_Ideograph.bin | Bin 1452 -> 1458 bytes .../jsp/props/Extended_Pictographic.bin | Bin 212 -> 211 bytes .../org/unicode/jsp/props/Extender.bin | Bin 135 -> 134 bytes .../unicode/jsp/props/General_Category.bin | Bin 3421 -> 3462 bytes .../jsp/props/Grapheme_Cluster_Break.bin | Bin 1035 -> 1059 bytes .../jsp/props/Hangul_Syllable_Type.bin | Bin 136 -> 136 bytes .../org/unicode/jsp/props/Hex_Digit.bin | Bin 46 -> 45 bytes .../unicode/jsp/props/IDS_Binary_Operator.bin | Bin 41 -> 40 bytes .../jsp/props/IDS_Trinary_Operator.bin | Bin 38 -> 38 bytes .../org/unicode/jsp/props/ID_Continue.bin | Bin 1210 -> 1224 bytes .../org/unicode/jsp/props/ID_Start.bin | Bin 1082 -> 1102 bytes .../unicode/jsp/props/Identifier_Status.bin | Bin 600 -> 610 bytes .../org/unicode/jsp/props/Identifier_Type.bin | Bin 2667 -> 2721 bytes .../org/unicode/jsp/props/Ideographic.bin | Bin 106 -> 108 bytes .../org/unicode/jsp/props/Idn_2008.bin | Bin 731 -> 738 bytes .../org/unicode/jsp/props/Idn_Mapping.bin | Bin 18729 -> 18792 bytes .../org/unicode/jsp/props/Idn_Status.bin | Bin 1881 -> 1901 bytes .../jsp/props/Indic_Positional_Category.bin | Bin 926 -> 941 bytes .../jsp/props/Indic_Syllabic_Category.bin | Bin 1463 -> 1479 bytes .../org/unicode/jsp/props/Join_Control.bin | Bin 38 -> 38 bytes .../org/unicode/jsp/props/Joining_Group.bin | Bin 990 -> 985 bytes .../org/unicode/jsp/props/Joining_Type.bin | Bin 345 -> 345 bytes .../org/unicode/jsp/props/Line_Break.bin | Bin 3029 -> 3070 bytes .../jsp/props/Logical_Order_Exception.bin | Bin 54 -> 53 bytes .../org/unicode/jsp/props/Lowercase.bin | Bin 380 -> 391 bytes .../unicode/jsp/props/Lowercase_Mapping.bin | Bin 383 -> 383 bytes .../resources/org/unicode/jsp/props/Math.bin | Bin 269 -> 268 bytes .../org/unicode/jsp/props/NFC_Quick_Check.bin | Bin 273 -> 271 bytes .../org/unicode/jsp/props/NFD_Quick_Check.bin | Bin 367 -> 366 bytes .../org/unicode/jsp/props/NFKC_Casefold.bin | Bin 19014 -> 19072 bytes .../unicode/jsp/props/NFKC_Quick_Check.bin | Bin 556 -> 560 bytes .../unicode/jsp/props/NFKD_Quick_Check.bin | Bin 611 -> 613 bytes .../resources/org/unicode/jsp/props/Name.bin | Bin 282051 -> 284209 bytes .../org/unicode/jsp/props/Name_Alias.bin | Bin 2739 -> 2794 bytes .../org/unicode/jsp/props/Named_Sequences.bin | Bin 3401 -> 3600 bytes .../jsp/props/Named_Sequences_Prov.bin | Bin 222 -> 25 bytes .../jsp/props/Noncharacter_Code_Point.bin | Bin 46 -> 47 bytes .../org/unicode/jsp/props/Numeric_Type.bin | Bin 606 -> 611 bytes .../org/unicode/jsp/props/Numeric_Value.bin | Bin 1625 -> 1636 bytes .../org/unicode/jsp/props/Pattern_Syntax.bin | Bin 103 -> 102 bytes .../unicode/jsp/props/Pattern_White_Space.bin | Bin 47 -> 46 bytes .../props/Prepended_Concatenation_Mark.bin | Bin 54 -> 54 bytes .../org/unicode/jsp/props/Quotation_Mark.bin | Bin 69 -> 68 bytes .../jsp/props/RGI_Emoji_Flag_Sequence.bin | Bin 584 -> 584 bytes .../jsp/props/RGI_Emoji_Keycap_Sequence.bin | Bin 74 -> 74 bytes .../jsp/props/RGI_Emoji_Modifier_Sequence.bin | Bin 1279 -> 1295 bytes .../jsp/props/RGI_Emoji_Tag_Sequence.bin | Bin 58 -> 58 bytes .../jsp/props/RGI_Emoji_Zwj_Sequence.bin | Bin 3881 -> 3884 bytes .../org/unicode/jsp/props/Radical.bin | Bin 45 -> 44 bytes .../unicode/jsp/props/Regional_Indicator.bin | Bin 38 -> 38 bytes .../org/unicode/jsp/props/Script.bin | Bin 3046 -> 3156 bytes .../unicode/jsp/props/Script_Extensions.bin | Bin 3743 -> 3836 bytes .../org/unicode/jsp/props/Sentence_Break.bin | Bin 2369 -> 2410 bytes .../unicode/jsp/props/Sentence_Terminal.bin | Bin 227 -> 228 bytes .../unicode/jsp/props/Simple_Case_Folding.bin | Bin 5565 -> 5565 bytes .../jsp/props/Simple_Lowercase_Mapping.bin | Bin 5477 -> 5477 bytes .../jsp/props/Simple_Titlecase_Mapping.bin | Bin 5587 -> 5587 bytes .../jsp/props/Simple_Uppercase_Mapping.bin | Bin 5589 -> 5589 bytes .../org/unicode/jsp/props/Soft_Dotted.bin | Bin 93 -> 98 bytes .../jsp/props/Standardized_Variant.bin | Bin 9676 -> 10082 bytes .../jsp/props/Terminal_Punctuation.bin | Bin 280 -> 282 bytes .../unicode/jsp/props/Titlecase_Mapping.bin | Bin 420 -> 420 bytes .../unicode/jsp/props/Unified_Ideograph.bin | Bin 82 -> 84 bytes .../org/unicode/jsp/props/Uppercase.bin | Bin 356 -> 355 bytes .../unicode/jsp/props/Uppercase_Mapping.bin | Bin 414 -> 414 bytes .../unicode/jsp/props/Variation_Selector.bin | Bin 49 -> 48 bytes .../jsp/props/Vertical_Orientation.bin | Bin 372 -> 372 bytes .../org/unicode/jsp/props/White_Space.bin | Bin 59 -> 59 bytes .../org/unicode/jsp/props/Word_Break.bin | Bin 1889 -> 1921 bytes .../org/unicode/jsp/props/XID_Continue.bin | Bin 1218 -> 1234 bytes .../org/unicode/jsp/props/XID_Start.bin | Bin 1090 -> 1110 bytes .../unicode/jsp/props/kAccountingNumeric.bin | Bin 157 -> 157 bytes .../org/unicode/jsp/props/kOtherNumeric.bin | Bin 175 -> 175 bytes .../org/unicode/jsp/props/kPrimaryNumeric.bin | Bin 136 -> 136 bytes .../unicode/jsp/props/kSimplifiedVariant.bin | Bin 31693 -> 32882 bytes .../unicode/jsp/props/kTraditionalVariant.bin | Bin 30897 -> 32704 bytes .../resources/org/unicode/jsp/subtagNames.txt | 101 +- 123 files changed, 1457 insertions(+), 181 deletions(-) diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierStatus.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierStatus.txt index 35ca61ec25..ea76f87f3b 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierStatus.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierStatus.txt @@ -1,13 +1,13 @@ # IdentifierStatus.txt -# Date: 2021-06-03, 22:26:01 GMT -# © 2021 Unicode®, Inc. +# Date: 2022-05-18, 21:51:57 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Security Mechanisms for UTS #39 -# Version: 14.0.0 +# Version: 15.0.0 # -# For documentation and usage, see http://www.unicode.org/reports/tr39 +# For documentation and usage, see https://www.unicode.org/reports/tr39 # # Format # @@ -284,6 +284,7 @@ 0CE2..0CE3 ; Allowed # 5.0 [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; Allowed # 1.1 [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE 0CF1..0CF2 ; Allowed # 5.0 [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +0CF3 ; Allowed # 15.0 KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT 0D00 ; Allowed # 10.0 MALAYALAM SIGN COMBINING ANUSVARA ABOVE 0D02..0D03 ; Allowed # 1.1 [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA 0D05..0D0C ; Allowed # 1.1 [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L @@ -345,6 +346,7 @@ 0EC0..0EC4 ; Allowed # 1.1 [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI 0EC6 ; Allowed # 1.1 LAO KO LA 0EC8..0ECD ; Allowed # 1.1 [6] LAO TONE MAI EK..LAO NIGGAHITA +0ECE ; Allowed # 15.0 LAO YAMAKKAN 0ED0..0ED9 ; Allowed # 1.1 [10] LAO DIGIT ZERO..LAO DIGIT NINE 0EDE..0EDF ; Allowed # 6.1 [2] LAO LETTER KHMU GO..LAO LETTER KHMU NYO 0F00 ; Allowed # 2.0 TIBETAN SYLLABLE OM @@ -441,7 +443,8 @@ 1780..17A2 ; Allowed # 3.0 [35] KHMER LETTER KA..KHMER LETTER QA 17A5..17A7 ; Allowed # 3.0 [3] KHMER INDEPENDENT VOWEL QI..KHMER INDEPENDENT VOWEL QU 17A9..17B3 ; Allowed # 3.0 [11] KHMER INDEPENDENT VOWEL QUU..KHMER INDEPENDENT VOWEL QAU -17B6..17CA ; Allowed # 3.0 [21] KHMER VOWEL SIGN AA..KHMER SIGN TRIISAP +17B6..17CD ; Allowed # 3.0 [24] KHMER VOWEL SIGN AA..KHMER SIGN TOANDAKHIAT +17D0 ; Allowed # 3.0 KHMER SIGN SAMYOK SANNYA 17D2 ; Allowed # 3.0 KHMER SIGN COENG 17D7 ; Allowed # 3.0 KHMER SIGN LEK TOO 17DC ; Allowed # 3.0 KHMER SIGN AVAKRAHASANYA @@ -482,7 +485,6 @@ 1FF6..1FF8 ; Allowed # 1.1 [3] GREEK SMALL LETTER OMEGA WITH PERISPOMENI..GREEK CAPITAL LETTER OMICRON WITH VARIA 1FFA ; Allowed # 1.1 GREEK CAPITAL LETTER OMEGA WITH VARIA 1FFC ; Allowed # 1.1 GREEK CAPITAL LETTER OMEGA WITH PROSGEGRAMMENI -200C..200D ; Allowed # 1.1 [2] ZERO WIDTH NON-JOINER..ZERO WIDTH JOINER 2010 ; Allowed # 1.1 HYPHEN 2019 ; Allowed # 1.1 RIGHT SINGLE QUOTATION MARK 2027 ; Allowed # 1.1 HYPHENATION POINT @@ -561,11 +563,15 @@ FA27..FA29 ; Allowed # 1.1 [3] CJK COMPATIBILITY IDEOGRAPH-FA27..CJK CO 1133C ; Allowed # 7.0 GRANTHA SIGN NUKTA 16FF0..16FF1 ; Allowed # 13.0 [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY 1B11F..1B122 ; Allowed # 14.0 [4] HIRAGANA LETTER ARCHAIC WU..KATAKANA LETTER ARCHAIC WU +1B132 ; Allowed # 15.0 HIRAGANA LETTER SMALL KO 1B150..1B152 ; Allowed # 12.0 [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO +1B155 ; Allowed # 15.0 KATAKANA LETTER SMALL KO 1B164..1B167 ; Allowed # 12.0 [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1DF00..1DF1E ; Allowed # 14.0 [31] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER S WITH CURL +1DF25..1DF2A ; Allowed # 15.0 [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1E08F ; Allowed # 15.0 COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I 1E7E0..1E7E6 ; Allowed # 14.0 [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO -1E7E8..1E7EB ; Allowed # 14.0 [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HWE +1E7E8..1E7EB ; Allowed # 14.0 [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE 1E7ED..1E7EE ; Allowed # 14.0 [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE 1E7F0..1E7FE ; Allowed # 14.0 [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 20000..2A6D6 ; Allowed # 3.1 [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6 @@ -573,9 +579,11 @@ FA27..FA29 ; Allowed # 1.1 [3] CJK COMPATIBILITY IDEOGRAPH-FA27..CJK CO 2A6DE..2A6DF ; Allowed # 14.0 [2] CJK UNIFIED IDEOGRAPH-2A6DE..CJK UNIFIED IDEOGRAPH-2A6DF 2A700..2B734 ; Allowed # 5.2 [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 2B735..2B738 ; Allowed # 14.0 [4] CJK UNIFIED IDEOGRAPH-2B735..CJK UNIFIED IDEOGRAPH-2B738 +2B739 ; Allowed # 15.0 CJK UNIFIED IDEOGRAPH-2B739 2B740..2B81D ; Allowed # 6.0 [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; Allowed # 8.0 [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; Allowed # 10.0 [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 30000..3134A ; Allowed # 13.0 [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A +31350..323AF ; Allowed # 15.0 [4192] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-323AF -# Total code points: 107953 +# Total code points: 112159 diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierType.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierType.txt index 066bed3ef3..df8b3f04e0 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierType.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierType.txt @@ -1,13 +1,13 @@ # IdentifierType.txt -# Date: 2021-06-03, 22:26:01 GMT -# © 2021 Unicode®, Inc. +# Date: 2022-05-18, 21:51:56 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Security Mechanisms for UTS #39 -# Version: 14.0.0 +# Version: 15.0.0 # -# For documentation and usage, see http://www.unicode.org/reports/tr39 +# For documentation and usage, see https://www.unicode.org/reports/tr39 # # Format # @@ -281,6 +281,7 @@ 0CE2..0CE3 ; Recommended # 5.0 [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; Recommended # 1.1 [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE 0CF1..0CF2 ; Recommended # 5.0 [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +0CF3 ; Recommended # 15.0 KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT 0D00 ; Recommended # 10.0 MALAYALAM SIGN COMBINING ANUSVARA ABOVE 0D02..0D03 ; Recommended # 1.1 [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA 0D05..0D0C ; Recommended # 1.1 [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L @@ -342,6 +343,7 @@ 0EC0..0EC4 ; Recommended # 1.1 [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI 0EC6 ; Recommended # 1.1 LAO KO LA 0EC8..0ECD ; Recommended # 1.1 [6] LAO TONE MAI EK..LAO NIGGAHITA +0ECE ; Recommended # 15.0 LAO YAMAKKAN 0ED0..0ED9 ; Recommended # 1.1 [10] LAO DIGIT ZERO..LAO DIGIT NINE 0EDE..0EDF ; Recommended # 6.1 [2] LAO LETTER KHMU GO..LAO LETTER KHMU NYO 0F00 ; Recommended # 2.0 TIBETAN SYLLABLE OM @@ -437,7 +439,8 @@ 1780..17A2 ; Recommended # 3.0 [35] KHMER LETTER KA..KHMER LETTER QA 17A5..17A7 ; Recommended # 3.0 [3] KHMER INDEPENDENT VOWEL QI..KHMER INDEPENDENT VOWEL QU 17A9..17B3 ; Recommended # 3.0 [11] KHMER INDEPENDENT VOWEL QUU..KHMER INDEPENDENT VOWEL QAU -17B6..17CA ; Recommended # 3.0 [21] KHMER VOWEL SIGN AA..KHMER SIGN TRIISAP +17B6..17CD ; Recommended # 3.0 [24] KHMER VOWEL SIGN AA..KHMER SIGN TOANDAKHIAT +17D0 ; Recommended # 3.0 KHMER SIGN SAMYOK SANNYA 17D2 ; Recommended # 3.0 KHMER SIGN COENG 17D7 ; Recommended # 3.0 KHMER SIGN LEK TOO 17DC ; Recommended # 3.0 KHMER SIGN AVAKRAHASANYA @@ -553,11 +556,15 @@ FA27..FA29 ; Recommended # 1.1 [3] CJK COMPATIBILITY ID 1133C ; Recommended # 7.0 GRANTHA SIGN NUKTA 16FF0..16FF1 ; Recommended # 13.0 [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY 1B11F..1B122 ; Recommended # 14.0 [4] HIRAGANA LETTER ARCHAIC WU..KATAKANA LETTER ARCHAIC WU +1B132 ; Recommended # 15.0 HIRAGANA LETTER SMALL KO 1B150..1B152 ; Recommended # 12.0 [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO +1B155 ; Recommended # 15.0 KATAKANA LETTER SMALL KO 1B164..1B167 ; Recommended # 12.0 [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1DF00..1DF1E ; Recommended # 14.0 [31] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER S WITH CURL +1DF25..1DF2A ; Recommended # 15.0 [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1E08F ; Recommended # 15.0 COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I 1E7E0..1E7E6 ; Recommended # 14.0 [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO -1E7E8..1E7EB ; Recommended # 14.0 [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HWE +1E7E8..1E7EB ; Recommended # 14.0 [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE 1E7ED..1E7EE ; Recommended # 14.0 [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE 1E7F0..1E7FE ; Recommended # 14.0 [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 20000..2A6D6 ; Recommended # 3.1 [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6 @@ -565,12 +572,14 @@ FA27..FA29 ; Recommended # 1.1 [3] CJK COMPATIBILITY ID 2A6DE..2A6DF ; Recommended # 14.0 [2] CJK UNIFIED IDEOGRAPH-2A6DE..CJK UNIFIED IDEOGRAPH-2A6DF 2A700..2B734 ; Recommended # 5.2 [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 2B735..2B738 ; Recommended # 14.0 [4] CJK UNIFIED IDEOGRAPH-2B735..CJK UNIFIED IDEOGRAPH-2B738 +2B739 ; Recommended # 15.0 CJK UNIFIED IDEOGRAPH-2B739 2B740..2B81D ; Recommended # 6.0 [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; Recommended # 8.0 [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; Recommended # 10.0 [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 30000..3134A ; Recommended # 13.0 [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A +31350..323AF ; Recommended # 15.0 [4192] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-323AF -# Total code points: 107934 +# Total code points: 112142 # Identifier_Type: Inclusion @@ -583,14 +592,13 @@ FA27..FA29 ; Recommended # 1.1 [3] CJK COMPATIBILITY ID 05F3..05F4 ; Inclusion # 1.1 [2] HEBREW PUNCTUATION GERESH..HEBREW PUNCTUATION GERSHAYIM 06FD..06FE ; Inclusion # 3.0 [2] ARABIC SIGN SINDHI AMPERSAND..ARABIC SIGN SINDHI POSTPOSITION MEN 0F0B ; Inclusion # 2.0 TIBETAN MARK INTERSYLLABIC TSHEG -200C..200D ; Inclusion # 1.1 [2] ZERO WIDTH NON-JOINER..ZERO WIDTH JOINER 2010 ; Inclusion # 1.1 HYPHEN 2019 ; Inclusion # 1.1 RIGHT SINGLE QUOTATION MARK 2027 ; Inclusion # 1.1 HYPHENATION POINT 30A0 ; Inclusion # 3.2 KATAKANA-HIRAGANA DOUBLE HYPHEN 30FB ; Inclusion # 1.1 KATAKANA MIDDLE DOT -# Total code points: 19 +# Total code points: 17 # Identifier_Type: Limited_Use @@ -852,11 +860,12 @@ A78F ; Uncommon_Use # 8.0 LATIN LETTER SINOLOG A7B2..A7B7 ; Uncommon_Use # 8.0 [6] LATIN CAPITAL LETTER J WITH CROSSED-TAIL..LATIN SMALL LETTER OMEGA AB60..AB63 ; Uncommon_Use # 8.0 [4] LATIN SMALL LETTER SAKHA YAT..LATIN SMALL LETTER UO 10780 ; Uncommon_Use # 14.0 MODIFIER LETTER SMALL CAPITAL AA +10EFD..10EFF ; Uncommon_Use # 15.0 [3] ARABIC SMALL LOW WORD SAKTA..ARABIC SMALL LOW WORD MADDA 1AFF0..1AFF3 ; Uncommon_Use # 14.0 [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 1AFF5..1AFFB ; Uncommon_Use # 14.0 [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 1AFFD..1AFFE ; Uncommon_Use # 14.0 [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 -# Total code points: 308 +# Total code points: 311 # Identifier_Type: Uncommon_Use Technical @@ -962,7 +971,7 @@ A8FC ; Uncommon_Use Obsolete Not_XID # 8.0 DEVANAGARI SIGN SIDD 0953..0954 ; Technical # 1.1 [2] DEVANAGARI GRAVE ACCENT..DEVANAGARI ACUTE ACCENT 0D81 ; Technical # 13.0 SINHALA SIGN CANDRABINDU 0F18..0F19 ; Technical # 2.0 [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS -17CB..17D0 ; Technical # 3.0 [6] KHMER SIGN BANTOC..KHMER SIGN SAMYOK SANNYA +17CE..17CF ; Technical # 3.0 [2] KHMER SIGN KAKABAT..KHMER SIGN AHSDA 1ABF..1AC0 ; Technical # 13.0 [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW 1D00..1D2B ; Technical # 4.0 [44] LATIN LETTER SMALL CAPITAL A..CYRILLIC LETTER SMALL CAPITAL EL 1D2F ; Technical # 4.0 MODIFIER LETTER CAPITAL BARRED B @@ -1015,7 +1024,7 @@ FE73 ; Technical # 3.2 ARABIC TAIL FRAGMENT 1D185..1D18B ; Technical # 3.1 [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE 1D1AA..1D1AD ; Technical # 3.1 [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO -# Total code points: 504 +# Total code points: 500 # Identifier_Type: Technical Exclusion @@ -1221,6 +1230,7 @@ A930..A953 ; Exclusion # 5.1 [36] REJANG LETTER KA..RE 11200..11211 ; Exclusion # 7.0 [18] KHOJKI LETTER A..KHOJKI LETTER JJA 11213..11237 ; Exclusion # 7.0 [37] KHOJKI LETTER NYA..KHOJKI SIGN SHADDA 1123E ; Exclusion # 9.0 KHOJKI SIGN SUKUN +1123F..11241 ; Exclusion # 15.0 [3] KHOJKI LETTER QA..KHOJKI VOWEL SIGN VOCALIC R 11280..11286 ; Exclusion # 8.0 [7] MULTANI LETTER A..MULTANI LETTER GA 11288 ; Exclusion # 8.0 MULTANI LETTER GHA 1128A..1128D ; Exclusion # 8.0 [4] MULTANI LETTER CA..MULTANI LETTER JJA @@ -1298,14 +1308,20 @@ A930..A953 ; Exclusion # 5.1 [36] REJANG LETTER KA..RE 11D3F..11D47 ; Exclusion # 10.0 [9] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI RA-KARA 11D50..11D59 ; Exclusion # 10.0 [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE 11EE0..11EF6 ; Exclusion # 11.0 [23] MAKASAR LETTER KA..MAKASAR VOWEL SIGN O +11F00..11F10 ; Exclusion # 15.0 [17] KAWI SIGN CANDRABINDU..KAWI LETTER O +11F12..11F3A ; Exclusion # 15.0 [41] KAWI LETTER KA..KAWI VOWEL SIGN VOCALIC R +11F3E..11F42 ; Exclusion # 15.0 [5] KAWI VOWEL SIGN E..KAWI CONJOINER +11F50..11F59 ; Exclusion # 15.0 [10] KAWI DIGIT ZERO..KAWI DIGIT NINE 12000..1236E ; Exclusion # 5.0 [879] CUNEIFORM SIGN A..CUNEIFORM SIGN ZUM 1236F..12398 ; Exclusion # 7.0 [42] CUNEIFORM SIGN KAP ELAMITE..CUNEIFORM SIGN UM TIMES ME 12399 ; Exclusion # 8.0 CUNEIFORM SIGN U U 12400..12462 ; Exclusion # 5.0 [99] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN OLD ASSYRIAN ONE QUARTER 12463..1246E ; Exclusion # 7.0 [12] CUNEIFORM NUMERIC SIGN ONE QUARTER GUR..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; Exclusion # 8.0 [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU -12F90..12FF2 ; Exclusion # 14.0 [99] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM302 +12F90..12FF0 ; Exclusion # 14.0 [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; Exclusion # 5.2 [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 +1342F ; Exclusion # 15.0 EGYPTIAN HIEROGLYPH V011D +13440..13455 ; Exclusion # 15.0 [22] EGYPTIAN HIEROGLYPH MIRROR HORIZONTALLY..EGYPTIAN HIEROGLYPH MODIFIER DAMAGED 14400..14646 ; Exclusion # 8.0 [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 16A70..16ABE ; Exclusion # 14.0 [79] TANGSA LETTER OZ..TANGSA LETTER ZA 16AC0..16AC9 ; Exclusion # 14.0 [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE @@ -1344,10 +1360,11 @@ A930..A953 ; Exclusion # 5.1 [36] REJANG LETTER KA..RE 1E023..1E024 ; Exclusion # 9.0 [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; Exclusion # 9.0 [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E290..1E2AE ; Exclusion # 14.0 [31] TOTO LETTER PA..TOTO SIGN RISING TONE +1E4D0..1E4F9 ; Exclusion # 15.0 [42] NAG MUNDARI LETTER O..NAG MUNDARI DIGIT NINE 1E800..1E8C4 ; Exclusion # 7.0 [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8D0..1E8D6 ; Exclusion # 7.0 [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS -# Total code points: 15932 +# Total code points: 16071 # Identifier_Type: Exclusion Not_XID @@ -1428,9 +1445,12 @@ A95F ; Exclusion Not_XID # 5.1 REJANG SECTION MARK 11C5A..11C6C ; Exclusion Not_XID # 9.0 [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK 11C70..11C71 ; Exclusion Not_XID # 9.0 [2] MARCHEN HEAD MARK..MARCHEN MARK SHAD 11EF7..11EF8 ; Exclusion Not_XID # 11.0 [2] MAKASAR PASSIMBANG..MAKASAR END OF SECTION +11F43..11F4F ; Exclusion Not_XID # 15.0 [13] KAWI DANDA..KAWI PUNCTUATION CLOSING SPIRAL 12470..12473 ; Exclusion Not_XID # 5.0 [4] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL TRICOLON 12474 ; Exclusion Not_XID # 7.0 CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON +12FF1..12FF2 ; Exclusion Not_XID # 14.0 [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 13430..13438 ; Exclusion Not_XID # 12.0 [9] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END SEGMENT +13439..1343F ; Exclusion Not_XID # 15.0 [7] EGYPTIAN HIEROGLYPH INSERT AT MIDDLE..EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE 16A6E..16A6F ; Exclusion Not_XID # 7.0 [2] MRO DANDA..MRO DOUBLE DANDA 16AF5 ; Exclusion Not_XID # 7.0 BASSA VAH FULL STOP 16B37..16B3F ; Exclusion Not_XID # 7.0 [9] PAHAWH HMONG SIGN VOS THOM..PAHAWH HMONG SIGN XYEEM FAIB @@ -1446,7 +1466,7 @@ A95F ; Exclusion Not_XID # 5.1 REJANG SECTION MARK 1DA85..1DA8B ; Exclusion Not_XID # 8.0 [7] SIGNWRITING LOCATION TORSO..SIGNWRITING PARENTHESIS 1E8C7..1E8CF ; Exclusion Not_XID # 7.0 [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE -# Total code points: 1103 +# Total code points: 1125 # Identifier_Type: Obsolete @@ -1901,9 +1921,11 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 101A0 ; Not_XID # 7.0 GREEK SYMBOL TAU RHO 10E60..10E7E ; Not_XID # 5.2 [31] RUMI DIGIT ONE..RUMI FRACTION TWO THIRDS 111E1..111F4 ; Not_XID # 7.0 [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +11B00..11B09 ; Not_XID # 15.0 [10] DEVANAGARI HEAD MARK..DEVANAGARI SIGN MINDU 11FC0..11FF1 ; Not_XID # 12.0 [50] TAMIL FRACTION ONE THREE-HUNDRED-AND-TWENTIETH..TAMIL SIGN VAKAIYARAA 11FFF ; Not_XID # 12.0 TAMIL PUNCTUATION END OF TEXT 16FE2 ; Not_XID # 12.0 OLD CHINESE HOOK MARK +1D2C0..1D2D3 ; Not_XID # 15.0 [20] KAKTOVIK NUMERAL ZERO..KAKTOVIK NUMERAL NINETEEN 1D2E0..1D2F3 ; Not_XID # 11.0 [20] MAYAN NUMERAL ZERO..MAYAN NUMERAL NINETEEN 1D360..1D371 ; Not_XID # 5.0 [18] COUNTING ROD UNIT DIGIT ONE..COUNTING ROD TENS DIGIT NINE 1D372..1D378 ; Not_XID # 11.0 [7] IDEOGRAPHIC TALLY MARK ONE..TALLY MARK FIVE @@ -2014,6 +2036,7 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1F6D3..1F6D4 ; Not_XID # 10.0 [2] STUPA..PAGODA 1F6D5 ; Not_XID # 12.0 HINDU TEMPLE 1F6D6..1F6D7 ; Not_XID # 13.0 [2] HUT..ELEVATOR +1F6DC ; Not_XID # 15.0 WIRELESS 1F6DD..1F6DF ; Not_XID # 14.0 [3] PLAYGROUND SLIDE..RING BUOY 1F6E0..1F6EC ; Not_XID # 7.0 [13] HAMMER AND WRENCH..AIRPLANE ARRIVING 1F6F0..1F6F3 ; Not_XID # 7.0 [4] SATELLITE..PASSENGER SHIP @@ -2023,8 +2046,11 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1F6FA ; Not_XID # 12.0 AUTO RICKSHAW 1F6FB..1F6FC ; Not_XID # 13.0 [2] PICKUP TRUCK..ROLLER SKATE 1F700..1F773 ; Not_XID # 6.0 [116] ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE +1F774..1F776 ; Not_XID # 15.0 [3] LOT OF FORTUNE..LUNAR ECLIPSE +1F77B..1F77F ; Not_XID # 15.0 [5] HAUMEA..ORCUS 1F780..1F7D4 ; Not_XID # 7.0 [85] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..HEAVY TWELVE POINTED PINWHEEL STAR 1F7D5..1F7D8 ; Not_XID # 11.0 [4] CIRCLED TRIANGLE..NEGATIVE CIRCLED SQUARE +1F7D9 ; Not_XID # 15.0 NINE POINTED WHITE STAR 1F7E0..1F7EB ; Not_XID # 12.0 [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE 1F7F0 ; Not_XID # 14.0 HEAVY EQUALS SIGN 1F800..1F80B ; Not_XID # 7.0 [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD @@ -2081,25 +2107,34 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1FA60..1FA6D ; Not_XID # 11.0 [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER 1FA70..1FA73 ; Not_XID # 12.0 [4] BALLET SHOES..SHORTS 1FA74 ; Not_XID # 13.0 THONG SANDAL +1FA75..1FA77 ; Not_XID # 15.0 [3] LIGHT BLUE HEART..PINK HEART 1FA78..1FA7A ; Not_XID # 12.0 [3] DROP OF BLOOD..STETHOSCOPE 1FA7B..1FA7C ; Not_XID # 14.0 [2] X-RAY..CRUTCH 1FA80..1FA82 ; Not_XID # 12.0 [3] YO-YO..PARACHUTE 1FA83..1FA86 ; Not_XID # 13.0 [4] BOOMERANG..NESTING DOLLS +1FA87..1FA88 ; Not_XID # 15.0 [2] MARACAS..FLUTE 1FA90..1FA95 ; Not_XID # 12.0 [6] RINGED PLANET..BANJO 1FA96..1FAA8 ; Not_XID # 13.0 [19] MILITARY HELMET..ROCK 1FAA9..1FAAC ; Not_XID # 14.0 [4] MIRROR BALL..HAMSA +1FAAD..1FAAF ; Not_XID # 15.0 [3] FOLDING HAND FAN..KHANDA 1FAB0..1FAB6 ; Not_XID # 13.0 [7] FLY..FEATHER 1FAB7..1FABA ; Not_XID # 14.0 [4] LOTUS..NEST WITH EGGS +1FABB..1FABD ; Not_XID # 15.0 [3] HYACINTH..WING +1FABF ; Not_XID # 15.0 GOOSE 1FAC0..1FAC2 ; Not_XID # 13.0 [3] ANATOMICAL HEART..PEOPLE HUGGING 1FAC3..1FAC5 ; Not_XID # 14.0 [3] PREGNANT MAN..PERSON WITH CROWN +1FACE..1FACF ; Not_XID # 15.0 [2] MOOSE..DONKEY 1FAD0..1FAD6 ; Not_XID # 13.0 [7] BLUEBERRIES..TEAPOT 1FAD7..1FAD9 ; Not_XID # 14.0 [3] POURING LIQUID..JAR +1FADA..1FADB ; Not_XID # 15.0 [2] GINGER ROOT..PEA POD 1FAE0..1FAE7 ; Not_XID # 14.0 [8] MELTING FACE..BUBBLES +1FAE8 ; Not_XID # 15.0 SHAKING FACE 1FAF0..1FAF6 ; Not_XID # 14.0 [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS +1FAF7..1FAF8 ; Not_XID # 15.0 [2] LEFTWARDS PUSHING HAND..RIGHTWARDS PUSHING HAND 1FB00..1FB92 ; Not_XID # 13.0 [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA ; Not_XID # 13.0 [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON -# Total code points: 5640 +# Total code points: 5699 # Identifier_Type: Not_NFKC @@ -2350,6 +2385,7 @@ FFE8..FFEE ; Not_NFKC # 1.1 [7] HALFWIDTH FORMS LIGH 1D6A8..1D7C9 ; Not_NFKC # 3.1 [290] MATHEMATICAL BOLD CAPITAL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC PI SYMBOL 1D7CA..1D7CB ; Not_NFKC # 5.0 [2] MATHEMATICAL BOLD CAPITAL DIGAMMA..MATHEMATICAL BOLD SMALL DIGAMMA 1D7CE..1D7FF ; Not_NFKC # 3.1 [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE +1E030..1E06D ; Not_NFKC # 15.0 [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE 1EE00..1EE03 ; Not_NFKC # 6.1 [4] ARABIC MATHEMATICAL ALEF..ARABIC MATHEMATICAL DAL 1EE05..1EE1F ; Not_NFKC # 6.1 [27] ARABIC MATHEMATICAL WAW..ARABIC MATHEMATICAL DOTLESS QAF 1EE21..1EE22 ; Not_NFKC # 6.1 [2] ARABIC MATHEMATICAL INITIAL BEH..ARABIC MATHEMATICAL INITIAL JEEM @@ -2411,7 +2447,7 @@ FFE8..FFEE ; Not_NFKC # 1.1 [7] HALFWIDTH FORMS LIGH 1FBF0..1FBF9 ; Not_NFKC # 13.0 [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE 2F800..2FA1D ; Not_NFKC # 3.1 [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D -# Total code points: 4859 +# Total code points: 4921 # Identifier_Type: Default_Ignorable @@ -2423,8 +2459,7 @@ FFE8..FFEE ; Not_NFKC # 1.1 [7] HALFWIDTH FORMS LIGH 180B..180D ; Default_Ignorable # 3.0 [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; Default_Ignorable # 3.0 MONGOLIAN VOWEL SEPARATOR 180F ; Default_Ignorable # 14.0 MONGOLIAN FREE VARIATION SELECTOR FOUR -200B ; Default_Ignorable # 1.1 ZERO WIDTH SPACE -200E..200F ; Default_Ignorable # 1.1 [2] LEFT-TO-RIGHT MARK..RIGHT-TO-LEFT MARK +200B..200F ; Default_Ignorable # 1.1 [5] ZERO WIDTH SPACE..RIGHT-TO-LEFT MARK 202A..202E ; Default_Ignorable # 1.1 [5] LEFT-TO-RIGHT EMBEDDING..RIGHT-TO-LEFT OVERRIDE 2060..2063 ; Default_Ignorable # 3.2 [4] WORD JOINER..INVISIBLE SEPARATOR 2064 ; Default_Ignorable # 5.1 INVISIBLE PLUS @@ -2438,7 +2473,7 @@ FFA0 ; Default_Ignorable # 1.1 HALFWIDTH HANGUL FIL E0020..E007F ; Default_Ignorable # 3.1 [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Default_Ignorable # 4.0 [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 396 +# Total code points: 398 # Identifier_Type: Deprecated diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/IdnaMappingTable.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/IdnaMappingTable.txt index 183760d1f1..e1ce2b36b4 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/IdnaMappingTable.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/IdnaMappingTable.txt @@ -1,13 +1,13 @@ # IdnaMappingTable.txt -# Date: 2021-05-29, 15:44:58 GMT -# © 2021 Unicode®, Inc. +# Date: 2022-05-02, 19:29:26 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode IDNA Compatible Preprocessing for UTS #46 -# Version: 14.0.0 +# Version: 15.0.0 # -# For documentation and usage, see http://www.unicode.org/reports/tr46 +# For documentation and usage, see https://www.unicode.org/reports/tr46 # 0000..002C ; disallowed_STD3_valid # 1.1 ..COMMA 002D..002E ; valid # 1.1 HYPHEN-MINUS..FULL STOP @@ -1278,7 +1278,8 @@ 0CE6..0CEF ; valid # 1.1 KANNADA DIGIT ZERO..KANNADA DIGIT NINE 0CF0 ; disallowed # NA 0CF1..0CF2 ; valid # 5.0 KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA -0CF3..0CFF ; disallowed # NA .. +0CF3 ; valid # 15.0 KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0CF4..0CFF ; disallowed # NA .. 0D00 ; valid # 10.0 MALAYALAM SIGN COMBINING ANUSVARA ABOVE 0D01 ; valid # 7.0 MALAYALAM SIGN CANDRABINDU 0D02..0D03 ; valid # 1.1 MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA @@ -1386,7 +1387,8 @@ 0EC6 ; valid # 1.1 LAO KO LA 0EC7 ; disallowed # NA 0EC8..0ECD ; valid # 1.1 LAO TONE MAI EK..LAO NIGGAHITA -0ECE..0ECF ; disallowed # NA .. +0ECE ; valid # 15.0 LAO YAMAKKAN +0ECF ; disallowed # NA 0ED0..0ED9 ; valid # 1.1 LAO DIGIT ZERO..LAO DIGIT NINE 0EDA..0EDB ; disallowed # NA .. 0EDC ; mapped ; 0EAB 0E99 # 1.1 LAO HO NO @@ -6206,7 +6208,8 @@ FFFE..FFFF ; disallowed # 1.1 .. 10EB0..10EB1 ; valid # 13.0 YEZIDI LETTER LAM WITH DOT ABOVE..YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE -10EB2..10EFF ; disallowed # NA .. +10EB2..10EFC ; disallowed # NA .. +10EFD..10EFF ; valid # 15.0 ARABIC SMALL LOW WORD SAKTA..ARABIC SMALL LOW WORD MADDA 10F00..10F1C ; valid # 11.0 OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL 10F1D..10F26 ; valid ; ; NV8 # 11.0 OLD SOGDIAN NUMBER ONE..OLD SOGDIAN FRACTION ONE HALF 10F27 ; valid # 11.0 OLD SOGDIAN LIGATURE AYIN-DALETH @@ -6271,7 +6274,8 @@ FFFE..FFFF ; disallowed # 1.1 .. +1123F..11241 ; valid # 15.0 KHOJKI LETTER QA..KHOJKI VOWEL SIGN VOCALIC R +11242..1127F ; disallowed # NA .. 11280..11286 ; valid # 8.0 MULTANI LETTER A..MULTANI LETTER GA 11287 ; disallowed # NA 11288 ; valid # 8.0 MULTANI LETTER GHA @@ -6443,7 +6447,9 @@ FFFE..FFFF ; disallowed # 1.1 .. 11AB0..11ABF ; valid # 14.0 CANADIAN SYLLABICS NATTILIK HI..CANADIAN SYLLABICS SPA 11AC0..11AF8 ; valid # 7.0 PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL -11AF9..11BFF ; disallowed # NA .. +11AF9..11AFF ; disallowed # NA .. +11B00..11B09 ; valid ; ; NV8 # 15.0 DEVANAGARI HEAD MARK..DEVANAGARI SIGN MINDU +11B0A..11BFF ; disallowed # NA .. 11C00..11C08 ; valid # 9.0 BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C09 ; disallowed # NA 11C0A..11C36 ; valid # 9.0 BHAIKSUKI LETTER E..BHAIKSUKI VOWEL SIGN VOCALIC L @@ -6489,7 +6495,15 @@ FFFE..FFFF ; disallowed # 1.1 .. 11EE0..11EF6 ; valid # 11.0 MAKASAR LETTER KA..MAKASAR VOWEL SIGN O 11EF7..11EF8 ; valid ; ; NV8 # 11.0 MAKASAR PASSIMBANG..MAKASAR END OF SECTION -11EF9..11FAF ; disallowed # NA .. +11EF9..11EFF ; disallowed # NA .. +11F00..11F10 ; valid # 15.0 KAWI SIGN CANDRABINDU..KAWI LETTER O +11F11 ; disallowed # NA +11F12..11F3A ; valid # 15.0 KAWI LETTER KA..KAWI VOWEL SIGN VOCALIC R +11F3B..11F3D ; disallowed # NA .. +11F3E..11F42 ; valid # 15.0 KAWI VOWEL SIGN E..KAWI CONJOINER +11F43..11F4F ; valid ; ; NV8 # 15.0 KAWI DANDA..KAWI PUNCTUATION CLOSING SPIRAL +11F50..11F59 ; valid # 15.0 KAWI DIGIT ZERO..KAWI DIGIT NINE +11F5A..11FAF ; disallowed # NA .. 11FB0 ; valid # 13.0 LISU LETTER YHA 11FB1..11FBF ; disallowed # NA .. 11FC0..11FF1 ; valid ; ; NV8 # 12.0 TAMIL FRACTION ONE THREE-HUNDRED-AND-TWENTIETH..TAMIL SIGN VAKAIYARAA @@ -6507,12 +6521,15 @@ FFFE..FFFF ; disallowed # 1.1 .. 12480..12543 ; valid # 8.0 CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU 12544..12F8F ; disallowed # NA .. -12F90..12FF2 ; valid # 14.0 CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM302 +12F90..12FF0 ; valid # 14.0 CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 +12FF1..12FF2 ; valid ; ; NV8 # 14.0 CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 12FF3..12FFF ; disallowed # NA .. 13000..1342E ; valid # 5.2 EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 -1342F ; disallowed # NA +1342F ; valid # 15.0 EGYPTIAN HIEROGLYPH V011D 13430..13438 ; disallowed # 12.0 EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END SEGMENT -13439..143FF ; disallowed # NA .. +13439..1343F ; disallowed # 15.0 EGYPTIAN HIEROGLYPH INSERT AT MIDDLE..EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE +13440..13455 ; valid # 15.0 EGYPTIAN HIEROGLYPH MIRROR HORIZONTALLY..EGYPTIAN HIEROGLYPH MODIFIER DAMAGED +13456..143FF ; disallowed # NA .. 14400..14646 ; valid # 8.0 ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 14647..167FF ; disallowed # NA .. 16800..16A38 ; valid # 6.0 BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ @@ -6614,9 +6631,13 @@ FFFE..FFFF ; disallowed # 1.1 .. +1B123..1B131 ; disallowed # NA .. +1B132 ; valid # 15.0 HIRAGANA LETTER SMALL KO +1B133..1B14F ; disallowed # NA .. 1B150..1B152 ; valid # 12.0 HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO -1B153..1B163 ; disallowed # NA .. +1B153..1B154 ; disallowed # NA .. +1B155 ; valid # 15.0 KATAKANA LETTER SMALL KO +1B156..1B163 ; disallowed # NA .. 1B164..1B167 ; valid # 12.0 KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B168..1B16F ; disallowed # NA .. 1B170..1B2FB ; valid # 10.0 NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -6667,7 +6688,9 @@ FFFE..FFFF ; disallowed # 1.1 .. 1D200..1D245 ; valid ; ; NV8 # 4.1 GREEK VOCAL NOTATION SYMBOL-1..GREEK MUSICAL LEIMMA -1D246..1D2DF ; disallowed # NA .. +1D246..1D2BF ; disallowed # NA .. +1D2C0..1D2D3 ; valid ; ; NV8 # 15.0 KAKTOVIK NUMERAL ZERO..KAKTOVIK NUMERAL NINETEEN +1D2D4..1D2DF ; disallowed # NA .. 1D2E0..1D2F3 ; valid ; ; NV8 # 11.0 MAYAN NUMERAL ZERO..MAYAN NUMERAL NINETEEN 1D2F4..1D2FF ; disallowed # NA .. 1D300..1D356 ; valid ; ; NV8 # 4.0 MONOGRAM FOR EARTH..TETRAGRAM FOR FOSTERING @@ -7700,7 +7723,9 @@ FFFE..FFFF ; disallowed # 1.1 .. 1DF00..1DF1E ; valid # 14.0 LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER S WITH CURL -1DF1F..1DFFF ; disallowed # NA .. +1DF1F..1DF24 ; disallowed # NA .. +1DF25..1DF2A ; valid # 15.0 LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK +1DF2B..1DFFF ; disallowed # NA .. 1E000..1E006 ; valid # 9.0 COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E007 ; disallowed # NA 1E008..1E018 ; valid # 9.0 COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU @@ -7710,7 +7735,72 @@ FFFE..FFFF ; disallowed # 1.1 1E026..1E02A ; valid # 9.0 COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA -1E02B..1E0FF ; disallowed # NA .. +1E02B..1E02F ; disallowed # NA .. +1E030 ; mapped ; 0430 # 15.0 MODIFIER LETTER CYRILLIC SMALL A +1E031 ; mapped ; 0431 # 15.0 MODIFIER LETTER CYRILLIC SMALL BE +1E032 ; mapped ; 0432 # 15.0 MODIFIER LETTER CYRILLIC SMALL VE +1E033 ; mapped ; 0433 # 15.0 MODIFIER LETTER CYRILLIC SMALL GHE +1E034 ; mapped ; 0434 # 15.0 MODIFIER LETTER CYRILLIC SMALL DE +1E035 ; mapped ; 0435 # 15.0 MODIFIER LETTER CYRILLIC SMALL IE +1E036 ; mapped ; 0436 # 15.0 MODIFIER LETTER CYRILLIC SMALL ZHE +1E037 ; mapped ; 0437 # 15.0 MODIFIER LETTER CYRILLIC SMALL ZE +1E038 ; mapped ; 0438 # 15.0 MODIFIER LETTER CYRILLIC SMALL I +1E039 ; mapped ; 043A # 15.0 MODIFIER LETTER CYRILLIC SMALL KA +1E03A ; mapped ; 043B # 15.0 MODIFIER LETTER CYRILLIC SMALL EL +1E03B ; mapped ; 043C # 15.0 MODIFIER LETTER CYRILLIC SMALL EM +1E03C ; mapped ; 043E # 15.0 MODIFIER LETTER CYRILLIC SMALL O +1E03D ; mapped ; 043F # 15.0 MODIFIER LETTER CYRILLIC SMALL PE +1E03E ; mapped ; 0440 # 15.0 MODIFIER LETTER CYRILLIC SMALL ER +1E03F ; mapped ; 0441 # 15.0 MODIFIER LETTER CYRILLIC SMALL ES +1E040 ; mapped ; 0442 # 15.0 MODIFIER LETTER CYRILLIC SMALL TE +1E041 ; mapped ; 0443 # 15.0 MODIFIER LETTER CYRILLIC SMALL U +1E042 ; mapped ; 0444 # 15.0 MODIFIER LETTER CYRILLIC SMALL EF +1E043 ; mapped ; 0445 # 15.0 MODIFIER LETTER CYRILLIC SMALL HA +1E044 ; mapped ; 0446 # 15.0 MODIFIER LETTER CYRILLIC SMALL TSE +1E045 ; mapped ; 0447 # 15.0 MODIFIER LETTER CYRILLIC SMALL CHE +1E046 ; mapped ; 0448 # 15.0 MODIFIER LETTER CYRILLIC SMALL SHA +1E047 ; mapped ; 044B # 15.0 MODIFIER LETTER CYRILLIC SMALL YERU +1E048 ; mapped ; 044D # 15.0 MODIFIER LETTER CYRILLIC SMALL E +1E049 ; mapped ; 044E # 15.0 MODIFIER LETTER CYRILLIC SMALL YU +1E04A ; mapped ; A689 # 15.0 MODIFIER LETTER CYRILLIC SMALL DZZE +1E04B ; mapped ; 04D9 # 15.0 MODIFIER LETTER CYRILLIC SMALL SCHWA +1E04C ; mapped ; 0456 # 15.0 MODIFIER LETTER CYRILLIC SMALL BYELORUSSIAN-UKRAINIAN I +1E04D ; mapped ; 0458 # 15.0 MODIFIER LETTER CYRILLIC SMALL JE +1E04E ; mapped ; 04E9 # 15.0 MODIFIER LETTER CYRILLIC SMALL BARRED O +1E04F ; mapped ; 04AF # 15.0 MODIFIER LETTER CYRILLIC SMALL STRAIGHT U +1E050 ; mapped ; 04CF # 15.0 MODIFIER LETTER CYRILLIC SMALL PALOCHKA +1E051 ; mapped ; 0430 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER A +1E052 ; mapped ; 0431 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER BE +1E053 ; mapped ; 0432 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER VE +1E054 ; mapped ; 0433 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER GHE +1E055 ; mapped ; 0434 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER DE +1E056 ; mapped ; 0435 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER IE +1E057 ; mapped ; 0436 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER ZHE +1E058 ; mapped ; 0437 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER ZE +1E059 ; mapped ; 0438 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER I +1E05A ; mapped ; 043A # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER KA +1E05B ; mapped ; 043B # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER EL +1E05C ; mapped ; 043E # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER O +1E05D ; mapped ; 043F # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER PE +1E05E ; mapped ; 0441 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER ES +1E05F ; mapped ; 0443 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER U +1E060 ; mapped ; 0444 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER EF +1E061 ; mapped ; 0445 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER HA +1E062 ; mapped ; 0446 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER TSE +1E063 ; mapped ; 0447 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER CHE +1E064 ; mapped ; 0448 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER SHA +1E065 ; mapped ; 044A # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER HARD SIGN +1E066 ; mapped ; 044B # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER YERU +1E067 ; mapped ; 0491 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER GHE WITH UPTURN +1E068 ; mapped ; 0456 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER BYELORUSSIAN-UKRAINIAN I +1E069 ; mapped ; 0455 # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER DZE +1E06A ; mapped ; 045F # 15.0 CYRILLIC SUBSCRIPT SMALL LETTER DZHE +1E06B ; mapped ; 04AB # 15.0 MODIFIER LETTER CYRILLIC SMALL ES WITH DESCENDER +1E06C ; mapped ; A651 # 15.0 MODIFIER LETTER CYRILLIC SMALL YERU WITH BACK YER +1E06D ; mapped ; 04B1 # 15.0 MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE +1E06E..1E08E ; disallowed # NA .. +1E08F ; valid # 15.0 COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I +1E090..1E0FF ; disallowed # NA .. 1E100..1E12C ; valid # 12.0 NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E12D..1E12F ; disallowed # NA .. 1E130..1E13D ; valid # 12.0 NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER @@ -7725,10 +7815,12 @@ FFFE..FFFF ; disallowed # 1.1 .. 1E2FF ; valid ; ; NV8 # 12.0 WANCHO NGUN SIGN -1E300..1E7DF ; disallowed # NA .. +1E300..1E4CF ; disallowed # NA .. +1E4D0..1E4F9 ; valid # 15.0 NAG MUNDARI LETTER O..NAG MUNDARI DIGIT NINE +1E4FA..1E7DF ; disallowed # NA .. 1E7E0..1E7E6 ; valid # 14.0 ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO 1E7E7 ; disallowed # NA -1E7E8..1E7EB ; valid # 14.0 ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HWE +1E7E8..1E7EB ; valid # 14.0 ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE 1E7EC ; disallowed # NA 1E7ED..1E7EE ; valid # 14.0 ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE 1E7EF ; disallowed # NA @@ -8212,7 +8304,8 @@ FFFE..FFFF ; disallowed # 1.1 .. +1F6D8..1F6DB ; disallowed # NA .. +1F6DC ; valid ; ; NV8 # 15.0 WIRELESS 1F6DD..1F6DF ; valid ; ; NV8 # 14.0 PLAYGROUND SLIDE..RING BUOY 1F6E0..1F6EC ; valid ; ; NV8 # 7.0 HAMMER AND WRENCH..AIRPLANE ARRIVING 1F6ED..1F6EF ; disallowed # NA .. @@ -8224,10 +8317,13 @@ FFFE..FFFF ; disallowed # 1.1 .. 1F700..1F773 ; valid ; ; NV8 # 6.0 ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE -1F774..1F77F ; disallowed # NA .. +1F774..1F776 ; valid ; ; NV8 # 15.0 LOT OF FORTUNE..LUNAR ECLIPSE +1F777..1F77A ; disallowed # NA .. +1F77B..1F77F ; valid ; ; NV8 # 15.0 HAUMEA..ORCUS 1F780..1F7D4 ; valid ; ; NV8 # 7.0 BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..HEAVY TWELVE POINTED PINWHEEL STAR 1F7D5..1F7D8 ; valid ; ; NV8 # 11.0 CIRCLED TRIANGLE..NEGATIVE CIRCLED SQUARE -1F7D9..1F7DF ; disallowed # NA .. +1F7D9 ; valid ; ; NV8 # 15.0 NINE POINTED WHITE STAR +1F7DA..1F7DF ; disallowed # NA .. 1F7E0..1F7EB ; valid ; ; NV8 # 12.0 LARGE ORANGE CIRCLE..LARGE BROWN SQUARE 1F7EC..1F7EF ; disallowed # NA .. 1F7F0 ; valid ; ; NV8 # 14.0 HEAVY EQUALS SIGN @@ -8294,30 +8390,37 @@ FFFE..FFFF ; disallowed # 1.1 .. 1FA70..1FA73 ; valid ; ; NV8 # 12.0 BALLET SHOES..SHORTS 1FA74 ; valid ; ; NV8 # 13.0 THONG SANDAL -1FA75..1FA77 ; disallowed # NA .. +1FA75..1FA77 ; valid ; ; NV8 # 15.0 LIGHT BLUE HEART..PINK HEART 1FA78..1FA7A ; valid ; ; NV8 # 12.0 DROP OF BLOOD..STETHOSCOPE 1FA7B..1FA7C ; valid ; ; NV8 # 14.0 X-RAY..CRUTCH 1FA7D..1FA7F ; disallowed # NA .. 1FA80..1FA82 ; valid ; ; NV8 # 12.0 YO-YO..PARACHUTE 1FA83..1FA86 ; valid ; ; NV8 # 13.0 BOOMERANG..NESTING DOLLS -1FA87..1FA8F ; disallowed # NA .. +1FA87..1FA88 ; valid ; ; NV8 # 15.0 MARACAS..FLUTE +1FA89..1FA8F ; disallowed # NA .. 1FA90..1FA95 ; valid ; ; NV8 # 12.0 RINGED PLANET..BANJO 1FA96..1FAA8 ; valid ; ; NV8 # 13.0 MILITARY HELMET..ROCK 1FAA9..1FAAC ; valid ; ; NV8 # 14.0 MIRROR BALL..HAMSA -1FAAD..1FAAF ; disallowed # NA .. +1FAAD..1FAAF ; valid ; ; NV8 # 15.0 FOLDING HAND FAN..KHANDA 1FAB0..1FAB6 ; valid ; ; NV8 # 13.0 FLY..FEATHER 1FAB7..1FABA ; valid ; ; NV8 # 14.0 LOTUS..NEST WITH EGGS -1FABB..1FABF ; disallowed # NA .. +1FABB..1FABD ; valid ; ; NV8 # 15.0 HYACINTH..WING +1FABE ; disallowed # NA +1FABF ; valid ; ; NV8 # 15.0 GOOSE 1FAC0..1FAC2 ; valid ; ; NV8 # 13.0 ANATOMICAL HEART..PEOPLE HUGGING 1FAC3..1FAC5 ; valid ; ; NV8 # 14.0 PREGNANT MAN..PERSON WITH CROWN -1FAC6..1FACF ; disallowed # NA .. +1FAC6..1FACD ; disallowed # NA .. +1FACE..1FACF ; valid ; ; NV8 # 15.0 MOOSE..DONKEY 1FAD0..1FAD6 ; valid ; ; NV8 # 13.0 BLUEBERRIES..TEAPOT 1FAD7..1FAD9 ; valid ; ; NV8 # 14.0 POURING LIQUID..JAR -1FADA..1FADF ; disallowed # NA .. +1FADA..1FADB ; valid ; ; NV8 # 15.0 GINGER ROOT..PEA POD +1FADC..1FADF ; disallowed # NA .. 1FAE0..1FAE7 ; valid ; ; NV8 # 14.0 MELTING FACE..BUBBLES -1FAE8..1FAEF ; disallowed # NA .. +1FAE8 ; valid ; ; NV8 # 15.0 SHAKING FACE +1FAE9..1FAEF ; disallowed # NA .. 1FAF0..1FAF6 ; valid ; ; NV8 # 14.0 HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS -1FAF7..1FAFF ; disallowed # NA .. +1FAF7..1FAF8 ; valid ; ; NV8 # 15.0 LEFTWARDS PUSHING HAND..RIGHTWARDS PUSHING HAND +1FAF9..1FAFF ; disallowed # NA .. 1FB00..1FB92 ; valid ; ; NV8 # 13.0 BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB93 ; disallowed # NA 1FB94..1FBCA ; valid ; ; NV8 # 13.0 LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON @@ -8340,7 +8443,8 @@ FFFE..FFFF ; disallowed # 1.1 .. 2A700..2B734 ; valid # 5.2 CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 2B735..2B738 ; valid # 14.0 CJK UNIFIED IDEOGRAPH-2B735..CJK UNIFIED IDEOGRAPH-2B738 -2B739..2B73F ; disallowed # NA .. +2B739 ; valid # 15.0 CJK UNIFIED IDEOGRAPH-2B739 +2B73A..2B73F ; disallowed # NA .. 2B740..2B81D ; valid # 6.0 CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B81E..2B81F ; disallowed # NA .. 2B820..2CEA1 ; valid # 8.0 CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 @@ -8882,7 +8986,9 @@ FFFE..FFFF ; disallowed # 1.1 .. 2FFFE..2FFFF ; disallowed # 2.0 .. 30000..3134A ; valid # 13.0 CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -3134B..3FFFD ; disallowed # NA .. +3134B..3134F ; disallowed # NA .. +31350..323AF ; valid # 15.0 CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-323AF +323B0..3FFFD ; disallowed # NA .. 3FFFE..3FFFF ; disallowed # 2.0 .. 40000..4FFFD ; disallowed # NA .. 4FFFE..4FFFF ; disallowed # 2.0 .. diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/NameAliases.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/NameAliases.txt index 8519284d89..db3a863a92 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/NameAliases.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/NameAliases.txt @@ -1,10 +1,10 @@ -# NameAliases-14.0.0.txt -# Date: 2020-10-21, 22:28:00 GMT [KW, LI] -# © 2020 Unicode®, Inc. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# NameAliases-15.0.0.txt +# Date: 2022-07-26, 20:13:00 GMT [KW] +# © 2022 Unicode®, Inc. +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # This file is a normative contributory data file in the # Unicode Character Database. @@ -40,7 +40,7 @@ # control codes (which for historical reasons have no Unicode character name) # or for format characters. # -# For documentation, see NamesList.html and http://www.unicode.org/reports/tr44/ +# For documentation, see NamesList.html and https://www.unicode.org/reports/tr44/ # # FORMAT # @@ -135,6 +135,7 @@ 0018;CAN;abbreviation 0019;END OF MEDIUM;control 0019;EOM;abbreviation +0019;EM;abbreviation 001A;SUBSTITUTE;control 001A;SUB;abbreviation 001B;ESCAPE;control @@ -163,7 +164,7 @@ # (and corresponding abbreviations) for these code # points are included here because these names leaked # out from the draft documents and were published in -# at least one RFC whose names for code points was +# at least one RFC whose names for code points were # implemented in Perl regex expressions. 0080;PADDING CHARACTER;figment @@ -254,6 +255,7 @@ 01A2;LATIN CAPITAL LETTER GHA;correction 01A3;LATIN SMALL LETTER GHA;correction 034F;CGJ;abbreviation +0616;ARABIC SMALL HIGH LIGATURE ALEF WITH YEH BARREE;correction 061C;ALM;abbreviation 0709;SYRIAC SUBLINEAR COLON SKEWED LEFT;correction 0CDE;KANNADA LETTER LLLA;correction @@ -271,6 +273,7 @@ 180D;FVS3;abbreviation 180E;MVS;abbreviation 180F;FVS4;abbreviation +1BBD;SUNDANESE LETTER ARCHAIC I;correction 200B;ZWSP;abbreviation 200C;ZWNJ;abbreviation 200D;ZWJ;abbreviation diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/NamesList.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/NamesList.txt index 8b4d2444f0..dc619b7fb9 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/NamesList.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/NamesList.txt @@ -1,19 +1,30 @@ ; charset=UTF-8 -@@@ The Unicode Standard 14.0.0 -@@@+ U14M210706.lst - Unicode 14.0.0 names list, tenth delta. - Repertoire synched with UnicodeData-14.0.0d13.txt. - Removed alias for 1FA79. - Added xref for 1F7F0. - Adjusted text of subhead at 1DF00. - Corrected typos in names of 3 Ethiopian Extended-B additions. +@@@ The Unicode Standard 15.0.0 +@@@+ U15M220504.lst + Unicode 15.0.0 names list, fourth delta. + Repertoire synched with UnicodeData-15.0.0d4.txt. + Rollup of alpha review fixes. + Adjusted alias and added xref for 1F728. + Added annotations for 1F772, 1F773. + Fixed typos in annotations for 1342F and 13430. + Added cross-references to 20E6. + Added cross-references between 1FAAF and 262C. + Updated annotation for 26A5. + Added annotation for 33D7. + Added annotation for 11F52. + Added cross-references between 10EFD and 08DD. + Added cross-references for 11B00 and 11B09. + Added name alias of type correction for 1BBD. + Added annotation and cross-reference for 2E95. + Extended the range for CJK Unified Ideographs Extension C to 2B739. + Added some annotations for Old Hungarian. This file is semi-automatically derived from UnicodeData.txt and a set of manually created annotations using a script to select or suppress information from the data file. The rules used for this process are aimed at readability for the human reader, at the expense of some details; therefore, this file should not be parsed for machine-readable information. -@+ © 2021 Unicode®, Inc. +@+ © 2022 Unicode®, Inc. For terms of use, see https://www.unicode.org/terms_of_use.html @@ 0000 C0 Controls and Basic Latin (Basic Latin) 007F @@+ @@ -104,6 +115,9 @@ x (zero width space - 200B) x (narrow no-break space - 202F) x (word joiner - 2060) + x (symbol for space - 2420) + x (blank symbol - 2422) + x (open box - 2423) x (ideographic space - 3000) x (zero width no-break space - FEFF) 0021 EXCLAMATION MARK @@ -113,27 +127,42 @@ x (latin letter retroflex click - 01C3) x (double exclamation mark - 203C) x (interrobang - 203D) + x (warning sign - 26A0) + x (heavy exclamation mark symbol - 2757) x (heavy exclamation mark ornament - 2762) + x (medieval exclamation mark - 2E53) + x (modifier letter raised exclamation mark - A71D) 0022 QUOTATION MARK + = double quote * neutral (vertical), used as opening or closing quotation mark * preferred characters in English for paired quotation marks are 201C & 201D * 05F4 is preferred for gershayim when writing Hebrew x (modifier letter double prime - 02BA) + x (double acute accent - 02DD) + x (modifier letter double apostrophe - 02EE) x (combining double acute accent - 030B) x (combining double vertical line above - 030E) x (hebrew punctuation gershayim - 05F4) + x (left double quotation mark - 201C) + x (right double quotation mark - 201D) x (double prime - 2033) x (ditto mark - 3003) 0023 NUMBER SIGN - = pound sign, hash, crosshatch, octothorpe + = pound sign (weight) + = hashtag, hash + = crosshatch, octothorpe + * for denoting musical sharp 266F is preferred x (l b bar symbol - 2114) + x (numero sign - 2116) x (viewdata square - 2317) x (music sharp sign - 266F) + x (equals sign and slanted parallel - 29E3) 0024 DOLLAR SIGN = milréis, escudo * used for many peso currencies in Latin America and elsewhere * glyph may have one or two vertical bars * other currency symbol characters start at 20A0 + x (cent sign - 00A2) x (currency sign - 00A4) x (peso sign - 20B1) x (heavy dollar sign - 1F4B2) @@ -143,11 +172,14 @@ x (per ten thousand sign - 2031) x (commercial minus sign - 2052) 0026 AMPERSAND + = and + * originally derived from a ligature of 'e' and 't' x (tironian sign et - 204A) x (turned ampersand - 214B) x (heavy ampersand ornament - 1F674) 0027 APOSTROPHE = apostrophe-quote (1.0) + = single quote = APL quote * neutral (vertical) glyph with mixed usage * 2019 is preferred for apostrophe @@ -157,7 +189,10 @@ x (modifier letter apostrophe - 02BC) x (modifier letter vertical line - 02C8) x (combining acute accent - 0301) + x (combining vertical line above - 030D) x (hebrew punctuation geresh - 05F3) + x (left single quotation mark - 2018) + x (right single quotation mark - 2019) x (prime - 2032) x (latin small letter saltillo - A78C) 0028 LEFT PARENTHESIS @@ -166,43 +201,65 @@ = closing parenthesis (1.0) * see discussion on semantics of paired bracketing characters 002A ASTERISK - = star (on phone keypads) + = star + * can have five or six spokes x (arabic five pointed star - 066D) + x (asterism - 2042) x (low asterisk - 204E) + x (two asterisks aligned vertically - 2051) + x (combining asterisk above - 20F0) x (asterisk operator - 2217) x (sextile - 26B9) x (heavy asterisk - 2731) + x (slavonic asterisk - A673) + x (medium six spoked asterisk - 1F7B6) +@ ASCII math operator 002B PLUS SIGN + x (modifier letter plus sign - 02D6) + x (minus sign - 2212) x (heavy plus sign - 2795) + x (hebrew letter alternative plus sign - FB29) + x (light greek cross - 1F7A2) +@ ASCII punctuation 002C COMMA = decimal separator x (arabic comma - 060C) + x (arabic decimal separator - 066B) x (single low-9 quotation mark - 201A) x (reversed comma - 2E41) x (medieval comma - 2E4C) x (ideographic comma - 3001) 002D HYPHEN-MINUS - = hyphen or minus sign - * used for either hyphen or minus sign + = hyphen, dash + = minus sign + * used generically for hyphen, minus sign or en dash, all of which have dedicated alternatives + x (soft hyphen - 00AD) + x (modifier letter minus sign - 02D7) x (hyphen - 2010) x (non-breaking hyphen - 2011) x (figure dash - 2012) x (en dash - 2013) + x (hyphenation point - 2027) x (hyphen bullet - 2043) x (minus sign - 2212) x (roman uncia sign - 10191) 002E FULL STOP = period, dot, decimal point + * the use as decimal point is locale dependent * may be rendered as a raised decimal point in old style numbers x (arabic full stop - 06D4) + x (one dot leader - 2024) + x (horizontal ellipsis - 2026) + x (raised dot - 2E33) x (stenographic full stop - 2E3C) x (ideographic full stop - 3002) 002F SOLIDUS - = slash, virgule - x (latin letter dental click - 01C0) + = slash, forward slash, virgule x (combining long solidus overlay - 0338) x (fraction slash - 2044) x (division slash - 2215) + x (mathematical rising diagonal - 27CB) + x (big solidus - 29F8) x (dotted solidus - 2E4A) @ ASCII digits 0030 DIGIT ZERO @@ -216,42 +273,65 @@ 0037 DIGIT SEVEN 0038 DIGIT EIGHT 0039 DIGIT NINE -@ ASCII punctuation and symbols +@ ASCII punctuation 003A COLON * also used to denote division or scale; for that mathematical use 2236 is preferred + * in Finnish and Swedish, also used as intra-word punctation (abbreviation mark) + x (modifier letter triangular colon - 02D0) + x (modifier letter raised colon - 02F8) x (armenian full stop - 0589) x (hebrew punctuation sof pasuq - 05C3) + x (ethiopic wordspace - 1361) + x (ethiopic colon - 1365) + x (two dot punctuation - 205A) + x (tricolon - 205D) x (ratio - 2236) x (modifier letter colon - A789) + x (presentation form for vertical two dot leader - FE30) 003B SEMICOLON * this, and not 037E, is the preferred character for 'Greek question mark' x (greek question mark - 037E) x (arabic semicolon - 061B) x (reversed semicolon - 204F) + x (turned semicolon - 2E35) +@ ASCII mathematical operators +@+ Other mathematical operators start at 2200. 003C LESS-THAN SIGN + * paired with 003E for ASCII-based angle bracket markup conventions + x (modifier letter left arrowhead - 02C2) x (single left-pointing angle quotation mark - 2039) x (left-pointing angle bracket - 2329) x (mathematical left angle bracket - 27E8) x (left angle bracket - 3008) 003D EQUALS SIGN * other related characters: 2241-2263 + x (canadian syllabics hyphen - 1400) + x (almost equal to - 2248) x (not equal to - 2260) x (identical to - 2261) + x (double hyphen - 2E40) + x (katakana-hiragana double hyphen - 30A0) x (modifier letter short equals sign - A78A) x (roman sextans sign - 10190) x (heavy equals sign - 1F7F0) 003E GREATER-THAN SIGN + x (modifier letter right arrowhead - 02C3) x (single right-pointing angle quotation mark - 203A) x (right-pointing angle bracket - 232A) x (mathematical right angle bracket - 27E9) x (right angle bracket - 3009) +@ ASCII punctuation 003F QUESTION MARK x (inverted question mark - 00BF) x (greek question mark - 037E) x (arabic question mark - 061F) x (interrobang - 203D) - x (question exclamation mark - 2048) - x (exclamation question mark - 2049) + x (double question mark - 2047) + x (black question mark ornament - 2753) + x (uncertainty sign - 2BD1) + x (reversed question mark - 2E2E) + x (medieval question mark - 2E54) + x (replacement character - FFFD) 0040 COMMERCIAL AT = at sign @ Uppercase Latin alphabet @@ -260,12 +340,16 @@ x (script capital b - 212C) 0043 LATIN CAPITAL LETTER C x (double-struck capital c - 2102) + x (degree celsius - 2103) x (black-letter capital c - 212D) + x (roman numeral one hundred - 216D) 0044 LATIN CAPITAL LETTER D + x (roman numeral five hundred - 216E) 0045 LATIN CAPITAL LETTER E x (euler constant - 2107) x (script capital e - 2130) 0046 LATIN CAPITAL LETTER F + x (degree fahrenheit - 2109) x (script capital f - 2131) x (turned capital f - 2132) 0047 LATIN CAPITAL LETTER G @@ -276,8 +360,6 @@ 0049 LATIN CAPITAL LETTER I * Turkish and Azerbaijani use 0131 for lowercase x (latin capital letter i with dot above - 0130) - x (cyrillic capital letter byelorussian-ukrainian i - 0406) - x (cyrillic letter palochka - 04C0) x (script capital i - 2110) x (black-letter capital i - 2111) x (roman numeral one - 2160) @@ -288,13 +370,16 @@ x (script capital l - 2112) 004D LATIN CAPITAL LETTER M x (script capital m - 2133) + x (roman numeral one thousand - 216F) 004E LATIN CAPITAL LETTER N x (double-struck capital n - 2115) 004F LATIN CAPITAL LETTER O 0050 LATIN CAPITAL LETTER P + x (script capital p - 2118) x (double-struck capital p - 2119) 0051 LATIN CAPITAL LETTER Q x (double-struck capital q - 211A) + x (rotated capital q - 213A) 0052 LATIN CAPITAL LETTER R x (script capital r - 211B) x (black-letter capital r - 211C) @@ -306,6 +391,7 @@ x (roman numeral five - 2164) 0057 LATIN CAPITAL LETTER W 0058 LATIN CAPITAL LETTER X + x (roman numeral ten - 2169) 0059 LATIN CAPITAL LETTER Y 005A LATIN CAPITAL LETTER Z x (double-struck capital z - 2124) @@ -318,10 +404,13 @@ = backslash x (combining reverse solidus overlay - 20E5) x (set minus - 2216) + x (mathematical falling diagonal - 27CD) + x (big reverse solidus - 29F9) 005D RIGHT SQUARE BRACKET = closing square bracket (1.0) 005E CIRCUMFLEX ACCENT * this is a spacing character + * used in ASCII-based representation of exponentiation x (modifier letter up arrowhead - 02C4) x (modifier letter circumflex accent - 02C6) x (combining circumflex accent - 0302) @@ -330,10 +419,12 @@ 005F LOW LINE = spacing underscore (1.0) * this is a spacing character + * joins with adjacent instances of itself x (modifier letter low macron - 02CD) x (combining macron below - 0331) x (combining low line - 0332) x (double low line - 2017) + x (combining conjoining macron below - FE2D) 0060 GRAVE ACCENT * this is a spacing character x (modifier letter grave accent - 02CB) @@ -347,6 +438,7 @@ 0065 LATIN SMALL LETTER E x (estimated symbol - 212E) x (script small e - 212F) + x (latin small letter blackletter e - AB32) 0066 LATIN SMALL LETTER F 0067 LATIN SMALL LETTER G x (latin small letter script g - 0261) @@ -357,6 +449,7 @@ 0069 LATIN SMALL LETTER I * Turkish and Azerbaijani use 0130 for uppercase x (latin small letter dotless i - 0131) + x (superscript latin small letter i - 2071) x (mathematical italic small dotless i - 1D6A4) 006A LATIN SMALL LETTER J x (latin small letter dotless j - 0237) @@ -370,15 +463,18 @@ x (superscript latin small letter n - 207F) 006F LATIN SMALL LETTER O x (script small o - 2134) + x (latin small letter blackletter o - AB3D) 0070 LATIN SMALL LETTER P 0071 LATIN SMALL LETTER Q 0072 LATIN SMALL LETTER R 0073 LATIN SMALL LETTER S + x (latin small letter long s - 017F) 0074 LATIN SMALL LETTER T 0075 LATIN SMALL LETTER U 0076 LATIN SMALL LETTER V 0077 LATIN SMALL LETTER W 0078 LATIN SMALL LETTER X + x (multiplication sign - 00D7) 0079 LATIN SMALL LETTER Y 007A LATIN SMALL LETTER Z x (latin small letter z with stroke - 01B6) @@ -387,10 +483,14 @@ = opening curly bracket (1.0) = left brace 007C VERTICAL LINE - = vertical bar + = vertical bar, pipe * used in pairs to indicate absolute value + * also used as an unpaired separator or as a fence + x (broken bar - 00A6) x (latin letter dental click - 01C0) x (hebrew punctuation paseq - 05C0) + x (devanagari danda - 0964) + x (combining long vertical line overlay - 20D2) x (divides - 2223) x (light vertical bar - 2758) 007D RIGHT CURLY BRACKET @@ -400,8 +500,12 @@ * this is a spacing character x (small tilde - 02DC) x (combining tilde - 0303) + x (combining tilde overlay - 0334) x (swung dash - 2053) x (tilde operator - 223C) + x (tilde with ring above - 2E1B) + x (vertical tilde - 2E2F) + x (wave dash - 301C) x (fullwidth tilde - FF5E) @ Control character 007F @@ -481,31 +585,42 @@ x (figure space - 2007) x (narrow no-break space - 202F) x (word joiner - 2060) + x (shouldered open box - 237D) x (zero width no-break space - FEFF) # 0020 00A1 INVERTED EXCLAMATION MARK * Spanish, Asturian, Galician * used in extended IPA to represent sublaminal lower alveolar percussive x (exclamation mark - 0021) + x (modifier letter raised inverted exclamation mark - A71E) 00A2 CENT SIGN + x (latin small letter c with stroke - 023C) + x (mill sign - 20A5) + x (cedi sign - 20B5) + x (musical symbol cut time - 1D135) 00A3 POUND SIGN - = pound sterling, Irish punt, Italian lira, Turkish lira, etc. + = pound sterling, Irish punt, lira, etc. + * glyph may have one or two crossbars, in distinction from 20A4 x (lira sign - 20A4) x (turkish lira sign - 20BA) x (roman semuncia sign - 10192) 00A4 CURRENCY SIGN - * other currency symbol characters: 20A0-20BF + * generic or unknown currency + * other currency symbol characters start at 20A0 x (dollar sign - 0024) 00A5 YEN SIGN - = yuan sign + = yuan sign (renminbi) * glyph may have one or two crossbars, but the official symbol in Japan and China has two + * in native context, specific ideographs may be used for units of these currencies x 5143 x 5186 00A6 BROKEN BAR = broken vertical bar (1.0) = parted rule (in typography) + x (vertical line - 007C) 00A7 SECTION SIGN - * paragraph sign in some European usage + * used in referencing numbered sections or paragraphs + x (top half section sign - 2E39) 00A8 DIAERESIS * this is a spacing character x (combining diaeresis - 0308) @@ -517,6 +632,7 @@ x (mask work symbol - 1F1AD) 00AA FEMININE ORDINAL INDICATOR * Spanish + x (modifier letter small a - 1D43) # 0061 00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK = left guillemet @@ -527,26 +643,37 @@ 00AC NOT SIGN = angled dash (in typography) x (reversed not sign - 2310) + x (turned not sign - 2319) 00AD SOFT HYPHEN = discretionary hyphen * commonly abbreviated as SHY + * an invisible format character indicating a possible hyphenation location 00AE REGISTERED SIGN = registered trade mark sign (1.0) + x (trade mark sign - 2122) x (circled latin capital letter r - 24C7) + x (raised md sign - 1F16B) + x (raised mr sign - 1F16C) 00AF MACRON = overline, APL overbar * this is a spacing character + * unlike 203E, adjacent instances of this character do not join x (modifier letter macron - 02C9) x (combining macron - 0304) x (combining overline - 0305) + x (overline - 203E) + x (combining conjoining macron - FE26) # 0020 0304 00B0 DEGREE SIGN * this is a spacing character x (ring above - 02DA) x (combining ring above - 030A) x (superscript zero - 2070) + x (degree celsius - 2103) + x (degree fahrenheit - 2109) x (ring operator - 2218) 00B1 PLUS-MINUS SIGN + = biquintile (astrological aspect: 144°) x (minus-or-plus sign - 2213) 00B2 SUPERSCRIPT TWO = squared @@ -562,6 +689,8 @@ x (modifier letter prime - 02B9) x (modifier letter acute accent - 02CA) x (combining acute accent - 0301) + x (greek tonos - 0384) + x (greek oxia - 1FFD) x (prime - 2032) # 0020 0301 00B5 MICRO SIGN @@ -577,6 +706,8 @@ = Georgian comma = Greek middle dot (ano teleia) * also used as a raised decimal point or to denote multiplication; for multiplication 22C5 is preferred + x (full stop - 002E) + x (dot above - 02D9) x (greek ano teleia - 0387) x (runic single punctuation - 16EB) x (bullet - 2022) @@ -596,9 +727,12 @@ 00B9 SUPERSCRIPT ONE x (superscript two - 00B2) x (superscript three - 00B3) + x (superscript zero - 2070) # 0031 00BA MASCULINE ORDINAL INDICATOR * Spanish + x (modifier letter small o - 1D52) + x (numero sign - 2116) # 006F 00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK = right guillemet @@ -657,6 +791,7 @@ * lowercase is 00F0 x (latin capital letter d with stroke - 0110) x (latin capital letter african d - 0189) + x (latin capital letter d with short stroke overlay - A7C7) 00D1 LATIN CAPITAL LETTER N WITH TILDE : 004E 0303 00D2 LATIN CAPITAL LETTER O WITH GRAVE @@ -672,9 +807,14 @@ @ Mathematical operator 00D7 MULTIPLICATION SIGN = z notation Cartesian product + x (latin small letter x - 0078) + x (saltire - 2613) x (multiplication x - 2715) + x (heavy ballot x - 2718) x (cross mark - 274C) x (vector or cross product - 2A2F) + x (cancellation x - 1F5D9) + x (light saltire - 1F7A9) @ Letters 00D8 LATIN CAPITAL LETTER O WITH STROKE = o slash @@ -694,9 +834,12 @@ = Eszett * German * not used in Swiss High German - * uppercase is "SS" or 1E9E + * uppercase is "SS" (standard case mapping), alternatively 1E9E * typographically the glyph for this character can be based on a ligature of 017F with either 0073 or with an old-style glyph for 007A (the latter similar in appearance to 0292). Both forms exist interchangeably today. + x (latin small letter long s - 017F) + x (latin small letter ezh - 0292) x (greek small letter beta - 03B2) + x (latin capital letter sharp s - 1E9E) 00E0 LATIN SMALL LETTER A WITH GRAVE : 0061 0300 00E1 LATIN SMALL LETTER A WITH ACUTE @@ -739,6 +882,7 @@ 00F0 LATIN SMALL LETTER ETH * Icelandic, Faroese, Old English, IPA * uppercase is 00D0 + x (latin small letter d with stroke - 0111) x (greek small letter delta - 03B4) x (partial differential - 2202) 00F1 LATIN SMALL LETTER N WITH TILDE @@ -757,7 +901,7 @@ @ Mathematical operator 00F7 DIVISION SIGN = obelus - * occasionally used as an alternate, more visually distinct version of 2212 or 2011 in some contexts + * occasionally used as an alternate, more visually distinct shape for a hyphen in some contexts * historically used as a punctuation mark to denote questionable passages in manuscripts x (syriac harklean obelus - 070B) x (commercial minus sign - 2052) @@ -766,6 +910,8 @@ x (divides - 2223) x (ratio - 2236) x (heavy division sign - 2797) + x (long division - 27CC) + x (dotted obelos - 2E13) @ Letters 00F8 LATIN SMALL LETTER O WITH STROKE = o slash @@ -3939,14 +4085,18 @@ * Kazakh, Jawi * forms digraphs @ Digraphic letters for Kazakh -@+ Use of these characters is discouraged. They were encoded for Kazakh digraphs, but their decompositions do not reflect the preferred order of representation. +@+ Use of these characters is discouraged. They were encoded for Kazakh digraphs, but their decompositions do not reflect the preferred order of representation. Accordingly, the representation of these Kazakh digraphs should instead use the preferred two-character spellings with the correct order of elements. 0675 ARABIC LETTER HIGH HAMZA ALEF + * preferred spelling is 0674 0627 # 0627 0674 0676 ARABIC LETTER HIGH HAMZA WAW + * preferred spelling is 0674 0648 # 0648 0674 0677 ARABIC LETTER U WITH HAMZA ABOVE + * preferred spelling is 0674 06C7 # 06C7 0674 0678 ARABIC LETTER HIGH HAMZA YEH + * preferred spelling is 0674 0649 # 064A 0674 @ Extended Arabic letters 0679 ARABIC LETTER TTEH @@ -4879,6 +5029,7 @@ 08DB ARABIC SMALL HIGH WORD AS-SAJDA 08DC ARABIC SMALL HIGH WORD AN-NISF 08DD ARABIC SMALL HIGH WORD SAKTA + x (arabic small low word sakta - 10EFD) 08DE ARABIC SMALL HIGH WORD QIF 08DF ARABIC SMALL HIGH WORD WAQFA 08E0 ARABIC SMALL HIGH FOOTNOTE MARKER @@ -5957,6 +6108,7 @@ 0C80 KANNADA SIGN SPACING CANDRABINDU 0C81 KANNADA SIGN CANDRABINDU 0C82 KANNADA SIGN ANUSVARA + * used in Konkani, Havyaka Kannada (Havigannada) and Awadhi texts to indicate regular anusvara 0C83 KANNADA SIGN VISARGA 0C84 KANNADA SIGN SIDDHAM = siddhirastu @@ -6079,6 +6231,8 @@ x (vedic sign jihvamuliya - 1CF5) 0CF2 KANNADA SIGN UPADHMANIYA x (vedic sign upadhmaniya - 1CF6) +0CF3 KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT + * used in Konkani, Havyaka Kannada (Havigannada) and Awadhi texts to indicate anunāsikā @@ 0D00 Malayalam 0D7F @ Various signs 0D00 MALAYALAM SIGN COMBINING ANUSVARA ABOVE @@ -6585,6 +6739,7 @@ = nikkhahit * final nasal 0E4E THAI CHARACTER YAMAKKAN + x (lao yamakkan - 0ECE) 0E4F THAI CHARACTER FONGMAN * used as a bullet x (khmer sign phnaek muan - 17D9) @@ -6728,6 +6883,9 @@ 0ECC LAO CANCELLATION MARK 0ECD LAO NIGGAHITA * final nasal or long o vowel +0ECE LAO YAMAKKAN + * marks a consonant that is simultaneously a part of two consonant clusters in Pali text + x (thai character yamakkan - 0E4E) @ Digits 0ED0 LAO DIGIT ZERO 0ED1 LAO DIGIT ONE @@ -10641,14 +10799,19 @@ 1BB9 SUNDANESE DIGIT NINE @ Sign 1BBA SUNDANESE AVAGRAHA + = gemination mark @ Historic letters 1BBB SUNDANESE LETTER REU * vocalic r 1BBC SUNDANESE LETTER LEU * vocalic l 1BBD SUNDANESE LETTER BHA + % SUNDANESE LETTER ARCHAIC I + * character was originally misidentified, so its name is a misnomer 1BBE SUNDANESE LETTER FINAL K 1BBF SUNDANESE LETTER FINAL M + * used in a 21st century document + * for actual final m, use the sequence 1B99 1BAA @@ 1BC0 Batak 1BFF @ Letters @+ Annotations for letters indicate different usage among the various alphabets sharing the Batak script. @@ -13227,6 +13390,9 @@ 20E6 COMBINING DOUBLE VERTICAL STROKE OVERLAY = z notation finite function diacritic x (double vertical line - 2016) + x (rightwards arrow with double vertical stroke - 21FB) + x (rightwards two-headed arrow with double vertical stroke - 2901) + x (rightwards arrow with tail with double vertical stroke - 2915) 20E7 COMBINING ANNUITY SYMBOL = actuarial bend x (right ceiling - 2309) @@ -14091,7 +14257,9 @@ : 2261 0338 2263 STRICTLY EQUIVALENT TO 2264 LESS-THAN OR EQUAL TO + x (less-than sign - 003C) 2265 GREATER-THAN OR EQUAL TO + x (greater-than sign - 003E) 2266 LESS-THAN OVER EQUAL TO 2267 GREATER-THAN OVER EQUAL TO 2268 LESS-THAN BUT NOT EQUAL TO @@ -14198,6 +14366,7 @@ x (circled crossing lanes - 26D2) x (n-ary circled times operator - 2A02) x (circled x - 2BBE) + x (lot of fortune - 1F774) ~ 2297 FE00 with white rim 2298 CIRCLED DIVISION SLASH 2299 CIRCLED DOT OPERATOR @@ -14311,6 +14480,9 @@ x (black star - 2605) x (white medium star - 2B50) 22C7 DIVISION TIMES + x (multiplication sign - 00D7) + x (division sign - 00F7) + x (multiplication x - 2715) @ Relation 22C8 BOWTIE x (ocr bow tie - 2445) @@ -14472,7 +14644,7 @@ 231B HOURGLASS = alchemical symbol for hour @ Quine corners -@+ These form a set of four quine corners, for quincuncial arrangement. They are also used in upper and lower pairs in mathematic, or more rarely in editorial usage as alternatives to half brackets. +@+ These form a set of four quine corners, for quincuncial arrangement. They are also used in upper and lower pairs in mathematics, or more rarely in editorial usage as alternatives to half brackets. 231C TOP LEFT CORNER x (right angle substitution marker - 2E00) x (top left half bracket - 2E22) @@ -15741,7 +15913,9 @@ x (alchemical symbol for purify - 1F763) 260C CONJUNCTION = alchemical symbol for day + x (occultation - 1F775) 260D OPPOSITION + x (lunar eclipse - 1F776) @ Miscellaneous symbols 260E BLACK TELEPHONE x (telephone sign - 2121) @@ -15827,6 +16001,7 @@ 262C ADI SHAKTI = khanda * Sikh religious symbol + x (khanda - 1FAAF) 262D HAMMER AND SICKLE 262E PEACE SYMBOL 262F YIN YANG @@ -16105,7 +16280,7 @@ = heterosexuality 26A5 MALE AND FEMALE SIGN = intersex, androgynous - = hermaphrodite (in entomology) + = hermaphroditic (in botany) 26A6 MALE WITH STROKE SIGN = transgender = alchemical symbol for iron or crocus of iron @@ -19279,7 +19454,9 @@ 2E94 CJK RADICAL SNOUT ONE x 5F51 2E95 CJK RADICAL SNOUT TWO + * actually a form of the radical for hand, despite its resemblance in shape to the radical for snout x 5F50 + x 2B739 2E96 CJK RADICAL HEART ONE * form used on left side x 5FC4 @@ -21932,6 +22109,7 @@ 33D6 SQUARE MOL # 006D 006F 006C 33D7 SQUARE PH + * casing inconsistency in the compatibility decomposition is a known anomaly dating from glyph presentations in very early versions of the standard # 0050 0048 33D8 SQUARE PM # 0070 002E 006D 002E @@ -24779,11 +24957,13 @@ A91E KAYAH LI LETTER THA A91F KAYAH LI LETTER HA A920 KAYAH LI LETTER VA A921 KAYAH LI LETTER CA +@ Vowels A922 KAYAH LI LETTER A + * serves as a vowel carrier for vowels indicated with combining marks A923 KAYAH LI LETTER OE + * also serves as a vowel carrier A924 KAYAH LI LETTER I A925 KAYAH LI LETTER OO -@ Vowels A926 KAYAH LI VOWEL UE A927 KAYAH LI VOWEL E A928 KAYAH LI VOWEL U @@ -32165,6 +32345,7 @@ FFFF 10C47 OLD TURKIC LETTER ORKHON OT 10C48 OLD TURKIC LETTER ORKHON BASH @@ 10C80 Old Hungarian 10CFF +@+ This script has contemporary usage in Hungary, where users often prefer the name Szekely-Hungarian Rovas. @ Uppercase letters @+ The use of uppercase letters is a modern innovation. 10C80 OLD HUNGARIAN CAPITAL LETTER A @@ -32352,6 +32533,7 @@ FFFF * in earlier literature called "tprus" (later recognized as an abbreviation for "temperius") 10CF2 OLD HUNGARIAN SMALL LETTER US @ Numbers +@+ The numbers for one, five, and ten have a clear relationship to Roman numerals. 10CFA OLD HUNGARIAN NUMBER ONE 10CFB OLD HUNGARIAN NUMBER FIVE 10CFC OLD HUNGARIAN NUMBER TEN @@ -32517,6 +32699,12 @@ FFFF @ Historical letters with diacritics 10EB0 YEZIDI LETTER LAM WITH DOT ABOVE 10EB1 YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE +@@ 10EC0 Arabic Extended-C 10EFF +@ Quranic marks used in Turkey +10EFD ARABIC SMALL LOW WORD SAKTA + x (arabic small high word sakta - 08DD) +10EFE ARABIC SMALL LOW WORD QASR +10EFF ARABIC SMALL LOW WORD MADDA @@ 10F00 Old Sogdian 10F2F @+ This block unifies the scripts used in the Ancient Letters and the Kultobe and Upper Indus inscriptions. @ Letters @@ -33330,6 +33518,12 @@ FFFF @ Sign 1123E KHOJKI SIGN SUKUN * used for Arabic transliteration +@ Consonant +1123F KHOJKI LETTER QA +@ Independent vowel +11240 KHOJKI LETTER SHORT I +@ Dependent vowel sign +11241 KHOJKI VOWEL SIGN VOCALIC R @@ 11280 Multani 112AF @ Vowels 11280 MULTANI LETTER A @@ -34821,6 +35015,22 @@ FFFF 11AF6 PAU CIN HAU LOW-FALLING TONE LONG FINAL 11AF7 PAU CIN HAU LOW-FALLING TONE FINAL 11AF8 PAU CIN HAU GLOTTAL STOP FINAL +@@ 11B00 Devanagari Extended-A 11B5F +@ Head marks +11B00 DEVANAGARI HEAD MARK + x (devanagari double danda - 0965) +11B01 DEVANAGARI HEAD MARK WITH HEADSTROKE +@ Auspicious signs +@+ These are used for representing bhale mīndu signs. +11B02 DEVANAGARI SIGN BHALE +11B03 DEVANAGARI SIGN BHALE WITH HOOK +11B04 DEVANAGARI SIGN EXTENDED BHALE +11B05 DEVANAGARI SIGN EXTENDED BHALE WITH HOOK +11B06 DEVANAGARI SIGN WESTERN FIVE-LIKE BHALE +11B07 DEVANAGARI SIGN WESTERN NINE-LIKE BHALE +11B08 DEVANAGARI SIGN REVERSED NINE-LIKE BHALE +11B09 DEVANAGARI SIGN MINDU + x (devanagari digit zero - 0966) @@ 11C00 Bhaiksuki 11C6F @ Independent vowels 11C00 BHAIKSUKI LETTER A @@ -35195,6 +35405,106 @@ FFFF @ Punctuation 11EF7 MAKASAR PASSIMBANG 11EF8 MAKASAR END OF SECTION +@@ 11F00 Kawi 11F5F +@ Signs +11F00 KAWI SIGN CANDRABINDU +11F01 KAWI SIGN ANUSVARA +11F02 KAWI SIGN REPHA + * cluster-initial form of 11F2C + * also used as final r +11F03 KAWI SIGN VISARGA +@ Independent vowels +11F04 KAWI LETTER A +11F05 KAWI LETTER AA +11F06 KAWI LETTER I +11F07 KAWI LETTER II +11F08 KAWI LETTER U +11F09 KAWI LETTER UU +11F0A KAWI LETTER VOCALIC R +11F0B KAWI LETTER VOCALIC RR +11F0C KAWI LETTER VOCALIC L +11F0D KAWI LETTER VOCALIC LL +11F0E KAWI LETTER E +11F0F KAWI LETTER AI +11F10 KAWI LETTER O +@ Consonants +11F12 KAWI LETTER KA +11F13 KAWI LETTER KHA +11F14 KAWI LETTER GA +11F15 KAWI LETTER GHA +11F16 KAWI LETTER NGA +11F17 KAWI LETTER CA +11F18 KAWI LETTER CHA +11F19 KAWI LETTER JA +11F1A KAWI LETTER JHA +11F1B KAWI LETTER NYA +11F1C KAWI LETTER TTA +11F1D KAWI LETTER TTHA +11F1E KAWI LETTER DDA +11F1F KAWI LETTER DDHA +11F20 KAWI LETTER NNA +11F21 KAWI LETTER TA +11F22 KAWI LETTER THA +11F23 KAWI LETTER DA +11F24 KAWI LETTER DHA +11F25 KAWI LETTER NA +11F26 KAWI LETTER PA +11F27 KAWI LETTER PHA +11F28 KAWI LETTER BA +11F29 KAWI LETTER BHA +11F2A KAWI LETTER MA +11F2B KAWI LETTER YA +11F2C KAWI LETTER RA +11F2D KAWI LETTER LA +11F2E KAWI LETTER WA +11F2F KAWI LETTER SHA +11F30 KAWI LETTER SSA +11F31 KAWI LETTER SA +11F32 KAWI LETTER HA +11F33 KAWI LETTER JNYA +@ Dependent vowel signs +11F34 KAWI VOWEL SIGN AA +11F35 KAWI VOWEL SIGN ALTERNATE AA +11F36 KAWI VOWEL SIGN I +11F37 KAWI VOWEL SIGN II +11F38 KAWI VOWEL SIGN U +11F39 KAWI VOWEL SIGN UU +11F3A KAWI VOWEL SIGN VOCALIC R +11F3E KAWI VOWEL SIGN E +11F3F KAWI VOWEL SIGN AI +11F40 KAWI VOWEL SIGN EU + * represents schwa [ǝ] +@ Viramas +11F41 KAWI SIGN KILLER + * vowel killer, always rendered visibly +11F42 KAWI CONJOINER + * used for producing below-base and post-base conjunct forms +@ Punctuation +11F43 KAWI DANDA +11F44 KAWI DOUBLE DANDA +11F45 KAWI PUNCTUATION SECTION MARKER +11F46 KAWI PUNCTUATION ALTERNATE SECTION MARKER +11F47 KAWI PUNCTUATION FLOWER +11F48 KAWI PUNCTUATION SPACE FILLER +11F49 KAWI PUNCTUATION DOT +11F4A KAWI PUNCTUATION DOUBLE DOT +11F4B KAWI PUNCTUATION TRIPLE DOT +11F4C KAWI PUNCTUATION CIRCLE +11F4D KAWI PUNCTUATION FILLED CIRCLE +11F4E KAWI PUNCTUATION SPIRAL +11F4F KAWI PUNCTUATION CLOSING SPIRAL +@ Digits +11F50 KAWI DIGIT ZERO +11F51 KAWI DIGIT ONE +11F52 KAWI DIGIT TWO + * also used as letter ro +11F53 KAWI DIGIT THREE +11F54 KAWI DIGIT FOUR +11F55 KAWI DIGIT FIVE +11F56 KAWI DIGIT SIX +11F57 KAWI DIGIT SEVEN +11F58 KAWI DIGIT EIGHT +11F59 KAWI DIGIT NINE @@ 11FB0 Lisu Supplement 11FBF @ Letter 11FB0 LISU LETTER YHA @@ -36784,7 +37094,9 @@ FFFF 1305B EGYPTIAN HIEROGLYPH C002 1305C EGYPTIAN HIEROGLYPH C002A 1305D EGYPTIAN HIEROGLYPH C002B + * mirrored version of 1305C 1305E EGYPTIAN HIEROGLYPH C002C + * mirrored version of 1305B 1305F EGYPTIAN HIEROGLYPH C003 13060 EGYPTIAN HIEROGLYPH C004 13061 EGYPTIAN HIEROGLYPH C005 @@ -36798,8 +37110,10 @@ FFFF * 1,000,000 13069 EGYPTIAN HIEROGLYPH C012 1306A EGYPTIAN HIEROGLYPH C013 + * mirrored version of 13069 1306B EGYPTIAN HIEROGLYPH C014 1306C EGYPTIAN HIEROGLYPH C015 + * mirrored version of 1306B 1306D EGYPTIAN HIEROGLYPH C016 1306E EGYPTIAN HIEROGLYPH C017 1306F EGYPTIAN HIEROGLYPH C018 @@ -36824,6 +37138,8 @@ FFFF 13081 EGYPTIAN HIEROGLYPH D011 * 1/2 13082 EGYPTIAN HIEROGLYPH D012 + * pupil of the eye + * not to be confused with 131F3 or 133F8 * 1/4 13083 EGYPTIAN HIEROGLYPH D013 * 1/8 @@ -36838,6 +37154,8 @@ FFFF 13089 EGYPTIAN HIEROGLYPH D019 1308A EGYPTIAN HIEROGLYPH D020 1308B EGYPTIAN HIEROGLYPH D021 + * mouth + * not to be confused with 133AB * transliterated as r 1308C EGYPTIAN HIEROGLYPH D022 1308D EGYPTIAN HIEROGLYPH D023 @@ -36845,8 +37163,11 @@ FFFF 1308F EGYPTIAN HIEROGLYPH D025 13090 EGYPTIAN HIEROGLYPH D026 13091 EGYPTIAN HIEROGLYPH D027 + ~ 13091 FE00 rotated 90 degrees 13092 EGYPTIAN HIEROGLYPH D027A + ~ 13092 FE00 rotated 90 degrees 13093 EGYPTIAN HIEROGLYPH D028 + ~ 13093 FE01 rotated 180 degrees 13094 EGYPTIAN HIEROGLYPH D029 13095 EGYPTIAN HIEROGLYPH D030 13096 EGYPTIAN HIEROGLYPH D031 @@ -36873,10 +37194,13 @@ FFFF * transliterated as d 130A8 EGYPTIAN HIEROGLYPH D046A 130A9 EGYPTIAN HIEROGLYPH D047 + ~ 130A9 FE01 rotated 180 degrees 130AA EGYPTIAN HIEROGLYPH D048 130AB EGYPTIAN HIEROGLYPH D048A 130AC EGYPTIAN HIEROGLYPH D049 130AD EGYPTIAN HIEROGLYPH D050 + * classifier 'accurate, finger' + * not to be confused with 130B7 * 10,000 130AE EGYPTIAN HIEROGLYPH D050A * 20,000 @@ -36897,12 +37221,16 @@ FFFF 130B6 EGYPTIAN HIEROGLYPH D050I * 50,000 130B7 EGYPTIAN HIEROGLYPH D051 + * classifier 'measure, nail, scratching, taking' + * not to be confused with 130AD 130B8 EGYPTIAN HIEROGLYPH D052 130B9 EGYPTIAN HIEROGLYPH D052A 130BA EGYPTIAN HIEROGLYPH D053 130BB EGYPTIAN HIEROGLYPH D054 + * (forward) motion 130BC EGYPTIAN HIEROGLYPH D054A 130BD EGYPTIAN HIEROGLYPH D055 + * backward motion 130BE EGYPTIAN HIEROGLYPH D056 130BF EGYPTIAN HIEROGLYPH D057 130C0 EGYPTIAN HIEROGLYPH D058 @@ -36917,6 +37245,7 @@ FFFF 130C8 EGYPTIAN HIEROGLYPH D066 130C9 EGYPTIAN HIEROGLYPH D067 * 1 heqat measure + * not to be confused with 13212 130CA EGYPTIAN HIEROGLYPH D067A * 2 heqat measures 130CB EGYPTIAN HIEROGLYPH D067B @@ -36935,7 +37264,10 @@ FFFF * 9 heqat measures @ E. Mammals 130D2 EGYPTIAN HIEROGLYPH E001 + * bull, classifier 'cattle' + * not to be confused with 130FD 130D3 EGYPTIAN HIEROGLYPH E002 + * aggressive bull 130D4 EGYPTIAN HIEROGLYPH E003 130D5 EGYPTIAN HIEROGLYPH E004 130D6 EGYPTIAN HIEROGLYPH E005 @@ -36975,9 +37307,12 @@ FFFF 130F8 EGYPTIAN HIEROGLYPH E033 130F9 EGYPTIAN HIEROGLYPH E034 130FA EGYPTIAN HIEROGLYPH E034A + * stylistic variant, use of 130F9 is preferred 130FB EGYPTIAN HIEROGLYPH E036 130FC EGYPTIAN HIEROGLYPH E037 130FD EGYPTIAN HIEROGLYPH E038 + * cow + * not to be confused with 130D2 @ F. Parts of mammals 130FE EGYPTIAN HIEROGLYPH F001 130FF EGYPTIAN HIEROGLYPH F001A @@ -36994,34 +37329,43 @@ FFFF 1310A EGYPTIAN HIEROGLYPH F012 1310B EGYPTIAN HIEROGLYPH F013 1310C EGYPTIAN HIEROGLYPH F013A + * stylistic variant, use of 1310B is preferred 1310D EGYPTIAN HIEROGLYPH F014 1310E EGYPTIAN HIEROGLYPH F015 1310F EGYPTIAN HIEROGLYPH F016 + ~ 1310F FE00 rotated 90 degrees 13110 EGYPTIAN HIEROGLYPH F017 13111 EGYPTIAN HIEROGLYPH F018 13112 EGYPTIAN HIEROGLYPH F019 13113 EGYPTIAN HIEROGLYPH F020 13114 EGYPTIAN HIEROGLYPH F021 13115 EGYPTIAN HIEROGLYPH F021A + * from hieratic 13116 EGYPTIAN HIEROGLYPH F022 13117 EGYPTIAN HIEROGLYPH F023 + ~ 13117 FE02 rotated 270 degrees 13118 EGYPTIAN HIEROGLYPH F024 + * mirrored version of 13117 13119 EGYPTIAN HIEROGLYPH F025 1311A EGYPTIAN HIEROGLYPH F026 1311B EGYPTIAN HIEROGLYPH F027 1311C EGYPTIAN HIEROGLYPH F028 + ~ 1311C FE00 rotated 90 degrees 1311D EGYPTIAN HIEROGLYPH F029 1311E EGYPTIAN HIEROGLYPH F030 1311F EGYPTIAN HIEROGLYPH F031 13120 EGYPTIAN HIEROGLYPH F031A + * cursive variant of 1311F 13121 EGYPTIAN HIEROGLYPH F032 * transliterated as 1E96 + ~ 13121 FE00 rotated 90 degrees 13122 EGYPTIAN HIEROGLYPH F033 13123 EGYPTIAN HIEROGLYPH F034 13124 EGYPTIAN HIEROGLYPH F035 13125 EGYPTIAN HIEROGLYPH F036 13126 EGYPTIAN HIEROGLYPH F037 13127 EGYPTIAN HIEROGLYPH F037A + ~ 13127 FE00 rotated 90 degrees 13128 EGYPTIAN HIEROGLYPH F038 13129 EGYPTIAN HIEROGLYPH F038A 1312A EGYPTIAN HIEROGLYPH F039 @@ -37034,25 +37378,37 @@ FFFF 13131 EGYPTIAN HIEROGLYPH F045A 13132 EGYPTIAN HIEROGLYPH F046 13133 EGYPTIAN HIEROGLYPH F046A + * rotated version of 13132 13134 EGYPTIAN HIEROGLYPH F047 + * mirrored version of 13132 13135 EGYPTIAN HIEROGLYPH F047A + * mirrored version of 13133 13136 EGYPTIAN HIEROGLYPH F048 13137 EGYPTIAN HIEROGLYPH F049 + * mirrored version of 13136 13138 EGYPTIAN HIEROGLYPH F050 13139 EGYPTIAN HIEROGLYPH F051 + ~ 13139 FE00 rotated 90 degrees + ~ 13139 FE02 rotated 270 degrees 1313A EGYPTIAN HIEROGLYPH F051A 1313B EGYPTIAN HIEROGLYPH F051B + * variant of 1313A 1313C EGYPTIAN HIEROGLYPH F051C + * rotated version of 13139 1313D EGYPTIAN HIEROGLYPH F052 1313E EGYPTIAN HIEROGLYPH F053 @ G. Birds 1313F EGYPTIAN HIEROGLYPH G001 + * Egyptian vulture, Egyptological alef + * not to be confused with 13142 * transliterated as A723 x (hebrew letter alef - 05D0) x (arabic letter alef with hamza above - 0623) 13140 EGYPTIAN HIEROGLYPH G002 13141 EGYPTIAN HIEROGLYPH G003 13142 EGYPTIAN HIEROGLYPH G004 + * phonogram 'tw' + * not to be confused with 1313F 13143 EGYPTIAN HIEROGLYPH G005 13144 EGYPTIAN HIEROGLYPH G006 13145 EGYPTIAN HIEROGLYPH G006A @@ -37093,10 +37449,14 @@ FFFF 13167 EGYPTIAN HIEROGLYPH G035 13168 EGYPTIAN HIEROGLYPH G036 13169 EGYPTIAN HIEROGLYPH G036A + * stylistic variant, use of 13168 is preferred 1316A EGYPTIAN HIEROGLYPH G037 1316B EGYPTIAN HIEROGLYPH G037A + * stylistic variant, use of 1316A is preferred 1316C EGYPTIAN HIEROGLYPH G038 + * goose 1316D EGYPTIAN HIEROGLYPH G039 + * duck 1316E EGYPTIAN HIEROGLYPH G040 1316F EGYPTIAN HIEROGLYPH G041 13170 EGYPTIAN HIEROGLYPH G042 @@ -37121,10 +37481,13 @@ FFFF 13181 EGYPTIAN HIEROGLYPH H003 13182 EGYPTIAN HIEROGLYPH H004 13183 EGYPTIAN HIEROGLYPH H005 + ~ 13183 FE02 rotated 270 degrees 13184 EGYPTIAN HIEROGLYPH H006 13185 EGYPTIAN HIEROGLYPH H006A + * from hieratic 13186 EGYPTIAN HIEROGLYPH H007 13187 EGYPTIAN HIEROGLYPH H008 + ~ 13187 FE01 rotated 180 degrees @ I. Amphibious animals, reptiles, etc. 13188 EGYPTIAN HIEROGLYPH I001 13189 EGYPTIAN HIEROGLYPH I002 @@ -37155,6 +37518,8 @@ FFFF 1319E EGYPTIAN HIEROGLYPH K004 1319F EGYPTIAN HIEROGLYPH K005 131A0 EGYPTIAN HIEROGLYPH K006 + ~ 131A0 FE00 rotated 90 degrees + ~ 131A0 FE02 rotated 270 degrees 131A1 EGYPTIAN HIEROGLYPH K007 131A2 EGYPTIAN HIEROGLYPH K008 @ L. Invertebrata and lesser animals @@ -37166,6 +37531,7 @@ FFFF 131A8 EGYPTIAN HIEROGLYPH L005 131A9 EGYPTIAN HIEROGLYPH L006 131AA EGYPTIAN HIEROGLYPH L006A + * mirrored version of 131A9 131AB EGYPTIAN HIEROGLYPH L007 131AC EGYPTIAN HIEROGLYPH L008 @ M. Trees and plants @@ -37174,6 +37540,8 @@ FFFF 131AF EGYPTIAN HIEROGLYPH M001B 131B0 EGYPTIAN HIEROGLYPH M002 131B1 EGYPTIAN HIEROGLYPH M003 + ~ 131B1 FE00 rotated 90 degrees + ~ 131B1 FE01 rotated 180 degrees 131B2 EGYPTIAN HIEROGLYPH M003A 131B3 EGYPTIAN HIEROGLYPH M004 131B4 EGYPTIAN HIEROGLYPH M005 @@ -37181,8 +37549,11 @@ FFFF 131B6 EGYPTIAN HIEROGLYPH M007 131B7 EGYPTIAN HIEROGLYPH M008 131B8 EGYPTIAN HIEROGLYPH M009 + ~ 131B8 FE00 rotated 90 degrees 131B9 EGYPTIAN HIEROGLYPH M010 + ~ 131B9 FE00 rotated 90 degrees 131BA EGYPTIAN HIEROGLYPH M010A + ~ 131BA FE02 rotated 270 degrees 131BB EGYPTIAN HIEROGLYPH M011 131BC EGYPTIAN HIEROGLYPH M012 * 1,000 @@ -37209,18 +37580,22 @@ FFFF 131C9 EGYPTIAN HIEROGLYPH M016 131CA EGYPTIAN HIEROGLYPH M016A 131CB EGYPTIAN HIEROGLYPH M017 - * yod + * egyptological yod + * transliterated as A7BD x (hebrew letter yod - 05D9) x (arabic letter yeh - 064A) + ~ 131CB FE00 rotated 90 degrees 131CC EGYPTIAN HIEROGLYPH M017A - * transliterated as y + * phonogram 'y' x (egyptian hieroglyph z004 - 133ED) 131CD EGYPTIAN HIEROGLYPH M018 131CE EGYPTIAN HIEROGLYPH M019 131CF EGYPTIAN HIEROGLYPH M020 131D0 EGYPTIAN HIEROGLYPH M021 131D1 EGYPTIAN HIEROGLYPH M022 + * classifier 'bud, lotus bud' 131D2 EGYPTIAN HIEROGLYPH M022A + *phonogram 'nn' 131D3 EGYPTIAN HIEROGLYPH M023 131D4 EGYPTIAN HIEROGLYPH M024 131D5 EGYPTIAN HIEROGLYPH M024A @@ -37236,41 +37611,65 @@ FFFF 131DF EGYPTIAN HIEROGLYPH M032 131E0 EGYPTIAN HIEROGLYPH M033 131E1 EGYPTIAN HIEROGLYPH M033A + * variant of 131E0 131E2 EGYPTIAN HIEROGLYPH M033B + * variant of 131E0 131E3 EGYPTIAN HIEROGLYPH M034 131E4 EGYPTIAN HIEROGLYPH M035 131E5 EGYPTIAN HIEROGLYPH M036 131E6 EGYPTIAN HIEROGLYPH M037 + * older variant of 131E5 131E7 EGYPTIAN HIEROGLYPH M038 131E8 EGYPTIAN HIEROGLYPH M039 131E9 EGYPTIAN HIEROGLYPH M040 + * phonogram 'js' + * not to be confused with 132A7 or 1342A 131EA EGYPTIAN HIEROGLYPH M040A 131EB EGYPTIAN HIEROGLYPH M041 131EC EGYPTIAN HIEROGLYPH M042 131ED EGYPTIAN HIEROGLYPH M043 131EE EGYPTIAN HIEROGLYPH M044 + * thorn + * not to be confused with 133DA + ~ 131EE FE01 rotated 180 degrees + ~ 131EE FE02 rotated 270 degrees @ N. Sky, earth, water 131EF EGYPTIAN HIEROGLYPH N001 131F0 EGYPTIAN HIEROGLYPH N002 131F1 EGYPTIAN HIEROGLYPH N003 + * older variant of 131F0 131F2 EGYPTIAN HIEROGLYPH N004 131F3 EGYPTIAN HIEROGLYPH N005 + * sun + * not to be confused with 13082 or 133F8 131F4 EGYPTIAN HIEROGLYPH N006 131F5 EGYPTIAN HIEROGLYPH N007 131F6 EGYPTIAN HIEROGLYPH N008 131F7 EGYPTIAN HIEROGLYPH N009 + * variant of 131F8 131F8 EGYPTIAN HIEROGLYPH N010 + * variant of 131F7 + ~ 131F8 FE01 rotated 180 degrees 131F9 EGYPTIAN HIEROGLYPH N011 + ~ 131F9 FE00 rotated 90 degrees + ~ 131F9 FE01 rotated 180 degrees 131FA EGYPTIAN HIEROGLYPH N012 + ~ 131FA FE00 rotated 90 degrees + ~ 131FA FE01 rotated 180 degrees 131FB EGYPTIAN HIEROGLYPH N013 131FC EGYPTIAN HIEROGLYPH N014 131FD EGYPTIAN HIEROGLYPH N015 131FE EGYPTIAN HIEROGLYPH N016 131FF EGYPTIAN HIEROGLYPH N017 + * land + * variant of 131FE 13200 EGYPTIAN HIEROGLYPH N018 + * island + * not to be confused with 132F0, 133D4, or 133F3 13201 EGYPTIAN HIEROGLYPH N018A 13202 EGYPTIAN HIEROGLYPH N018B 13203 EGYPTIAN HIEROGLYPH N019 + * logogram 'akhti' 13204 EGYPTIAN HIEROGLYPH N020 13205 EGYPTIAN HIEROGLYPH N021 13206 EGYPTIAN HIEROGLYPH N022 @@ -37278,10 +37677,13 @@ FFFF 13208 EGYPTIAN HIEROGLYPH N024 13209 EGYPTIAN HIEROGLYPH N025 1320A EGYPTIAN HIEROGLYPH N025A + * stylistic variant, use of 13209 is preferred 1320B EGYPTIAN HIEROGLYPH N026 1320C EGYPTIAN HIEROGLYPH N027 1320D EGYPTIAN HIEROGLYPH N028 1320E EGYPTIAN HIEROGLYPH N029 + * hill + * not to be confused with 133D8 * transliterated as q or as 1E33 x (hebrew letter qof - 05E7) x (arabic letter qaf - 0642) @@ -37289,21 +37691,34 @@ FFFF 13210 EGYPTIAN HIEROGLYPH N031 13211 EGYPTIAN HIEROGLYPH N032 13212 EGYPTIAN HIEROGLYPH N033 + * classifier 'granule, grain' + * not to be confused with 130C9 13213 EGYPTIAN HIEROGLYPH N033A + * classifier 'granules, grains' + * not to be confused with 133E7 13214 EGYPTIAN HIEROGLYPH N034 13215 EGYPTIAN HIEROGLYPH N034A + * stylistic variant, use of 13214 is preferred 13216 EGYPTIAN HIEROGLYPH N035 * transliterated as n + ~ 13216 FE02 rotated 270 degrees 13217 EGYPTIAN HIEROGLYPH N035A + * classifier 'liquid' 13218 EGYPTIAN HIEROGLYPH N036 13219 EGYPTIAN HIEROGLYPH N037 + * lake * transliterated as 0161 + * not to be confused with 1328C 1321A EGYPTIAN HIEROGLYPH N037A + * variant of 13219 1321B EGYPTIAN HIEROGLYPH N038 + * variant of 13219 1321C EGYPTIAN HIEROGLYPH N039 + * variant of 13219 1321D EGYPTIAN HIEROGLYPH N040 1321E EGYPTIAN HIEROGLYPH N041 1321F EGYPTIAN HIEROGLYPH N042 + * variant of 1321E @ NL. Nomes of Lower Egypt 13220 EGYPTIAN HIEROGLYPH NL001 13221 EGYPTIAN HIEROGLYPH NL002 @@ -37365,7 +37780,9 @@ FFFF x (arabic letter heh - 0647) 13255 EGYPTIAN HIEROGLYPH O005 13256 EGYPTIAN HIEROGLYPH O005A + * mirrored version of 13255 13257 EGYPTIAN HIEROGLYPH O006 + ~ 13257 FE01 rotated 180 degrees 13258 EGYPTIAN HIEROGLYPH O006A * beginning of hwt or serekh enclosure x (egyptian hieroglyph o033a - 13282) @@ -37409,12 +37826,19 @@ FFFF 13279 EGYPTIAN HIEROGLYPH O027 1327A EGYPTIAN HIEROGLYPH O028 1327B EGYPTIAN HIEROGLYPH O029 + ~ 1327B FE02 rotated 270 degrees 1327C EGYPTIAN HIEROGLYPH O029A + * rotated variant of 1327B 1327D EGYPTIAN HIEROGLYPH O030 + * supporting pole + * not to be confused with 13361 1327E EGYPTIAN HIEROGLYPH O030A 1327F EGYPTIAN HIEROGLYPH O031 + ~ 1327F FE00 rotated 90 degrees + ~ 1327F FE01 rotated 180 degrees 13280 EGYPTIAN HIEROGLYPH O032 13281 EGYPTIAN HIEROGLYPH O033 + * classifier 'serekh' 13282 EGYPTIAN HIEROGLYPH O033A * end of serekh enclosure x (egyptian hieroglyph o006a - 13258) @@ -37423,6 +37847,7 @@ FFFF x (egyptian hieroglyph s029 - 132F4) 13284 EGYPTIAN HIEROGLYPH O035 13285 EGYPTIAN HIEROGLYPH O036 + ~ 13285 FE00 rotated 90 degrees 13286 EGYPTIAN HIEROGLYPH O036A * beginning of fortified wall cartouche 13287 EGYPTIAN HIEROGLYPH O036B @@ -37434,10 +37859,14 @@ FFFF 1328A EGYPTIAN HIEROGLYPH O037 1328B EGYPTIAN HIEROGLYPH O038 1328C EGYPTIAN HIEROGLYPH O039 + * stone, brick + * not to be confused with 13219 + ~ 1328C FE00 rotated 90 degrees 1328D EGYPTIAN HIEROGLYPH O040 1328E EGYPTIAN HIEROGLYPH O041 1328F EGYPTIAN HIEROGLYPH O042 13290 EGYPTIAN HIEROGLYPH O043 + * older variant of 1328F 13291 EGYPTIAN HIEROGLYPH O044 13292 EGYPTIAN HIEROGLYPH O045 13293 EGYPTIAN HIEROGLYPH O046 @@ -37447,26 +37876,36 @@ FFFF 13297 EGYPTIAN HIEROGLYPH O050 13298 EGYPTIAN HIEROGLYPH O050A 13299 EGYPTIAN HIEROGLYPH O050B + * mirrored version of 13298 1329A EGYPTIAN HIEROGLYPH O051 @ P. Ships and parts of ships 1329B EGYPTIAN HIEROGLYPH P001 + * classifier 'ship, travel' 1329C EGYPTIAN HIEROGLYPH P001A + * classifier 'upset, overturn' 1329D EGYPTIAN HIEROGLYPH P002 1329E EGYPTIAN HIEROGLYPH P003 + * sacred ship 1329F EGYPTIAN HIEROGLYPH P003A + * mirrored variant of 1329E 132A0 EGYPTIAN HIEROGLYPH P004 132A1 EGYPTIAN HIEROGLYPH P005 132A2 EGYPTIAN HIEROGLYPH P006 132A3 EGYPTIAN HIEROGLYPH P007 132A4 EGYPTIAN HIEROGLYPH P008 + ~ 132A4 FE01 rotated 180 degrees + ~ 132A4 FE02 rotated 270 degrees 132A5 EGYPTIAN HIEROGLYPH P009 132A6 EGYPTIAN HIEROGLYPH P010 132A7 EGYPTIAN HIEROGLYPH P011 + * mooring post + * not to be confused with 131E9 or 1342A @ Q. Domestic and funerary furniture 132A8 EGYPTIAN HIEROGLYPH Q001 132A9 EGYPTIAN HIEROGLYPH Q002 132AA EGYPTIAN HIEROGLYPH Q003 * transliterated as p + ~ 132AA FE00 rotated 90 degrees 132AB EGYPTIAN HIEROGLYPH Q004 132AC EGYPTIAN HIEROGLYPH Q005 132AD EGYPTIAN HIEROGLYPH Q006 @@ -37501,6 +37940,7 @@ FFFF 132C9 EGYPTIAN HIEROGLYPH R022 132CA EGYPTIAN HIEROGLYPH R023 132CB EGYPTIAN HIEROGLYPH R024 + ~ 132CB FE00 rotated 90 degrees 132CC EGYPTIAN HIEROGLYPH R025 132CD EGYPTIAN HIEROGLYPH R026 132CE EGYPTIAN HIEROGLYPH R027 @@ -37519,6 +37959,7 @@ FFFF 132DA EGYPTIAN HIEROGLYPH S008 132DB EGYPTIAN HIEROGLYPH S009 132DC EGYPTIAN HIEROGLYPH S010 + ~ 132DC FE00 rotated 90 degrees 132DD EGYPTIAN HIEROGLYPH S011 132DE EGYPTIAN HIEROGLYPH S012 132DF EGYPTIAN HIEROGLYPH S013 @@ -37530,8 +37971,11 @@ FFFF 132E5 EGYPTIAN HIEROGLYPH S017 132E6 EGYPTIAN HIEROGLYPH S017A 132E7 EGYPTIAN HIEROGLYPH S018 + ~ 132E7 FE00 rotated 90 degrees + ~ 132E7 FE02 rotated 270 degrees 132E8 EGYPTIAN HIEROGLYPH S019 132E9 EGYPTIAN HIEROGLYPH S020 + ~ 132E9 FE02 rotated 270 degrees 132EA EGYPTIAN HIEROGLYPH S021 132EB EGYPTIAN HIEROGLYPH S022 132EC EGYPTIAN HIEROGLYPH S023 @@ -37539,6 +37983,8 @@ FFFF 132EE EGYPTIAN HIEROGLYPH S025 132EF EGYPTIAN HIEROGLYPH S026 132F0 EGYPTIAN HIEROGLYPH S026A + * loin-cloth + * not to be confused with 13200, 133D4, or 133F3 132F1 EGYPTIAN HIEROGLYPH S026B 132F2 EGYPTIAN HIEROGLYPH S027 132F3 EGYPTIAN HIEROGLYPH S028 @@ -37549,24 +37995,36 @@ FFFF 132F6 EGYPTIAN HIEROGLYPH S031 132F7 EGYPTIAN HIEROGLYPH S032 132F8 EGYPTIAN HIEROGLYPH S033 + ~ 132F8 FE02 rotated 270 degrees 132F9 EGYPTIAN HIEROGLYPH S034 132FA EGYPTIAN HIEROGLYPH S035 132FB EGYPTIAN HIEROGLYPH S035A + * variant of 132FA 132FC EGYPTIAN HIEROGLYPH S036 + * older variant of 132FA 132FD EGYPTIAN HIEROGLYPH S037 + ~ 132FD FE02 rotated 270 degrees 132FE EGYPTIAN HIEROGLYPH S038 132FF EGYPTIAN HIEROGLYPH S039 13300 EGYPTIAN HIEROGLYPH S040 + * phonogram 'wꜣs' 13301 EGYPTIAN HIEROGLYPH S041 + * phonogram 'ḏꜣm' 13302 EGYPTIAN HIEROGLYPH S042 + ~ 13302 FE02 rotated 270 degrees 13303 EGYPTIAN HIEROGLYPH S043 + ~ 13303 FE02 rotated 270 degrees 13304 EGYPTIAN HIEROGLYPH S044 13305 EGYPTIAN HIEROGLYPH S045 13306 EGYPTIAN HIEROGLYPH S046 @ T. Warfare, hunting, butchery 13307 EGYPTIAN HIEROGLYPH T001 + ~ 13307 FE00 rotated 90 degrees 13308 EGYPTIAN HIEROGLYPH T002 + * classifier 'striking, hitting' + ~ 13308 FE01 rotated 180 degrees 13309 EGYPTIAN HIEROGLYPH T003 + * classifier 'mace' 1330A EGYPTIAN HIEROGLYPH T003A 1330B EGYPTIAN HIEROGLYPH T004 1330C EGYPTIAN HIEROGLYPH T005 @@ -37574,51 +38032,86 @@ FFFF 1330E EGYPTIAN HIEROGLYPH T007 1330F EGYPTIAN HIEROGLYPH T007A 13310 EGYPTIAN HIEROGLYPH T008 + * older variant of 13311 + ~ 13310 FE02 rotated 270 degrees 13311 EGYPTIAN HIEROGLYPH T008A + ~ 13311 FE02 rotated 270 degrees 13312 EGYPTIAN HIEROGLYPH T009 + ~ 13312 FE01 rotated 180 degrees + ~ 13312 FE02 rotated 270 degrees 13313 EGYPTIAN HIEROGLYPH T009A + * older variant of 13312 + ~ 13313 FE01 rotated 180 degrees + ~ 13313 FE02 rotated 270 degrees 13314 EGYPTIAN HIEROGLYPH T010 + ~ 13314 FE01 rotated 180 degrees + ~ 13314 FE02 rotated 270 degrees 13315 EGYPTIAN HIEROGLYPH T011 13316 EGYPTIAN HIEROGLYPH T011A 13317 EGYPTIAN HIEROGLYPH T012 13318 EGYPTIAN HIEROGLYPH T013 13319 EGYPTIAN HIEROGLYPH T014 1331A EGYPTIAN HIEROGLYPH T015 + * older variant of 13319 1331B EGYPTIAN HIEROGLYPH T016 + ~ 1331B FE00 rotated 90 degrees + ~ 1331B FE01 rotated 180 degrees 1331C EGYPTIAN HIEROGLYPH T016A + ~ 1331C FE02 rotated 270 degrees 1331D EGYPTIAN HIEROGLYPH T017 1331E EGYPTIAN HIEROGLYPH T018 1331F EGYPTIAN HIEROGLYPH T019 13320 EGYPTIAN HIEROGLYPH T020 + * older variant of 1331F 13321 EGYPTIAN HIEROGLYPH T021 + ~ 13321 FE01 rotated 180 degrees + ~ 13321 FE02 rotated 270 degrees 13322 EGYPTIAN HIEROGLYPH T022 + ~ 13322 FE00 rotated 90 degrees + ~ 13322 FE01 rotated 180 degrees 13323 EGYPTIAN HIEROGLYPH T023 + * more recent variant of 13322 13324 EGYPTIAN HIEROGLYPH T024 13325 EGYPTIAN HIEROGLYPH T025 13326 EGYPTIAN HIEROGLYPH T026 13327 EGYPTIAN HIEROGLYPH T027 + * older variant of 13326 13328 EGYPTIAN HIEROGLYPH T028 13329 EGYPTIAN HIEROGLYPH T029 1332A EGYPTIAN HIEROGLYPH T030 + * classifier 'knife, cutting' 1332B EGYPTIAN HIEROGLYPH T031 + * phonogram 'sšm' 1332C EGYPTIAN HIEROGLYPH T032 1332D EGYPTIAN HIEROGLYPH T032A 1332E EGYPTIAN HIEROGLYPH T033 + * older variant of 13326 1332F EGYPTIAN HIEROGLYPH T033A 13330 EGYPTIAN HIEROGLYPH T034 13331 EGYPTIAN HIEROGLYPH T035 + * variant of 13330 + ~ 13331 FE01 rotated 180 degrees + ~ 13331 FE02 rotated 270 degrees 13332 EGYPTIAN HIEROGLYPH T036 @ U. Agriculture, crafts, and professions 13333 EGYPTIAN HIEROGLYPH U001 13334 EGYPTIAN HIEROGLYPH U002 + * stylistic variant of 13333 13335 EGYPTIAN HIEROGLYPH U003 13336 EGYPTIAN HIEROGLYPH U004 13337 EGYPTIAN HIEROGLYPH U005 + * stylistic variant of 13336 13338 EGYPTIAN HIEROGLYPH U006 13339 EGYPTIAN HIEROGLYPH U006A + * stylistic variant of 13338 1333A EGYPTIAN HIEROGLYPH U006B + * mirrored version of 13339 1333B EGYPTIAN HIEROGLYPH U007 + * variant of 13338 + ~ 1333B FE00 rotated 90 degrees 1333C EGYPTIAN HIEROGLYPH U008 + * variant of 1333B + ~ 1333C FE00 rotated 90 degrees 1333D EGYPTIAN HIEROGLYPH U009 1333E EGYPTIAN HIEROGLYPH U010 1333F EGYPTIAN HIEROGLYPH U011 @@ -37629,18 +38122,25 @@ FFFF 13344 EGYPTIAN HIEROGLYPH U016 13345 EGYPTIAN HIEROGLYPH U017 13346 EGYPTIAN HIEROGLYPH U018 + * variant of 13345 13347 EGYPTIAN HIEROGLYPH U019 13348 EGYPTIAN HIEROGLYPH U020 + * older variant of 13347 13349 EGYPTIAN HIEROGLYPH U021 1334A EGYPTIAN HIEROGLYPH U022 + ~ 1334A FE02 rotated 270 degrees 1334B EGYPTIAN HIEROGLYPH U023 1334C EGYPTIAN HIEROGLYPH U023A + * stylistic variant of 1334B 1334D EGYPTIAN HIEROGLYPH U024 1334E EGYPTIAN HIEROGLYPH U025 + * older variant of 1334D 1334F EGYPTIAN HIEROGLYPH U026 13350 EGYPTIAN HIEROGLYPH U027 + * older variant of 1334F 13351 EGYPTIAN HIEROGLYPH U028 13352 EGYPTIAN HIEROGLYPH U029 + * older variant of 13351 13353 EGYPTIAN HIEROGLYPH U029A 13354 EGYPTIAN HIEROGLYPH U030 13355 EGYPTIAN HIEROGLYPH U031 @@ -37654,11 +38154,17 @@ FFFF 1335D EGYPTIAN HIEROGLYPH U038 1335E EGYPTIAN HIEROGLYPH U039 1335F EGYPTIAN HIEROGLYPH U040 + * cursive variant of 1335E 13360 EGYPTIAN HIEROGLYPH U041 13361 EGYPTIAN HIEROGLYPH U042 + * pitchfork + * not to be confused with 1327D + ~ 13361 FE02 rotated 270 degrees @ V. Rope, fiber, baskets, bags, etc. 13362 EGYPTIAN HIEROGLYPH V001 * 100 + * classifier 'cord, rope' + * not to be confused with 133F2 13363 EGYPTIAN HIEROGLYPH V001A * 200 13364 EGYPTIAN HIEROGLYPH V001B @@ -37683,13 +38189,21 @@ FFFF 1336F EGYPTIAN HIEROGLYPH V004 13370 EGYPTIAN HIEROGLYPH V005 13371 EGYPTIAN HIEROGLYPH V006 + * phonogram 'šs' 13372 EGYPTIAN HIEROGLYPH V007 + * phonogram 'šn' 13373 EGYPTIAN HIEROGLYPH V007A + ~ 13373 FE02 rotated 270 degrees 13374 EGYPTIAN HIEROGLYPH V007B 13375 EGYPTIAN HIEROGLYPH V008 13376 EGYPTIAN HIEROGLYPH V009 13377 EGYPTIAN HIEROGLYPH V010 + * logogram 'name' + ~ 13377 FE00 rotated 90 degrees 13378 EGYPTIAN HIEROGLYPH V011 + * classifier 'restrain, split' + x (egyptian hieroglyph v011d - 1342F) + ~ 13378 FE00 rotated 90 degrees 13379 EGYPTIAN HIEROGLYPH V011A * beginning of cartouche 1337A EGYPTIAN HIEROGLYPH V011B @@ -37698,19 +38212,25 @@ FFFF * end of knotless cartouche 1337C EGYPTIAN HIEROGLYPH V012 1337D EGYPTIAN HIEROGLYPH V012A + ~ 1337D FE02 rotated 270 degrees 1337E EGYPTIAN HIEROGLYPH V012B 1337F EGYPTIAN HIEROGLYPH V013 * transliterated as 1E6F 13380 EGYPTIAN HIEROGLYPH V014 + * variant of 1337F 13381 EGYPTIAN HIEROGLYPH V015 13382 EGYPTIAN HIEROGLYPH V016 13383 EGYPTIAN HIEROGLYPH V017 13384 EGYPTIAN HIEROGLYPH V018 + * older variant of 13383 13385 EGYPTIAN HIEROGLYPH V019 + ~ 13385 FE02 rotated 270 degrees 13386 EGYPTIAN HIEROGLYPH V020 * 10 + * not to be confused with 133AD 13387 EGYPTIAN HIEROGLYPH V020A * 20 + * not to be confused with 133AE 13388 EGYPTIAN HIEROGLYPH V020B * 30 13389 EGYPTIAN HIEROGLYPH V020C @@ -37727,20 +38247,29 @@ FFFF * 90 1338F EGYPTIAN HIEROGLYPH V020I * 20 + * variant of 13387 13390 EGYPTIAN HIEROGLYPH V020J * 30 + * variant of 13388 13391 EGYPTIAN HIEROGLYPH V020K * 40 + * variant of 13389 13392 EGYPTIAN HIEROGLYPH V020L * 50 + * variant of 1338A 13393 EGYPTIAN HIEROGLYPH V021 13394 EGYPTIAN HIEROGLYPH V022 13395 EGYPTIAN HIEROGLYPH V023 + * older variant of 13394 13396 EGYPTIAN HIEROGLYPH V023A 13397 EGYPTIAN HIEROGLYPH V024 13398 EGYPTIAN HIEROGLYPH V025 + * more recent variant of 13397 13399 EGYPTIAN HIEROGLYPH V026 + ~ 13399 FE00 rotated 90 degrees 1339A EGYPTIAN HIEROGLYPH V027 + * older variant of 13399 + ~ 1339A FE00 rotated 90 degrees 1339B EGYPTIAN HIEROGLYPH V028 * transliterated as 1E25 x (arabic letter hah - 062D) @@ -37749,30 +38278,40 @@ FFFF 1339E EGYPTIAN HIEROGLYPH V029A 1339F EGYPTIAN HIEROGLYPH V030 133A0 EGYPTIAN HIEROGLYPH V030A + * stylistic variant, use of 1339F is preferred 133A1 EGYPTIAN HIEROGLYPH V031 * transliterated as k x (hebrew letter kaf - 05DB) x (arabic letter kaf - 0643) 133A2 EGYPTIAN HIEROGLYPH V031A + * from hieratic 133A3 EGYPTIAN HIEROGLYPH V032 133A4 EGYPTIAN HIEROGLYPH V033 133A5 EGYPTIAN HIEROGLYPH V033A 133A6 EGYPTIAN HIEROGLYPH V034 + * more recent variant of 133A4 133A7 EGYPTIAN HIEROGLYPH V035 133A8 EGYPTIAN HIEROGLYPH V036 133A9 EGYPTIAN HIEROGLYPH V037 133AA EGYPTIAN HIEROGLYPH V037A 133AB EGYPTIAN HIEROGLYPH V038 + * bandage + * not to be confused with 1308B 133AC EGYPTIAN HIEROGLYPH V039 133AD EGYPTIAN HIEROGLYPH V040 * 10 in dates + * not to be confused with 13386 133AE EGYPTIAN HIEROGLYPH V040A * 20 in dates + * not to be confused with 13387 @ W. Vessels of stone and earthenware 133AF EGYPTIAN HIEROGLYPH W001 + ~ 133AF FE02 rotated 270 degrees 133B0 EGYPTIAN HIEROGLYPH W002 + ~ 133B0 FE02 rotated 270 degrees 133B1 EGYPTIAN HIEROGLYPH W003 133B2 EGYPTIAN HIEROGLYPH W003A + * stylistic variant, use of 133B1 is preferred 133B3 EGYPTIAN HIEROGLYPH W004 133B4 EGYPTIAN HIEROGLYPH W005 133B5 EGYPTIAN HIEROGLYPH W006 @@ -37780,93 +38319,142 @@ FFFF 133B7 EGYPTIAN HIEROGLYPH W008 133B8 EGYPTIAN HIEROGLYPH W009 133B9 EGYPTIAN HIEROGLYPH W009A + * mirrored version of 133B8 133BA EGYPTIAN HIEROGLYPH W010 133BB EGYPTIAN HIEROGLYPH W010A 133BC EGYPTIAN HIEROGLYPH W011 * transliterated as g 133BD EGYPTIAN HIEROGLYPH W012 + * older variant of 133BC 133BE EGYPTIAN HIEROGLYPH W013 133BF EGYPTIAN HIEROGLYPH W014 + ~ 133BF FE02 rotated 270 degrees 133C0 EGYPTIAN HIEROGLYPH W014A 133C1 EGYPTIAN HIEROGLYPH W015 133C2 EGYPTIAN HIEROGLYPH W016 133C3 EGYPTIAN HIEROGLYPH W017 133C4 EGYPTIAN HIEROGLYPH W017A + * cursive variant of 133C3 133C5 EGYPTIAN HIEROGLYPH W018 + * older variant of 133C3 133C6 EGYPTIAN HIEROGLYPH W018A + * cursive variant of 133C5 133C7 EGYPTIAN HIEROGLYPH W019 133C8 EGYPTIAN HIEROGLYPH W020 133C9 EGYPTIAN HIEROGLYPH W021 133CA EGYPTIAN HIEROGLYPH W022 133CB EGYPTIAN HIEROGLYPH W023 133CC EGYPTIAN HIEROGLYPH W024 + * phonogram 'nw' 133CD EGYPTIAN HIEROGLYPH W024A + * monogram 'nw(n)' or 'nww' 133CE EGYPTIAN HIEROGLYPH W025 @ X. Loaves and cakes 133CF EGYPTIAN HIEROGLYPH X001 * transliterated as t 133D0 EGYPTIAN HIEROGLYPH X002 133D1 EGYPTIAN HIEROGLYPH X003 + * variant of 133D0 133D2 EGYPTIAN HIEROGLYPH X004 133D3 EGYPTIAN HIEROGLYPH X004A + * variant of 133D2 + ~ 133D3 FE00 rotated 90 degrees 133D4 EGYPTIAN HIEROGLYPH X004B + * cake + * variant of 133D2 + * not to be confused with 13200, 132F0, or 133F3 133D5 EGYPTIAN HIEROGLYPH X005 + * hieratic + * variant of 133D4 133D6 EGYPTIAN HIEROGLYPH X006 133D7 EGYPTIAN HIEROGLYPH X006A 133D8 EGYPTIAN HIEROGLYPH X007 + * classifier 'food' + * not to be confused with 1320E 133D9 EGYPTIAN HIEROGLYPH X008 133DA EGYPTIAN HIEROGLYPH X008A + * bread + * variant of 133D9 + * not to be confused with 131EE @ Y. Writings, games, music 133DB EGYPTIAN HIEROGLYPH Y001 133DC EGYPTIAN HIEROGLYPH Y001A + * rotated variant of 133DB 133DD EGYPTIAN HIEROGLYPH Y002 + * older variant of 133DB + ~ 133DD FE02 rotated 270 degrees 133DE EGYPTIAN HIEROGLYPH Y003 133DF EGYPTIAN HIEROGLYPH Y004 + * mirrored version of 133DE 133E0 EGYPTIAN HIEROGLYPH Y005 133E1 EGYPTIAN HIEROGLYPH Y006 133E2 EGYPTIAN HIEROGLYPH Y007 133E3 EGYPTIAN HIEROGLYPH Y008 @ Z. Strokes, signs derived from Hieratic, geometrical figures 133E4 EGYPTIAN HIEROGLYPH Z001 - x (egyptian hieroglyph z015 - 133FA) + * semogram index + * classifier 'single' + * not to be confused with 133FA 133E5 EGYPTIAN HIEROGLYPH Z002 - * plurality - x (egyptian hieroglyph z015b - 133FC) + * classifier 'plural' + * not to be confused with 133FC 133E6 EGYPTIAN HIEROGLYPH Z002A + * stylistic variant of 133E5 133E7 EGYPTIAN HIEROGLYPH Z002B + * classifier 'plural' + * not to be confused with 13213 133E8 EGYPTIAN HIEROGLYPH Z002C + * variant of 133E6 133E9 EGYPTIAN HIEROGLYPH Z002D + * variant of 133E8 133EA EGYPTIAN HIEROGLYPH Z003 + * variant of 133E5 133EB EGYPTIAN HIEROGLYPH Z003A + * variant of 133EA 133EC EGYPTIAN HIEROGLYPH Z003B - * 3 + * variant of 133E7 133ED EGYPTIAN HIEROGLYPH Z004 - * duality + * classifier 'dual' * transliterated as y x (egyptian hieroglyph m017a - 131CC) 133EE EGYPTIAN HIEROGLYPH Z004A - * duality - x (egyptian hieroglyph z015a - 133FB) + * variant of 133ED + * classifier 'dual' + * transliterated as y + * not to be confused with 133FB 133EF EGYPTIAN HIEROGLYPH Z005 133F0 EGYPTIAN HIEROGLYPH Z005A + * variant of 133EF 133F1 EGYPTIAN HIEROGLYPH Z006 133F2 EGYPTIAN HIEROGLYPH Z007 + * phonogram 'w' + * not to be confused with 13362 + ~ 133F2 FE00 rotated 90 degrees 133F3 EGYPTIAN HIEROGLYPH Z008 + * oval + * not to be confused with 13200, 132F0, or 133D4 133F4 EGYPTIAN HIEROGLYPH Z009 133F5 EGYPTIAN HIEROGLYPH Z010 + * older variant of 133F4 + ~ 133F5 FE00 rotated 90 degrees 133F6 EGYPTIAN HIEROGLYPH Z011 + ~ 133F6 FE00 rotated 90 degrees 133F7 EGYPTIAN HIEROGLYPH Z012 + * hieratic 133F8 EGYPTIAN HIEROGLYPH Z013 + * circle, unmarked round sign + * not to be confused with 13082 or 131F3 133F9 EGYPTIAN HIEROGLYPH Z014 + * hieratic 133FA EGYPTIAN HIEROGLYPH Z015 * 1 - x (egyptian hieroglyph z001 - 133E4) + * not to be confused with 133E4 133FB EGYPTIAN HIEROGLYPH Z015A * 2 - x (egyptian hieroglyph z004a - 133EE) + * not to be confused with 133EE 133FC EGYPTIAN HIEROGLYPH Z015B * 3 - x (egyptian hieroglyph z002 - 133E5) + * not to be confused with 133E5 x (egyptian hieroglyph z003 - 133EA) 133FD EGYPTIAN HIEROGLYPH Z015C * 4 @@ -37882,6 +38470,7 @@ FFFF * 9 13403 EGYPTIAN HIEROGLYPH Z015I * 5 + ~ 13403 FE00 rotated 90 degrees 13404 EGYPTIAN HIEROGLYPH Z016 * 1 in dates 13405 EGYPTIAN HIEROGLYPH Z016A @@ -37911,34 +38500,58 @@ FFFF 13412 EGYPTIAN HIEROGLYPH AA006 13413 EGYPTIAN HIEROGLYPH AA007 13414 EGYPTIAN HIEROGLYPH AA007A + * mirrored version of 13413 13415 EGYPTIAN HIEROGLYPH AA007B 13416 EGYPTIAN HIEROGLYPH AA008 + ~ 13416 FE00 rotated 90 degrees 13417 EGYPTIAN HIEROGLYPH AA009 13418 EGYPTIAN HIEROGLYPH AA010 13419 EGYPTIAN HIEROGLYPH AA011 + ~ 13419 FE00 rotated 90 degrees + ~ 13419 FE01 rotated 180 degrees + ~ 13419 FE02 rotated 270 degrees 1341A EGYPTIAN HIEROGLYPH AA012 + * older variant of 13419 + ~ 1341A FE00 rotated 90 degrees 1341B EGYPTIAN HIEROGLYPH AA013 1341C EGYPTIAN HIEROGLYPH AA014 + * older variant of 1341B 1341D EGYPTIAN HIEROGLYPH AA015 1341E EGYPTIAN HIEROGLYPH AA016 + * variant of 1341D 1341F EGYPTIAN HIEROGLYPH AA017 13420 EGYPTIAN HIEROGLYPH AA018 + * more recent variant of 1341F 13421 EGYPTIAN HIEROGLYPH AA019 13422 EGYPTIAN HIEROGLYPH AA020 13423 EGYPTIAN HIEROGLYPH AA021 + ~ 13423 FE00 rotated 90 degrees 13424 EGYPTIAN HIEROGLYPH AA022 13425 EGYPTIAN HIEROGLYPH AA023 13426 EGYPTIAN HIEROGLYPH AA024 + * older variant of 13425 13427 EGYPTIAN HIEROGLYPH AA025 13428 EGYPTIAN HIEROGLYPH AA026 13429 EGYPTIAN HIEROGLYPH AA027 1342A EGYPTIAN HIEROGLYPH AA028 + * phonogram 'qd' + * not to be confused with 131E9 and 132A7 1342B EGYPTIAN HIEROGLYPH AA029 + * older variant of 1342A 1342C EGYPTIAN HIEROGLYPH AA030 + ~ 1342C FE02 rotated 270 degrees 1342D EGYPTIAN HIEROGLYPH AA031 + * older variant of 1342C 1342E EGYPTIAN HIEROGLYPH AA032 -@@ 13430 Egyptian Hieroglyph Format Controls 1343F -@+ These format controls are used to render Egyptian hieroglyphic quadrats. + ~ 1342E FE02 rotated 270 degrees +@ Addition to group V +@+ This is part of the cartouche set: 13379, 1337A, 1337B, and 1342F. +1342F EGYPTIAN HIEROGLYPH V011D + * knotted beginning of cartouche + * not to be confused with 13378 +@~ ! +@@ 13430 Egyptian Hieroglyph Format Controls 1345F +@+ These format controls are used to render Egyptian hieroglyphic spatial arrangements, including quadrats, overlays, insertions, and blank, lost or damaged sections. @ Joiners 13430 EGYPTIAN HIEROGLYPH VERTICAL JOINER = sign separator: subordination (Manuel de Codage) @@ -37954,6 +38567,45 @@ FFFF @ Segment scoping delimiters 13437 EGYPTIAN HIEROGLYPH BEGIN SEGMENT 13438 EGYPTIAN HIEROGLYPH END SEGMENT +@ Sign insertion controls +13439 EGYPTIAN HIEROGLYPH INSERT AT MIDDLE +1343A EGYPTIAN HIEROGLYPH INSERT AT TOP +1343B EGYPTIAN HIEROGLYPH INSERT AT BOTTOM +@ Enclosure controls +1343C EGYPTIAN HIEROGLYPH BEGIN ENCLOSURE +1343D EGYPTIAN HIEROGLYPH END ENCLOSURE +1343E EGYPTIAN HIEROGLYPH BEGIN WALLED ENCLOSURE +1343F EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE +@ Mirror control +13440 EGYPTIAN HIEROGLYPH MIRROR HORIZONTALLY +@ Blank and lost signs +13441 EGYPTIAN HIEROGLYPH FULL BLANK +13442 EGYPTIAN HIEROGLYPH HALF BLANK +13443 EGYPTIAN HIEROGLYPH LOST SIGN + ~ 13443 FE00 expanded +13444 EGYPTIAN HIEROGLYPH HALF LOST SIGN + ~ 13444 FE00 expanded +13445 EGYPTIAN HIEROGLYPH TALL LOST SIGN + ~ 13445 FE00 expanded +13446 EGYPTIAN HIEROGLYPH WIDE LOST SIGN + ~ 13446 FE00 expanded +@ Damage modifiers +13447 EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP START +13448 EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM START +13449 EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT START +1344A EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP END +1344B EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP +1344C EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM START AND TOP END +1344D EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT START AND TOP +1344E EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM END +1344F EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP START AND BOTTOM END +13450 EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM +13451 EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT START AND BOTTOM +13452 EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT END +13453 EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP AND END +13454 EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT BOTTOM AND END +13455 EGYPTIAN HIEROGLYPH MODIFIER DAMAGED +@~ ! @@ 14400 Anatolian Hieroglyphs 1467F @+ In the names list, most of the comments are in Latin. Those which have a Luwian phonetic value are identified as syllabic. @ A. The human body and clothing @@ -41373,6 +42025,7 @@ FFFF 18BDC KHITAN SMALL SCRIPT CHARACTER-18BDC 18BDD KHITAN SMALL SCRIPT CHARACTER-18BDD 18BDE KHITAN SMALL SCRIPT CHARACTER-18BDE + x (khitan small script character-18cca - 18CCA) 18BDF KHITAN SMALL SCRIPT CHARACTER-18BDF 18BE0 KHITAN SMALL SCRIPT CHARACTER-18BE0 18BE1 KHITAN SMALL SCRIPT CHARACTER-18BE1 @@ -41621,6 +42274,7 @@ FFFF 18CC8 KHITAN SMALL SCRIPT CHARACTER-18CC8 18CC9 KHITAN SMALL SCRIPT CHARACTER-18CC9 18CCA KHITAN SMALL SCRIPT CHARACTER-18CCA + x (khitan small script character-18bde - 18BDE) 18CCB KHITAN SMALL SCRIPT CHARACTER-18CCB @ Radical-19 18CCC KHITAN SMALL SCRIPT CHARACTER-18CCC @@ -41639,7 +42293,6 @@ FFFF @+ This block contains tone marks occasionally used in furigana extensions to annotate Minnan Chinese. @ Tone marks 1AFF0 KATAKANA LETTER MINNAN TONE-2 - * also used for tone six 1AFF1 KATAKANA LETTER MINNAN TONE-3 1AFF2 KATAKANA LETTER MINNAN TONE-4 1AFF3 KATAKANA LETTER MINNAN TONE-5 @@ -41648,7 +42301,6 @@ FFFF @ Nasalized tone marks 1AFF7 KATAKANA LETTER MINNAN NASALIZED TONE-1 1AFF8 KATAKANA LETTER MINNAN NASALIZED TONE-2 - * also used for tone six 1AFF9 KATAKANA LETTER MINNAN NASALIZED TONE-3 1AFFA KATAKANA LETTER MINNAN NASALIZED TONE-4 1AFFB KATAKANA LETTER MINNAN NASALIZED TONE-5 @@ -42243,10 +42895,12 @@ FFFF 1B122 KATAKANA LETTER ARCHAIC WU @@ 1B130 Small Kana Extension 1B16F @ Historic small hiragana letters +1B132 HIRAGANA LETTER SMALL KO 1B150 HIRAGANA LETTER SMALL WI 1B151 HIRAGANA LETTER SMALL WE 1B152 HIRAGANA LETTER SMALL WO @ Historic small katakana letters +1B155 KATAKANA LETTER SMALL KO 1B164 KATAKANA LETTER SMALL WI 1B165 KATAKANA LETTER SMALL WE 1B166 KATAKANA LETTER SMALL WO @@ -44132,6 +44786,28 @@ FFFF 1D244 COMBINING GREEK MUSICAL PENTASEME x (metrical pentaseme - 23D9) 1D245 GREEK MUSICAL LEIMMA +@@ 1D2C0 Kaktovik Numerals 1D2DF +@ Numerals +1D2C0 KAKTOVIK NUMERAL ZERO +1D2C1 KAKTOVIK NUMERAL ONE +1D2C2 KAKTOVIK NUMERAL TWO +1D2C3 KAKTOVIK NUMERAL THREE +1D2C4 KAKTOVIK NUMERAL FOUR +1D2C5 KAKTOVIK NUMERAL FIVE +1D2C6 KAKTOVIK NUMERAL SIX +1D2C7 KAKTOVIK NUMERAL SEVEN +1D2C8 KAKTOVIK NUMERAL EIGHT +1D2C9 KAKTOVIK NUMERAL NINE +1D2CA KAKTOVIK NUMERAL TEN +1D2CB KAKTOVIK NUMERAL ELEVEN +1D2CC KAKTOVIK NUMERAL TWELVE +1D2CD KAKTOVIK NUMERAL THIRTEEN +1D2CE KAKTOVIK NUMERAL FOURTEEN +1D2CF KAKTOVIK NUMERAL FIFTEEN +1D2D0 KAKTOVIK NUMERAL SIXTEEN +1D2D1 KAKTOVIK NUMERAL SEVENTEEN +1D2D2 KAKTOVIK NUMERAL EIGHTEEN +1D2D3 KAKTOVIK NUMERAL NINETEEN @@ 1D2E0 Mayan Numerals 1D2FF @ Mayan numerals 1D2E0 MAYAN NUMERAL ZERO @@ -47147,6 +47823,13 @@ FFFF 1DF1D LATIN SMALL LETTER C WITH RETROFLEX HOOK @ IPA extension 1DF1E LATIN SMALL LETTER S WITH CURL +@ Letters for Malayalam transliteration +1DF25 LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK +1DF26 LATIN SMALL LETTER L WITH MID-HEIGHT LEFT HOOK +1DF27 LATIN SMALL LETTER N WITH MID-HEIGHT LEFT HOOK +1DF28 LATIN SMALL LETTER R WITH MID-HEIGHT LEFT HOOK +1DF29 LATIN SMALL LETTER S WITH MID-HEIGHT LEFT HOOK +1DF2A LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK @@ 1E000 Glagolitic Supplement 1E02F @ Combining letters 1E000 COMBINING GLAGOLITIC LETTER AZU @@ -47187,6 +47870,140 @@ FFFF 1E028 COMBINING GLAGOLITIC LETTER BIG YUS 1E029 COMBINING GLAGOLITIC LETTER IOTATED BIG YUS 1E02A COMBINING GLAGOLITIC LETTER FITA +@@ 1E030 Cyrillic Extended-D 1E08F +@+ These are phonetic extensions, used in a manner analogous to IPA. Additional Cyrillic modifier letters are found in other blocks. + x (modifier letter cyrillic en - 1D78) + x (modifier letter cyrillic hard sign - A69C) + x (modifier letter cyrillic soft sign - A69D) +@ Superscript modifier letters +1E030 MODIFIER LETTER CYRILLIC SMALL A + # 0430 +1E031 MODIFIER LETTER CYRILLIC SMALL BE + # 0431 +1E032 MODIFIER LETTER CYRILLIC SMALL VE + # 0432 +1E033 MODIFIER LETTER CYRILLIC SMALL GHE + # 0433 +1E034 MODIFIER LETTER CYRILLIC SMALL DE + # 0434 +1E035 MODIFIER LETTER CYRILLIC SMALL IE + # 0435 +1E036 MODIFIER LETTER CYRILLIC SMALL ZHE + # 0436 +1E037 MODIFIER LETTER CYRILLIC SMALL ZE + # 0437 +1E038 MODIFIER LETTER CYRILLIC SMALL I + # 0438 +1E039 MODIFIER LETTER CYRILLIC SMALL KA + # 043A +1E03A MODIFIER LETTER CYRILLIC SMALL EL + # 043B +1E03B MODIFIER LETTER CYRILLIC SMALL EM + # 043C +1E03C MODIFIER LETTER CYRILLIC SMALL O + # 043E +1E03D MODIFIER LETTER CYRILLIC SMALL PE + # 043F +1E03E MODIFIER LETTER CYRILLIC SMALL ER + # 0440 +1E03F MODIFIER LETTER CYRILLIC SMALL ES + # 0441 +1E040 MODIFIER LETTER CYRILLIC SMALL TE + # 0442 +1E041 MODIFIER LETTER CYRILLIC SMALL U + # 0443 +1E042 MODIFIER LETTER CYRILLIC SMALL EF + # 0444 +1E043 MODIFIER LETTER CYRILLIC SMALL HA + # 0445 +1E044 MODIFIER LETTER CYRILLIC SMALL TSE + # 0446 +1E045 MODIFIER LETTER CYRILLIC SMALL CHE + # 0447 +1E046 MODIFIER LETTER CYRILLIC SMALL SHA + # 0448 +1E047 MODIFIER LETTER CYRILLIC SMALL YERU + # 044B +1E048 MODIFIER LETTER CYRILLIC SMALL E + # 044D +1E049 MODIFIER LETTER CYRILLIC SMALL YU + # 044E +1E04A MODIFIER LETTER CYRILLIC SMALL DZZE + # A689 +1E04B MODIFIER LETTER CYRILLIC SMALL SCHWA + # 04D9 +1E04C MODIFIER LETTER CYRILLIC SMALL BYELORUSSIAN-UKRAINIAN I + # 0456 +1E04D MODIFIER LETTER CYRILLIC SMALL JE + # 0458 +1E04E MODIFIER LETTER CYRILLIC SMALL BARRED O + # 04E9 +1E04F MODIFIER LETTER CYRILLIC SMALL STRAIGHT U + # 04AF +1E050 MODIFIER LETTER CYRILLIC SMALL PALOCHKA + # 04CF +@ Subscript modifier letters +1E051 CYRILLIC SUBSCRIPT SMALL LETTER A + # 0430 +1E052 CYRILLIC SUBSCRIPT SMALL LETTER BE + # 0431 +1E053 CYRILLIC SUBSCRIPT SMALL LETTER VE + # 0432 +1E054 CYRILLIC SUBSCRIPT SMALL LETTER GHE + # 0433 +1E055 CYRILLIC SUBSCRIPT SMALL LETTER DE + # 0434 +1E056 CYRILLIC SUBSCRIPT SMALL LETTER IE + # 0435 +1E057 CYRILLIC SUBSCRIPT SMALL LETTER ZHE + # 0436 +1E058 CYRILLIC SUBSCRIPT SMALL LETTER ZE + # 0437 +1E059 CYRILLIC SUBSCRIPT SMALL LETTER I + # 0438 +1E05A CYRILLIC SUBSCRIPT SMALL LETTER KA + # 043A +1E05B CYRILLIC SUBSCRIPT SMALL LETTER EL + # 043B +1E05C CYRILLIC SUBSCRIPT SMALL LETTER O + # 043E +1E05D CYRILLIC SUBSCRIPT SMALL LETTER PE + # 043F +1E05E CYRILLIC SUBSCRIPT SMALL LETTER ES + # 0441 +1E05F CYRILLIC SUBSCRIPT SMALL LETTER U + # 0443 +1E060 CYRILLIC SUBSCRIPT SMALL LETTER EF + # 0444 +1E061 CYRILLIC SUBSCRIPT SMALL LETTER HA + # 0445 +1E062 CYRILLIC SUBSCRIPT SMALL LETTER TSE + # 0446 +1E063 CYRILLIC SUBSCRIPT SMALL LETTER CHE + # 0447 +1E064 CYRILLIC SUBSCRIPT SMALL LETTER SHA + # 0448 +1E065 CYRILLIC SUBSCRIPT SMALL LETTER HARD SIGN + # 044A +1E066 CYRILLIC SUBSCRIPT SMALL LETTER YERU + # 044B +1E067 CYRILLIC SUBSCRIPT SMALL LETTER GHE WITH UPTURN + # 0491 +1E068 CYRILLIC SUBSCRIPT SMALL LETTER BYELORUSSIAN-UKRAINIAN I + # 0456 +1E069 CYRILLIC SUBSCRIPT SMALL LETTER DZE + # 0455 +1E06A CYRILLIC SUBSCRIPT SMALL LETTER DZHE + # 045F +@ Superscript modifier letters +1E06B MODIFIER LETTER CYRILLIC SMALL ES WITH DESCENDER + # 04AB +1E06C MODIFIER LETTER CYRILLIC SMALL YERU WITH BACK YER + # A651 +1E06D MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE + # 04B1 +@ Diacritical mark +1E08F COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I @@ 1E100 Nyiakeng Puachue Hmong 1E14F @+ The Nyiakeng Puachue Hmong script (Nyiaj Keeb Puaj Txwm in RPA orthography) is also known as Pa Dao (Paj Ntaub) and Chervang script (Txawj Vaag). @ Consonant onsets @@ -47405,6 +48222,58 @@ FFFF 1E2FF WANCHO NGUN SIGN = rupee x (indian rupee sign - 20B9) +@@ 1E4D0 Nag Mundari 1E4FF +@ Letters +1E4D0 NAG MUNDARI LETTER O +1E4D1 NAG MUNDARI LETTER OP +1E4D2 NAG MUNDARI LETTER OL +1E4D3 NAG MUNDARI LETTER OY +1E4D4 NAG MUNDARI LETTER ONG +1E4D5 NAG MUNDARI LETTER A +1E4D6 NAG MUNDARI LETTER AJ +1E4D7 NAG MUNDARI LETTER AB +1E4D8 NAG MUNDARI LETTER ANY +1E4D9 NAG MUNDARI LETTER AH +1E4DA NAG MUNDARI LETTER I +1E4DB NAG MUNDARI LETTER IS +1E4DC NAG MUNDARI LETTER IDD +1E4DD NAG MUNDARI LETTER IT +1E4DE NAG MUNDARI LETTER IH +1E4DF NAG MUNDARI LETTER U +1E4E0 NAG MUNDARI LETTER UC +1E4E1 NAG MUNDARI LETTER UD +1E4E2 NAG MUNDARI LETTER UK +1E4E3 NAG MUNDARI LETTER UR +1E4E4 NAG MUNDARI LETTER E +1E4E5 NAG MUNDARI LETTER ENN +1E4E6 NAG MUNDARI LETTER EG +1E4E7 NAG MUNDARI LETTER EM +1E4E8 NAG MUNDARI LETTER EN +1E4E9 NAG MUNDARI LETTER ETT +1E4EA NAG MUNDARI LETTER ELL +@ Various signs +1E4EB NAG MUNDARI SIGN OJOD + * precedes modified letters such as AB or UD + * may indicate consonant gemination +1E4EC NAG MUNDARI SIGN MUHOR + * vowel nasalization +1E4ED NAG MUNDARI SIGN TOYOR + * indicates a long vowel +1E4EE NAG MUNDARI SIGN IKIR + * vowel preceded by the 'w' sound +1E4EF NAG MUNDARI SIGN SUTUH + * mostly used for close transliteration of other languages +@ Digits +1E4F0 NAG MUNDARI DIGIT ZERO +1E4F1 NAG MUNDARI DIGIT ONE +1E4F2 NAG MUNDARI DIGIT TWO +1E4F3 NAG MUNDARI DIGIT THREE +1E4F4 NAG MUNDARI DIGIT FOUR +1E4F5 NAG MUNDARI DIGIT FIVE +1E4F6 NAG MUNDARI DIGIT SIX +1E4F7 NAG MUNDARI DIGIT SEVEN +1E4F8 NAG MUNDARI DIGIT EIGHT +1E4F9 NAG MUNDARI DIGIT NINE @@ 1E7E0 Ethiopic Extended-B 1E7FF @ Syllables for Gurage 1E7E0 ETHIOPIC SYLLABLE HHYA @@ -49996,6 +50865,7 @@ FFFF x (heavy black heart - 2764) x (white heart - 1F90D) x (orange heart - 1F9E1) + x (light blue heart - 1FA75) 1F49A GREEN HEART 1F49B YELLOW HEART 1F49C PURPLE HEART @@ -51006,6 +51876,7 @@ FFFF 1F6D6 HUT 1F6D7 ELEVATOR @ Miscellaneous symbols +1F6DC WIRELESS 1F6DD PLAYGROUND SLIDE 1F6DE WHEEL 1F6DF RING BUOY @@ -51140,8 +52011,9 @@ FFFF x (alchemical symbol for sal-ammoniac - 1F739) 1F728 ALCHEMICAL SYMBOL FOR VERDIGRIS = aes viride, copper subacetate - = early astronomical symbol for earth + = astronomical symbol for earth x (circled plus - 2295) + x (earth - 2641) @ Symbols for tin and lead ore 1F729 ALCHEMICAL SYMBOL FOR TIN ORE x (jupiter - 2643) @@ -51280,10 +52152,27 @@ FFFF @ Measures 1F772 ALCHEMICAL SYMBOL FOR HALF DRAM = drachma semis + * handwritten ligature of 0292 + 00DF, typically spelled out as ʒss x (latin small letter ezh - 0292) 1F773 ALCHEMICAL SYMBOL FOR HALF OUNCE = uncia semis + * handwritten ligature of 2125 + 00DF, typically spelled out as 2125 ss x (ounce sign - 2125) +@ Other symbol +1F774 LOT OF FORTUNE + = pars fortunae + x (circled times - 2297) +@ Eclipse symbols +1F775 OCCULTATION + x (conjunction - 260C) +1F776 LUNAR ECLIPSE + x (opposition - 260D) +@ Symbols for dwarf planets +1F77B HAUMEA +1F77C MAKEMAKE +1F77D GONGGONG +1F77E QUAOAR +1F77F ORCUS @@ 1F780 Geometric Shapes Extended 1F7FF @+ These geometric shapes originate from the Webdings/Wingdings collections. @ Isosceles right triangles @@ -51437,6 +52326,9 @@ FFFF 1F7D6 NEGATIVE CIRCLED TRIANGLE 1F7D7 CIRCLED SQUARE 1F7D8 NEGATIVE CIRCLED SQUARE +@ Nine pointed star +1F7D9 NINE POINTED WHITE STAR + * commonly used by members of the Bahá'í faith @ Colored circles @+ For use with emoji. Constitute a set as follows: 26AA, 26AB, 1F534, 1F535, 1F7E0-1F7E4 1F7E0 LARGE ORANGE CIRCLE @@ -51664,7 +52556,7 @@ FFFF @ Hand symbol 1F90C PINCHED FINGERS @ Colored heart symbols -@+ For use with emoji. Constitute a set as follows: 2764, 1F499-1F49C, 1F5A4, 1F90D, 1F90E, and 1F9E1. +@+ For use with emoji. Constitute a set as follows: 2764, 1F499-1F49C, 1F5A4, 1F90D, 1F90E, 1F9E1, and 1FA75-1FA77. 1F90D WHITE HEART 1F90E BROWN HEART @ Hand symbol @@ -52184,6 +53076,11 @@ FFFF 1FA73 SHORTS 1FA74 THONG SANDAL = flip flop +@ Colored heart symbols +@+ For use with emoji. Constitute a set as follows: 2764, 1F499-1F49C, 1F5A4, 1F90D, 1F90E, 1F9E1, and 1FA75-1FA77. +1FA75 LIGHT BLUE HEART +1FA76 GREY HEART +1FA77 PINK HEART @ Medical symbols 1FA78 DROP OF BLOOD x (droplet - 1F4A7) @@ -52199,6 +53096,9 @@ FFFF 1FA84 MAGIC WAND 1FA85 PINATA 1FA86 NESTING DOLLS +@ Musical instruments +1FA87 MARACAS +1FA88 FLUTE @ Miscellaneous objects 1FA90 RINGED PLANET 1FA91 CHAIR @@ -52231,6 +53131,11 @@ FFFF 1FAAB LOW BATTERY x (battery - 1F50B) 1FAAC HAMSA +1FAAD FOLDING HAND FAN +1FAAE HAIR PICK +@ Religious symbol +1FAAF KHANDA + x (adi shakti - 262C) @ Animals and nature 1FAB0 FLY 1FAB1 WORM @@ -52243,6 +53148,10 @@ FFFF 1FAB8 CORAL 1FAB9 EMPTY NEST 1FABA NEST WITH EGGS +1FABB HYACINTH +1FABC JELLYFISH +1FABD WING +1FABF GOOSE @ Body parts 1FAC0 ANATOMICAL HEART 1FAC1 LUNGS @@ -52253,6 +53162,9 @@ FFFF x (pregnant woman - 1F930) 1FAC5 PERSON WITH CROWN x (princess - 1F478) +@ Animals and nature +1FACE MOOSE +1FACF DONKEY @ Food and drink 1FAD0 BLUEBERRIES 1FAD1 BELL PEPPER @@ -52265,6 +53177,8 @@ FFFF x (glass of milk - 1F95B) 1FAD8 BEANS 1FAD9 JAR +1FADA GINGER ROOT +1FADB PEA POD @ Faces 1FAE0 MELTING FACE 1FAE1 SALUTING FACE @@ -52276,6 +53190,8 @@ FFFF 1FAE6 BITING LIP x (lips - 1F5E2) 1FAE7 BUBBLES +@ Face +1FAE8 SHAKING FACE @ Hand symbols 1FAF0 HAND WITH INDEX FINGER AND THUMB CROSSED x (hand with index and middle fingers crossed - 1F91E) @@ -52285,6 +53201,8 @@ FFFF 1FAF4 PALM UP HAND 1FAF5 INDEX POINTING AT THE VIEWER 1FAF6 HEART HANDS +1FAF7 LEFTWARDS PUSHING HAND +1FAF8 RIGHTWARDS PUSHING HAND @@ 1FB00 Symbols for Legacy Computing 1FBFF @ Block mosaic terminal graphic characters @+ The term "sextant" refers to block mosaics divided into six parts. @@ -52601,7 +53519,7 @@ FFFF 1FFFE 1FFFF @@ 20000 CJK Unified Ideographs Extension B 2A6DF -@@ 2A700 CJK Unified Ideographs Extension C 2B738 +@@ 2A700 CJK Unified Ideographs Extension C 2B739 @@ 2B740 CJK Unified Ideographs Extension D 2B81D @@ 2B820 CJK Unified Ideographs Extension E 2CEA1 @@ 2CEB0 CJK Unified Ideographs Extension F 2EBE0 @@ -53722,6 +54640,7 @@ FFFF 2FFFE 2FFFF @@ 30000 CJK Unified Ideographs Extension G 3134A +@@ 31350 CJK Unified Ideographs Extension H 323AF @@ 3FF80 Unassigned 3FFFF @ Noncharacters @+ These codes are intended for process-internal uses. diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/ScriptExtensions.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/ScriptExtensions.txt index 3f5cd1c0db..2f5a1727e3 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/ScriptExtensions.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/ScriptExtensions.txt @@ -1,11 +1,11 @@ -# ScriptExtensions-14.0.0.txt -# Date: 2021-06-04, 02:19:38 GMT -# © 2021 Unicode®, Inc. +# ScriptExtensions-15.0.0.txt +# Date: 2022-02-02, 00:57:11 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # The Script_Extensions property indicates which characters are commonly used # with more than one script, but with a limited number of scripts. diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/StandardizedVariants.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/StandardizedVariants.txt index 5c3c0149ba..04b93de342 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/StandardizedVariants.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/StandardizedVariants.txt @@ -1,6 +1,6 @@ -# StandardizedVariants-14.0.0.txt -# Date: 2021-01-26, 18:20:00 GMT [KW, LI, RP] -# © 2021 Unicode®, Inc. +# StandardizedVariants-15.0.0.txt +# Date: 2022-01-28, 21:31:00 GMT [KW] +# © 2022 Unicode®, Inc. # For terms of use, see https://www.unicode.org/terms_of_use.html # # Specification of the variation sequences that are defined in the @@ -26,7 +26,7 @@ # # For more information on standardized variation sequences, # see Section 23.4, Variation Selectors, -# in The Unicode Standard, Version 14.0. +# in The Unicode Standard, Version 15.0. # # For more information on the Ideographic Variation Database, # see https://www.unicode.org/ivd/ @@ -262,6 +262,113 @@ A868 FE00; phags-pa letter reversed shaping subjoined ya; # PHAGS-PA SUBJOINED L 1888 180B; second form; final # MONGOLIAN LETTER ALI GALI I 188A 180B; second form; initial medial # MONGOLIAN LETTER ALI GALI NGA +# Egyptian hieroglyph rotational variants + +# Rotations are clockwise for when rendered normally as left-to-right. +# Rotations are counter-clockwise when text is mirrored right-to-left. + +13091 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH D027 +13092 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH D027A +13093 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH D028 +130A9 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH D047 +1310F FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH F016 +13117 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH F023 +1311C FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH F028 +13121 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH F032 +13127 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH F037A +13139 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH F051 +13139 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH F051 +13183 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH H005 +13187 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH H008 +131A0 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH K006 +131A0 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH K006 +131B1 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH M003 +131B1 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH M003 +131B8 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH M009 +131B9 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH M010 +131BA FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH M010A +131CB FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH M017 +131EE FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH M044 +131EE FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH M044 +131F8 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH N010 +131F9 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH N011 +131F9 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH N011 +131FA FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH N012 +131FA FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH N012 +13216 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH N035 +13257 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH O006 +1327B FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH O029 +1327F FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH O031 +1327F FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH O031 +13285 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH O036 +1328C FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH O039 +132A4 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH P008 +132A4 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH P008 +132AA FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH Q003 +132CB FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH R024 +132DC FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH S010 +132E7 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH S018 +132E7 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH S018 +132E9 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH S020 +132F8 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH S033 +132FD FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH S037 +13302 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH S042 +13303 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH S043 +13307 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH T001 +13308 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH T002 +13310 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH T008 +13311 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH T008A +13312 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH T009 +13312 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH T009 +13313 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH T009A +13313 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH T009A +13314 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH T010 +13314 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH T010 +1331B FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH T016 +1331B FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH T016 +1331C FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH T016A +13321 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH T021 +13321 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH T021 +13322 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH T022 +13322 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH T022 +13331 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH T035 +13331 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH T035 +1333B FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH U007 +1333C FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH U008 +1334A FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH U022 +13361 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH U042 +13373 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH V007A +13377 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH V010 +13378 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH V011 +1337D FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH V012A +13385 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH V019 +13399 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH V026 +1339A FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH V027 +133AF FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH W001 +133B0 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH W002 +133BF FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH W014 +133D3 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH X004A +133DD FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH Y002 +133F2 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH Z007 +133F5 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH Z010 +133F6 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH Z011 +13403 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH Z015I +13416 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH AA008 +13419 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH AA011 +13419 FE01; rotated 180 degrees; # EGYPTIAN HIEROGLYPH AA011 +13419 FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH AA011 +1341A FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH AA012 +13423 FE00; rotated 90 degrees; # EGYPTIAN HIEROGLYPH AA021 +1342C FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH AA030 +1342E FE02; rotated 270 degrees; # EGYPTIAN HIEROGLYPH AA032 + +# Egyptian hieroglyph expanded variants + +13443 FE00; expanded ; # LOST SIGN +13444 FE00; expanded ; # HALF LOST SIGN +13445 FE00; expanded ; # TALL LOST SIGN +13446 FE00; expanded ; # WIDE LOST SIGN + # CJK compatibility ideographs # Note: In the entries for CJK compatibility ideographs, field 1 diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/confusables.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/confusables.txt index 371612c607..3b65d309f9 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/confusables.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/confusables.txt @@ -1,13 +1,13 @@ # confusables.txt -# Date: 2021-05-29, 22:09:29 GMT -# © 2021 Unicode®, Inc. +# Date: 2022-05-18, 21:51:56 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Security Mechanisms for UTS #39 -# Version: 14.0.0 +# Version: 15.0.0 # -# For documentation and usage, see http://www.unicode.org/reports/tr39 +# For documentation and usage, see https://www.unicode.org/reports/tr39 # 05AD ; 0596 ; MA # ( ֭ → ֖ ) HEBREW ACCENT DEHI → HEBREW ACCENT TIPEHA # @@ -2761,11 +2761,11 @@ FE87 ; 006C 0655 ; MA # ( ‎ﺇ‎ → lٕ ) ARABIC LETTER ALEF WITH HAMZA BELO 02AB ; 006C 007A ; MA # ( ʫ → lz ) LATIN SMALL LETTER LZ DIGRAPH → LATIN SMALL LETTER L, LATIN SMALL LETTER Z # +0675 ; 006C 0674 ; MA # ( ‎ٵ‎ → ‎lٴ‎ ) ARABIC LETTER HIGH HAMZA ALEF → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎اٴ‎→ 0623 ; 006C 0674 ; MA # ( ‎أ‎ → ‎lٴ‎ ) ARABIC LETTER ALEF WITH HAMZA ABOVE → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎ٵ‎→→‎اٴ‎→ FE84 ; 006C 0674 ; MA # ( ‎ﺄ‎ → ‎lٴ‎ ) ARABIC LETTER ALEF WITH HAMZA ABOVE FINAL FORM → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎أ‎→→‎ٵ‎→→‎اٴ‎→ FE83 ; 006C 0674 ; MA # ( ‎ﺃ‎ → ‎lٴ‎ ) ARABIC LETTER ALEF WITH HAMZA ABOVE ISOLATED FORM → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎ٵ‎→→‎اٴ‎→ 0672 ; 006C 0674 ; MA # ( ‎ٲ‎ → ‎lٴ‎ ) ARABIC LETTER ALEF WITH WAVY HAMZA ABOVE → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎أ‎→→‎ٵ‎→→‎اٴ‎→ -0675 ; 006C 0674 ; MA # ( ‎ٵ‎ → ‎lٴ‎ ) ARABIC LETTER HIGH HAMZA ALEF → LATIN SMALL LETTER L, ARABIC LETTER HIGH HAMZA # →‎اٴ‎→ FDF3 ; 006C 0643 0628 0631 ; MA # ( ‎ﷳ‎ → ‎lكبر‎ ) ARABIC LIGATURE AKBAR ISOLATED FORM → LATIN SMALL LETTER L, ARABIC LETTER KAF, ARABIC LETTER BEH, ARABIC LETTER REH # →‎اكبر‎→ @@ -5351,10 +5351,10 @@ FBE2 ; 0648 0302 ; MA # ( ‎ﯢ‎ → ‎و̂‎ ) ARABIC LETTER KIRGHIZ YU IS FBDC ; 0648 0670 ; MA # ( ‎ﯜ‎ → ‎وٰ‎ ) ARABIC LETTER YU FINAL FORM → ARABIC LETTER WAW, ARABIC LETTER SUPERSCRIPT ALEF # →‎ۈ‎→ FBDB ; 0648 0670 ; MA # ( ‎ﯛ‎ → ‎وٰ‎ ) ARABIC LETTER YU ISOLATED FORM → ARABIC LETTER WAW, ARABIC LETTER SUPERSCRIPT ALEF # →‎ۈ‎→ +0676 ; 0648 0674 ; MA # ( ‎ٶ‎ → ‎وٴ‎ ) ARABIC LETTER HIGH HAMZA WAW → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # 0624 ; 0648 0674 ; MA # ( ‎ؤ‎ → ‎وٴ‎ ) ARABIC LETTER WAW WITH HAMZA ABOVE → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # →‎ٶ‎→ FE86 ; 0648 0674 ; MA # ( ‎ﺆ‎ → ‎وٴ‎ ) ARABIC LETTER WAW WITH HAMZA ABOVE FINAL FORM → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # →‎ٶ‎→ FE85 ; 0648 0674 ; MA # ( ‎ﺅ‎ → ‎وٴ‎ ) ARABIC LETTER WAW WITH HAMZA ABOVE ISOLATED FORM → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # →‎ٶ‎→ -0676 ; 0648 0674 ; MA # ( ‎ٶ‎ → ‎وٴ‎ ) ARABIC LETTER HIGH HAMZA WAW → ARABIC LETTER WAW, ARABIC LETTER HIGH HAMZA # 0677 ; 0648 0313 0674 ; MA # ( ‎ٷ‎ → ‎و̓ٴ‎ ) ARABIC LETTER U WITH HAMZA ABOVE → ARABIC LETTER WAW, COMBINING COMMA ABOVE, ARABIC LETTER HIGH HAMZA # →‎ۇٴ‎→ FBDD ; 0648 0313 0674 ; MA # ( ‎ﯝ‎ → ‎و̓ٴ‎ ) ARABIC LETTER U WITH HAMZA ABOVE ISOLATED FORM → ARABIC LETTER WAW, COMBINING COMMA ABOVE, ARABIC LETTER HIGH HAMZA # →‎ۇٴ‎→ @@ -5446,12 +5446,12 @@ FCF1 ; 0649 006F ; MA # ( ‎ﳱ‎ → ‎ىo‎ ) ARABIC LIGATURE YEH WITH HEH FCE6 ; 0649 06DB 006F ; MA # ( ‎ﳦ‎ → ‎ىۛo‎ ) ARABIC LIGATURE THEH WITH HEH MEDIAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC SMALL HIGH THREE DOTS, LATIN SMALL LETTER O # →‎ثه‎→ +0678 ; 0649 0674 ; MA # ( ‎ٸ‎ → ‎ىٴ‎ ) ARABIC LETTER HIGH HAMZA YEH → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎يٴ‎→ 0626 ; 0649 0674 ; MA # ( ‎ئ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ٸ‎→→‎يٴ‎→ FE8B ; 0649 0674 ; MA # ( ‎ﺋ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE INITIAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ئ‎→→‎ٸ‎→→‎يٴ‎→ FE8C ; 0649 0674 ; MA # ( ‎ﺌ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE MEDIAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ئ‎→→‎ٸ‎→→‎يٴ‎→ FE8A ; 0649 0674 ; MA # ( ‎ﺊ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE FINAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ئ‎→→‎ٸ‎→→‎يٴ‎→ FE89 ; 0649 0674 ; MA # ( ‎ﺉ‎ → ‎ىٴ‎ ) ARABIC LETTER YEH WITH HAMZA ABOVE ISOLATED FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎ٸ‎→→‎يٴ‎→ -0678 ; 0649 0674 ; MA # ( ‎ٸ‎ → ‎ىٴ‎ ) ARABIC LETTER HIGH HAMZA YEH → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA # →‎يٴ‎→ FBEB ; 0649 0674 006C ; MA # ( ‎ﯫ‎ → ‎ىٴl‎ ) ARABIC LIGATURE YEH WITH HAMZA ABOVE WITH ALEF FINAL FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA, LATIN SMALL LETTER L # →‎ئا‎→ FBEA ; 0649 0674 006C ; MA # ( ‎ﯪ‎ → ‎ىٴl‎ ) ARABIC LIGATURE YEH WITH HAMZA ABOVE WITH ALEF ISOLATED FORM → ARABIC LETTER ALEF MAKSURA, ARABIC LETTER HIGH HAMZA, LATIN SMALL LETTER L # →‎ئا‎→ diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/data/PropertyAliases.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/data/PropertyAliases.txt index 3e4b429e45..2de24e26f6 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/data/PropertyAliases.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/data/PropertyAliases.txt @@ -1,11 +1,11 @@ -# PropertyAliases-14.0.0.txt -# Date: 2021-03-08, 19:35:48 GMT -# © 2021 Unicode®, Inc. +# PropertyAliases-15.0.0.txt +# Date: 2022-02-02, 23:35:44 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # This file contains aliases for properties used in the UCD. # These names can be used for XML formats of UCD data, for regular-expression diff --git a/UnicodeJsps/src/main/resources/org/unicode/jsp/data/PropertyValueAliases.txt b/UnicodeJsps/src/main/resources/org/unicode/jsp/data/PropertyValueAliases.txt index f0cb26bdab..863301b1e1 100644 --- a/UnicodeJsps/src/main/resources/org/unicode/jsp/data/PropertyValueAliases.txt +++ b/UnicodeJsps/src/main/resources/org/unicode/jsp/data/PropertyValueAliases.txt @@ -1,11 +1,11 @@ -# PropertyValueAliases-14.0.0.txt -# Date: 2021-05-10, 21:08:53 GMT -# © 2021 Unicode®, Inc. +# PropertyValueAliases-15.0.0.txt +# Date: 2022-08-05, 23:42:17 GMT +# © 2022 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # This file contains aliases for property values used in the UCD. # These names can be used for XML formats of UCD data, for regular-expression @@ -90,6 +90,7 @@ age; 12.0 ; V12_0 age; 12.1 ; V12_1 age; 13.0 ; V13_0 age; 14.0 ; V14_0 +age; 15.0 ; V15_0 age; NA ; Unassigned # Alphabetic (Alpha) @@ -135,7 +136,6 @@ Bidi_M; Y ; Yes ; T # Bidi_Mirroring_Glyph (bmg) -# @missing: 0000..10FFFF; Bidi_Mirroring_Glyph; # Bidi_Paired_Bracket (bpb) @@ -162,6 +162,7 @@ blk; Ancient_Symbols ; Ancient_Symbols blk; Arabic ; Arabic blk; Arabic_Ext_A ; Arabic_Extended_A blk; Arabic_Ext_B ; Arabic_Extended_B +blk; Arabic_Ext_C ; Arabic_Extended_C blk; Arabic_Math ; Arabic_Mathematical_Alphabetic_Symbols blk; Arabic_PF_A ; Arabic_Presentation_Forms_A ; Arabic_Presentation_Forms-A blk; Arabic_PF_B ; Arabic_Presentation_Forms_B @@ -206,6 +207,7 @@ blk; CJK_Ext_D ; CJK_Unified_Ideographs_Extension_D blk; CJK_Ext_E ; CJK_Unified_Ideographs_Extension_E blk; CJK_Ext_F ; CJK_Unified_Ideographs_Extension_F blk; CJK_Ext_G ; CJK_Unified_Ideographs_Extension_G +blk; CJK_Ext_H ; CJK_Unified_Ideographs_Extension_H blk; CJK_Radicals_Sup ; CJK_Radicals_Supplement blk; CJK_Strokes ; CJK_Strokes blk; CJK_Symbols ; CJK_Symbols_And_Punctuation @@ -223,10 +225,12 @@ blk; Cyrillic ; Cyrillic blk; Cyrillic_Ext_A ; Cyrillic_Extended_A blk; Cyrillic_Ext_B ; Cyrillic_Extended_B blk; Cyrillic_Ext_C ; Cyrillic_Extended_C +blk; Cyrillic_Ext_D ; Cyrillic_Extended_D blk; Cyrillic_Sup ; Cyrillic_Supplement ; Cyrillic_Supplementary blk; Deseret ; Deseret blk; Devanagari ; Devanagari blk; Devanagari_Ext ; Devanagari_Extended +blk; Devanagari_Ext_A ; Devanagari_Extended_A blk; Diacriticals ; Combining_Diacritical_Marks blk; Diacriticals_Ext ; Combining_Diacritical_Marks_Extended blk; Diacriticals_For_Symbols ; Combining_Diacritical_Marks_For_Symbols; Combining_Marks_For_Symbols @@ -288,6 +292,7 @@ blk; Jamo_Ext_A ; Hangul_Jamo_Extended_A blk; Jamo_Ext_B ; Hangul_Jamo_Extended_B blk; Javanese ; Javanese blk; Kaithi ; Kaithi +blk; Kaktovik_Numerals ; Kaktovik_Numerals blk; Kana_Ext_A ; Kana_Extended_A blk; Kana_Ext_B ; Kana_Extended_B blk; Kana_Sup ; Kana_Supplement @@ -296,6 +301,7 @@ blk; Kangxi ; Kangxi_Radicals blk; Kannada ; Kannada blk; Katakana ; Katakana blk; Katakana_Ext ; Katakana_Phonetic_Extensions +blk; Kawi ; Kawi blk; Kayah_Li ; Kayah_Li blk; Kharoshthi ; Kharoshthi blk; Khitan_Small_Script ; Khitan_Small_Script @@ -360,6 +366,7 @@ blk; Myanmar ; Myanmar blk; Myanmar_Ext_A ; Myanmar_Extended_A blk; Myanmar_Ext_B ; Myanmar_Extended_B blk; Nabataean ; Nabataean +blk; Nag_Mundari ; Nag_Mundari blk; Nandinagari ; Nandinagari blk; NB ; No_Block blk; New_Tai_Lue ; New_Tai_Lue @@ -663,7 +670,6 @@ EPres; Y ; Yes ; T # Equivalent_Unified_Ideograph (EqUIdeo) -# @missing: 0000..10FFFF; Equivalent_Unified_Ideograph; # Expands_On_NFC (XO_NFC) @@ -1143,7 +1149,6 @@ NFD_QC; Y ; Yes # NFKC_Casefold (NFKC_CF) -# @missing: 0000..10FFFF; NFKC_Casefold; # NFKC_Quick_Check (NFKC_QC) @@ -1313,6 +1318,7 @@ sc ; Ital ; Old_Italic sc ; Java ; Javanese sc ; Kali ; Kayah_Li sc ; Kana ; Katakana +sc ; Kawi ; Kawi sc ; Khar ; Kharoshthi sc ; Khmr ; Khmer sc ; Khoj ; Khojki @@ -1345,6 +1351,7 @@ sc ; Mroo ; Mro sc ; Mtei ; Meetei_Mayek sc ; Mult ; Multani sc ; Mymr ; Myanmar +sc ; Nagm ; Nag_Mundari sc ; Nand ; Nandinagari sc ; Narb ; Old_North_Arabian sc ; Nbat ; Nabataean @@ -1418,7 +1425,6 @@ sc ; Zzzz ; Unknown # Script_Extensions (scx) -# @missing: 0000..10FFFF; Script_Extensions;