Skip to content
Permalink
Browse files
8268081: Upgrade Unicode Data Files to 14.0.0
Reviewed-by: joehw, iris, lancea
  • Loading branch information
naotoj committed Jan 12, 2022
1 parent ddddec7 commit 0a094d7c286ed0b5a35c517391e48c603cb43a68
Show file tree
Hide file tree
Showing 38 changed files with 3,342 additions and 1,090 deletions.
@@ -1,6 +1,6 @@
# Blocks-13.0.0.txt
# Date: 2019-07-10, 19:06:00 GMT [KW]
# Copyright (c) 2019 Unicode, Inc.
# Blocks-14.0.0.txt
# Date: 2021-01-22, 23:29:00 GMT [KW]
# Copyright (c) 2021 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
# Unicode Character Database
@@ -52,6 +52,7 @@
0800..083F; Samaritan
0840..085F; Mandaic
0860..086F; Syriac Supplement
0870..089F; Arabic Extended-B
08A0..08FF; Arabic Extended-A
0900..097F; Devanagari
0980..09FF; Bengali
@@ -215,7 +216,9 @@ FFF0..FFFF; Specials
104B0..104FF; Osage
10500..1052F; Elbasan
10530..1056F; Caucasian Albanian
10570..105BF; Vithkuqi
10600..1077F; Linear A
10780..107BF; Latin Extended-F
10800..1083F; Cypriot Syllabary
10840..1085F; Imperial Aramaic
10860..1087F; Palmyrene
@@ -240,6 +243,7 @@ FFF0..FFFF; Specials
10E80..10EBF; Yezidi
10F00..10F2F; Old Sogdian
10F30..10F6F; Sogdian
10F70..10FAF; Old Uyghur
10FB0..10FDF; Chorasmian
10FE0..10FFF; Elymaic
11000..1107F; Brahmi
@@ -259,13 +263,14 @@ FFF0..FFFF; Specials
11600..1165F; Modi
11660..1167F; Mongolian Supplement
11680..116CF; Takri
11700..1173F; Ahom
11700..1174F; Ahom
11800..1184F; Dogra
118A0..118FF; Warang Citi
11900..1195F; Dives Akuru
119A0..119FF; Nandinagari
11A00..11A4F; Zanabazar Square
11A50..11AAF; Soyombo
11AB0..11ABF; Unified Canadian Aboriginal Syllabics Extended-A
11AC0..11AFF; Pau Cin Hau
11C00..11C6F; Bhaiksuki
11C70..11CBF; Marchen
@@ -277,11 +282,13 @@ FFF0..FFFF; Specials
12000..123FF; Cuneiform
12400..1247F; Cuneiform Numbers and Punctuation
12480..1254F; Early Dynastic Cuneiform
12F90..12FFF; Cypro-Minoan
13000..1342F; Egyptian Hieroglyphs
13430..1343F; Egyptian Hieroglyph Format Controls
14400..1467F; Anatolian Hieroglyphs
16800..16A3F; Bamum Supplement
16A40..16A6F; Mro
16A70..16ACF; Tangsa
16AD0..16AFF; Bassa Vah
16B00..16B8F; Pahawh Hmong
16E40..16E9F; Medefaidrin
@@ -290,13 +297,15 @@ FFF0..FFFF; Specials
17000..187FF; Tangut
18800..18AFF; Tangut Components
18B00..18CFF; Khitan Small Script
18D00..18D8F; Tangut Supplement
18D00..18D7F; Tangut Supplement
1AFF0..1AFFF; Kana Extended-B
1B000..1B0FF; Kana Supplement
1B100..1B12F; Kana Extended-A
1B130..1B16F; Small Kana Extension
1B170..1B2FF; Nushu
1BC00..1BC9F; Duployan
1BCA0..1BCAF; Shorthand Format Controls
1CF00..1CFCF; Znamenny Musical Notation
1D000..1D0FF; Byzantine Musical Symbols
1D100..1D1FF; Musical Symbols
1D200..1D24F; Ancient Greek Musical Notation
@@ -305,9 +314,12 @@ FFF0..FFFF; Specials
1D360..1D37F; Counting Rod Numerals
1D400..1D7FF; Mathematical Alphanumeric Symbols
1D800..1DAAF; Sutton SignWriting
1DF00..1DFFF; Latin Extended-G
1E000..1E02F; Glagolitic Supplement
1E100..1E14F; Nyiakeng Puachue Hmong
1E290..1E2BF; Toto
1E2C0..1E2FF; Wancho
1E7E0..1E7FF; Ethiopic Extended-B
1E800..1E8DF; Mende Kikakui
1E900..1E95F; Adlam
1EC70..1ECBF; Indic Siyaq Numbers

Large diffs are not rendered by default.

Large diffs are not rendered by default.

Large diffs are not rendered by default.

@@ -1,6 +1,6 @@
# PropertyValueAliases-13.0.0.txt
# Date: 2019-11-13, 21:52:10 GMT
# Copyright (c) 2019 Unicode, Inc.
# PropertyValueAliases-14.0.0.txt
# Date: 2021-05-10, 21:08:53 GMT
# Copyright (c) 2021 Unicode, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
@@ -89,6 +89,7 @@ age; 11.0 ; V11_0
age; 12.0 ; V12_0
age; 12.1 ; V12_1
age; 13.0 ; V13_0
age; 14.0 ; V14_0
age; NA ; Unassigned

# Alphabetic (Alpha)
@@ -160,6 +161,7 @@ blk; Ancient_Greek_Numbers ; Ancient_Greek_Numbers
blk; Ancient_Symbols ; Ancient_Symbols
blk; Arabic ; Arabic
blk; Arabic_Ext_A ; Arabic_Extended_A
blk; Arabic_Ext_B ; Arabic_Extended_B
blk; Arabic_Math ; Arabic_Mathematical_Alphabetic_Symbols
blk; Arabic_PF_A ; Arabic_Presentation_Forms_A ; Arabic_Presentation_Forms-A
blk; Arabic_PF_B ; Arabic_Presentation_Forms_B
@@ -216,6 +218,7 @@ blk; Cuneiform ; Cuneiform
blk; Cuneiform_Numbers ; Cuneiform_Numbers_And_Punctuation
blk; Currency_Symbols ; Currency_Symbols
blk; Cypriot_Syllabary ; Cypriot_Syllabary
blk; Cypro_Minoan ; Cypro_Minoan
blk; Cyrillic ; Cyrillic
blk; Cyrillic_Ext_A ; Cyrillic_Extended_A
blk; Cyrillic_Ext_B ; Cyrillic_Extended_B
@@ -246,6 +249,7 @@ blk; Enclosed_Ideographic_Sup ; Enclosed_Ideographic_Supplement
blk; Ethiopic ; Ethiopic
blk; Ethiopic_Ext ; Ethiopic_Extended
blk; Ethiopic_Ext_A ; Ethiopic_Extended_A
blk; Ethiopic_Ext_B ; Ethiopic_Extended_B
blk; Ethiopic_Sup ; Ethiopic_Supplement
blk; Geometric_Shapes ; Geometric_Shapes
blk; Geometric_Shapes_Ext ; Geometric_Shapes_Extended
@@ -285,6 +289,7 @@ blk; Jamo_Ext_B ; Hangul_Jamo_Extended_B
blk; Javanese ; Javanese
blk; Kaithi ; Kaithi
blk; Kana_Ext_A ; Kana_Extended_A
blk; Kana_Ext_B ; Kana_Extended_B
blk; Kana_Sup ; Kana_Supplement
blk; Kanbun ; Kanbun
blk; Kangxi ; Kangxi_Radicals
@@ -306,6 +311,8 @@ blk; Latin_Ext_B ; Latin_Extended_B
blk; Latin_Ext_C ; Latin_Extended_C
blk; Latin_Ext_D ; Latin_Extended_D
blk; Latin_Ext_E ; Latin_Extended_E
blk; Latin_Ext_F ; Latin_Extended_F
blk; Latin_Ext_G ; Latin_Extended_G
blk; Lepcha ; Lepcha
blk; Letterlike_Symbols ; Letterlike_Symbols
blk; Limbu ; Limbu
@@ -372,6 +379,7 @@ blk; Old_Persian ; Old_Persian
blk; Old_Sogdian ; Old_Sogdian
blk; Old_South_Arabian ; Old_South_Arabian
blk; Old_Turkic ; Old_Turkic
blk; Old_Uyghur ; Old_Uyghur
blk; Oriya ; Oriya
blk; Ornamental_Dingbats ; Ornamental_Dingbats
blk; Osage ; Osage
@@ -433,6 +441,7 @@ blk; Tai_Xuan_Jing ; Tai_Xuan_Jing_Symbols
blk; Takri ; Takri
blk; Tamil ; Tamil
blk; Tamil_Sup ; Tamil_Supplement
blk; Tangsa ; Tangsa
blk; Tangut ; Tangut
blk; Tangut_Components ; Tangut_Components
blk; Tangut_Sup ; Tangut_Supplement
@@ -442,13 +451,16 @@ blk; Thai ; Thai
blk; Tibetan ; Tibetan
blk; Tifinagh ; Tifinagh
blk; Tirhuta ; Tirhuta
blk; Toto ; Toto
blk; Transport_And_Map ; Transport_And_Map_Symbols
blk; UCAS ; Unified_Canadian_Aboriginal_Syllabics; Canadian_Syllabics
blk; UCAS_Ext ; Unified_Canadian_Aboriginal_Syllabics_Extended
blk; UCAS_Ext_A ; Unified_Canadian_Aboriginal_Syllabics_Extended_A
blk; Ugaritic ; Ugaritic
blk; Vai ; Vai
blk; Vedic_Ext ; Vedic_Extensions
blk; Vertical_Forms ; Vertical_Forms
blk; Vithkuqi ; Vithkuqi
blk; VS ; Variation_Selectors
blk; VS_Sup ; Variation_Selectors_Supplement
blk; Wancho ; Wancho
@@ -458,6 +470,7 @@ blk; Yi_Radicals ; Yi_Radicals
blk; Yi_Syllables ; Yi_Syllables
blk; Yijing ; Yijing_Hexagram_Symbols
blk; Zanabazar_Square ; Zanabazar_Square
blk; Znamenny_Music ; Znamenny_Musical_Notation

# Canonical_Combining_Class (ccc)

@@ -1032,6 +1045,8 @@ jg ; Taw ; Taw
jg ; Teh_Marbuta ; Teh_Marbuta
jg ; Teh_Marbuta_Goal ; Hamza_On_Heh_Goal
jg ; Teth ; Teth
jg ; Thin_Yeh ; Thin_Yeh
jg ; Vertical_Tail ; Vertical_Tail
jg ; Waw ; Waw
jg ; Yeh ; Yeh
jg ; Yeh_Barree ; Yeh_Barree
@@ -1262,6 +1277,7 @@ sc ; Cham ; Cham
sc ; Cher ; Cherokee
sc ; Chrs ; Chorasmian
sc ; Copt ; Coptic ; Qaac
sc ; Cpmn ; Cypro_Minoan
sc ; Cprt ; Cypriot
sc ; Cyrl ; Cyrillic
sc ; Deva ; Devanagari
@@ -1341,6 +1357,7 @@ sc ; Orkh ; Old_Turkic
sc ; Orya ; Oriya
sc ; Osge ; Osage
sc ; Osma ; Osmanya
sc ; Ougr ; Old_Uyghur
sc ; Palm ; Palmyrene
sc ; Pauc ; Pau_Cin_Hau
sc ; Perm ; Old_Permic
@@ -1383,8 +1400,11 @@ sc ; Thaa ; Thaana
sc ; Thai ; Thai
sc ; Tibt ; Tibetan
sc ; Tirh ; Tirhuta
sc ; Tnsa ; Tangsa
sc ; Toto ; Toto
sc ; Ugar ; Ugaritic
sc ; Vaii ; Vai
sc ; Vith ; Vithkuqi
sc ; Wara ; Warang_Citi
sc ; Wcho ; Wancho
sc ; Xpeo ; Old_Persian
@@ -0,0 +1,16 @@
# Unicode Character Database
# Date: 2021-09-10, 17:22:00 GMT [KW]
# Copyright (c) 2021 Unicode, Inc.
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
# For terms of use, see https://www.unicode.org/terms_of_use.html
#
# For documentation, see the following:
# NamesList.html
# UAX #38, "Unicode Han Database (Unihan)"
# UAX #44, "Unicode Character Database"
# UTS #51, "Unicode Emoji"
#
# The UAXes and UTS #51 can be accessed at https://www.unicode.org/versions/Unicode14.0.0/

This directory contains the final data files
for the Unicode Character Database, for Version 14.0.0 of the Unicode Standard.

1 comment on commit 0a094d7

@openjdk-notifier
Copy link

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Please sign in to comment.