mirror of
https://github.com/neovim/neovim.git
synced 2025-09-06 19:38:20 +00:00
feat: update unicode tables (#27317)
This commit is contained in:
9
src/unicode/CaseFolding.txt
vendored
9
src/unicode/CaseFolding.txt
vendored
@@ -1,6 +1,6 @@
|
||||
# CaseFolding-15.0.0.txt
|
||||
# Date: 2022-02-02, 23:35:35 GMT
|
||||
# © 2022 Unicode®, Inc.
|
||||
# CaseFolding-15.1.0.txt
|
||||
# Date: 2023-05-12, 21:53:10 GMT
|
||||
# © 2023 Unicode®, Inc.
|
||||
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
|
||||
# For terms of use, see https://www.unicode.org/terms_of_use.html
|
||||
#
|
||||
@@ -929,6 +929,7 @@
|
||||
1FCC; S; 1FC3; # GREEK CAPITAL LETTER ETA WITH PROSGEGRAMMENI
|
||||
1FD2; F; 03B9 0308 0300; # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND VARIA
|
||||
1FD3; F; 03B9 0308 0301; # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
|
||||
1FD3; S; 0390; # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
|
||||
1FD6; F; 03B9 0342; # GREEK SMALL LETTER IOTA WITH PERISPOMENI
|
||||
1FD7; F; 03B9 0308 0342; # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND PERISPOMENI
|
||||
1FD8; C; 1FD0; # GREEK CAPITAL LETTER IOTA WITH VRACHY
|
||||
@@ -937,6 +938,7 @@
|
||||
1FDB; C; 1F77; # GREEK CAPITAL LETTER IOTA WITH OXIA
|
||||
1FE2; F; 03C5 0308 0300; # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND VARIA
|
||||
1FE3; F; 03C5 0308 0301; # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA
|
||||
1FE3; S; 03B0; # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA
|
||||
1FE4; F; 03C1 0313; # GREEK SMALL LETTER RHO WITH PSILI
|
||||
1FE6; F; 03C5 0342; # GREEK SMALL LETTER UPSILON WITH PERISPOMENI
|
||||
1FE7; F; 03C5 0308 0342; # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND PERISPOMENI
|
||||
@@ -1328,6 +1330,7 @@ FB02; F; 0066 006C; # LATIN SMALL LIGATURE FL
|
||||
FB03; F; 0066 0066 0069; # LATIN SMALL LIGATURE FFI
|
||||
FB04; F; 0066 0066 006C; # LATIN SMALL LIGATURE FFL
|
||||
FB05; F; 0073 0074; # LATIN SMALL LIGATURE LONG S T
|
||||
FB05; S; FB06; # LATIN SMALL LIGATURE LONG S T
|
||||
FB06; F; 0073 0074; # LATIN SMALL LIGATURE ST
|
||||
FB13; F; 0574 0576; # ARMENIAN SMALL LIGATURE MEN NOW
|
||||
FB14; F; 0574 0565; # ARMENIAN SMALL LIGATURE MEN ECH
|
||||
|
22
src/unicode/EastAsianWidth.txt
vendored
22
src/unicode/EastAsianWidth.txt
vendored
@@ -1,6 +1,6 @@
|
||||
# EastAsianWidth-15.0.0.txt
|
||||
# Date: 2022-05-24, 17:40:20 GMT [KW, LI]
|
||||
# © 2022 Unicode®, Inc.
|
||||
# EastAsianWidth-15.1.0.txt
|
||||
# Date: 2023-07-28, 23:34:08 GMT
|
||||
# © 2023 Unicode®, Inc.
|
||||
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
|
||||
# For terms of use, see https://www.unicode.org/terms_of_use.html
|
||||
#
|
||||
@@ -30,11 +30,10 @@
|
||||
# Character ranges are specified as for other property files in the
|
||||
# Unicode Character Database.
|
||||
#
|
||||
# For legacy reasons, there are no spaces before or after the semicolon
|
||||
# which separates the two fields. The comments following the number sign
|
||||
# "#" list the General_Category property value or the L& alias of the
|
||||
# derived value LC, the Unicode character name or names, and, in lines
|
||||
# with ranges of code points, the code point count in square brackets.
|
||||
# The comments following the number sign "#" list the General_Category
|
||||
# property value or the L& alias of the derived value LC, the Unicode
|
||||
# character name or names, and, in lines with ranges of code points,
|
||||
# the code point count in square brackets.
|
||||
#
|
||||
# For more information, see UAX #11: East Asian Width,
|
||||
# at https://www.unicode.org/reports/tr11/
|
||||
@@ -1430,7 +1429,7 @@
|
||||
2E80..2E99 ; W # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP
|
||||
2E9B..2EF3 ; W # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE
|
||||
2F00..2FD5 ; W # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE
|
||||
2FF0..2FFB;W # So [12] IDEOGRAPHIC DESCRIPTION CHARACTER LEFT TO RIGHT..IDEOGRAPHIC DESCRIPTION CHARACTER OVERLAID
|
||||
2FF0..2FFF ; W # So [16] IDEOGRAPHIC DESCRIPTION CHARACTER LEFT TO RIGHT..IDEOGRAPHIC DESCRIPTION CHARACTER ROTATION
|
||||
3000 ; F # Zs IDEOGRAPHIC SPACE
|
||||
3001..3003 ; W # Po [3] IDEOGRAPHIC COMMA..DITTO MARK
|
||||
3004 ; W # So JAPANESE INDUSTRIAL STANDARD SYMBOL
|
||||
@@ -1489,6 +1488,7 @@
|
||||
3196..319F ; W # So [10] IDEOGRAPHIC ANNOTATION TOP MARK..IDEOGRAPHIC ANNOTATION MAN MARK
|
||||
31A0..31BF ; W # Lo [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH
|
||||
31C0..31E3 ; W # So [36] CJK STROKE T..CJK STROKE Q
|
||||
31EF ; W # So IDEOGRAPHIC DESCRIPTION CHARACTER SUBTRACTION
|
||||
31F0..31FF ; W # Lo [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO
|
||||
3200..321E ; W # So [31] PARENTHESIZED HANGUL KIYEOK..PARENTHESIZED KOREAN CHARACTER O HU
|
||||
3220..3229 ; W # No [10] PARENTHESIZED IDEOGRAPH ONE..PARENTHESIZED IDEOGRAPH TEN
|
||||
@@ -2602,7 +2602,9 @@ FFFD;A # So REPLACEMENT CHARACTER
|
||||
2B820..2CEA1 ; W # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1
|
||||
2CEA2..2CEAF ; W # Cn [14] <reserved-2CEA2>..<reserved-2CEAF>
|
||||
2CEB0..2EBE0 ; W # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0
|
||||
2EBE1..2F7FF;W # Cn [3103] <reserved-2EBE1>..<reserved-2F7FF>
|
||||
2EBE1..2EBEF ; W # Cn [15] <reserved-2EBE1>..<reserved-2EBEF>
|
||||
2EBF0..2EE5D ; W # Lo [622] CJK UNIFIED IDEOGRAPH-2EBF0..CJK UNIFIED IDEOGRAPH-2EE5D
|
||||
2EE5E..2F7FF ; W # Cn [2466] <reserved-2EE5E>..<reserved-2F7FF>
|
||||
2F800..2FA1D ; W # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
|
||||
2FA1E..2FA1F ; W # Cn [2] <reserved-2FA1E>..<reserved-2FA1F>
|
||||
2FA20..2FFFD ; W # Cn [1502] <reserved-2FA20>..<reserved-2FFFD>
|
||||
|
7
src/unicode/UnicodeData.txt
vendored
7
src/unicode/UnicodeData.txt
vendored
@@ -11231,6 +11231,10 @@
|
||||
2FF9;IDEOGRAPHIC DESCRIPTION CHARACTER SURROUND FROM UPPER RIGHT;So;0;ON;;;;;N;;;;;
|
||||
2FFA;IDEOGRAPHIC DESCRIPTION CHARACTER SURROUND FROM LOWER LEFT;So;0;ON;;;;;N;;;;;
|
||||
2FFB;IDEOGRAPHIC DESCRIPTION CHARACTER OVERLAID;So;0;ON;;;;;N;;;;;
|
||||
2FFC;IDEOGRAPHIC DESCRIPTION CHARACTER SURROUND FROM RIGHT;So;0;ON;;;;;N;;;;;
|
||||
2FFD;IDEOGRAPHIC DESCRIPTION CHARACTER SURROUND FROM LOWER RIGHT;So;0;ON;;;;;N;;;;;
|
||||
2FFE;IDEOGRAPHIC DESCRIPTION CHARACTER HORIZONTAL REFLECTION;So;0;ON;;;;;N;;;;;
|
||||
2FFF;IDEOGRAPHIC DESCRIPTION CHARACTER ROTATION;So;0;ON;;;;;N;;;;;
|
||||
3000;IDEOGRAPHIC SPACE;Zs;0;WS;<wide> 0020;;;;N;;;;;
|
||||
3001;IDEOGRAPHIC COMMA;Po;0;ON;;;;;N;;;;;
|
||||
3002;IDEOGRAPHIC FULL STOP;Po;0;ON;;;;;N;IDEOGRAPHIC PERIOD;;;;
|
||||
@@ -11705,6 +11709,7 @@
|
||||
31E1;CJK STROKE HZZZG;So;0;ON;;;;;N;;;;;
|
||||
31E2;CJK STROKE PG;So;0;ON;;;;;N;;;;;
|
||||
31E3;CJK STROKE Q;So;0;ON;;;;;N;;;;;
|
||||
31EF;IDEOGRAPHIC DESCRIPTION CHARACTER SUBTRACTION;So;0;ON;;;;;N;;;;;
|
||||
31F0;KATAKANA LETTER SMALL KU;Lo;0;L;;;;;N;;;;;
|
||||
31F1;KATAKANA LETTER SMALL SI;Lo;0;L;;;;;N;;;;;
|
||||
31F2;KATAKANA LETTER SMALL SU;Lo;0;L;;;;;N;;;;;
|
||||
@@ -34035,6 +34040,8 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;;
|
||||
2CEA1;<CJK Ideograph Extension E, Last>;Lo;0;L;;;;;N;;;;;
|
||||
2CEB0;<CJK Ideograph Extension F, First>;Lo;0;L;;;;;N;;;;;
|
||||
2EBE0;<CJK Ideograph Extension F, Last>;Lo;0;L;;;;;N;;;;;
|
||||
2EBF0;<CJK Ideograph Extension I, First>;Lo;0;L;;;;;N;;;;;
|
||||
2EE5D;<CJK Ideograph Extension I, Last>;Lo;0;L;;;;;N;;;;;
|
||||
2F800;CJK COMPATIBILITY IDEOGRAPH-2F800;Lo;0;L;4E3D;;;;N;;;;;
|
||||
2F801;CJK COMPATIBILITY IDEOGRAPH-2F801;Lo;0;L;4E38;;;;N;;;;;
|
||||
2F802;CJK COMPATIBILITY IDEOGRAPH-2F802;Lo;0;L;4E41;;;;N;;;;;
|
||||
|
6
src/unicode/emoji-data.txt
vendored
6
src/unicode/emoji-data.txt
vendored
@@ -1,11 +1,11 @@
|
||||
# emoji-data.txt
|
||||
# Date: 2022-08-02, 00:26:10 GMT
|
||||
# © 2022 Unicode®, Inc.
|
||||
# Date: 2023-02-01, 02:22:54 GMT
|
||||
# © 2023 Unicode®, Inc.
|
||||
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
|
||||
# For terms of use, see https://www.unicode.org/terms_of_use.html
|
||||
#
|
||||
# Emoji Data for UTS #51
|
||||
# Used with Emoji Version 15.0 and subsequent minor revisions (if any)
|
||||
# Used with Emoji Version 15.1 and subsequent minor revisions (if any)
|
||||
#
|
||||
# For documentation and usage, see https://www.unicode.org/reports/tr51
|
||||
#
|
||||
|
Reference in New Issue
Block a user