Skip to content

Commit 94e0151

Browse files
committed
Merge remote-tracking branch 'la-vache/main' into linkification-in-MakeUnicodeFiles
2 parents 4be4bb4 + 9880b1c commit 94e0151

File tree

15 files changed

+74
-30
lines changed

15 files changed

+74
-30
lines changed

unicodetools/data/linkification/dev/LinkTerm.txt

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# LinkTerm.txt
2-
# Date: 2026-02-03, 13:35:49 GMT
2+
# Date: 2026-02-03, 19:23:30 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -1804,6 +1804,7 @@ FFFD ; Include # 1.1 (�) REPLACEMENT CHARACTER
18041804
1CCFA..1CCFC ; Include # 17.0 [3] (𜳺..𜳼) SNAKE SYMBOL..NOSE SYMBOL
18051805
1CD00..1CEB3 ; Include # 16.0 [436] (𜴀..𜺳) BLOCK OCTANT-3..BLACK RIGHT TRIANGLE CARET
18061806
1CEBA..1CED0 ; Include # 17.0 [23] (𜺺..𜻐) FRAGILE SYMBOL..LEUKOTHEA
1807+
1CED2..1CED4 ; Include # 18.0 [3] (U+1CED2..U+1CED4) ALCHEMICAL SYMBOL FOR OIL INVERTED..ALCHEMICAL SYMBOL FOR SALT OF TARTAR
18071808
1CEDD..1CEDF ; Include # 18.0 [3] (U+1CEDD..U+1CEDF) SQUARE ROOT OF SQUARE ROOT..SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT
18081809
1CEE0..1CEF0 ; Include # 17.0 [17] (𜻠..𜻰) GEOMANTIC FIGURE POPULUS..MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR
18091810
1CEF1..1CEFD ; Include # 18.0 [13] (U+1CEF1..U+1CEFD) LEIBNIZIAN DIVISION SIGN..HYPERBOLA
@@ -2208,5 +2209,5 @@ FFFD ; Include # 1.1 (�) REPLACEMENT CHARACTER
22082209
E0020..E007F ; Include # 3.1 [96] (U+E0020..U+E007F) TAG SPACE..CANCEL TAG
22092210
E0100..E01EF ; Include # 4.0 [240] (U+E0100..U+E01EF) VARIATION SELECTOR-17..VARIATION SELECTOR-256
22102211

2211-
# Total code points: 172350
2212+
# Total code points: 172353
22122213

unicodetools/data/ucd/dev/DerivedAge.txt

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# DerivedAge-18.0.0.txt
2-
# Date: 2026-02-03, 11:13:44 GMT
2+
# Date: 2026-02-03, 12:08:03 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -2154,6 +2154,7 @@ AB6C..AB6D ; 18.0 # [2] LATIN CAPITAL LETTER SCRIPT R..LATIN CAPITAL LETTER
21542154
191A0..191D2 ; 18.0 # [51] JURCHEN RADICAL-01..JURCHEN RADICAL-51
21552155
1B123..1B128 ; 18.0 # [6] HIRAGANA DIGRAPH KOTO..KATAKANA LETTER ALTERNATE WI
21562156
1B168 ; 18.0 # KATAKANA LETTER SMALL ARCHAIC YE
2157+
1CED2..1CED4 ; 18.0 # [3] ALCHEMICAL SYMBOL FOR OIL INVERTED..ALCHEMICAL SYMBOL FOR SALT OF TARTAR
21572158
1CEDD..1CEDF ; 18.0 # [3] SQUARE ROOT OF SQUARE ROOT..SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT
21582159
1CEF1..1CEFD ; 18.0 # [13] LEIBNIZIAN DIVISION SIGN..HYPERBOLA
21592160
1D127..1D128 ; 18.0 # [2] MUSICAL SYMBOL COMBINING STRESS..MUSICAL SYMBOL COMBINING UNSTRESS
@@ -2177,6 +2178,6 @@ AB6C..AB6D ; 18.0 # [2] LATIN CAPITAL LETTER SCRIPT R..LATIN CAPITAL LETTER
21772178
2B81E ; 18.0 # CJK UNIFIED IDEOGRAPH-2B81E
21782179
3D000..3FC3F ; 18.0 # [11328] SEAL CHARACTER-3D000..SEAL CHARACTER-3FC3F
21792180

2180-
# Total code points: 13045
2181+
# Total code points: 13048
21812182

21822183
# EOF

unicodetools/data/ucd/dev/DerivedCoreProperties.txt

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# DerivedCoreProperties-18.0.0.txt
2-
# Date: 2026-02-03, 11:13:48 GMT
2+
# Date: 2026-02-03, 12:08:07 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -13053,6 +13053,7 @@ FFFC..FFFD ; Grapheme_Base # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEME
1305313053
1CCFA..1CCFC ; Grapheme_Base # So [3] SNAKE SYMBOL..NOSE SYMBOL
1305413054
1CD00..1CEB3 ; Grapheme_Base # So [436] BLOCK OCTANT-3..BLACK RIGHT TRIANGLE CARET
1305513055
1CEBA..1CED0 ; Grapheme_Base # So [23] FRAGILE SYMBOL..LEUKOTHEA
13056+
1CED2..1CED4 ; Grapheme_Base # So [3] ALCHEMICAL SYMBOL FOR OIL INVERTED..ALCHEMICAL SYMBOL FOR SALT OF TARTAR
1305613057
1CEDD..1CEDF ; Grapheme_Base # Sm [3] SQUARE ROOT OF SQUARE ROOT..SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT
1305713058
1CEE0..1CEEF ; Grapheme_Base # So [16] GEOMANTIC FIGURE POPULUS..GEOMANTIC FIGURE VIA
1305813059
1CEF0..1CEFD ; Grapheme_Base # Sm [14] MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR..HYPERBOLA
@@ -13252,7 +13253,7 @@ FFFC..FFFD ; Grapheme_Base # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEME
1325213253
31350..33479 ; Grapheme_Base # Lo [8490] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-33479
1325313254
3D000..3FC3F ; Grapheme_Base # Lo [11328] SEAL CHARACTER-3D000..SEAL CHARACTER-3FC3F
1325413255

13255-
# Total code points: 170500
13256+
# Total code points: 170503
1325613257

1325713258
# ================================================
1325813259

unicodetools/data/ucd/dev/EastAsianWidth.txt

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# EastAsianWidth-18.0.0.txt
2-
# Date: 2026-02-03, 11:13:54 GMT
2+
# Date: 2026-02-03, 12:08:13 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -2428,6 +2428,7 @@ FFFD ; A # So REPLACEMENT CHARACTER
24282428
1CD00..1CEB3 ; N # So [436] BLOCK OCTANT-3..BLACK RIGHT TRIANGLE CARET
24292429
1CEBA..1CEBF ; N # So [6] FRAGILE SYMBOL..STRAWBERRY SYMBOL
24302430
1CEC0..1CED0 ; N # So [17] HEBE..LEUKOTHEA
2431+
1CED2..1CED4 ; N # So [3] ALCHEMICAL SYMBOL FOR OIL INVERTED..ALCHEMICAL SYMBOL FOR SALT OF TARTAR
24312432
1CEDD..1CEDF ; N # Sm [3] SQUARE ROOT OF SQUARE ROOT..SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT
24322433
1CEE0..1CEEF ; N # So [16] GEOMANTIC FIGURE POPULUS..GEOMANTIC FIGURE VIA
24332434
1CEF0..1CEFD ; N # Sm [14] MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR..HYPERBOLA

unicodetools/data/ucd/dev/LineBreak.txt

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# LineBreak-18.0.0.txt
2-
# Date: 2026-02-03, 11:13:55 GMT
2+
# Date: 2026-02-03, 12:08:14 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -3341,6 +3341,7 @@ FFFD ; AI # So REPLACEMENT CHARACTER
33413341
1CD00..1CEB3 ; AL # So [436] BLOCK OCTANT-3..BLACK RIGHT TRIANGLE CARET
33423342
1CEBA..1CEBF ; AL # So [6] FRAGILE SYMBOL..STRAWBERRY SYMBOL
33433343
1CEC0..1CED0 ; AL # So [17] HEBE..LEUKOTHEA
3344+
1CED2..1CED4 ; AL # So [3] ALCHEMICAL SYMBOL FOR OIL INVERTED..ALCHEMICAL SYMBOL FOR SALT OF TARTAR
33443345
1CEDD..1CEDF ; AL # Sm [3] SQUARE ROOT OF SQUARE ROOT..SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT
33453346
1CEE0..1CEEF ; AL # So [16] GEOMANTIC FIGURE POPULUS..GEOMANTIC FIGURE VIA
33463347
1CEF0..1CEFD ; AL # Sm [14] MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR..HYPERBOLA

unicodetools/data/ucd/dev/Scripts.txt

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# Scripts-18.0.0.txt
2-
# Date: 2026-02-03, 11:14:21 GMT
2+
# Date: 2026-02-03, 12:08:41 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -530,6 +530,7 @@ FFFC..FFFD ; Common # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHAR
530530
1CCFA..1CCFC ; Common # So [3] SNAKE SYMBOL..NOSE SYMBOL
531531
1CD00..1CEB3 ; Common # So [436] BLOCK OCTANT-3..BLACK RIGHT TRIANGLE CARET
532532
1CEBA..1CED0 ; Common # So [23] FRAGILE SYMBOL..LEUKOTHEA
533+
1CED2..1CED4 ; Common # So [3] ALCHEMICAL SYMBOL FOR OIL INVERTED..ALCHEMICAL SYMBOL FOR SALT OF TARTAR
533534
1CEDD..1CEDF ; Common # Sm [3] SQUARE ROOT OF SQUARE ROOT..SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT
534535
1CEE0..1CEEF ; Common # So [16] GEOMANTIC FIGURE POPULUS..GEOMANTIC FIGURE VIA
535536
1CEF0..1CEFD ; Common # Sm [14] MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR..HYPERBOLA
@@ -648,7 +649,7 @@ FFFC..FFFD ; Common # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHAR
648649
E0001 ; Common # Cf LANGUAGE TAG
649650
E0020..E007F ; Common # Cf [96] TAG SPACE..CANCEL TAG
650651

651-
# Total code points: 9273
652+
# Total code points: 9276
652653

653654
# ================================================
654655

unicodetools/data/ucd/dev/UnicodeData.txt

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -33930,6 +33930,9 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;;
3393033930
1CECE;BELLONA;So;0;ON;;;;;N;;;;;
3393133931
1CECF;AMPHITRITE;So;0;ON;;;;;N;;;;;
3393233932
1CED0;LEUKOTHEA;So;0;ON;;;;;N;;;;;
33933+
1CED2;ALCHEMICAL SYMBOL FOR OIL INVERTED;So;0;ON;;;;;N;;;;;
33934+
1CED3;ALCHEMICAL SYMBOL FOR MOON-JUPITER;So;0;ON;;;;;N;;;;;
33935+
1CED4;ALCHEMICAL SYMBOL FOR SALT OF TARTAR;So;0;ON;;;;;N;;;;;
3393333936
1CEDD;SQUARE ROOT OF SQUARE ROOT;Sm;0;ON;;;;;Y;;;;;
3393433937
1CEDE;SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT;Sm;0;ON;;;;;Y;;;;;
3393533938
1CEDF;SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT;Sm;0;ON;;;;;Y;;;;;

unicodetools/data/ucd/dev/VerticalOrientation.txt

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# VerticalOrientation-18.0.0.txt
2-
# Date: 2026-02-03, 11:14:24 GMT
2+
# Date: 2026-02-03, 12:08:44 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -2281,7 +2281,9 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA
22812281
1CD00..1CEB3 ; R # So [436] BLOCK OCTANT-3..BLACK RIGHT TRIANGLE CARET
22822282
1CEBA..1CEBF ; R # So [6] FRAGILE SYMBOL..STRAWBERRY SYMBOL
22832283
1CEC0..1CED0 ; U # So [17] HEBE..LEUKOTHEA
2284-
1CED1..1CEDC ; U # Cn [12] <reserved-1CED1>..<reserved-1CEDC>
2284+
1CED1 ; U # Cn <reserved-1CED1>
2285+
1CED2..1CED4 ; U # So [3] ALCHEMICAL SYMBOL FOR OIL INVERTED..ALCHEMICAL SYMBOL FOR SALT OF TARTAR
2286+
1CED5..1CEDC ; U # Cn [8] <reserved-1CED5>..<reserved-1CEDC>
22852287
1CEDD..1CEDF ; R # Sm [3] SQUARE ROOT OF SQUARE ROOT..SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT
22862288
1CEE0..1CEEF ; U # So [16] GEOMANTIC FIGURE POPULUS..GEOMANTIC FIGURE VIA
22872289
1CEF0 ; U # Sm MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR

unicodetools/data/ucd/dev/extracted/DerivedBidiClass.txt

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# DerivedBidiClass-18.0.0.txt
2-
# Date: 2026-02-03, 11:13:46 GMT
2+
# Date: 2026-02-03, 12:08:05 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -1253,8 +1253,8 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER
12531253
F0000..FFFFD ; L # Co [65534] <private-use-F0000>..<private-use-FFFFD>
12541254
100000..10FFFD; L # Co [65534] <private-use-100000>..<private-use-10FFFD>
12551255

1256-
# The above property value applies to 797614 code points not listed here.
1257-
# Total code points: 1095316
1256+
# The above property value applies to 797611 code points not listed here.
1257+
# Total code points: 1095313
12581258

12591259
# ================================================
12601260

@@ -1992,6 +1992,7 @@ FFFC..FFFD ; ON # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTE
19921992
1CCFA..1CCFC ; ON # So [3] SNAKE SYMBOL..NOSE SYMBOL
19931993
1CD00..1CEB3 ; ON # So [436] BLOCK OCTANT-3..BLACK RIGHT TRIANGLE CARET
19941994
1CEBA..1CED0 ; ON # So [23] FRAGILE SYMBOL..LEUKOTHEA
1995+
1CED2..1CED4 ; ON # So [3] ALCHEMICAL SYMBOL FOR OIL INVERTED..ALCHEMICAL SYMBOL FOR SALT OF TARTAR
19951996
1CEDD..1CEDF ; ON # Sm [3] SQUARE ROOT OF SQUARE ROOT..SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT
19961997
1CEE0..1CEEF ; ON # So [16] GEOMANTIC FIGURE POPULUS..GEOMANTIC FIGURE VIA
19971998
1CEF0..1CEFD ; ON # Sm [14] MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR..HYPERBOLA
@@ -2051,7 +2052,7 @@ FFFC..FFFD ; ON # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTE
20512052
1FB94..1FBEF ; ON # So [92] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..TOP LEFT JUSTIFIED LOWER RIGHT QUARTER BLACK CIRCLE
20522053
1FBFA ; ON # So ALARM BELL SYMBOL
20532054

2054-
# Total code points: 6929
2055+
# Total code points: 6932
20552056

20562057
# ================================================
20572058

unicodetools/data/ucd/dev/extracted/DerivedCombiningClass.txt

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# DerivedCombiningClass-18.0.0.txt
2-
# Date: 2026-02-03, 11:13:47 GMT
2+
# Date: 2026-02-03, 12:08:06 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -1900,6 +1900,7 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER
19001900
1CCFA..1CCFC ; 0 # So [3] SNAKE SYMBOL..NOSE SYMBOL
19011901
1CD00..1CEB3 ; 0 # So [436] BLOCK OCTANT-3..BLACK RIGHT TRIANGLE CARET
19021902
1CEBA..1CED0 ; 0 # So [23] FRAGILE SYMBOL..LEUKOTHEA
1903+
1CED2..1CED4 ; 0 # So [3] ALCHEMICAL SYMBOL FOR OIL INVERTED..ALCHEMICAL SYMBOL FOR SALT OF TARTAR
19031904
1CEDD..1CEDF ; 0 # Sm [3] SQUARE ROOT OF SQUARE ROOT..SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT OF SQUARE ROOT
19041905
1CEE0..1CEEF ; 0 # So [16] GEOMANTIC FIGURE POPULUS..GEOMANTIC FIGURE VIA
19051906
1CEF0..1CEFD ; 0 # Sm [14] MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR..HYPERBOLA
@@ -2113,7 +2114,7 @@ E0100..E01EF ; 0 # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256
21132114
F0000..FFFFD ; 0 # Co [65534] <private-use-F0000>..<private-use-FFFFD>
21142115
100000..10FFFD; 0 # Co [65534] <private-use-100000>..<private-use-10FFFD>
21152116

2116-
# The above property value applies to 803733 code points not listed here.
2117+
# The above property value applies to 803730 code points not listed here.
21172118
# Total code points: 1113109
21182119

21192120
# ================================================

0 commit comments

Comments
 (0)