Skip to content

Commit 8bcdbe3

Browse files
committed
data: update to UCD 16
1 parent d3d3ff7 commit 8bcdbe3

File tree

12 files changed

+2064
-595
lines changed

12 files changed

+2064
-595
lines changed

regex-automata/src/util/unicode_data/perl_word.rs

Lines changed: 45 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,10 @@
11
// DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY:
22
//
3-
// ucd-generate perl-word tmp/ucd-15.0.0/ --chars
3+
// ucd-generate perl-word ucd-16.0.0 --chars
44
//
5-
// Unicode version: 15.0.0.
5+
// Unicode version: 16.0.0.
66
//
7-
// ucd-generate 0.2.15 is available on crates.io.
7+
// ucd-generate 0.3.1 is available on crates.io.
88

99
pub const PERL_WORD: &'static [(char, char)] = &[
1010
('0', '9'),
@@ -59,7 +59,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
5959
('ࡠ', 'ࡪ'),
6060
('ࡰ', 'ࢇ'),
6161
('ࢉ', 'ࢎ'),
62-
('\u{898}', '\u{8e1}'),
62+
('\u{897}', '\u{8e1}'),
6363
('\u{8e3}', '\u{963}'),
6464
('०', '९'),
6565
('ॱ', 'ঃ'),
@@ -158,8 +158,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[
158158
('ಪ', 'ಳ'),
159159
('ವ', 'ಹ'),
160160
('\u{cbc}', 'ೄ'),
161-
('\u{cc6}', ''),
162-
('', '\u{ccd}'),
161+
('\u{cc6}', '\u{cc8}'),
162+
('\u{cca}', '\u{ccd}'),
163163
('\u{cd5}', '\u{cd6}'),
164164
('ೝ', 'ೞ'),
165165
('ೠ', '\u{ce3}'),
@@ -243,8 +243,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[
243243
('ᚁ', 'ᚚ'),
244244
('ᚠ', 'ᛪ'),
245245
('ᛮ', 'ᛸ'),
246-
('ᜀ', ''),
247-
('ᜟ', ''),
246+
('ᜀ', '\u{1715}'),
247+
('ᜟ', '\u{1734}'),
248248
('ᝀ', '\u{1753}'),
249249
('ᝠ', 'ᝬ'),
250250
('ᝮ', 'ᝰ'),
@@ -276,11 +276,11 @@ pub const PERL_WORD: &'static [(char, char)] = &[
276276
('\u{1b00}', 'ᭌ'),
277277
('᭐', '᭙'),
278278
('\u{1b6b}', '\u{1b73}'),
279-
('\u{1b80}', ''),
279+
('\u{1b80}', '\u{1bf3}'),
280280
('ᰀ', '\u{1c37}'),
281281
('᱀', '᱉'),
282282
('ᱍ', 'ᱽ'),
283-
('ᲀ', ''),
283+
('ᲀ', ''),
284284
('Ა', 'Ჺ'),
285285
('Ჽ', 'Ჿ'),
286286
('\u{1cd0}', '\u{1cd2}'),
@@ -367,10 +367,10 @@ pub const PERL_WORD: &'static [(char, char)] = &[
367367
('ꙿ', '\u{a6f1}'),
368368
('ꜗ', 'ꜟ'),
369369
('Ꜣ', 'ꞈ'),
370-
('Ꞌ', ''),
370+
('Ꞌ', ''),
371371
('Ꟑ', 'ꟑ'),
372372
('ꟓ', 'ꟓ'),
373-
('ꟕ', ''),
373+
('ꟕ', ''),
374374
('ꟲ', 'ꠧ'),
375375
('\u{a82c}', '\u{a82c}'),
376376
('ꡀ', 'ꡳ'),
@@ -379,9 +379,9 @@ pub const PERL_WORD: &'static [(char, char)] = &[
379379
('\u{a8e0}', 'ꣷ'),
380380
('ꣻ', 'ꣻ'),
381381
('ꣽ', '\u{a92d}'),
382-
('ꤰ', ''),
382+
('ꤰ', '\u{a953}'),
383383
('ꥠ', 'ꥼ'),
384-
('\u{a980}', ''),
384+
('\u{a980}', '\u{a9c0}'),
385385
('ꧏ', '꧙'),
386386
('ꧠ', 'ꧾ'),
387387
('ꨀ', '\u{aa36}'),
@@ -468,6 +468,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
468468
('𐖣', '𐖱'),
469469
('𐖳', '𐖹'),
470470
('𐖻', '𐖼'),
471+
('𐗀', '𐗳'),
471472
('𐘀', '𐜶'),
472473
('𐝀', '𐝕'),
473474
('𐝠', '𐝧'),
@@ -508,10 +509,14 @@ pub const PERL_WORD: &'static [(char, char)] = &[
508509
('𐳀', '𐳲'),
509510
('𐴀', '\u{10d27}'),
510511
('𐴰', '𐴹'),
512+
('𐵀', '𐵥'),
513+
('\u{10d69}', '\u{10d6d}'),
514+
('𐵯', '𐶅'),
511515
('𐺀', '𐺩'),
512516
('\u{10eab}', '\u{10eac}'),
513517
('𐺰', '𐺱'),
514-
('\u{10efd}', '𐼜'),
518+
('𐻂', '𐻄'),
519+
('\u{10efc}', '𐼜'),
515520
('𐼧', '𐼧'),
516521
('𐼰', '\u{10f50}'),
517522
('𐽰', '\u{10f85}'),
@@ -551,12 +556,22 @@ pub const PERL_WORD: &'static [(char, char)] = &[
551556
('𑌵', '𑌹'),
552557
('\u{1133b}', '𑍄'),
553558
('𑍇', '𑍈'),
554-
('𑍋', '𑍍'),
559+
('𑍋', '\u{1134d}'),
555560
('𑍐', '𑍐'),
556561
('\u{11357}', '\u{11357}'),
557562
('𑍝', '𑍣'),
558563
('\u{11366}', '\u{1136c}'),
559564
('\u{11370}', '\u{11374}'),
565+
('𑎀', '𑎉'),
566+
('𑎋', '𑎋'),
567+
('𑎎', '𑎎'),
568+
('𑎐', '𑎵'),
569+
('𑎷', '\u{113c0}'),
570+
('\u{113c2}', '\u{113c2}'),
571+
('\u{113c5}', '\u{113c5}'),
572+
('\u{113c7}', '𑏊'),
573+
('𑏌', '𑏓'),
574+
('\u{113e1}', '\u{113e2}'),
560575
('𑐀', '𑑊'),
561576
('𑑐', '𑑙'),
562577
('\u{1145e}', '𑑡'),
@@ -571,6 +586,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
571586
('𑙐', '𑙙'),
572587
('𑚀', '𑚸'),
573588
('𑛀', '𑛉'),
589+
('𑛐', '𑛣'),
574590
('𑜀', '𑜚'),
575591
('\u{1171d}', '\u{1172b}'),
576592
('𑜰', '𑜹'),
@@ -594,6 +610,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[
594610
('𑩐', '\u{11a99}'),
595611
('𑪝', '𑪝'),
596612
('𑪰', '𑫸'),
613+
('𑯀', '𑯠'),
614+
('𑯰', '𑯹'),
597615
('𑰀', '𑰈'),
598616
('𑰊', '\u{11c36}'),
599617
('\u{11c38}', '𑱀'),
@@ -618,15 +636,17 @@ pub const PERL_WORD: &'static [(char, char)] = &[
618636
('\u{11f00}', '𑼐'),
619637
('𑼒', '\u{11f3a}'),
620638
('𑼾', '\u{11f42}'),
621-
('𑽐', '𑽙'),
639+
('𑽐', '\u{11f5a}'),
622640
('𑾰', '𑾰'),
623641
('𒀀', '𒎙'),
624642
('𒐀', '𒑮'),
625643
('𒒀', '𒕃'),
626644
('𒾐', '𒿰'),
627645
('𓀀', '𓐯'),
628646
('\u{13440}', '\u{13455}'),
647+
('𓑠', '𔏺'),
629648
('𔐀', '𔙆'),
649+
('𖄀', '𖄹'),
630650
('𖠀', '𖨸'),
631651
('𖩀', '𖩞'),
632652
('𖩠', '𖩩'),
@@ -639,16 +659,18 @@ pub const PERL_WORD: &'static [(char, char)] = &[
639659
('𖭐', '𖭙'),
640660
('𖭣', '𖭷'),
641661
('𖭽', '𖮏'),
662+
('𖵀', '𖵬'),
663+
('𖵰', '𖵹'),
642664
('𖹀', '𖹿'),
643665
('𖼀', '𖽊'),
644666
('\u{16f4f}', '𖾇'),
645667
('\u{16f8f}', '𖾟'),
646668
('𖿠', '𖿡'),
647669
('𖿣', '\u{16fe4}'),
648-
('𖿰', '𖿱'),
670+
('\u{16ff0}', '\u{16ff1}'),
649671
('𗀀', '𘟷'),
650672
('𘠀', '𘳕'),
651-
('𘴀', '𘴈'),
673+
('𘳿', '𘴈'),
652674
('𚿰', '𚿳'),
653675
('𚿵', '𚿻'),
654676
('𚿽', '𚿾'),
@@ -663,10 +685,11 @@ pub const PERL_WORD: &'static [(char, char)] = &[
663685
('𛲀', '𛲈'),
664686
('𛲐', '𛲙'),
665687
('\u{1bc9d}', '\u{1bc9e}'),
688+
('𜳰', '𜳹'),
666689
('\u{1cf00}', '\u{1cf2d}'),
667690
('\u{1cf30}', '\u{1cf46}'),
668691
('\u{1d165}', '\u{1d169}'),
669-
('𝅭', '\u{1d172}'),
692+
('\u{1d16d}', '\u{1d172}'),
670693
('\u{1d17b}', '\u{1d182}'),
671694
('\u{1d185}', '\u{1d18b}'),
672695
('\u{1d1aa}', '\u{1d1ad}'),
@@ -724,6 +747,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
724747
('𞊐', '\u{1e2ae}'),
725748
('𞋀', '𞋹'),
726749
('𞓐', '𞓹'),
750+
('𞗐', '𞗺'),
727751
('𞟠', '𞟦'),
728752
('𞟨', '𞟫'),
729753
('𞟭', '𞟮'),
@@ -774,6 +798,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
774798
('𫝀', '𫠝'),
775799
('𫠠', '𬺡'),
776800
('𬺰', '𮯠'),
801+
('𮯰', '𮹝'),
777802
('丽', '𪘀'),
778803
('𰀀', '𱍊'),
779804
('𱍐', '𲎯'),

regex-syntax/src/unicode_tables/age.rs

Lines changed: 66 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,10 @@
11
// DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY:
22
//
3-
// ucd-generate age ucd-15.0.0 --chars
3+
// ucd-generate age ucd-16.0.0 --chars
44
//
5-
// Unicode version: 15.0.0.
5+
// Unicode version: 16.0.0.
66
//
7-
// ucd-generate 0.2.14 is available on crates.io.
7+
// ucd-generate 0.3.1 is available on crates.io.
88

99
pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[
1010
("V10_0", V10_0),
@@ -14,6 +14,8 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[
1414
("V13_0", V13_0),
1515
("V14_0", V14_0),
1616
("V15_0", V15_0),
17+
("V15_1", V15_1),
18+
("V16_0", V16_0),
1719
("V1_1", V1_1),
1820
("V2_0", V2_0),
1921
("V2_1", V2_1),
@@ -238,7 +240,7 @@ pub const V13_0: &'static [(char, char)] = &[
238240
('𑥐', '𑥙'),
239241
('𑾰', '𑾰'),
240242
('\u{16fe4}', '\u{16fe4}'),
241-
('𖿰', '𖿱'),
243+
('\u{16ff0}', '\u{16ff1}'),
242244
('𘫳', '𘳕'),
243245
('𘴀', '𘴈'),
244246
('🄍', '🄏'),
@@ -277,7 +279,7 @@ pub const V14_0: &'static [(char, char)] = &[
277279
('ౝ', 'ౝ'),
278280
('ೝ', 'ೝ'),
279281
('ᜍ', 'ᜍ'),
280-
('', ''),
282+
('\u{1715}', '\u{1715}'),
281283
('ᜟ', 'ᜟ'),
282284
('\u{180f}', '\u{180f}'),
283285
('\u{1ac1}', '\u{1ace}'),
@@ -382,6 +384,59 @@ pub const V15_0: &'static [(char, char)] = &[
382384
('𱍐', '𲎯'),
383385
];
384386

387+
pub const V15_1: &'static [(char, char)] =
388+
&[('⿼', '⿿'), ('㇯', '㇯'), ('𮯰', '𮹝')];
389+
390+
pub const V16_0: &'static [(char, char)] = &[
391+
('\u{897}', '\u{897}'),
392+
('᭎', '᭏'),
393+
('᭿', '᭿'),
394+
('Ᲊ', 'ᲊ'),
395+
('␧', '␩'),
396+
('㇤', '㇥'),
397+
('Ɤ', 'ꟍ'),
398+
('Ꟛ', 'Ƛ'),
399+
('𐗀', '𐗳'),
400+
('𐵀', '𐵥'),
401+
('\u{10d69}', '𐶅'),
402+
('𐶎', '𐶏'),
403+
('𐻂', '𐻄'),
404+
('\u{10efc}', '\u{10efc}'),
405+
('𑎀', '𑎉'),
406+
('𑎋', '𑎋'),
407+
('𑎎', '𑎎'),
408+
('𑎐', '𑎵'),
409+
('𑎷', '\u{113c0}'),
410+
('\u{113c2}', '\u{113c2}'),
411+
('\u{113c5}', '\u{113c5}'),
412+
('\u{113c7}', '𑏊'),
413+
('𑏌', '𑏕'),
414+
('𑏗', '𑏘'),
415+
('\u{113e1}', '\u{113e2}'),
416+
('𑛐', '𑛣'),
417+
('𑯀', '𑯡'),
418+
('𑯰', '𑯹'),
419+
('\u{11f5a}', '\u{11f5a}'),
420+
('𓑠', '𔏺'),
421+
('𖄀', '𖄹'),
422+
('𖵀', '𖵹'),
423+
('𘳿', '𘳿'),
424+
('𜰀', '𜳹'),
425+
('𜴀', '𜺳'),
426+
('𞗐', '𞗺'),
427+
('𞗿', '𞗿'),
428+
('🢲', '🢻'),
429+
('🣀', '🣁'),
430+
('🪉', '🪉'),
431+
('🪏', '🪏'),
432+
('🪾', '🪾'),
433+
('🫆', '🫆'),
434+
('🫜', '🫜'),
435+
('🫟', '🫟'),
436+
('🫩', '🫩'),
437+
('🯋', '🯯'),
438+
];
439+
385440
pub const V1_1: &'static [(char, char)] = &[
386441
('\0', 'ǵ'),
387442
('Ǻ', 'ȗ'),
@@ -530,8 +585,8 @@ pub const V1_1: &'static [(char, char)] = &[
530585
('ಪ', 'ಳ'),
531586
('ವ', 'ಹ'),
532587
('ಾ', 'ೄ'),
533-
('\u{cc6}', ''),
534-
('', '\u{ccd}'),
588+
('\u{cc6}', '\u{cc8}'),
589+
('\u{cca}', '\u{ccd}'),
535590
('\u{cd5}', '\u{cd6}'),
536591
('ೞ', 'ೞ'),
537592
('ೠ', 'ೡ'),
@@ -1174,7 +1229,7 @@ pub const V5_1: &'static [(char, char)] = &[
11741229
('ၚ', '႙'),
11751230
('႞', '႟'),
11761231
('ᢪ', 'ᢪ'),
1177-
('\u{1b80}', ''),
1232+
('\u{1b80}', '\u{1baa}'),
11781233
('ᮮ', '᮹'),
11791234
('ᰀ', '\u{1c37}'),
11801235
('᰻', '᱉'),
@@ -1212,7 +1267,7 @@ pub const V5_1: &'static [(char, char)] = &[
12121267
('ꟻ', 'ꟿ'),
12131268
('ꢀ', '\u{a8c4}'),
12141269
('꣎', '꣙'),
1215-
('꤀', ''),
1270+
('꤀', '\u{a953}'),
12161271
('꥟', '꥟'),
12171272
('ꨀ', '\u{aa36}'),
12181273
('ꩀ', 'ꩍ'),
@@ -1340,7 +1395,7 @@ pub const V6_0: &'static [(char, char)] = &[
13401395
('ྌ', '\u{f8f}'),
13411396
('࿙', '࿚'),
13421397
('\u{135d}', '\u{135e}'),
1343-
('ᯀ', ''),
1398+
('ᯀ', '\u{1bf3}'),
13441399
('᯼', '᯿'),
13451400
('\u{1dfc}', '\u{1dfc}'),
13461401
('ₕ', 'ₜ'),
@@ -1606,7 +1661,7 @@ pub const V7_0: &'static [(char, char)] = &[
16061661
('𑌵', '𑌹'),
16071662
('\u{1133c}', '𑍄'),
16081663
('𑍇', '𑍈'),
1609-
('𑍋', '𑍍'),
1664+
('𑍋', '\u{1134d}'),
16101665
('\u{11357}', '\u{11357}'),
16111666
('𑍝', '𑍣'),
16121667
('\u{11366}', '\u{1136c}'),

0 commit comments

Comments
 (0)