|
1 | 1 | # unidata-16.0.0.txt |
2 | | -# Date: 2023-10-07, 00:00:00 GMT [KW] |
| 2 | +# Date: 2023-10-08, 00:00:00 GMT [KW] |
3 | 3 | # © 2023 Unicode®, Inc. |
4 | 4 | # For terms of use, see https://www.unicode.org/terms_of_use.html |
5 | 5 | # |
|
9 | 9 | # Default Unicode Collation Element Table (DUCET) for |
10 | 10 | # the Unicode Collation Algorithm. |
11 | 11 | # |
12 | | -# Version 16.0.0 draft 5 (Unicode Version: 16.0.0) |
| 12 | +# Version 16.0.0 draft 6 (Unicode Version: 16.0.0) |
13 | 13 | # based on Unicode data file UnicodeData-16.0.0d7.txt |
14 | 14 | # Ordering for Unicode 16.0 |
15 | 15 | # |
@@ -21399,16 +21399,16 @@ DEFAULT |
21399 | 21399 |
|
21400 | 21400 | # Kannada two-part vowels collate as units, not |
21401 | 21401 | # by their decompositions. |
21402 | | -# Added a second decomposition for 0CCB, to deal with |
21403 | | -# the canonical equivalence of 0CCA --> 0CC6 0CC2 |
21404 | 21402 |
|
21405 | 21403 | CONTRACTION |
21406 | 21404 |
|
21407 | 21405 | 0CC7;KANNADA VOWEL SIGN EE;Mc;0CC6 0CD5;;;;; |
21408 | 21406 | 0CC8;KANNADA VOWEL SIGN AI;Mc;0CC6 0CD6;;;;; |
21409 | 21407 | 0CCA;KANNADA VOWEL SIGN O;Mc;0CC6 0CC2;;;;; |
21410 | | -#0CCB;KANNADA VOWEL SIGN OO;Mc;0CC6 0CC2 0CD5;;;;; |
21411 | | -0CCB;KANNADA VOWEL SIGN OO;Mc;0CC6 0CC2 0CD5, 0CCA 0CD5;;;;; |
| 21408 | +# Added a second decomposition for 0CCB, to deal with |
| 21409 | +# the canonical equivalence of 0CCA --> 0CC6 0CC2 |
| 21410 | +#0CCB;KANNADA VOWEL SIGN OO;Mc;0CCA 0CD5;;;;; |
| 21411 | +0CCB;KANNADA VOWEL SIGN OO;Mc;0CCA 0CD5, 0CC6 0CC2 0CD5;;;;; |
21412 | 21412 |
|
21413 | 21413 | DEFAULT |
21414 | 21414 |
|
@@ -21636,14 +21636,15 @@ DEFAULT |
21636 | 21636 |
|
21637 | 21637 | # Sinhala two-part vowels collate as units, not |
21638 | 21638 | # by their decompositions. |
21639 | | -# |
21640 | | -# A second decomposition is added for 0DDD, to deal |
21641 | | -# with the canonical equivalence of 0DDC -> 0DD9 0DCF |
21642 | 21639 |
|
21643 | 21640 | CONTRACTION |
21644 | 21641 |
|
21645 | 21642 | 0DDC;SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA;Mc;0DD9 0DCF;;;;; |
21646 | | -0DDD;SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA;Mc;0DD9 0DCF 0DCA, 0DDC 0DCA;;;;; |
| 21643 | +# A second decomposition is added for 0DDD, to deal |
| 21644 | +# with the canonical equivalence of 0DDC -> 0DD9 0DCF |
| 21645 | +# in order to maintain canonical closure. |
| 21646 | +# 0DDD;SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA;Mc;0DDC 0DCA;;;;; |
| 21647 | +0DDD;SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA;Mc;0DDC 0DCA, 0DD9 0DCF 0DCA;;;;; |
21647 | 21648 | 0DDE;SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA;Mc;0DD9 0DDF;;;;; |
21648 | 21649 |
|
21649 | 21650 | DEFAULT |
@@ -33774,6 +33775,66 @@ A4F7;LISU LETTER OE;Lo;;;;;; |
33774 | 33775 | 16ABD;TANGSA LETTER CHA;Lo;;;;;; |
33775 | 33776 | 16ABE;TANGSA LETTER ZA;Lo;;;;;; |
33776 | 33777 |
|
| 33778 | +# Kirat Rai script starts here |
| 33779 | + |
| 33780 | +16D40;KIRAT RAI SIGN ANUSVARA;Lm;;;;;; |
| 33781 | +16D41;KIRAT RAI SIGN TONPI;Lm;;;;;; |
| 33782 | +16D42;KIRAT RAI SIGN VISARGA;Lm;;;;;; |
| 33783 | +16D43;KIRAT RAI LETTER A;Lo;;;;;; |
| 33784 | +16D44;KIRAT RAI LETTER KA;Lo;;;;;; |
| 33785 | +16D45;KIRAT RAI LETTER KHA;Lo;;;;;; |
| 33786 | +16D46;KIRAT RAI LETTER GA;Lo;;;;;; |
| 33787 | +16D47;KIRAT RAI LETTER GHA;Lo;;;;;; |
| 33788 | +16D48;KIRAT RAI LETTER NGA;Lo;;;;;; |
| 33789 | +16D49;KIRAT RAI LETTER CA;Lo;;;;;; |
| 33790 | +16D4A;KIRAT RAI LETTER CHA;Lo;;;;;; |
| 33791 | +16D4B;KIRAT RAI LETTER JA;Lo;;;;;; |
| 33792 | +16D4C;KIRAT RAI LETTER JHA;Lo;;;;;; |
| 33793 | +16D4D;KIRAT RAI LETTER NYA;Lo;;;;;; |
| 33794 | +16D4E;KIRAT RAI LETTER TTA;Lo;;;;;; |
| 33795 | +16D4F;KIRAT RAI LETTER TTHA;Lo;;;;;; |
| 33796 | +16D50;KIRAT RAI LETTER DDA;Lo;;;;;; |
| 33797 | +16D51;KIRAT RAI LETTER DDHA;Lo;;;;;; |
| 33798 | +16D52;KIRAT RAI LETTER TA;Lo;;;;;; |
| 33799 | +16D53;KIRAT RAI LETTER THA;Lo;;;;;; |
| 33800 | +16D54;KIRAT RAI LETTER DA;Lo;;;;;; |
| 33801 | +16D55;KIRAT RAI LETTER DHA;Lo;;;;;; |
| 33802 | +16D56;KIRAT RAI LETTER NA;Lo;;;;;; |
| 33803 | +16D57;KIRAT RAI LETTER PA;Lo;;;;;; |
| 33804 | +16D58;KIRAT RAI LETTER PHA;Lo;;;;;; |
| 33805 | +16D59;KIRAT RAI LETTER BA;Lo;;;;;; |
| 33806 | +16D5A;KIRAT RAI LETTER BHA;Lo;;;;;; |
| 33807 | +16D5B;KIRAT RAI LETTER MA;Lo;;;;;; |
| 33808 | +16D5C;KIRAT RAI LETTER YA;Lo;;;;;; |
| 33809 | +16D5D;KIRAT RAI LETTER RA;Lo;;;;;; |
| 33810 | +16D5E;KIRAT RAI LETTER LA;Lo;;;;;; |
| 33811 | +16D5F;KIRAT RAI LETTER VA;Lo;;;;;; |
| 33812 | +16D60;KIRAT RAI LETTER SA;Lo;;;;;; |
| 33813 | +16D61;KIRAT RAI LETTER SHA;Lo;;;;;; |
| 33814 | +16D62;KIRAT RAI LETTER HA;Lo;;;;;; |
| 33815 | +16D63;KIRAT RAI VOWEL SIGN AA;Lo;;;;;; |
| 33816 | +16D64;KIRAT RAI VOWEL SIGN I;Lo;;;;;; |
| 33817 | +16D65;KIRAT RAI VOWEL SIGN U;Lo;;;;;; |
| 33818 | +16D66;KIRAT RAI VOWEL SIGN UE;Lo;;;;;; |
| 33819 | +16D67;KIRAT RAI VOWEL SIGN E;Lo;;;;;; |
| 33820 | + |
| 33821 | +# Kirat Rai two-part and three-part vowels collate as units, not |
| 33822 | +# by their decompositions. |
| 33823 | + |
| 33824 | +CONTRACTION |
| 33825 | + |
| 33826 | +16D68;KIRAT RAI VOWEL SIGN AI;Lo;16D67 16D67;;;;; |
| 33827 | +16D69;KIRAT RAI VOWEL SIGN O;Lo;16D63 16D67;;;;; |
| 33828 | +# The vowel sign au has a complex decomposition that recurses. |
| 33829 | +# Add a secondary decomposition to 16D6A for canonical closure. |
| 33830 | +# 16D6A;KIRAT RAI VOWEL SIGN AU;Lo;16D69 16D67;;;;; |
| 33831 | +16D6A;KIRAT RAI VOWEL SIGN AU;Lo;16D69 16D67, 16D63 16D67 16D67;;;;; |
| 33832 | + |
| 33833 | +DEFAULT |
| 33834 | + |
| 33835 | +16D6B;KIRAT RAI SIGN VIRAMA;Lm;;;;;; |
| 33836 | +16D6C;KIRAT RAI SIGN SAAT;Lm;;;;;; |
| 33837 | + |
33777 | 33838 | # Aegean syllabic scripts start here |
33778 | 33839 |
|
33779 | 33840 | # Linear B script starts here |
|
0 commit comments