Skip to content

Commit c1dd3ea

Browse files
committed
New confusables data based on L2/22-108: generated data
1 parent fe8a53a commit c1dd3ea

File tree

2 files changed

+43
-10
lines changed

2 files changed

+43
-10
lines changed

unicodetools/data/security/dev/data/confusablesSummaryIdentifier.txt

Lines changed: 32 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# confusablesSummaryIdentifier.txt
2-
# Date: 2025-07-13, 16:46:41 GMT
2+
# Date: 2025-07-20, 15:54:57 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -489,9 +489,10 @@
489489
(‎ ́ ‎) 0301 COMBINING ACUTE ACCENT
490490
← (‎ َ ‎) 064E ARABIC FATHA
491491

492-
# ̆ ̌
492+
# ̆ ̌
493493
(‎ ̆ ‎) 0306 COMBINING BREVE
494494
← (‎ ̌ ‎) 030C COMBINING CARON
495+
← (‎ ॅ ‎) 0945 DEVANAGARI VOWEL SIGN CANDRA E
495496

496497
# ̆̇ ँ ঁ ଁ
497498
(‎ ̆̇ ‎) 0306 0307 COMBINING BREVE, COMBINING DOT ABOVE
@@ -743,10 +744,21 @@
743744
(‎ ݧ ‎) 0767 ARABIC LETTER NOON WITH TWO DOTS BELOW
744745
← (‎ ࢩ ‎) 08A9 ARABIC LETTER YEH WITH TWO DOTS BELOW AND DOT ABOVE # →‎ݔ‎→
745746

747+
# अ̆ अॅ ॲ
748+
(‎ अ̆ ‎) 0905 0306 DEVANAGARI LETTER A, COMBINING BREVE
749+
← (‎ अॅ ‎) 0905 0945 DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN CANDRA E
750+
← (‎ ॲ ‎) 0972 DEVANAGARI LETTER CANDRA A # →अॅ→
751+
746752
# अा आ
747753
(‎ अा ‎) 0905 093E DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN AA
748754
← (‎ आ ‎) 0906 DEVANAGARI LETTER AA
749755

756+
# अा̆ अाॅ अॉ ऑ
757+
(‎ अा̆ ‎) 0905 093E 0306 DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN AA, COMBINING BREVE
758+
← (‎ अाॅ ‎) 0905 093E 0945 DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN AA, DEVANAGARI VOWEL SIGN CANDRA E # →अॉ→
759+
← (‎ अॉ ‎) 0905 0949 DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN CANDRA O
760+
← (‎ ऑ ‎) 0911 DEVANAGARI LETTER CANDRA O # →अॉ→
761+
750762
# अाॆ अॊ आॆ ऒ
751763
(‎ अाॆ ‎) 0905 093E 0946 DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN AA, DEVANAGARI VOWEL SIGN SHORT E
752764
← (‎ अॊ ‎) 0905 094A DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN SHORT O # →आॆ→
@@ -765,17 +777,14 @@
765777
← (‎ आै ‎) 0906 0948 DEVANAGARI LETTER AA, DEVANAGARI VOWEL SIGN AI
766778
← (‎ औ ‎) 0914 DEVANAGARI LETTER AU # →अौ→→आै→
767779

768-
# अॉ ऑ
769-
(‎ अॉ ‎) 0905 0949 DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN CANDRA O
770-
← (‎ ऑ ‎) 0911 DEVANAGARI LETTER CANDRA O
771-
772780
# र्इ ई
773781
(‎ ई ‎) 0908 DEVANAGARI LETTER II
774782
← (‎ र्इ ‎) 0930 094D 0907 DEVANAGARI LETTER RA, DEVANAGARI SIGN VIRAMA, DEVANAGARI LETTER I
775783

776-
# एॅ ऍ
784+
# एॅ ए̆
777785
(‎ ऍ ‎) 090D DEVANAGARI LETTER CANDRA E
778786
← (‎ एॅ ‎) 090F 0945 DEVANAGARI LETTER E, DEVANAGARI VOWEL SIGN CANDRA E
787+
← (‎ ए̆ ‎) 090F 0306 DEVANAGARI LETTER E, COMBINING BREVE # →एॅ→
779788

780789
# एॆ ऎ
781790
(‎ ऎ ‎) 090E DEVANAGARI LETTER SHORT E
@@ -785,6 +794,11 @@
785794
(‎ एे ‎) 090F 0947 DEVANAGARI LETTER E, DEVANAGARI VOWEL SIGN E
786795
← (‎ ऐ ‎) 0910 DEVANAGARI LETTER AI
787796

797+
# ा̆ ाॅ ॉ
798+
(‎ ा̆ ‎) 093E 0306 DEVANAGARI VOWEL SIGN AA, COMBINING BREVE
799+
← (‎ ाॅ ‎) 093E 0945 DEVANAGARI VOWEL SIGN AA, DEVANAGARI VOWEL SIGN CANDRA E
800+
← (‎ ॉ ‎) 0949 DEVANAGARI VOWEL SIGN CANDRA O # →ाॅ→
801+
788802
# ु ુ
789803
(‎ ु ‎) 0941 DEVANAGARI VOWEL SIGN U
790804
← (‎ ુ ‎) 0AC1 GUJARATI VOWEL SIGN U
@@ -915,8 +929,9 @@
915929
(‎ ழ ‎) 0BB4 TAMIL LETTER LLLA
916930
← (‎ ഴ ‎) 0D34 MALAYALAM LETTER LLLA
917931

918-
# ஶ ശ
932+
# ஶ
919933
(‎ ஶ ‎) 0BB6 TAMIL LETTER SHA
934+
← (‎ ஸ ‎) 0BB8 TAMIL LETTER SA
920935
← (‎ ശ ‎) 0D36 MALAYALAM LETTER SHA
921936

922937
# ி ി ീ
@@ -1176,6 +1191,10 @@
11761191
(‎ ဂှ ‎) 1002 103E MYANMAR LETTER GA, MYANMAR CONSONANT SIGN MEDIAL HA
11771192
← (‎ ႁ ‎) 1081 MYANMAR LETTER SHAN HA
11781193

1194+
# င ၚ
1195+
(‎ င ‎) 1004 MYANMAR LETTER NGA
1196+
← (‎ ၚ ‎) 105A MYANMAR LETTER MON NGA
1197+
11791198
# ပာ ဟ
11801199
(‎ ပာ ‎) 1015 102C MYANMAR LETTER PA, MYANMAR VOWEL SIGN AA
11811200
← (‎ ဟ ‎) 101F MYANMAR LETTER HA
@@ -1193,9 +1212,13 @@
11931212
(‎ ၽှ ‎) 107D 103E MYANMAR LETTER SHAN PHA, MYANMAR CONSONANT SIGN MEDIAL HA
11941213
← (‎ ၾ ‎) 107E MYANMAR LETTER SHAN FA
11951214

1215+
# ដ ត
1216+
(‎ ដ ‎) 178A KHMER LETTER DA
1217+
← (‎ ត ‎) 178F KHMER LETTER TA
1218+
11961219
# へ ヘ
11971220
(‎ へ ‎) 3078 HIRAGANA LETTER HE
11981221
← (‎ ヘ ‎) 30D8 KATAKANA LETTER HE
11991222

1200-
# total : 425
1223+
# total : 436
12011224

unicodetools/data/security/dev/data/source/formatted-source.txt

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# formatted-source.txt
2-
# Date: 2025-07-13, 16:46:40 GMT
2+
# Date: 2025-07-20, 15:54:56 GMT
33
# © 2025 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use and license, see https://www.unicode.org/terms_of_use.html
@@ -1145,6 +1145,7 @@
11451145
0304 0304 ; 1AE8 # ( ̄̄ ~ ᫨ ) COMBINING MACRON, COMBINING MACRON ~ COMBINING EQUALS SIGN ABOVE
11461146

11471147
0306 ; 030C # ( ̆ ~ ̌ ) COMBINING BREVE ~ COMBINING CARON
1148+
0306 ; 0945 # ( ̆ ~ ॅ ) COMBINING BREVE ~ DEVANAGARI VOWEL SIGN CANDRA E
11481149
0306 ; 0658 # ( ̆ ~ ٘ ) COMBINING BREVE ~ ARABIC MARK NOON GHUNNA
11491150
0306 ; A67C # ( ̆ ~ ꙼ ) COMBINING BREVE ~ COMBINING CYRILLIC KAVYKA
11501151

@@ -1870,6 +1871,8 @@
18701871

18711872
0905 093E ; 0906 # ( अा ~ आ ) DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN AA ~ DEVANAGARI LETTER AA
18721873

1874+
0905 0945 ; 0972 # ( अॅ ~ ॲ ) DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN CANDRA E ~ DEVANAGARI LETTER CANDRA A
1875+
18731876
0905 0946 ; 0904 # ( अॆ ~ ऄ ) DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN SHORT E ~ DEVANAGARI LETTER SHORT A
18741877

18751878
0905 0949 ; 0911 # ( अॉ ~ ऑ ) DEVANAGARI LETTER A, DEVANAGARI VOWEL SIGN CANDRA O ~ DEVANAGARI LETTER CANDRA O
@@ -1899,6 +1902,8 @@
18991902

19001903
093D ; 0ABD # ( ऽ ~ ઽ ) DEVANAGARI SIGN AVAGRAHA ~ GUJARATI SIGN AVAGRAHA
19011904

1905+
093E 0945 ; 0949 # ( ाॅ ~ ॉ ) DEVANAGARI VOWEL SIGN AA, DEVANAGARI VOWEL SIGN CANDRA E ~ DEVANAGARI VOWEL SIGN CANDRA O
1906+
19021907
0941 ; 0AC1 # ( ु ~ ુ ) DEVANAGARI VOWEL SIGN U ~ GUJARATI VOWEL SIGN U
19031908

19041909
0942 ; 0AC2 # ( ू ~ ૂ ) DEVANAGARI VOWEL SIGN UU ~ GUJARATI VOWEL SIGN UU
@@ -2099,6 +2104,7 @@
20992104

21002105
0BB4 ; 0D34 # ( ழ ~ ഴ ) TAMIL LETTER LLLA ~ MALAYALAM LETTER LLLA
21012106

2107+
0BB6 ; 0BB8 # ( ஶ ~ ஸ ) TAMIL LETTER SHA ~ TAMIL LETTER SA
21022108
0BB6 ; 0D36 # ( ஶ ~ ശ ) TAMIL LETTER SHA ~ MALAYALAM LETTER SHA
21032109

21042110
0BB7 ; 0BF8 # ( ஷ ~ ௸ ) TAMIL LETTER SSA ~ TAMIL AS ABOVE SIGN
@@ -2344,6 +2350,8 @@
23442350

23452351
1003 103E ; 1070 # ( ဃှ ~ ၰ ) MYANMAR LETTER GHA, MYANMAR CONSONANT SIGN MEDIAL HA ~ MYANMAR LETTER EASTERN PWO KAREN GHWA
23462352

2353+
1004 ; 105A # ( င ~ ၚ ) MYANMAR LETTER NGA ~ MYANMAR LETTER MON NGA
2354+
23472355
1015 102C ; 101F # ( ပာ ~ ဟ ) MYANMAR LETTER PA, MYANMAR VOWEL SIGN AA ~ MYANMAR LETTER HA
23482356

23492357
1015 103E ; 1066 # ( ပှ ~ ၦ ) MYANMAR LETTER PA, MYANMAR CONSONANT SIGN MEDIAL HA ~ MYANMAR LETTER WESTERN PWO KAREN PWA
@@ -3643,6 +3651,8 @@
36433651

36443652
1715 ; 1734 # ( ᜕ ~ ᜴ ) TAGALOG SIGN PAMUDPOD ~ HANUNOO SIGN PAMUDPOD
36453653

3654+
178A ; 178F # ( ដ ~ ត ) KHMER LETTER DA ~ KHMER LETTER TA
3655+
36463656
17A2 ; 17A3 # ( អ ~ ឣ ) KHMER LETTER QA ~ KHMER INDEPENDENT VOWEL QAQ
36473657

36483658
185C ; 1896 # ( ᡜ ~ ᢖ ) MONGOLIAN LETTER TODO DZA ~ MONGOLIAN LETTER ALI GALI ZA

0 commit comments

Comments
 (0)