diff --git a/unicodetools/data/security/dev/IdentifierType.txt b/unicodetools/data/security/dev/IdentifierType.txt index 8e2805ff4..2ed700406 100644 --- a/unicodetools/data/security/dev/IdentifierType.txt +++ b/unicodetools/data/security/dev/IdentifierType.txt @@ -1,5 +1,5 @@ # IdentifierType.txt -# Date: 2025-09-12, 03:24:49 GMT +# Date: 2025-10-09, 03:26:38 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -4492,6 +4492,7 @@ A8F8..A8FA ; Obsolete Not_XID # 5.2 [3] DEVANAGARI SIGN PUSH 20BF ; Not_XID # 10.0 BITCOIN SIGN 20C0 ; Not_XID # 14.0 SOM SIGN 20C1 ; Not_XID # 17.0 SAUDI RIYAL SIGN +20C3 ; Not_XID # 18.0 UAE DIRHAM SIGN 2104 ; Not_XID # 1.1 CENTRE LINE SYMBOL 2108 ; Not_XID # 1.1 SCRUPLE 2114 ; Not_XID # 1.1 L B BAR SYMBOL @@ -4814,8 +4815,10 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1F780..1F7D4 ; Not_XID # 7.0 [85] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..HEAVY TWELVE POINTED PINWHEEL STAR 1F7D5..1F7D8 ; Not_XID # 11.0 [4] CIRCLED TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7D9 ; Not_XID # 15.0 NINE POINTED WHITE STAR +1F7DB ; Not_XID # 18.0 BULLET IN DOUBLE CIRCLE 1F7E0..1F7EB ; Not_XID # 12.0 [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE 1F7F0 ; Not_XID # 14.0 HEAVY EQUALS SIGN +1F7F1..1F7FF ; Not_XID # 18.0 [15] CIRCLE WITH DOUBLE VERTICAL AND HORIZONTAL LINE..RHOMBUS 1F800..1F80B ; Not_XID # 7.0 [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F810..1F847 ; Not_XID # 7.0 [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW 1F850..1F859 ; Not_XID # 7.0 [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW @@ -4916,7 +4919,7 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1FBCB..1FBEF ; Not_XID # 16.0 [37] WHITE CROSS MARK..TOP LEFT JUSTIFIED LOWER RIGHT QUARTER BLACK CIRCLE 1FBFA ; Not_XID # 17.0 ALARM BELL SYMBOL -# Total code points: 6487 +# Total code points: 6504 # Identifier_Type: Not_NFKC diff --git a/unicodetools/data/security/dev/confusables.txt b/unicodetools/data/security/dev/confusables.txt index bccab9562..e71b276ba 100644 --- a/unicodetools/data/security/dev/confusables.txt +++ b/unicodetools/data/security/dev/confusables.txt @@ -1,5 +1,5 @@ # confusables.txt -# Date: 2025-09-12, 03:24:49 GMT +# Date: 2025-10-09, 03:26:38 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -110,11 +110,11 @@ A6F0 ; 0302 ; MA # ( ꛰ → ̂ ) BAMUM COMBINING MARK KOQNDON → COMBINING CIR 0345 ; 0328 ; MA # ( ͅ → ̨ ) COMBINING GREEK YPOGEGRAMMENI → COMBINING OGONEK # 1CD2 ; 0304 ; MA # ( ᳒ → ̄ ) VEDIC TONE PRENKHA → COMBINING MACRON # +1AE2 ; 0304 ; MA # ( ᫢ → ̄ ) COMBINING MINUS SIGN ABOVE → COMBINING MACRON # 0305 ; 0304 ; MA # ( ̅ → ̄ ) COMBINING OVERLINE → COMBINING MACRON # 0659 ; 0304 ; MA # ( ٙ → ̄ ) ARABIC ZWARAKAY → COMBINING MACRON # 07EB ; 0304 ; MA # ( ߫ → ̄ ) NKO COMBINING SHORT HIGH TONE → COMBINING MACRON # A6F1 ; 0304 ; MA # ( ꛱ → ̄ ) BAMUM COMBINING MARK TUKWENTIS → COMBINING MACRON # -1AE2 ; 0304 ; MA # ( ᫢ → ̄ ) COMBINING MINUS SIGN ABOVE → COMBINING MACRON # 1AE8 ; 0304 0304 ; MA # ( ᫨ → ̄̄ ) COMBINING EQUALS SIGN ABOVE → COMBINING MACRON, COMBINING MACRON # @@ -132,6 +132,14 @@ A6F1 ; 0304 ; MA # ( ꛱ → ̄ ) BAMUM COMBINING MARK TUKWENTIS → COMBINING M 1E6EE ; 1AC8 ; MA # ( 𞛮 → ᫈ ) TAI YO SIGN AY → COMBINING PLUS SIGN ABOVE # +1DE8 ; 1ADA ; MA # ( ᷨ → ᫚ ) COMBINING LATIN SMALL LETTER B → COMBINING FLAT SIGN # + +2DEE ; 1ADB ; MA # ( ⷮ → ᫛ ) COMBINING CYRILLIC LETTER TE → COMBINING DOWN TACK ABOVE # + +1AE7 ; 1AE5 ; MA # ( ᫧ → ᫥ ) COMBINING DOUBLE ARCH ABOVE → COMBINING SEAGULL ABOVE # + +031A ; 1AE9 ; MA # ( ̚ → ᫩ ) COMBINING LEFT ANGLE ABOVE → COMBINING LEFT ANGLE CENTRED ABOVE # + 1CED ; 0316 ; MA # ( ᳭ → ̖ ) VEDIC SIGN TIRYAK → COMBINING GRAVE ACCENT BELOW # 1CDC ; 0329 ; MA # ( ᳜ → ̩ ) VEDIC TONE KATHAKA ANUDATTA → COMBINING VERTICAL LINE BELOW # @@ -179,8 +187,6 @@ A6F1 ; 0304 ; MA # ( ꛱ → ̄ ) BAMUM COMBINING MARK TUKWENTIS → COMBINING M 1CD9 ; 032D ; MA # ( ᳙ → ̭ ) VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER → COMBINING CIRCUMFLEX ACCENT BELOW # -1CD8 ; 032E ; MA # ( ᳘ → ̮ ) VEDIC TONE CANDRA BELOW → COMBINING BREVE BELOW # - 0952 ; 0331 ; MA # ( ॒ → ̱ ) DEVANAGARI STRESS SIGN ANUDATTA → COMBINING MACRON BELOW # 0320 ; 0331 ; MA # ( ̠ → ̱ ) COMBINING MINUS SIGN BELOW → COMBINING MACRON BELOW # @@ -215,6 +221,8 @@ FC63 ; FE7C 0670 ; MA #* ( ‎ﱣ‎ → ‎ﹼٰ‎ ) ARABIC LIGATURE SHADDA WI 030D ; 0670 ; MA # ( ̍ → ٰ ) COMBINING VERTICAL LINE ABOVE → ARABIC LETTER SUPERSCRIPT ALEF # +0348 ; 10EFA ; MA # ( ͈ → 𐻺 ) COMBINING DOUBLE VERTICAL LINE BELOW → ARABIC DOUBLE VERTICAL BAR BELOW # + 0742 ; 073C ; MA # ( ݂ → ܼ ) SYRIAC RUKKAKHA → SYRIAC HBASA-ESASA DOTTED # 0A03 ; 0983 ; MA # ( ਃ → ঃ ) GURMUKHI SIGN VISARGA → BENGALI SIGN VISARGA # @@ -316,8 +324,8 @@ FE30 ; 003A ; MA #* ( ︰ → : ) PRESENTATION FORM FOR VERTICAL TWO DOT LEADER A789 ; 003A ; MA #* ( ꞉ → : ) MODIFIER LETTER COLON → COLON # 2236 ; 003A ; MA #* ( ∶ → : ) RATIO → COLON # 02D0 ; 003A ; MA # ( ː → : ) MODIFIER LETTER TRIANGULAR COLON → COLON # -A4FD ; 003A ; MA # ( ꓽ → : ) LISU LETTER TONE MYA JEU → COLON # 11DD9 ; 003A ; MA # ( 𑷙 → : ) TOLONG SIKI SIGN SELA → COLON # +A4FD ; 003A ; MA # ( ꓽ → : ) LISU LETTER TONE MYA JEU → COLON # 2A74 ; 003A 003A 003D ; MA #* ( ⩴ → ::= ) DOUBLE COLON EQUAL → COLON, COLON, EQUALS SIGN # @@ -1085,8 +1093,8 @@ A714 ; 02EB ; MA #* ( ꜔ → ˫ ) MODIFIER LETTER MID LEFT-STEM TONE BAR → MO 25CB ; 00B0 ; MA #* ( ○ → ° ) WHITE CIRCLE → DEGREE SIGN # →◦→→∘→ 25E6 ; 00B0 ; MA #* ( ◦ → ° ) WHITE BULLET → DEGREE SIGN # →∘→ -235C ; 00B0 0332 ; MA #* ( ⍜ → °̲ ) APL FUNCTIONAL SYMBOL CIRCLE UNDERBAR → DEGREE SIGN, COMBINING LOW LINE # →○̲→ 10ED0 ; 00B0 0332 ; MA #* ( 𐻐 → °̲ ) ARABIC BIBLICAL END OF VERSE → DEGREE SIGN, COMBINING LOW LINE # →⍜→→○̲→ +235C ; 00B0 0332 ; MA #* ( ⍜ → °̲ ) APL FUNCTIONAL SYMBOL CIRCLE UNDERBAR → DEGREE SIGN, COMBINING LOW LINE # →○̲→ 2364 ; 00B0 0308 ; MA #* ( ⍤ → °̈ ) APL FUNCTIONAL SYMBOL JOT DIAERESIS → DEGREE SIGN, COMBINING DIAERESIS # →◦̈→→∘̈→ @@ -1156,8 +1164,8 @@ A714 ; 02EB ; MA #* ( ꜔ → ˫ ) MODIFIER LETTER MID LEFT-STEM TONE BAR → MO 16ED ; 002B ; MA #* ( ᛭ → + ) RUNIC CROSS PUNCTUATION → PLUS SIGN # 2795 ; 002B ; MA #* ( ➕ → + ) HEAVY PLUS SIGN → PLUS SIGN # -1029B ; 002B ; MA # ( 𐊛 → + ) LYCIAN LETTER H → PLUS SIGN # 1E6E9 ; 002B ; MA # ( 𞛩 → + ) TAI YO LETTER IA → PLUS SIGN # +1029B ; 002B ; MA # ( 𐊛 → + ) LYCIAN LETTER H → PLUS SIGN # 2A23 ; 002B 0302 ; MA #* ( ⨣ → +̂ ) PLUS SIGN WITH CIRCUMFLEX ACCENT ABOVE → PLUS SIGN, COMBINING CIRCUMFLEX ACCENT # @@ -1356,6 +1364,29 @@ FFED ; 25AA ; MA #* ( ■ → ▪ ) HALFWIDTH BLACK SQUARE → BLACK SMALL SQUAR 25B8 ; 25B6 ; MA #* ( ▸ → ▶ ) BLACK RIGHT-POINTING SMALL TRIANGLE → BLACK RIGHT-POINTING TRIANGLE # →►→ 25BA ; 25B6 ; MA #* ( ► → ▶ ) BLACK RIGHT-POINTING POINTER → BLACK RIGHT-POINTING TRIANGLE # +1F40D ; 1CCFA ; MA #* ( 🐍 → 𜳺 ) SNAKE → SNAKE SYMBOL # + +1F443 ; 1CCFC ; MA #* ( 👃 → 𜳼 ) NOSE → NOSE SYMBOL # + +1F377 ; 1CEBA ; MA #* ( 🍷 → 𜺺 ) WINE GLASS → FRAGILE SYMBOL # + +1F3E2 ; 1CEBB ; MA #* ( 🏢 → 𜺻 ) OFFICE BUILDING → OFFICE BUILDING SYMBOL # + +1F333 ; 1CEBC ; MA #* ( 🌳 → 𜺼 ) DECIDUOUS TREE → TREE SYMBOL # + +1F34E ; 1CEBD ; MA #* ( 🍎 → 𜺽 ) RED APPLE → APPLE SYMBOL # +1F34F ; 1CEBD ; MA #* ( 🍏 → 𜺽 ) GREEN APPLE → APPLE SYMBOL # + +1F352 ; 1CEBE ; MA #* ( 🍒 → 𜺾 ) CHERRIES → CHERRY SYMBOL # + +1F353 ; 1CEBF ; MA #* ( 🍓 → 𜺿 ) STRAWBERRY → STRAWBERRY SYMBOL # + +28FF ; 1CEE0 ; MA #* ( ⣿ → 𜻠 ) BRAILLE PATTERN DOTS-12345678 → GEOMANTIC FIGURE POPULUS # + +29B5 ; 1CEF0 ; MA #* ( ⦵ → 𜻰 ) CIRCLE WITH HORIZONTAL BAR → MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR # + +1F514 ; 1FBFA ; MA #* ( 🔔 → 🯺 ) BELL → ALARM BELL SYMBOL # + 2CE9 ; 2627 ; MA #* ( ⳩ → ☧ ) COPTIC SYMBOL KHI RO → CHI RHO # 1F70A ; 2629 ; MA #* ( 🜊 → ☩ ) ALCHEMICAL SYMBOL FOR VINEGAR → CROSS OF JERUSALEM # @@ -1376,12 +1407,20 @@ FFED ; 25AA ; MA #* ( ■ → ▪ ) HALFWIDTH BLACK SQUARE → BLACK SMALL SQUAR 266A ; 1D158 1D165 1D16E ; MA #* ( ♪ → 𝅘𝅥𝅮 ) EIGHTH NOTE → MUSICAL SYMBOL NOTEHEAD BLACK, MUSICAL SYMBOL COMBINING STEM, MUSICAL SYMBOL COMBINING FLAG-1 # +2657 ; 1FA55 ; MA #* ( ♗ → 🩕 ) WHITE CHESS BISHOP → WHITE CHESS ALFIL # + +265D ; 1FA57 ; MA #* ( ♝ → 🩗 ) BLACK CHESS BISHOP → BLACK CHESS ALFIL # + 24EA ; 1F10D ; MA #* ( ⓪ → 🄍 ) CIRCLED DIGIT ZERO → CIRCLED ZERO WITH SLASH # 21BA ; 1F10E ; MA #* ( ↺ → 🄎 ) ANTICLOCKWISE OPEN CIRCLE ARROW → CIRCLED ANTICLOCKWISE ARROW # 1CCFB ; 1F6F8 ; MA #* ( 𜳻 → 🛸 ) FLYING SAUCER SYMBOL → FLYING SAUCER # +21C4 ; 1F8D0 ; MA #* ( ⇄ → 🣐 ) RIGHTWARDS ARROW OVER LEFTWARDS ARROW → LONG RIGHTWARDS ARROW OVER LONG LEFTWARDS ARROW # + +21CC ; 1F8D1 ; MA #* ( ⇌ → 🣑 ) RIGHTWARDS HARPOON OVER LEFTWARDS HARPOON → LONG RIGHTWARDS HARPOON OVER LONG LEFTWARDS HARPOON # + 02D9 ; 0971 ; MA #* ( ˙ → ॱ ) DOT ABOVE → DEVANAGARI SIGN HIGH SPACING DOT # 0D4E ; 0971 ; MA # ( ൎ → ॱ ) MALAYALAM LETTER DOT REPH → DEVANAGARI SIGN HIGH SPACING DOT # →˙→ @@ -2594,6 +2633,7 @@ FFE8 ; 006C ; MA #* ( │ → l ) HALFWIDTH FORMS LIGHT VERTICAL → LATIN SMALL 0661 ; 006C ; MA # ( ‎١‎ → l ) ARABIC-INDIC DIGIT ONE → LATIN SMALL LETTER L # →1→ 06F1 ; 006C ; MA # ( ۱ → l ) EXTENDED ARABIC-INDIC DIGIT ONE → LATIN SMALL LETTER L # →1→ 10320 ; 006C ; MA #* ( 𐌠 → l ) OLD ITALIC NUMERAL ONE → LATIN SMALL LETTER L # →𐌉→→I→ +11DE1 ; 006C ; MA # ( 𑷡 → l ) TOLONG SIKI DIGIT ONE → LATIN SMALL LETTER L # →|→ 1E8C7 ; 006C ; MA #* ( ‎𞣇‎ → l ) MENDE KIKAKUI DIGIT ONE → LATIN SMALL LETTER L # 1CCF1 ; 006C ; MA # ( 𜳱 → l ) OUTLINED DIGIT ONE → LATIN SMALL LETTER L # →1→ 1D7CF ; 006C ; MA # ( 𝟏 → l ) MATHEMATICAL BOLD DIGIT ONE → LATIN SMALL LETTER L # →1→ @@ -2656,14 +2696,13 @@ FE8E ; 006C ; MA # ( ‎ﺎ‎ → l ) ARABIC LETTER ALEF FINAL FORM → LATIN S FE8D ; 006C ; MA # ( ‎ﺍ‎ → l ) ARABIC LETTER ALEF ISOLATED FORM → LATIN SMALL LETTER L # →‎ا‎→→1→ 07CA ; 006C ; MA # ( ‎ߊ‎ → l ) NKO LETTER A → LATIN SMALL LETTER L # →∣→→ǀ→ 2D4F ; 006C ; MA # ( ⵏ → l ) TIFINAGH LETTER YAN → LATIN SMALL LETTER L # →Ӏ→ +11DDA ; 006C ; MA # ( 𑷚 → l ) TOLONG SIKI SIGN HECAKA → LATIN SMALL LETTER L # →|→ 16C1 ; 006C ; MA # ( ᛁ → l ) RUNIC LETTER ISAZ IS ISS I → LATIN SMALL LETTER L # →I→ +16EAA ; 006C ; MA # ( 𖺪 → l ) BERIA ERFE CAPITAL LETTER LAKKO → LATIN SMALL LETTER L # →I→ A4F2 ; 006C ; MA # ( ꓲ → l ) LISU LETTER I → LATIN SMALL LETTER L # →I→ 16F28 ; 006C ; MA # ( 𖼨 → l ) MIAO LETTER GHA → LATIN SMALL LETTER L # →I→ 1028A ; 006C ; MA # ( 𐊊 → l ) LYCIAN LETTER J → LATIN SMALL LETTER L # →I→ 10309 ; 006C ; MA # ( 𐌉 → l ) OLD ITALIC LETTER I → LATIN SMALL LETTER L # →I→ -11DDA ; 006C ; MA # ( 𑷚 → l ) TOLONG SIKI SIGN HECAKA → LATIN SMALL LETTER L # →|→ -11DE1 ; 006C ; MA # ( 𑷡 → l ) TOLONG SIKI DIGIT ONE → LATIN SMALL LETTER L # →|→ -16EAA ; 006C ; MA # ( 𖺪 → l ) BERIA ERFE CAPITAL LETTER LAKKO → LATIN SMALL LETTER L # →I→ 1D22A ; 004C ; MA #* ( 𝈪 → L ) GREEK INSTRUMENTAL NOTATION SYMBOL-23 → LATIN CAPITAL LETTER L # 216C ; 004C ; MA # ( Ⅼ → L ) ROMAN NUMERAL FIFTY → LATIN CAPITAL LETTER L # @@ -3041,6 +3080,7 @@ FBA6 ; 006F ; MA # ( ‎ﮦ‎ → o ) ARABIC LETTER HEH GOAL ISOLATED FORM → 0CE6 ; 004F ; MA # ( ೦ → O ) KANNADA DIGIT ZERO → LATIN CAPITAL LETTER O # 3007 ; 004F ; MA # ( 〇 → O ) IDEOGRAPHIC NUMBER ZERO → LATIN CAPITAL LETTER O # 118E0 ; 004F ; MA # ( 𑣠 → O ) WARANG CITI DIGIT ZERO → LATIN CAPITAL LETTER O # →0→ +11DE0 ; 004F ; MA # ( 𑷠 → O ) TOLONG SIKI DIGIT ZERO → LATIN CAPITAL LETTER O # →0→ 1CCF0 ; 004F ; MA # ( 𜳰 → O ) OUTLINED DIGIT ZERO → LATIN CAPITAL LETTER O # →0→ 1D7CE ; 004F ; MA # ( 𝟎 → O ) MATHEMATICAL BOLD DIGIT ZERO → LATIN CAPITAL LETTER O # →0→ 1D7D8 ; 004F ; MA # ( 𝟘 → O ) MATHEMATICAL DOUBLE-STRUCK DIGIT ZERO → LATIN CAPITAL LETTER O # →0→ @@ -3082,7 +3122,6 @@ A4F3 ; 004F ; MA # ( ꓳ → O ) LISU LETTER O → LATIN CAPITAL LETTER O # 102AB ; 004F ; MA # ( 𐊫 → O ) CARIAN LETTER O → LATIN CAPITAL LETTER O # 10404 ; 004F ; MA # ( 𐐄 → O ) DESERET CAPITAL LETTER LONG O → LATIN CAPITAL LETTER O # 10516 ; 004F ; MA # ( 𐔖 → O ) ELBASAN LETTER O → LATIN CAPITAL LETTER O # -11DE0 ; 004F ; MA # ( 𑷠 → O ) TOLONG SIKI DIGIT ZERO → LATIN CAPITAL LETTER O # →0→ 2070 ; 00BA ; MA #* ( ⁰ → º ) SUPERSCRIPT ZERO → MASCULINE ORDINAL INDICATOR # 1D52 ; 00BA ; MA # ( ᵒ → º ) MODIFIER LETTER SMALL O → MASCULINE ORDINAL INDICATOR # →⁰→ @@ -4140,6 +4179,9 @@ AB9F ; 0185 ; MA # ( ꮟ → ƅ ) CHEROKEE SMALL LETTER SI → LATIN SMALL LETTE AB7E ; 0242 ; MA # ( ꭾ → ɂ ) CHEROKEE SMALL LETTER HE → LATIN SMALL LETTER GLOTTAL STOP # +0295 ; A7CE ; MA # ( ʕ → ꟎ ) LATIN LETTER PHARYNGEAL VOICED FRICATIVE → LATIN CAPITAL LETTER PHARYNGEAL VOICED FRICATIVE # +A7CF ; A7CE ; MA # ( ꟏ → ꟎ ) LATIN SMALL LETTER PHARYNGEAL VOICED FRICATIVE → LATIN CAPITAL LETTER PHARYNGEAL VOICED FRICATIVE # →ʕ→ + 02E4 ; 02C1 ; MA # ( ˤ → ˁ ) MODIFIER LETTER SMALL REVERSED GLOTTAL STOP → MODIFIER LETTER REVERSED GLOTTAL STOP # A6CD ; 02A1 ; MA # ( ꛍ → ʡ ) BAMUM LETTER LU → LATIN LETTER GLOTTAL STOP WITH STROKE # @@ -4806,8 +4848,8 @@ FC5C ; 0631 0670 ; MA # ( ‎ﱜ‎ → ‎رٰ‎ ) ARABIC LIGATURE REH WITH SU FDF6 ; 0631 0633 0648 0644 ; MA # ( ‎ﷶ‎ → ‎رسول‎ ) ARABIC LIGATURE RASOUL ISOLATED FORM → ARABIC LETTER REH, ARABIC LETTER SEEN, ARABIC LETTER WAW, ARABIC LETTER LAM # -FDFC ; 0631 0649 006C 0644 ; MA #* ( ‎﷼‎ → ‎رىlل‎ ) RIAL SIGN → ARABIC LETTER REH, ARABIC LETTER ALEF MAKSURA, LATIN SMALL LETTER L, ARABIC LETTER LAM # →‎ریال‎→ 20C1 ; 0631 0649 006C 0644 ; MA #* ( ⃁ → ‎رىlل‎ ) SAUDI RIYAL SIGN → ARABIC LETTER REH, ARABIC LETTER ALEF MAKSURA, LATIN SMALL LETTER L, ARABIC LETTER LAM # →‎﷼‎→→‎ریال‎→ +FDFC ; 0631 0649 006C 0644 ; MA #* ( ‎﷼‎ → ‎رىlل‎ ) RIAL SIGN → ARABIC LETTER REH, ARABIC LETTER ALEF MAKSURA, LATIN SMALL LETTER L, ARABIC LETTER LAM # →‎ریال‎→ 1EE06 ; 0632 ; MA # ( ‎𞸆‎ → ‎ز‎ ) ARABIC MATHEMATICAL ZAIN → ARABIC LETTER ZAIN # 1EE86 ; 0632 ; MA # ( ‎𞺆‎ → ‎ز‎ ) ARABIC MATHEMATICAL LOOPED ZAIN → ARABIC LETTER ZAIN # @@ -5363,6 +5405,8 @@ FEE1 ; 0645 ; MA # ( ‎ﻡ‎ → ‎م‎ ) ARABIC LETTER MEEM ISOLATED FORM 08A7 ; 0645 06DB ; MA # ( ‎ࢧ‎ → ‎مۛ‎ ) ARABIC LETTER MEEM WITH THREE DOTS ABOVE → ARABIC LETTER MEEM, ARABIC SMALL HIGH THREE DOTS # +06FE ; 0645 10EFA ; MA #* ( ‎۾‎ → ‎م𐻺‎ ) ARABIC SIGN SINDHI POSTPOSITION MEN → ARABIC LETTER MEEM, ARABIC DOUBLE VERTICAL BAR BELOW # + FC88 ; 0645 006C ; MA # ( ‎ﲈ‎ → ‎مl‎ ) ARABIC LIGATURE MEEM WITH ALEF FINAL FORM → ARABIC LETTER MEEM, LATIN SMALL LETTER L # →‎ما‎→ FCCE ; 0645 062C ; MA # ( ‎ﳎ‎ → ‎مج‎ ) ARABIC LIGATURE MEEM WITH JEEM INITIAL FORM → ARABIC LETTER MEEM, ARABIC LETTER JEEM # @@ -5405,8 +5449,6 @@ FDB1 ; 0645 0645 0649 ; MA # ( ‎ﶱ‎ → ‎ممى‎ ) ARABIC LIGATURE MEEM FC49 ; 0645 0649 ; MA # ( ‎ﱉ‎ → ‎مى‎ ) ARABIC LIGATURE MEEM WITH ALEF MAKSURA ISOLATED FORM → ARABIC LETTER MEEM, ARABIC LETTER ALEF MAKSURA # FC4A ; 0645 0649 ; MA # ( ‎ﱊ‎ → ‎مى‎ ) ARABIC LIGATURE MEEM WITH YEH ISOLATED FORM → ARABIC LETTER MEEM, ARABIC LETTER ALEF MAKSURA # →‎مي‎→ -06FE ; 0645 10EFA ; MA #* ( ‎۾‎ → ‎م𐻺‎ ) ARABIC SIGN SINDHI POSTPOSITION MEN → ARABIC LETTER MEEM, ARABIC DOUBLE VERTICAL BAR BELOW # - 1EE0D ; 0646 ; MA # ( ‎𞸍‎ → ‎ن‎ ) ARABIC MATHEMATICAL NOON → ARABIC LETTER NOON # 1EE2D ; 0646 ; MA # ( ‎𞸭‎ → ‎ن‎ ) ARABIC MATHEMATICAL INITIAL NOON → ARABIC LETTER NOON # 1EE4D ; 0646 ; MA # ( ‎𞹍‎ → ‎ن‎ ) ARABIC MATHEMATICAL TAILED NOON → ARABIC LETTER NOON # @@ -5710,8 +5752,8 @@ FC04 ; 0649 0654 0649 ; MA # ( ‎ﰄ‎ → ‎ىٔى‎ ) ARABIC LIGATURE YEH 205E ; 2D42 ; MA #* ( ⁞ → ⵂ ) VERTICAL FOUR DOTS → TIFINAGH LETTER TUAREG YAH # 2E3D ; 2D42 ; MA #* ( ⸽ → ⵂ ) VERTICAL SIX DOTS → TIFINAGH LETTER TUAREG YAH # →⁞→ -2999 ; 2D42 ; MA #* ( ⦙ → ⵂ ) DOTTED FENCE → TIFINAGH LETTER TUAREG YAH # →⁞→ 1CEEF ; 2D42 ; MA #* ( 𜻯 → ⵂ ) GEOMANTIC FIGURE VIA → TIFINAGH LETTER TUAREG YAH # →⁞→ +2999 ; 2D42 ; MA #* ( ⦙ → ⵂ ) DOTTED FENCE → TIFINAGH LETTER TUAREG YAH # →⁞→ FE19 ; 2D57 ; MA #* ( ︙ → ⵗ ) PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS → TIFINAGH LETTER TUAREG YAGH # →⁝→ 205D ; 2D57 ; MA #* ( ⁝ → ⵗ ) TRICOLON → TIFINAGH LETTER TUAREG YAGH # @@ -5869,7 +5911,7 @@ FE19 ; 2D57 ; MA #* ( ︙ → ⵗ ) PRESENTATION FORM FOR VERTICAL HORIZONTAL EL 0A09 ; 0A73 11B62 ; MA # ( ਉ → ੳ𑭢 ) GURMUKHI LETTER U → GURMUKHI URA, SHARADA VOWEL SIGN UE # →ੳੁ→ -0A0A ; 0A73 11B63 ; MA # ( ਊ → ੳ𑭣 ) GURMUKHI LETTER UU → GURMUKHI URA, SHARADA VOWEL SIGN UUE # →ੳੂ→ +0A0A ; 0A73 11B62 11B62 ; MA # ( ਊ → ੳ𑭢𑭢 ) GURMUKHI LETTER UU → GURMUKHI URA, SHARADA VOWEL SIGN UE, SHARADA VOWEL SIGN UE # →ੳੂ→ 0A10 ; 0A05 0948 ; MA # ( ਐ → ਅै ) GURMUKHI LETTER AI → GURMUKHI LETTER A, DEVANAGARI VOWEL SIGN AI # →ਅੈ→ @@ -6028,6 +6070,8 @@ FE19 ; 2D57 ; MA #* ( ︙ → ⵗ ) PRESENTATION FORM FOR VERTICAL HORIZONTAL EL 0C2E ; 0C35 0C41 ; MA # ( మ → వు ) TELUGU LETTER MA → TELUGU LETTER VA, TELUGU VOWEL SIGN U # +0CDC ; 0C5C ; MA # ( ೜ → ౜ ) KANNADA ARCHAIC SHRII → TELUGU ARCHAIC SHRII # + 0CB3 ; 0C33 ; MA # ( ಳ → ళ ) KANNADA LETTER LLA → TELUGU LETTER LLA # 0CBF ; 0C3F ; MA # ( ಿ → ి ) KANNADA VOWEL SIGN I → TELUGU VOWEL SIGN I # @@ -6109,6 +6153,18 @@ FE19 ; 2D57 ; MA #* ( ︙ → ⵗ ) PRESENTATION FORM FOR VERTICAL HORIZONTAL EL 0D8D ; 0DC3 0DD8 ; MA # ( ඍ → සෘ ) SINHALA LETTER IRUYANNA → SINHALA LETTER DANTAJA SAYANNA, SINHALA VOWEL SIGN GAETTA-PILLA # +1CD8 ; 11B62 ; MA # ( ᳘ → 𑭢 ) VEDIC TONE CANDRA BELOW → SHARADA VOWEL SIGN UE # →̮→→ॖ→ +032E ; 11B62 ; MA # ( ̮ → 𑭢 ) COMBINING BREVE BELOW → SHARADA VOWEL SIGN UE # →ॖ→ +0956 ; 11B62 ; MA # ( ॖ → 𑭢 ) DEVANAGARI VOWEL SIGN UE → SHARADA VOWEL SIGN UE # +0A41 ; 11B62 ; MA # ( ੁ → 𑭢 ) GURMUKHI VOWEL SIGN U → SHARADA VOWEL SIGN UE # →ॖ→ + +0957 ; 11B62 11B62 ; MA # ( ॗ → 𑭢𑭢 ) DEVANAGARI VOWEL SIGN UUE → SHARADA VOWEL SIGN UE, SHARADA VOWEL SIGN UE # →̮̮→ +0A42 ; 11B62 11B62 ; MA # ( ੂ → 𑭢𑭢 ) GURMUKHI VOWEL SIGN UU → SHARADA VOWEL SIGN UE, SHARADA VOWEL SIGN UE # →ॗ→→̮̮→ +11B63 ; 11B62 11B62 ; MA # ( 𑭣 → 𑭢𑭢 ) SHARADA VOWEL SIGN UUE → SHARADA VOWEL SIGN UE, SHARADA VOWEL SIGN UE # →ॗ→→̮̮→ + +0947 ; 11B64 ; MA # ( े → 𑭤 ) DEVANAGARI VOWEL SIGN E → SHARADA VOWEL SIGN SHORT E # +0A47 ; 11B64 ; MA # ( ੇ → 𑭤 ) GURMUKHI VOWEL SIGN EE → SHARADA VOWEL SIGN SHORT E # →े→ + 11413 ; 11434 11442 11412 ; MA # ( 𑐓 → 𑐴𑑂𑐒 ) NEWA LETTER NGHA → NEWA LETTER HA, NEWA SIGN VIRAMA, NEWA LETTER NGA # 11419 ; 11434 11442 11418 ; MA # ( 𑐙 → 𑐴𑑂𑐘 ) NEWA LETTER NYHA → NEWA LETTER HA, NEWA SIGN VIRAMA, NEWA LETTER NYA # @@ -6533,8 +6589,8 @@ A4ED ; 1660 ; MA # ( ꓭ → ᙠ ) LISU LETTER GHA → CANADIAN SYLLABICS CARRIE 02B3 ; 18F4 ; MA # ( ʳ → ᣴ ) MODIFIER LETTER SMALL R → CANADIAN SYLLABICS BEAVER DENE R # 02E2 ; 18F5 ; MA # ( ˢ → ᣵ ) MODIFIER LETTER SMALL S → CANADIAN SYLLABICS CARRIER DENTAL S # -18DB ; 18F5 ; MA # ( ᣛ → ᣵ ) CANADIAN SYLLABICS OJIBWAY SH → CANADIAN SYLLABICS CARRIER DENTAL S # →ˢ→ A7F1 ; 18F5 ; MA # ( ꟱ → ᣵ ) MODIFIER LETTER CAPITAL S → CANADIAN SYLLABICS CARRIER DENTAL S # →ˢ→ +18DB ; 18F5 ; MA # ( ᣛ → ᣵ ) CANADIAN SYLLABICS OJIBWAY SH → CANADIAN SYLLABICS CARRIER DENTAL S # →ˢ→ A6B0 ; 16B9 ; MA # ( ꚰ → ᚹ ) BAMUM LETTER TAA → RUNIC LETTER WUNJO WYNN W # @@ -7478,6 +7534,8 @@ FA74 ; 5145 ; MA # ( 充 → 充 ) CJK COMPATIBILITY IDEOGRAPH-FA74 → CJK UNIF FA32 ; 514D ; MA # ( 免 → 免 ) CJK COMPATIBILITY IDEOGRAPH-FA32 → CJK UNIFIED IDEOGRAPH-514D # 2F80E ; 514D ; MA # ( 免 → 免 ) CJK COMPATIBILITY IDEOGRAPH-2F80E → CJK UNIFIED IDEOGRAPH-514D # +5152 ; 16FF3 ; MA # ( 兒 → 𖿳 ) CJK UNIFIED IDEOGRAPH-5152 → CHINESE SMALL TRADITIONAL ER # + 2F80F ; 5154 ; MA # ( 兔 → 兔 ) CJK COMPATIBILITY IDEOGRAPH-2F80F → CJK UNIFIED IDEOGRAPH-5154 # 2F810 ; 5164 ; MA # ( 兤 → 兤 ) CJK COMPATIBILITY IDEOGRAPH-2F810 → CJK UNIFIED IDEOGRAPH-5164 # @@ -8096,6 +8154,8 @@ FA88 ; 6108 ; MA # ( 愈 → 愈 ) CJK COMPATIBILITY IDEOGRAPH-FA88 → CJK UNIF FA3E ; 6168 ; MA # ( 慨 → 慨 ) CJK COMPATIBILITY IDEOGRAPH-FA3E → CJK UNIFIED IDEOGRAPH-6168 # +6138 ; 2B73F ; MA # ( 愸 → 𫜿 ) CJK UNIFIED IDEOGRAPH-6138 → CJK UNIFIED IDEOGRAPH-2B73F # + F9D9 ; 6144 ; MA # ( 慄 → 慄 ) CJK COMPATIBILITY IDEOGRAPH-F9D9 → CJK UNIFIED IDEOGRAPH-6144 # 2F8A6 ; 6148 ; MA # ( 慈 → 慈 ) CJK COMPATIBILITY IDEOGRAPH-2F8A6 → CJK UNIFIED IDEOGRAPH-6148 # @@ -9929,64 +9989,5 @@ FACE ; 9F9C ; MA # ( 龜 → 龜 ) CJK COMPATIBILITY IDEOGRAPH-FACE → CJK UNIF 2FD5 ; 9FA0 ; MA #* ( ⿕ → 龠 ) KANGXI RADICAL FLUTE → CJK UNIFIED IDEOGRAPH-9FA0 # -0CDC ; 0C5C ; MA # ( ೜ → ౜ ) KANNADA ARCHAIC SHRII → TELUGU ARCHAIC SHRII # - -1DE8 ; 1ADA ; MA # ( ᷨ → ᫚ ) COMBINING LATIN SMALL LETTER B → COMBINING FLAT SIGN # - -2DEE ; 1ADB ; MA # ( ⷮ → ᫛ ) COMBINING CYRILLIC LETTER TE → COMBINING DOWN TACK ABOVE # - -1AE7 ; 1AE5 ; MA # ( ᫧ → ᫥ ) COMBINING DOUBLE ARCH ABOVE → COMBINING SEAGULL ABOVE # - -031A ; 1AE9 ; MA # ( ̚ → ᫩ ) COMBINING LEFT ANGLE ABOVE → COMBINING LEFT ANGLE CENTRED ABOVE # - -0295 ; A7CE ; MA # ( ʕ → ꟎ ) LATIN LETTER PHARYNGEAL VOICED FRICATIVE → LATIN CAPITAL LETTER PHARYNGEAL VOICED FRICATIVE # -A7CF ; A7CE ; MA # ( ꟏ → ꟎ ) LATIN SMALL LETTER PHARYNGEAL VOICED FRICATIVE → LATIN CAPITAL LETTER PHARYNGEAL VOICED FRICATIVE # →ʕ→ - -0348 ; 10EFA ; MA # ( ͈ → 𐻺 ) COMBINING DOUBLE VERTICAL LINE BELOW → ARABIC DOUBLE VERTICAL BAR BELOW # - -0956 ; 11B62 ; MA # ( ॖ → 𑭢 ) DEVANAGARI VOWEL SIGN UE → SHARADA VOWEL SIGN UE # -0A41 ; 11B62 ; MA # ( ੁ → 𑭢 ) GURMUKHI VOWEL SIGN U → SHARADA VOWEL SIGN UE # →ॖ→ - -0957 ; 11B63 ; MA # ( ॗ → 𑭣 ) DEVANAGARI VOWEL SIGN UUE → SHARADA VOWEL SIGN UUE # -0A42 ; 11B63 ; MA # ( ੂ → 𑭣 ) GURMUKHI VOWEL SIGN UU → SHARADA VOWEL SIGN UUE # →ॗ→ - -0947 ; 11B64 ; MA # ( े → 𑭤 ) DEVANAGARI VOWEL SIGN E → SHARADA VOWEL SIGN SHORT E # -0A47 ; 11B64 ; MA # ( ੇ → 𑭤 ) GURMUKHI VOWEL SIGN EE → SHARADA VOWEL SIGN SHORT E # →े→ - -5152 ; 16FF3 ; MA # ( 兒 → 𖿳 ) CJK UNIFIED IDEOGRAPH-5152 → CHINESE SMALL TRADITIONAL ER # - -1F40D ; 1CCFA ; MA #* ( 🐍 → 𜳺 ) SNAKE → SNAKE SYMBOL # - -1F443 ; 1CCFC ; MA #* ( 👃 → 𜳼 ) NOSE → NOSE SYMBOL # - -1F377 ; 1CEBA ; MA #* ( 🍷 → 𜺺 ) WINE GLASS → FRAGILE SYMBOL # - -1F3E2 ; 1CEBB ; MA #* ( 🏢 → 𜺻 ) OFFICE BUILDING → OFFICE BUILDING SYMBOL # - -1F333 ; 1CEBC ; MA #* ( 🌳 → 𜺼 ) DECIDUOUS TREE → TREE SYMBOL # - -1F34E ; 1CEBD ; MA #* ( 🍎 → 𜺽 ) RED APPLE → APPLE SYMBOL # -1F34F ; 1CEBD ; MA #* ( 🍏 → 𜺽 ) GREEN APPLE → APPLE SYMBOL # - -1F352 ; 1CEBE ; MA #* ( 🍒 → 𜺾 ) CHERRIES → CHERRY SYMBOL # - -1F353 ; 1CEBF ; MA #* ( 🍓 → 𜺿 ) STRAWBERRY → STRAWBERRY SYMBOL # - -28FF ; 1CEE0 ; MA #* ( ⣿ → 𜻠 ) BRAILLE PATTERN DOTS-12345678 → GEOMANTIC FIGURE POPULUS # - -29B5 ; 1CEF0 ; MA #* ( ⦵ → 𜻰 ) CIRCLE WITH HORIZONTAL BAR → MEDIUM SMALL WHITE CIRCLE WITH HORIZONTAL BAR # - -21C4 ; 1F8D0 ; MA #* ( ⇄ → 🣐 ) RIGHTWARDS ARROW OVER LEFTWARDS ARROW → LONG RIGHTWARDS ARROW OVER LONG LEFTWARDS ARROW # - -21CC ; 1F8D1 ; MA #* ( ⇌ → 🣑 ) RIGHTWARDS HARPOON OVER LEFTWARDS HARPOON → LONG RIGHTWARDS HARPOON OVER LONG LEFTWARDS HARPOON # - -2657 ; 1FA55 ; MA #* ( ♗ → 🩕 ) WHITE CHESS BISHOP → WHITE CHESS ALFIL # - -265D ; 1FA57 ; MA #* ( ♝ → 🩗 ) BLACK CHESS BISHOP → BLACK CHESS ALFIL # - -1F514 ; 1FBFA ; MA #* ( 🔔 → 🯺 ) BELL → ALARM BELL SYMBOL # - -6138 ; 2B73F ; MA # ( 愸 → 𫜿 ) CJK UNIFIED IDEOGRAPH-6138 → CJK UNIFIED IDEOGRAPH-2B73F # - -# total: 6565 +# total: 6567 diff --git a/unicodetools/data/security/dev/confusablesSummary.txt b/unicodetools/data/security/dev/confusablesSummary.txt index f51842740..b618de435 100644 --- a/unicodetools/data/security/dev/confusablesSummary.txt +++ b/unicodetools/data/security/dev/confusablesSummary.txt @@ -1,5 +1,5 @@ # confusablesSummary.txt -# Date: 2025-09-12, 03:24:49 GMT +# Date: 2025-10-09, 03:26:38 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -5778,10 +5778,20 @@ (‎ ̭ ‎) 032D COMBINING CIRCUMFLEX ACCENT BELOW ← (‎ ᳙ ‎) 1CD9 VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER -# ̮ ᳘ +# 𑭢 ̮ ॖ ੁ ᳘ (‎ ̮ ‎) 032E COMBINING BREVE BELOW +← (‎ 𑭢 ‎) 11B62 SHARADA VOWEL SIGN UE # →ॖ→ +← (‎ ॖ ‎) 0956 DEVANAGARI VOWEL SIGN UE +← (‎ ੁ ‎) 0A41 GURMUKHI VOWEL SIGN U # →ॖ→ ← (‎ ᳘ ‎) 1CD8 VEDIC TONE CANDRA BELOW +# 𑭢𑭢 ̮̮ 𑭣 ॗ ੂ + (‎ ̮̮ ‎) 032E 032E COMBINING BREVE BELOW, COMBINING BREVE BELOW +← (‎ 𑭢𑭢 ‎) 11B62 11B62 SHARADA VOWEL SIGN UE, SHARADA VOWEL SIGN UE +← (‎ 𑭣 ‎) 11B63 SHARADA VOWEL SIGN UUE # →ॗ→ +← (‎ ॗ ‎) 0957 DEVANAGARI VOWEL SIGN UUE +← (‎ ੂ ‎) 0A42 GURMUKHI VOWEL SIGN UU # →ॗ→ + # ̳ ͇ (‎ ̳ ‎) 0333 COMBINING DOUBLE LOW LINE ← (‎ ͇ ‎) 0347 COMBINING EQUALS SIGN BELOW @@ -8688,16 +8698,6 @@ ← (‎ ੍ ‎) 0A4D GURMUKHI SIGN VIRAMA ← (‎ ્ ‎) 0ACD GUJARATI SIGN VIRAMA -# 𑭢 ॖ ੁ - (‎ ॖ ‎) 0956 DEVANAGARI VOWEL SIGN UE -← (‎ 𑭢 ‎) 11B62 SHARADA VOWEL SIGN UE -← (‎ ੁ ‎) 0A41 GURMUKHI VOWEL SIGN U - -# 𑭣 ॗ ੂ - (‎ ॗ ‎) 0957 DEVANAGARI VOWEL SIGN UUE -← (‎ 𑭣 ‎) 11B63 SHARADA VOWEL SIGN UUE -← (‎ ੂ ‎) 0A42 GURMUKHI VOWEL SIGN UU - # । ꠰ (‎ । ‎) 0964 DEVANAGARI DANDA ← (‎ ꠰ ‎) A830 NORTH INDIC FRACTION ONE QUARTER @@ -8885,9 +8885,9 @@ ← (‎ ੳ𑭢 ‎) 0A73 11B62 GURMUKHI URA, SHARADA VOWEL SIGN UE # →ੳੁ→ ← (‎ ੳੁ ‎) 0A73 0A41 GURMUKHI URA, GURMUKHI VOWEL SIGN U -# ੳ𑭣 ੳੂ ਊ +# ੳ𑭢𑭢 ੳੂ ਊ (‎ ਊ ‎) 0A0A GURMUKHI LETTER UU -← (‎ ੳ𑭣 ‎) 0A73 11B63 GURMUKHI URA, SHARADA VOWEL SIGN UUE # →ੳੂ→ +← (‎ ੳ𑭢𑭢 ‎) 0A73 11B62 11B62 GURMUKHI URA, SHARADA VOWEL SIGN UE, SHARADA VOWEL SIGN UE # →ੳੂ→ ← (‎ ੳੂ ‎) 0A73 0A42 GURMUKHI URA, GURMUKHI VOWEL SIGN UU # અા આ @@ -17834,5 +17834,5 @@ (‎ 𪘀 ‎) 2A600 CJK UNIFIED IDEOGRAPH-2A600 ← (‎ 𪘀 ‎) 2FA1D CJK COMPATIBILITY IDEOGRAPH-2FA1D -# total : 7579 +# total : 7582 diff --git a/unicodetools/data/security/dev/data/confusablesSummaryIdentifier.txt b/unicodetools/data/security/dev/data/confusablesSummaryIdentifier.txt index c1d2cbdcf..3f16b3c45 100644 --- a/unicodetools/data/security/dev/data/confusablesSummaryIdentifier.txt +++ b/unicodetools/data/security/dev/data/confusablesSummaryIdentifier.txt @@ -1,5 +1,5 @@ # confusablesSummaryIdentifier.txt -# Date: 2025-09-12, 03:24:49 GMT +# Date: 2025-10-09, 03:26:38 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -556,6 +556,14 @@ ← (‎ ઼ ‎) 0ABC GUJARATI SIGN NUKTA ← (‎ ଼ ‎) 0B3C ORIYA SIGN NUKTA +# ॖ ੁ + (‎ ॖ ‎) 0956 DEVANAGARI VOWEL SIGN UE +← (‎ ੁ ‎) 0A41 GURMUKHI VOWEL SIGN U + +# ॗ ੂ + (‎ ॗ ‎) 0957 DEVANAGARI VOWEL SIGN UUE +← (‎ ੂ ‎) 0A42 GURMUKHI VOWEL SIGN UU + # Γ Г (‎ Γ ‎) 0393 GREEK CAPITAL LETTER GAMMA ← (‎ Г ‎) 0413 CYRILLIC CAPITAL LETTER GHE @@ -925,14 +933,6 @@ ← (‎ ੍ ‎) 0A4D GURMUKHI SIGN VIRAMA ← (‎ ્ ‎) 0ACD GUJARATI SIGN VIRAMA -# ॖ ੁ - (‎ ॖ ‎) 0956 DEVANAGARI VOWEL SIGN UE -← (‎ ੁ ‎) 0A41 GURMUKHI VOWEL SIGN U - -# ॗ ੂ - (‎ ॗ ‎) 0957 DEVANAGARI VOWEL SIGN UUE -← (‎ ੂ ‎) 0A42 GURMUKHI VOWEL SIGN UU - # २ ર ૨ (‎ २ ‎) 0968 DEVANAGARI DIGIT TWO ← (‎ ર ‎) 0AB0 GUJARATI LETTER RA # →૨→ diff --git a/unicodetools/data/security/dev/data/draft-restrictions.txt b/unicodetools/data/security/dev/data/draft-restrictions.txt index 2d3429eed..3157df9ec 100644 --- a/unicodetools/data/security/dev/data/draft-restrictions.txt +++ b/unicodetools/data/security/dev/data/draft-restrictions.txt @@ -59697,6 +59697,7 @@ E0100..E01EF ; Allowed ; Recommended # [240] (U+E0100..U+E01EF) VARIATION SELE 2074..208E ; ~Unicode Identifier # [27] (⁴..₎) SUPERSCRIPT FOUR..SUBSCRIPT RIGHT PARENTHESIS 2090..209C ; ~Unicode Identifier # [13] (ₐ..ₜ) LATIN SUBSCRIPT SMALL LETTER A..LATIN SUBSCRIPT SMALL LETTER T 20A0..20C1 ; ~Unicode Identifier # [34] (₠..⃁) EURO-CURRENCY SIGN..SAUDI RIYAL SIGN +20C3 ; ~Unicode Identifier # (⃃) UAE DIRHAM SIGN 20DD..20E0 ; ~Unicode Identifier # [4] (⃝..⃠) COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH 20E2..20E4 ; ~Unicode Identifier # [3] (⃢..⃤) COMBINING ENCLOSING SCREEN..COMBINING ENCLOSING UPWARD POINTING TRIANGLE 2100..2117 ; ~Unicode Identifier # [24] (℀..℗) ACCOUNT OF..SOUND RECORDING COPYRIGHT @@ -59998,9 +59999,9 @@ FFF9..FFFD ; ~Unicode Identifier # [5] (U+FFF9..�) INTERLINEAR ANNOTATION 1F6DC..1F6EC ; ~Unicode Identifier # [17] (🛜..🛬) WIRELESS..AIRPLANE ARRIVING 1F6F0..1F6FC ; ~Unicode Identifier # [13] (🛰..🛼) SATELLITE..ROLLER SKATE 1F700..1F7D9 ; ~Unicode Identifier # [218] (🜀..🟙) ALCHEMICAL SYMBOL FOR QUINTESSENCE..NINE POINTED WHITE STAR +1F7DB ; ~Unicode Identifier # (🟛) BULLET IN DOUBLE CIRCLE 1F7E0..1F7EB ; ~Unicode Identifier # [12] (🟠..🟫) LARGE ORANGE CIRCLE..LARGE BROWN SQUARE -1F7F0 ; ~Unicode Identifier # (🟰) HEAVY EQUALS SIGN -1F800..1F80B ; ~Unicode Identifier # [12] (🠀..🠋) LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD +1F7F0..1F80B ; ~Unicode Identifier # [28] (🟰..🠋) HEAVY EQUALS SIGN..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F810..1F847 ; ~Unicode Identifier # [56] (🠐..🡇) LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW 1F850..1F859 ; ~Unicode Identifier # [10] (🡐..🡙) LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW 1F860..1F887 ; ~Unicode Identifier # [40] (🡠..🢇) WIDE-HEADED LEFTWARDS LIGHT BARB ARROW..WIDE-HEADED SOUTH WEST VERY HEAVY BARB ARROW @@ -60023,4 +60024,4 @@ FFF9..FFFD ; ~Unicode Identifier # [5] (U+FFF9..�) INTERLINEAR ANNOTATION E0001 ; ~Unicode Identifier # (U+E0001) LANGUAGE TAG E0020..E007F ; ~Unicode Identifier # [96] (U+E0020..U+E007F) TAG SPACE..CANCEL TAG -# Total code points: 14287 +# Total code points: 14304 diff --git a/unicodetools/data/security/dev/data/review.txt b/unicodetools/data/security/dev/data/review.txt index 4e3641157..3692a9c95 100644 --- a/unicodetools/data/security/dev/data/review.txt +++ b/unicodetools/data/security/dev/data/review.txt @@ -1,5 +1,5 @@ # review.txt -# Date: 2025-09-12, 03:25:00 GMT +# Date: 2025-10-09, 03:27:02 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -71181,6 +71181,7 @@ E0100..E01EF ; Restricted ; output-disallowed # [240] (U+E0100..U+E01EF) VARIA 2029 ; Restricted ; not in XID+ # (U+2029) PARAGRAPH SEPARATOR 202A..202E ; Restricted ; not in XID+ # [5] (U+202A..U+202E) LEFT-TO-RIGHT EMBEDDING..RIGHT-TO-LEFT OVERRIDE 2066..2069 ; Restricted ; not in XID+ # [4] (U+2066..U+2069) LEFT-TO-RIGHT ISOLATE..POP DIRECTIONAL ISOLATE +20C3 ; Restricted ; not in XID+ # (⃃) UAE DIRHAM SIGN 2488..249B ; Restricted ; not in XID+ # [20] (⒈..⒛) DIGIT ONE FULL STOP..NUMBER TWENTY FULL STOP 2FF0 ; Restricted ; not in XID+ # (⿰) IDEOGRAPHIC DESCRIPTION CHARACTER LEFT TO RIGHT 2FF1 ; Restricted ; not in XID+ # (⿱) IDEOGRAPHIC DESCRIPTION CHARACTER ABOVE TO BELOW @@ -71230,7 +71231,23 @@ FFFD ; Restricted ; not in XID+ # (�) REPLACEMENT CHARACTER 1343E ; Restricted ; not in XID+ # (U+1343E) EGYPTIAN HIEROGLYPH BEGIN WALLED ENCLOSURE 1343F ; Restricted ; not in XID+ # (U+1343F) EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE 1F100 ; Restricted ; not in XID+ # (🄀) DIGIT ZERO FULL STOP +1F7DB ; Restricted ; not in XID+ # (🟛) BULLET IN DOUBLE CIRCLE +1F7F1 ; Restricted ; not in XID+ # (🟱) CIRCLE WITH DOUBLE VERTICAL AND HORIZONTAL LINE +1F7F2 ; Restricted ; not in XID+ # (🟲) DOUBLE CIRCLE WITH DOUBLE HORIZONTAL LINE +1F7F3 ; Restricted ; not in XID+ # (🟳) CIRCLED BOTTOM RIGHT OBLIQUE HALF BLACK CIRCLE +1F7F4 ; Restricted ; not in XID+ # (🟴) LEFT HALF WHITE CIRCLE +1F7F5 ; Restricted ; not in XID+ # (🟵) RIGHT HALF WHITE CIRCLE +1F7F6 ; Restricted ; not in XID+ # (🟶) TRANSPARENT CUBE +1F7F7 ; Restricted ; not in XID+ # (🟷) WHITE CUBE +1F7F8 ; Restricted ; not in XID+ # (🟸) HORIZONTAL DOUBLE WHITE SMALL SQUARE +1F7F9 ; Restricted ; not in XID+ # (🟹) VERTICAL DOUBLE WHITE SMALL SQUARE +1F7FA ; Restricted ; not in XID+ # (🟺) WHITE SQUARE WITH BOTTOM HALF BISECTED +1F7FB ; Restricted ; not in XID+ # (🟻) WHITE SQUARE WITH TOP HALF BISECTED +1F7FC ; Restricted ; not in XID+ # (🟼) WHITE SQUARE WITH HORIZONTAL AND VERTICAL BISECTING LINES +1F7FD ; Restricted ; not in XID+ # (🟽) LOWER LEFT FLATTENED RIGHT TRIANGLE +1F7FE ; Restricted ; not in XID+ # (🟾) LOWER RIGHT FLATTENED RIGHT TRIANGLE +1F7FF ; Restricted ; not in XID+ # (🟿) RHOMBUS E0001 ; Restricted ; not in XID+ # (U+E0001) LANGUAGE TAG E0020..E007F ; Restricted ; not in XID+ # [96] (U+E0020..U+E007F) TAG SPACE..CANCEL TAG -# Total code points: 226 +# Total code points: 243 diff --git a/unicodetools/data/security/dev/data/source/confusables-source.txt b/unicodetools/data/security/dev/data/source/confusables-source.txt index 5c8008495..db5d217fa 100644 --- a/unicodetools/data/security/dev/data/source/confusables-source.txt +++ b/unicodetools/data/security/dev/data/source/confusables-source.txt @@ -5724,3 +5724,7 @@ A7F1 ; 02E2 # ( ꟱ → ˢ ) MODIFIER LETTER CAPITAL S → MODIFIER LETTER SMAL # Confusable Katakana-Han pair (PAG ref #442) 1B122 ; 4E8E + +# Confusables for Devanagari UE and UUE (PAG ref #449) +0956 ; 032E +0957 ; 032E 032E diff --git a/unicodetools/data/security/dev/data/source/formatted-source.txt b/unicodetools/data/security/dev/data/source/formatted-source.txt index b2c747838..da9adfdc4 100644 --- a/unicodetools/data/security/dev/data/source/formatted-source.txt +++ b/unicodetools/data/security/dev/data/source/formatted-source.txt @@ -1,5 +1,5 @@ # formatted-source.txt -# Date: 2025-09-12, 03:24:47 GMT +# Date: 2025-10-09, 03:26:35 GMT # © 2025 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use and license, see https://www.unicode.org/terms_of_use.html @@ -1265,8 +1265,11 @@ 032D ; 1CD9 # ( ̭ ~ ᳙ ) COMBINING CIRCUMFLEX ACCENT BELOW ~ VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +032E ; 0956 # ( ̮ ~ ॖ ) COMBINING BREVE BELOW ~ DEVANAGARI VOWEL SIGN UE 032E ; 1CD8 # ( ̮ ~ ᳘ ) COMBINING BREVE BELOW ~ VEDIC TONE CANDRA BELOW +032E 032E ; 0957 # ( ̮̮ ~ ॗ ) COMBINING BREVE BELOW, COMBINING BREVE BELOW ~ DEVANAGARI VOWEL SIGN UUE + 0331 ; 0320 # ( ̱ ~ ̠ ) COMBINING MACRON BELOW ~ COMBINING MINUS SIGN BELOW 0331 ; 0952 # ( ̱ ~ ॒ ) COMBINING MACRON BELOW ~ DEVANAGARI STRESS SIGN ANUDATTA