import re
regex = re.compile(r"(?:[!-#%-\*,-\/:;\?@\[-\]_\{\}\xA1\xA7\xAB\xB6\xB7\xBB\xBF\u037E\u0387\u055A-\u055F\u0589\u058A\u05BE\u05C0\u05C3\u05C6\u05F3\u05F4\u0609\u060A\u060C\u060D\u061B\u061E\u061F\u066A-\u066D\u06D4\u0700-\u070D\u07F7-\u07F9\u0830-\u083E\u085E\u0964\u0965\u0970\u09FD\u0A76\u0AF0\u0C84\u0DF4\u0E4F\u0E5A\u0E5B\u0F04-\u0F12\u0F14\u0F3A-\u0F3D\u0F85\u0FD0-\u0FD4\u0FD9\u0FDA\u104A-\u104F\u10FB\u1360-\u1368\u1400\u166D\u166E\u169B\u169C\u16EB-\u16ED\u1735\u1736\u17D4-\u17D6\u17D8-\u17DA\u1800-\u180A\u1944\u1945\u1A1E\u1A1F\u1AA0-\u1AA6\u1AA8-\u1AAD\u1B5A-\u1B60\u1BFC-\u1BFF\u1C3B-\u1C3F\u1C7E\u1C7F\u1CC0-\u1CC7\u1CD3\u2010-\u2027\u2030-\u2043\u2045-\u2051\u2053-\u205E\u207D\u207E\u208D\u208E\u2308-\u230B\u2329\u232A\u2768-\u2775\u27C5\u27C6\u27E6-\u27EF\u2983-\u2998\u29D8-\u29DB\u29FC\u29FD\u2CF9-\u2CFC\u2CFE\u2CFF\u2D70\u2E00-\u2E2E\u2E30-\u2E4E\u3001-\u3003\u3008-\u3011\u3014-\u301F\u3030\u303D\u30A0\u30FB\uA4FE\uA4FF\uA60D-\uA60F\uA673\uA67E\uA6F2-\uA6F7\uA874-\uA877\uA8CE\uA8CF\uA8F8-\uA8FA\uA8FC\uA92E\uA92F\uA95F\uA9C1-\uA9CD\uA9DE\uA9DF\uAA5C-\uAA5F\uAADE\uAADF\uAAF0\uAAF1\uABEB\uFD3E\uFD3F\uFE10-\uFE19\uFE30-\uFE52\uFE54-\uFE61\uFE63\uFE68\uFE6A\uFE6B\uFF01-\uFF03\uFF05-\uFF0A\uFF0C-\uFF0F\uFF1A\uFF1B\uFF1F\uFF20\uFF3B-\uFF3D\uFF3F\uFF5B\uFF5D\uFF5F-\uFF65]|\uD800[\uDD00-\uDD02\uDF9F\uDFD0]|\uD801\uDD6F|\uD802[\uDC57\uDD1F\uDD3F\uDE50-\uDE58\uDE7F\uDEF0-\uDEF6\uDF39-\uDF3F\uDF99-\uDF9C]|\uD803[\uDF55-\uDF59]|\uD804[\uDC47-\uDC4D\uDCBB\uDCBC\uDCBE-\uDCC1\uDD40-\uDD43\uDD74\uDD75\uDDC5-\uDDC8\uDDCD\uDDDB\uDDDD-\uDDDF\uDE38-\uDE3D\uDEA9]|\uD805[\uDC4B-\uDC4F\uDC5B\uDC5D\uDCC6\uDDC1-\uDDD7\uDE41-\uDE43\uDE60-\uDE6C\uDF3C-\uDF3E]|\uD806[\uDC3B\uDE3F-\uDE46\uDE9A-\uDE9C\uDE9E-\uDEA2]|\uD807[\uDC41-\uDC45\uDC70\uDC71\uDEF7\uDEF8]|\uD809[\uDC70-\uDC74]|\uD81A[\uDE6E\uDE6F\uDEF5\uDF37-\uDF3B\uDF44]|\uD81B[\uDE97-\uDE9A]|\uD82F\uDC9F|\uD836[\uDE87-\uDE8B]|\uD83A[\uDD5E\uDD5F])")
test_str = ("\n"
"Basic Latin — ASCII punctuation and symbols items: 23\n"
" ! U+0021 EXCLAMATION MARK\n"
" \" U+0022 QUOTATION MARK\n"
" # U+0023 NUMBER SIGN\n"
" % U+0025 PERCENT SIGN\n"
" & U+0026 AMPERSAND\n"
" ' U+0027 APOSTROPHE\n"
" ( U+0028 LEFT PARENTHESIS\n"
" ) U+0029 RIGHT PARENTHESIS\n"
" * U+002A ASTERISK\n"
" , U+002C COMMA\n"
" - U+002D HYPHEN-MINUS\n"
" . U+002E FULL STOP\n"
" / U+002F SOLIDUS\n"
" : U+003A COLON\n"
" ; U+003B SEMICOLON\n"
" ? U+003F QUESTION MARK\n"
" @ U+0040 COMMERCIAL AT\n"
" [ U+005B LEFT SQUARE BRACKET\n"
" \\ U+005C REVERSE SOLIDUS\n"
" ] U+005D RIGHT SQUARE BRACKET\n"
" _ U+005F LOW LINE\n"
" { U+007B LEFT CURLY BRACKET\n"
" } U+007D RIGHT CURLY BRACKET\n"
"Latin 1 Supplement — Latin-1 punctuation and symbols items: 6\n"
" ¡ U+00A1 INVERTED EXCLAMATION MARK\n"
" § U+00A7 SECTION SIGN\n"
" « U+00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK\n"
" ¶ U+00B6 PILCROW SIGN\n"
" · U+00B7 MIDDLE DOT\n"
" » U+00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK\n"
"Latin 1 Supplement — Punctuation items: 1\n"
" ¿ U+00BF INVERTED QUESTION MARK\n"
"Greek And Coptic — Punctuation items: 2\n"
" ; U+037E GREEK QUESTION MARK\n"
" · U+0387 GREEK ANO TELEIA\n"
"Armenian — Modifier letter items: 6\n"
" ՚ U+055A ARMENIAN APOSTROPHE\n"
" ՛ U+055B ARMENIAN EMPHASIS MARK\n"
" ՜ U+055C ARMENIAN EXCLAMATION MARK\n"
" ՝ U+055D ARMENIAN COMMA\n"
" ՞ U+055E ARMENIAN QUESTION MARK\n"
" ՟ U+055F ARMENIAN ABBREVIATION MARK\n"
"Armenian — Punctuation items: 2\n"
" ։ U+0589 ARMENIAN FULL STOP\n"
" ֊ U+058A ARMENIAN HYPHEN\n"
"Hebrew — Points and punctuation items: 4\n"
" ־ U+05BE HEBREW PUNCTUATION MAQAF\n"
" ׀ U+05C0 HEBREW PUNCTUATION PASEQ\n"
" ׃ U+05C3 HEBREW PUNCTUATION SOF PASUQ\n"
" ׆ U+05C6 HEBREW PUNCTUATION NUN HAFUKHA\n"
"Hebrew — Punctuation items: 2\n"
" ׳ U+05F3 HEBREW PUNCTUATION GERESH\n"
" ״ U+05F4 HEBREW PUNCTUATION GERSHAYIM\n"
"Arabic — Punctuation items: 12\n"
" ؉ U+0609 ARABIC-INDIC PER MILLE SIGN\n"
" ؊ U+060A ARABIC-INDIC PER TEN THOUSAND SIGN\n"
" ، U+060C ARABIC COMMA\n"
" ؍ U+060D ARABIC DATE SEPARATOR\n"
" ؛ U+061B ARABIC SEMICOLON\n"
" ؞ U+061E ARABIC TRIPLE DOT PUNCTUATION MARK\n"
" ؟ U+061F ARABIC QUESTION MARK\n"
" ٪ U+066A ARABIC PERCENT SIGN\n"
" ٫ U+066B ARABIC DECIMAL SEPARATOR\n"
" ٬ U+066C ARABIC THOUSANDS SEPARATOR\n"
" ٭ U+066D ARABIC FIVE POINTED STAR\n"
" ۔ U+06D4 ARABIC FULL STOP\n"
"Syriac — Syriac punctuation and signs items: 14\n"
" ܀ U+0700 SYRIAC END OF PARAGRAPH\n"
" ܁ U+0701 SYRIAC SUPRALINEAR FULL STOP\n"
" ܂ U+0702 SYRIAC SUBLINEAR FULL STOP\n"
" ܃ U+0703 SYRIAC SUPRALINEAR COLON\n"
" ܄ U+0704 SYRIAC SUBLINEAR COLON\n"
" ܅ U+0705 SYRIAC HORIZONTAL COLON\n"
" ܆ U+0706 SYRIAC COLON SKEWED LEFT\n"
" ܇ U+0707 SYRIAC COLON SKEWED RIGHT\n"
" ܈ U+0708 SYRIAC SUPRALINEAR COLON SKEWED LEFT\n"
" ܉ U+0709 SYRIAC SUBLINEAR COLON SKEWED RIGHT\n"
" ܊ U+070A SYRIAC CONTRACTION\n"
" ܋ U+070B SYRIAC HARKLEAN OBELUS\n"
" ܌ U+070C SYRIAC HARKLEAN METOBELUS\n"
" ܍ U+070D SYRIAC HARKLEAN ASTERISCUS\n"
"NKo — Punctuation items: 3\n"
" ߷ U+07F7 NKO SYMBOL GBAKURUNEN\n"
" ߸ U+07F8 NKO COMMA\n"
" ߹ U+07F9 NKO EXCLAMATION MARK\n"
"Samaritan — Punctuation items: 15\n"
" ࠰ U+0830 SAMARITAN PUNCTUATION NEQUDAA\n"
" ࠱ U+0831 SAMARITAN PUNCTUATION AFSAAQ\n"
" ࠲ U+0832 SAMARITAN PUNCTUATION ANGED\n"
" ࠳ U+0833 SAMARITAN PUNCTUATION BAU\n"
" ࠴ U+0834 SAMARITAN PUNCTUATION ATMAAU\n"
" ࠵ U+0835 SAMARITAN PUNCTUATION SHIYYAALAA\n"
" ࠶ U+0836 SAMARITAN ABBREVIATION MARK\n"
" ࠷ U+0837 SAMARITAN PUNCTUATION MELODIC QITSA\n"
" ࠸ U+0838 SAMARITAN PUNCTUATION ZIQAA\n"
" ࠹ U+0839 SAMARITAN PUNCTUATION QITSA\n"
" ࠺ U+083A SAMARITAN PUNCTUATION ZAEF\n"
" ࠻ U+083B SAMARITAN PUNCTUATION TURU\n"
" ࠼ U+083C SAMARITAN PUNCTUATION ARKAANU\n"
" ࠽ U+083D SAMARITAN PUNCTUATION SOF MASHFAAT\n"
" ࠾ U+083E SAMARITAN PUNCTUATION ANNAAU\n"
"Mandaic — Punctuation items: 1\n"
" ࡞ U+085E MANDAIC PUNCTUATION\n"
"Devanagari — Generic punctuation for scripts of India items: 2\n"
" । U+0964 DEVANAGARI DANDA\n"
" ॥ U+0965 DEVANAGARI DOUBLE DANDA\n"
"Devanagari — Abbreviation mark items: 1\n"
" ॰ U+0970 DEVANAGARI ABBREVIATION SIGN\n"
"Bengali — Sign items: 1\n"
" ৽ U+09FD BENGALI ABBREVIATION SIGN\n"
"Gurmukhi — Sign items: 1\n"
" ੶ U+0A76 GURMUKHI ABBREVIATION SIGN\n"
"Gujarati — Abbreviation mark items: 1\n"
" ૰ U+0AF0 GUJARATI ABBREVIATION SIGN\n"
"Kannada — Various signs items: 1\n"
" ಄ U+0C84 KANNADA SIGN SIDDHAM\n"
"Sinhala — Punctuation items: 1\n"
" ෴ U+0DF4 SINHALA PUNCTUATION KUNDDALIYA\n"
"Thai — Sign items: 3\n"
" ๏ U+0E4F THAI CHARACTER FONGMAN\n"
" ๚ U+0E5A THAI CHARACTER ANGKHANKHU\n"
" ๛ U+0E5B THAI CHARACTER KHOMUT\n"
"Tibetan — Head mark items: 6\n"
" ༄ U+0F04 TIBETAN MARK INITIAL YIG MGO MDUN MA\n"
" ༅ U+0F05 TIBETAN MARK CLOSING YIG MGO SGAB MA\n"
" ༆ U+0F06 TIBETAN MARK CARET YIG MGO PHUR SHAD MA\n"
" ༇ U+0F07 TIBETAN MARK YIG MGO TSHEG SHAD MA\n"
" ࿓ U+0FD3 TIBETAN MARK INITIAL BRDA RNYING YIG MGO MDUN MA\n"
" ࿔ U+0FD4 TIBETAN MARK CLOSING BRDA RNYING YIG MGO SGAB MA\n"
"Tibetan — Sign items: 16\n"
" ༈ U+0F08 TIBETAN MARK SBRUL SHAD\n"
" ༉ U+0F09 TIBETAN MARK BSKUR YIG MGO\n"
" ༊ U+0F0A TIBETAN MARK BKA- SHOG YIG MGO\n"
" ་ U+0F0B TIBETAN MARK INTERSYLLABIC TSHEG\n"
" ༌ U+0F0C TIBETAN MARK DELIMITER TSHEG BSTAR\n"
" ། U+0F0D TIBETAN MARK SHAD\n"
" ༎ U+0F0E TIBETAN MARK NYIS SHAD\n"
" ༏ U+0F0F TIBETAN MARK TSHEG SHAD\n"
" ༐ U+0F10 TIBETAN MARK NYIS TSHEG SHAD\n"
" ༑ U+0F11 TIBETAN MARK RIN CHEN SPUNGS SHAD\n"
" ༒ U+0F12 TIBETAN MARK RGYA GRAM SHAD\n"
" ༔ U+0F14 TIBETAN MARK GTER TSHEG\n"
" ྅ U+0F85 TIBETAN MARK PALUTA\n"
" ࿐ U+0FD0 TIBETAN MARK BSKA- SHOG GI MGO RGYAN\n"
" ࿑ U+0FD1 TIBETAN MARK MNYAM YIG GI MGO RGYAN\n"
" ࿒ U+0FD2 TIBETAN MARK NYIS TSHEG\n"
"Tibetan — Paired punctuation items: 4\n"
" ༺ U+0F3A TIBETAN MARK GUG RTAGS GYON\n"
" ༻ U+0F3B TIBETAN MARK GUG RTAGS GYAS\n"
" ༼ U+0F3C TIBETAN MARK ANG KHANG GYON\n"
" ༽ U+0F3D TIBETAN MARK ANG KHANG GYAS\n"
"Tibetan — Annotation marks items: 2\n"
" ࿙ U+0FD9 TIBETAN MARK LEADING MCHAN RTAGS\n"
" ࿚ U+0FDA TIBETAN MARK TRAILING MCHAN RTAGS\n"
"Myanmar — Punctuation items: 2\n"
" ၊ U+104A MYANMAR SIGN LITTLE SECTION\n"
" ။ U+104B MYANMAR SIGN SECTION\n"
"Myanmar — Various signs items: 4\n"
" ၌ U+104C MYANMAR SYMBOL LOCATIVE\n"
" ၍ U+104D MYANMAR SYMBOL COMPLETED\n"
" ၎ U+104E MYANMAR SYMBOL AFOREMENTIONED\n"
" ၏ U+104F MYANMAR SYMBOL GENITIVE\n"
"Georgian — Punctuation items: 1\n"
" ჻ U+10FB GEORGIAN PARAGRAPH SEPARATOR\n"
"Ethiopic — Punctuation items: 9\n"
" ፠ U+1360 ETHIOPIC SECTION MARK\n"
" ፡ U+1361 ETHIOPIC WORDSPACE\n"
" ። U+1362 ETHIOPIC FULL STOP\n"
" ፣ U+1363 ETHIOPIC COMMA\n"
" ፤ U+1364 ETHIOPIC SEMICOLON\n"
" ፥ U+1365 ETHIOPIC COLON\n"
" ፦ U+1366 ETHIOPIC PREFACE COLON\n"
" ፧ U+1367 ETHIOPIC QUESTION MARK\n"
" ፨ U+1368 ETHIOPIC PARAGRAPH SEPARATOR\n"
"Unified Canadian Aboriginal Syllabics — Punctuation items: 2\n"
" ᐀ U+1400 CANADIAN SYLLABICS HYPHEN\n"
" ᙮ U+166E CANADIAN SYLLABICS FULL STOP\n"
"Unified Canadian Aboriginal Syllabics — Sign items: 1\n"
" ᙭ U+166D CANADIAN SYLLABICS CHI SIGN\n"
"Ogham — Punctuation items: 2\n"
" ᚛ U+169B OGHAM FEATHER MARK\n"
" ᚜ U+169C OGHAM REVERSED FEATHER MARK\n"
"Runic — Punctuation items: 3\n"
" ᛫ U+16EB RUNIC SINGLE PUNCTUATION\n"
" ᛬ U+16EC RUNIC MULTIPLE PUNCTUATION\n"
" ᛭ U+16ED RUNIC CROSS PUNCTUATION\n"
"Hanunoo — Generic punctuation for Philippine scripts items: 2\n"
" ᜵ U+1735 PHILIPPINE SINGLE PUNCTUATION\n"
" ᜶ U+1736 PHILIPPINE DOUBLE PUNCTUATION\n"
"Khmer — Various signs items: 6\n"
" ។ U+17D4 KHMER SIGN KHAN\n"
" ៕ U+17D5 KHMER SIGN BARIYOOSAN\n"
" ៖ U+17D6 KHMER SIGN CAMNUC PII KUUH\n"
" ៘ U+17D8 KHMER SIGN BEYYAL\n"
" ៙ U+17D9 KHMER SIGN PHNAEK MUAN\n"
" ៚ U+17DA KHMER SIGN KOOMUUT\n"
"Mongolian — Punctuation items: 11\n"
" ᠀ U+1800 MONGOLIAN BIRGA\n"
" ᠁ U+1801 MONGOLIAN ELLIPSIS\n"
" ᠂ U+1802 MONGOLIAN COMMA\n"
" ᠃ U+1803 MONGOLIAN FULL STOP\n"
" ᠄ U+1804 MONGOLIAN COLON\n"
" ᠅ U+1805 MONGOLIAN FOUR DOTS\n"
" ᠆ U+1806 MONGOLIAN TODO SOFT HYPHEN\n"
" ᠇ U+1807 MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER\n"
" ᠈ U+1808 MONGOLIAN MANCHU COMMA\n"
" ᠉ U+1809 MONGOLIAN MANCHU FULL STOP\n"
" ᠊ U+180A MONGOLIAN NIRUGU\n"
"Limbu — Various signs items: 2\n"
" ᥄ U+1944 LIMBU EXCLAMATION MARK\n"
" ᥅ U+1945 LIMBU QUESTION MARK\n"
"Buginese — Various signs items: 2\n"
" ᨞ U+1A1E BUGINESE PALLAWA\n"
" ᨟ U+1A1F BUGINESE END OF SECTION\n"
"Tai Tham — Logographs items: 3\n"
" ᪠ U+1AA0 TAI THAM SIGN WIANG\n"
" ᪡ U+1AA1 TAI THAM SIGN WIANGWAAK\n"
" ᪢ U+1AA2 TAI THAM SIGN SAWAN\n"
"Tai Tham — Punctuation items: 10\n"
" ᪣ U+1AA3 TAI THAM SIGN KEOW\n"
" ᪤ U+1AA4 TAI THAM SIGN HOY\n"
" ᪥ U+1AA5 TAI THAM SIGN DOKMAI\n"
" ᪦ U+1AA6 TAI THAM SIGN REVERSED ROTATED RANA\n"
" ᪨ U+1AA8 TAI THAM SIGN KAAN\n"
" ᪩ U+1AA9 TAI THAM SIGN KAANKUU\n"
" ᪪ U+1AAA TAI THAM SIGN SATKAAN\n"
" ᪫ U+1AAB TAI THAM SIGN SATKAANKUU\n"
" ᪬ U+1AAC TAI THAM SIGN HANG\n"
" ᪭ U+1AAD TAI THAM SIGN CAANG\n"
"Balinese — Punctuation items: 7\n"
" ᭚ U+1B5A BALINESE PANTI\n"
" ᭛ U+1B5B BALINESE PAMADA\n"
" ᭜ U+1B5C BALINESE WINDU\n"
" ᭝ U+1B5D BALINESE CARIK PAMUNGKAH\n"
" ᭞ U+1B5E BALINESE CARIK SIKI\n"
" ᭟ U+1B5F BALINESE CARIK PAREREN\n"
" ᭠ U+1B60 BALINESE PAMENENG\n"
"Batak — Punctuation items: 4\n"
" ᯼ U+1BFC BATAK SYMBOL BINDU NA METEK\n"
" ᯽ U+1BFD BATAK SYMBOL BINDU PINARBORAS\n"
" ᯾ U+1BFE BATAK SYMBOL BINDU JUDUL\n"
" ᯿ U+1BFF BATAK SYMBOL BINDU PANGOLAT\n"
"Lepcha — Punctuation items: 5\n"
" ᰻ U+1C3B LEPCHA PUNCTUATION TA-ROL\n"
" ᰼ U+1C3C LEPCHA PUNCTUATION NYET THYOOM TA-ROL\n"
" ᰽ U+1C3D LEPCHA PUNCTUATION CER-WA\n"
" ᰾ U+1C3E LEPCHA PUNCTUATION TSHOOK CER-WA\n"
" ᰿ U+1C3F LEPCHA PUNCTUATION TSHOOK\n"
"Ol Chiki — Punctuation items: 2\n"
" ᱾ U+1C7E OL CHIKI PUNCTUATION MUCAAD\n"
" ᱿ U+1C7F OL CHIKI PUNCTUATION DOUBLE MUCAAD\n"
"Sundanese Supplement — Punctuation items: 8\n"
" ᳀ U+1CC0 SUNDANESE PUNCTUATION BINDU SURYA\n"
" ᳁ U+1CC1 SUNDANESE PUNCTUATION BINDU PANGLONG\n"
" ᳂ U+1CC2 SUNDANESE PUNCTUATION BINDU PURNAMA\n"
" ᳃ U+1CC3 SUNDANESE PUNCTUATION BINDU CAKRA\n"
" ᳄ U+1CC4 SUNDANESE PUNCTUATION BINDU LEU SATANGA\n"
" ᳅ U+1CC5 SUNDANESE PUNCTUATION BINDU KA SATANGA\n"
" ᳆ U+1CC6 SUNDANESE PUNCTUATION BINDU DA SATANGA\n"
" ᳇ U+1CC7 SUNDANESE PUNCTUATION BINDU BA SATANGA\n"
"Vedic Extensions — Breathing mark for the Samaveda items: 1\n"
" ᳓ U+1CD3 VEDIC SIGN NIHSHVASA\n"
"General Punctuation — Dashes items: 6\n"
" ‐ U+2010 HYPHEN\n"
" ‑ U+2011 NON-BREAKING HYPHEN\n"
" ‒ U+2012 FIGURE DASH\n"
" – U+2013 EN DASH\n"
" — U+2014 EM DASH\n"
" ― U+2015 HORIZONTAL BAR\n"
"General Punctuation — General punctuation items: 39\n"
" ‖ U+2016 DOUBLE VERTICAL LINE\n"
" ‗ U+2017 DOUBLE LOW LINE\n"
" † U+2020 DAGGER\n"
" ‡ U+2021 DOUBLE DAGGER\n"
" • U+2022 BULLET\n"
" ‣ U+2023 TRIANGULAR BULLET\n"
" ․ U+2024 ONE DOT LEADER\n"
" ‥ U+2025 TWO DOT LEADER\n"
" … U+2026 HORIZONTAL ELLIPSIS\n"
" ‧ U+2027 HYPHENATION POINT\n"
" ‰ U+2030 PER MILLE SIGN\n"
" ‱ U+2031 PER TEN THOUSAND SIGN\n"
" ′ U+2032 PRIME\n"
" ″ U+2033 DOUBLE PRIME\n"
" ‴ U+2034 TRIPLE PRIME\n"
" ‵ U+2035 REVERSED PRIME\n"
" ‶ U+2036 REVERSED DOUBLE PRIME\n"
" ‷ U+2037 REVERSED TRIPLE PRIME\n"
" ‸ U+2038 CARET\n"
" ※ U+203B REFERENCE MARK\n"
" ‽ U+203D INTERROBANG\n"
" ‾ U+203E OVERLINE\n"
" ‿ U+203F UNDERTIE\n"
" ⁀ U+2040 CHARACTER TIE\n"
" ⁁ U+2041 CARET INSERTION POINT\n"
" ⁂ U+2042 ASTERISM\n"
" ⁃ U+2043 HYPHEN BULLET\n"
" ⁊ U+204A TIRONIAN SIGN ET\n"
" ⁋ U+204B REVERSED PILCROW SIGN\n"
" ⁌ U+204C BLACK LEFTWARDS BULLET\n"
" ⁍ U+204D BLACK RIGHTWARDS BULLET\n"
" ⁎ U+204E LOW ASTERISK\n"
" ⁏ U+204F REVERSED SEMICOLON\n"
" ⁐ U+2050 CLOSE UP\n"
" ⁑ U+2051 TWO ASTERISKS ALIGNED VERTICALLY\n"
" ⁓ U+2053 SWUNG DASH\n"
" ⁔ U+2054 INVERTED UNDERTIE\n"
" ⁕ U+2055 FLOWER PUNCTUATION MARK\n"
" ⁗ U+2057 QUADRUPLE PRIME\n"
"General Punctuation — Quotation marks and apostrophe items: 8\n"
" ‘ U+2018 LEFT SINGLE QUOTATION MARK\n"
" ’ U+2019 RIGHT SINGLE QUOTATION MARK\n"
" ‚ U+201A SINGLE LOW-9 QUOTATION MARK\n"
" ‛ U+201B SINGLE HIGH-REVERSED-9 QUOTATION MARK\n"
" “ U+201C LEFT DOUBLE QUOTATION MARK\n"
" ” U+201D RIGHT DOUBLE QUOTATION MARK\n"
" „ U+201E DOUBLE LOW-9 QUOTATION MARK\n"
" ‟ U+201F DOUBLE HIGH-REVERSED-9 QUOTATION MARK\n"
"General Punctuation — Quotation marks items: 2\n"
" ‹ U+2039 SINGLE LEFT-POINTING ANGLE QUOTATION MARK\n"
" › U+203A SINGLE RIGHT-POINTING ANGLE QUOTATION MARK\n"
"General Punctuation — Double punctuation for vertical text items: 4\n"
" ‼️ U+203C DOUBLE EXCLAMATION MARK\n"
" ⁇ U+2047 DOUBLE QUESTION MARK\n"
" ⁈ U+2048 QUESTION EXCLAMATION MARK\n"
" ⁉️ U+2049 EXCLAMATION QUESTION MARK\n"
"General Punctuation — Brackets items: 2\n"
" ⁅ U+2045 LEFT SQUARE BRACKET WITH QUILL\n"
" ⁆ U+2046 RIGHT SQUARE BRACKET WITH QUILL\n"
"General Punctuation — Archaic punctuation items: 8\n"
" ⁖ U+2056 THREE DOT PUNCTUATION\n"
" ⁘ U+2058 FOUR DOT PUNCTUATION\n"
" ⁙ U+2059 FIVE DOT PUNCTUATION\n"
" ⁚ U+205A TWO DOT PUNCTUATION\n"
" ⁛ U+205B FOUR DOT MARK\n"
" ⁜ U+205C DOTTED CROSS\n"
" ⁝ U+205D TRICOLON\n"
" ⁞ U+205E VERTICAL FOUR DOTS\n"
"Superscripts And Subscripts — Superscripts items: 2\n"
" ⁽ U+207D SUPERSCRIPT LEFT PARENTHESIS\n"
" ⁾ U+207E SUPERSCRIPT RIGHT PARENTHESIS\n"
"Superscripts And Subscripts — Subscripts items: 2\n"
" ₍ U+208D SUBSCRIPT LEFT PARENTHESIS\n"
" ₎ U+208E SUBSCRIPT RIGHT PARENTHESIS\n"
"Miscellaneous Technical — Ceilings and floors items: 4\n"
" ⌈ U+2308 LEFT CEILING\n"
" ⌉ U+2309 RIGHT CEILING\n"
" ⌊ U+230A LEFT FLOOR\n"
" ⌋ U+230B RIGHT FLOOR\n"
"Miscellaneous Technical — Deprecated angle brackets items: 2\n"
" 〈 U+2329 LEFT-POINTING ANGLE BRACKET\n"
" 〉 U+232A RIGHT-POINTING ANGLE BRACKET\n"
"Dingbats — Ornamental brackets items: 14\n"
" ❨ U+2768 MEDIUM LEFT PARENTHESIS ORNAMENT\n"
" ❩ U+2769 MEDIUM RIGHT PARENTHESIS ORNAMENT\n"
" ❪ U+276A MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT\n"
" ❫ U+276B MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT\n"
" ❬ U+276C MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT\n"
" ❭ U+276D MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT\n"
" ❮ U+276E HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT\n"
" ❯ U+276F HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT\n"
" ❰ U+2770 HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT\n"
" ❱ U+2771 HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT\n"
" ❲ U+2772 LIGHT LEFT TORTOISE SHELL BRACKET ORNAMENT\n"
" ❳ U+2773 LIGHT RIGHT TORTOISE SHELL BRACKET ORNAMENT\n"
" ❴ U+2774 MEDIUM LEFT CURLY BRACKET ORNAMENT\n"
" ❵ U+2775 MEDIUM RIGHT CURLY BRACKET ORNAMENT\n"
"Miscellaneous Mathematical Symbols A — Paired punctuation items: 2\n"
" ⟅ U+27C5 LEFT S-SHAPED BAG DELIMITER\n"
" ⟆ U+27C6 RIGHT S-SHAPED BAG DELIMITER\n"
"Miscellaneous Mathematical Symbols A — Mathematical brackets items: 10\n"
" ⟦ U+27E6 MATHEMATICAL LEFT WHITE SQUARE BRACKET\n"
" ⟧ U+27E7 MATHEMATICAL RIGHT WHITE SQUARE BRACKET\n"
" ⟨ U+27E8 MATHEMATICAL LEFT ANGLE BRACKET\n"
" ⟩ U+27E9 MATHEMATICAL RIGHT ANGLE BRACKET\n"
" ⟪ U+27EA MATHEMATICAL LEFT DOUBLE ANGLE BRACKET\n"
" ⟫ U+27EB MATHEMATICAL RIGHT DOUBLE ANGLE BRACKET\n"
" ⟬ U+27EC MATHEMATICAL LEFT WHITE TORTOISE SHELL BRACKET\n"
" ⟭ U+27ED MATHEMATICAL RIGHT WHITE TORTOISE SHELL BRACKET\n"
" ⟮ U+27EE MATHEMATICAL LEFT FLATTENED PARENTHESIS\n"
" ⟯ U+27EF MATHEMATICAL RIGHT FLATTENED PARENTHESIS\n"
"Miscellaneous Mathematical Symbols B — Brackets items: 20\n"
" ⦃ U+2983 LEFT WHITE CURLY BRACKET\n"
" ⦄ U+2984 RIGHT WHITE CURLY BRACKET\n"
" ⦅ U+2985 LEFT WHITE PARENTHESIS\n"
" ⦆ U+2986 RIGHT WHITE PARENTHESIS\n"
" ⦇ U+2987 Z NOTATION LEFT IMAGE BRACKET\n"
" ⦈ U+2988 Z NOTATION RIGHT IMAGE BRACKET\n"
" ⦉ U+2989 Z NOTATION LEFT BINDING BRACKET\n"
" ⦊ U+298A Z NOTATION RIGHT BINDING BRACKET\n"
" ⦋ U+298B LEFT SQUARE BRACKET WITH UNDERBAR\n"
" ⦌ U+298C RIGHT SQUARE BRACKET WITH UNDERBAR\n"
" ⦑ U+2991 LEFT ANGLE BRACKET WITH DOT\n"
" ⦒ U+2992 RIGHT ANGLE BRACKET WITH DOT\n"
" ⦓ U+2993 LEFT ARC LESS-THAN BRACKET\n"
" ⦔ U+2994 RIGHT ARC GREATER-THAN BRACKET\n"
" ⦕ U+2995 DOUBLE LEFT ARC GREATER-THAN BRACKET\n"
" ⦖ U+2996 DOUBLE RIGHT ARC LESS-THAN BRACKET\n"
" ⦗ U+2997 LEFT BLACK TORTOISE SHELL BRACKET\n"
" ⦘ U+2998 RIGHT BLACK TORTOISE SHELL BRACKET\n"
" ⧼ U+29FC LEFT-POINTING CURVED ANGLE BRACKET\n"
" ⧽ U+29FD RIGHT-POINTING CURVED ANGLE BRACKET\n"
"Miscellaneous Mathematical Symbols B — Brackets with ticks items: 4\n"
" ⦍ U+298D LEFT SQUARE BRACKET WITH TICK IN TOP CORNER\n"
" ⦎ U+298E RIGHT SQUARE BRACKET WITH TICK IN BOTTOM CORNER\n"
" ⦏ U+298F LEFT SQUARE BRACKET WITH TICK IN BOTTOM CORNER\n"
" ⦐ U+2990 RIGHT SQUARE BRACKET WITH TICK IN TOP CORNER\n"
"Miscellaneous Mathematical Symbols B — Fences items: 4\n"
" ⧘ U+29D8 LEFT WIGGLY FENCE\n"
" ⧙ U+29D9 RIGHT WIGGLY FENCE\n"
" ⧚ U+29DA LEFT DOUBLE WIGGLY FENCE\n"
" ⧛ U+29DB RIGHT DOUBLE WIGGLY FENCE\n"
"Coptic — Old Nubian punctuation items: 4\n"
" ⳹ U+2CF9 COPTIC OLD NUBIAN FULL STOP\n"
" ⳺ U+2CFA COPTIC OLD NUBIAN DIRECT QUESTION MARK\n"
" ⳻ U+2CFB COPTIC OLD NUBIAN INDIRECT QUESTION MARK\n"
" ⳼ U+2CFC COPTIC OLD NUBIAN VERSE DIVIDER\n"
"Coptic — Punctuation items: 2\n"
" ⳾ U+2CFE COPTIC FULL STOP\n"
" ⳿ U+2CFF COPTIC MORPHOLOGICAL DIVIDER\n"
"Tifinagh — Punctuation items: 1\n"
" ⵰ U+2D70 TIFINAGH SEPARATOR MARK\n"
"Supplemental Punctuation — New Testament editorial symbols items: 14\n"
" ⸀ U+2E00 RIGHT ANGLE SUBSTITUTION MARKER\n"
" ⸁ U+2E01 RIGHT ANGLE DOTTED SUBSTITUTION MARKER\n"
" ⸂ U+2E02 LEFT SUBSTITUTION BRACKET\n"
" ⸃ U+2E03 RIGHT SUBSTITUTION BRACKET\n"
" ⸄ U+2E04 LEFT DOTTED SUBSTITUTION BRACKET\n"
" ⸅ U+2E05 RIGHT DOTTED SUBSTITUTION BRACKET\n"
" ⸆ U+2E06 RAISED INTERPOLATION MARKER\n"
" ⸇ U+2E07 RAISED DOTTED INTERPOLATION MARKER\n"
" ⸈ U+2E08 DOTTED TRANSPOSITION MARKER\n"
" ⸉ U+2E09 LEFT TRANSPOSITION BRACKET\n"
" ⸊ U+2E0A RIGHT TRANSPOSITION BRACKET\n"
" ⸋ U+2E0B RAISED SQUARE\n"
" ⸌ U+2E0C LEFT RAISED OMISSION BRACKET\n"
" ⸍ U+2E0D RIGHT RAISED OMISSION BRACKET\n"
"Supplemental Punctuation — Ancient Greek textual symbols items: 9\n"
" ⸎ U+2E0E EDITORIAL CORONIS\n"
" ⸏ U+2E0F PARAGRAPHOS\n"
" ⸐ U+2E10 FORKED PARAGRAPHOS\n"
" ⸑ U+2E11 REVERSED FORKED PARAGRAPHOS\n"
" ⸒ U+2E12 HYPODIASTOLE\n"
" ⸓ U+2E13 DOTTED OBELOS\n"
" ⸔ U+2E14 DOWNWARDS ANCORA\n"
" ⸕ U+2E15 UPWARDS ANCORA\n"
" ⸖ U+2E16 DOTTED RIGHT-POINTING ANGLE\n"
"Supplemental Punctuation — Ancient Near-Eastern linguistic symbol items: 1\n"
" ⸗ U+2E17 DOUBLE OBLIQUE HYPHEN\n"
"Supplemental Punctuation — General punctuation items: 2\n"
" ⸘ U+2E18 INVERTED INTERROBANG\n"
" ⸙ U+2E19 PALM BRANCH\n"
"Supplemental Punctuation — Dictionary punctuation items: 4\n"
" ⸚ U+2E1A HYPHEN WITH DIAERESIS\n"
" ⸛ U+2E1B TILDE WITH RING ABOVE\n"
" ⸞ U+2E1E TILDE WITH DOT ABOVE\n"
" ⸟ U+2E1F TILDE WITH DOT BELOW\n"
"Supplemental Punctuation — Brackets items: 8\n"
" ⸜ U+2E1C LEFT LOW PARAPHRASE BRACKET\n"
" ⸝ U+2E1D RIGHT LOW PARAPHRASE BRACKET\n"
" ⸠ U+2E20 LEFT VERTICAL BAR WITH QUILL\n"
" ⸡ U+2E21 RIGHT VERTICAL BAR WITH QUILL\n"
" ⸦ U+2E26 LEFT SIDEWAYS U BRACKET\n"
" ⸧ U+2E27 RIGHT SIDEWAYS U BRACKET\n"
" ⸨ U+2E28 LEFT DOUBLE PARENTHESIS\n"
" ⸩ U+2E29 RIGHT DOUBLE PARENTHESIS\n"
"Supplemental Punctuation — Half brackets items: 4\n"
" ⸢ U+2E22 TOP LEFT HALF BRACKET\n"
" ⸣ U+2E23 TOP RIGHT HALF BRACKET\n"
" ⸤ U+2E24 BOTTOM LEFT HALF BRACKET\n"
" ⸥ U+2E25 BOTTOM RIGHT HALF BRACKET\n"
"Supplemental Punctuation — Archaic punctuation items: 15\n"
" ⸪ U+2E2A TWO DOTS OVER ONE DOT PUNCTUATION\n"
" ⸫ U+2E2B ONE DOT OVER TWO DOTS PUNCTUATION\n"
" ⸬ U+2E2C SQUARED FOUR DOT PUNCTUATION\n"
" ⸭ U+2E2D FIVE DOT MARK\n"
" ⸮ U+2E2E REVERSED QUESTION MARK\n"
" ⸰ U+2E30 RING POINT\n"
" ⸱ U+2E31 WORD SEPARATOR MIDDLE DOT\n"
" ⸳ U+2E33 RAISED DOT\n"
" ⸴ U+2E34 RAISED COMMA\n"
" ⸿ U+2E3F CAPITULUM\n"
" ⹊ U+2E4A DOTTED SOLIDUS\n"
" ⹋ U+2E4B TRIPLE DAGGER\n"
" ⹌ U+2E4C MEDIEVAL COMMA\n"
" ⹍ U+2E4D PARAGRAPHUS MARK\n"
" ⹎ U+2E4E PUNCTUS ELEVATUS MARK\n"
"Supplemental Punctuation — Palaeotype transliteration symbol items: 6\n"
" ⸲ U+2E32 TURNED COMMA\n"
" ⸵ U+2E35 TURNED SEMICOLON\n"
" ⸶ U+2E36 DAGGER WITH LEFT GUARD\n"
" ⸷ U+2E37 DAGGER WITH RIGHT GUARD\n"
" ⸸ U+2E38 TURNED DAGGER\n"
" ⸹ U+2E39 TOP HALF SECTION SIGN\n"
"Supplemental Punctuation — Dashes items: 2\n"
" ⸺ U+2E3A TWO-EM DASH\n"
" ⸻ U+2E3B THREE-EM DASH\n"
"Supplemental Punctuation — Alternate forms of punctuation items: 3\n"
" ⸼ U+2E3C STENOGRAPHIC FULL STOP\n"
" ⸽ U+2E3D VERTICAL SIX DOTS\n"
" ⸾ U+2E3E WIGGLY VERTICAL LINE\n"
"Supplemental Punctuation — Double hyphen items: 1\n"
" ⹀ U+2E40 DOUBLE HYPHEN\n"
"Supplemental Punctuation — Reversed punctuation items: 2\n"
" ⹁ U+2E41 REVERSED COMMA\n"
" ⹂ U+2E42 DOUBLE LOW-REVERSED-9 QUOTATION MARK\n"
"Supplemental Punctuation — Miscellaneous punctuation items: 2\n"
" ⹃ U+2E43 DASH WITH LEFT UPTURN\n"
" ⹄ U+2E44 DOUBLE SUSPENSION MARK\n"
"Supplemental Punctuation — Typicon punctuation items: 5\n"
" ⹅ U+2E45 INVERTED LOW KAVYKA\n"
" ⹆ U+2E46 INVERTED LOW KAVYKA WITH KAVYKA ABOVE\n"
" ⹇ U+2E47 LOW KAVYKA\n"
" ⹈ U+2E48 LOW KAVYKA WITH DOT\n"
" ⹉ U+2E49 DOUBLE STACKED COMMA\n"
"CJK Symbols And Punctuation — CJK symbols and punctuation items: 3\n"
" 、 U+3001 IDEOGRAPHIC COMMA\n"
" 。 U+3002 IDEOGRAPHIC FULL STOP\n"
" 〃 U+3003 DITTO MARK\n"
"CJK Symbols And Punctuation — CJK angle brackets items: 4\n"
" 〈 U+3008 LEFT ANGLE BRACKET\n"
" 〉 U+3009 RIGHT ANGLE BRACKET\n"
" 《 U+300A LEFT DOUBLE ANGLE BRACKET\n"
" 》 U+300B RIGHT DOUBLE ANGLE BRACKET\n"
"CJK Symbols And Punctuation — CJK corner brackets items: 4\n"
" 「 U+300C LEFT CORNER BRACKET\n"
" 」 U+300D RIGHT CORNER BRACKET\n"
" 『 U+300E LEFT WHITE CORNER BRACKET\n"
" 』 U+300F RIGHT WHITE CORNER BRACKET\n"
"CJK Symbols And Punctuation — CJK brackets items: 10\n"
" 【 U+3010 LEFT BLACK LENTICULAR BRACKET\n"
" 】 U+3011 RIGHT BLACK LENTICULAR BRACKET\n"
" 〔 U+3014 LEFT TORTOISE SHELL BRACKET\n"
" 〕 U+3015 RIGHT TORTOISE SHELL BRACKET\n"
" 〖 U+3016 LEFT WHITE LENTICULAR BRACKET\n"
" 〗 U+3017 RIGHT WHITE LENTICULAR BRACKET\n"
" 〘 U+3018 LEFT WHITE TORTOISE SHELL BRACKET\n"
" 〙 U+3019 RIGHT WHITE TORTOISE SHELL BRACKET\n"
" 〚 U+301A LEFT WHITE SQUARE BRACKET\n"
" 〛 U+301B RIGHT WHITE SQUARE BRACKET\n"
"CJK Symbols And Punctuation — CJK punctuation items: 6\n"
" 〜 U+301C WAVE DASH\n"
" 〝 U+301D REVERSED DOUBLE PRIME QUOTATION MARK\n"
" 〞 U+301E DOUBLE PRIME QUOTATION MARK\n"
" 〟 U+301F LOW DOUBLE PRIME QUOTATION MARK\n"
" 〰️ U+3030 WAVY DASH\n"
" 〽️ U+303D PART ALTERNATION MARK\n"
"Katakana — Katakana punctuation items: 1\n"
" ゠ U+30A0 KATAKANA-HIRAGANA DOUBLE HYPHEN\n"
"Katakana — Conjunction and length marks items: 1\n"
" ・ U+30FB KATAKANA MIDDLE DOT\n"
"Lisu — Punctuation items: 2\n"
" ꓾ U+A4FE LISU PUNCTUATION COMMA\n"
" ꓿ U+A4FF LISU PUNCTUATION FULL STOP\n"
"Vai — Punctuation items: 3\n"
" ꘍ U+A60D VAI COMMA\n"
" ꘎ U+A60E VAI FULL STOP\n"
" ꘏ U+A60F VAI QUESTION MARK\n"
"Cyrillic Extended B — Punctuation mark items: 2\n"
" ꙳ U+A673 SLAVONIC ASTERISK\n"
" ꙾ U+A67E CYRILLIC KAVYKA\n"
"Bamum — Punctuation items: 6\n"
" ꛲ U+A6F2 BAMUM NJAEMLI\n"
" ꛳ U+A6F3 BAMUM FULL STOP\n"
" ꛴ U+A6F4 BAMUM COLON\n"
" ꛵ U+A6F5 BAMUM COMMA\n"
" ꛶ U+A6F6 BAMUM SEMICOLON\n"
" ꛷ U+A6F7 BAMUM QUESTION MARK\n"
"Phags Pa — Head marks for Tibetan items: 2\n"
" ꡴ U+A874 PHAGS-PA SINGLE HEAD MARK\n"
" ꡵ U+A875 PHAGS-PA DOUBLE HEAD MARK\n"
"Phags Pa — Punctuation for Tibetan items: 2\n"
" ꡶ U+A876 PHAGS-PA MARK SHAD\n"
" ꡷ U+A877 PHAGS-PA MARK DOUBLE SHAD\n"
"Saurashtra — Punctuation items: 2\n"
" ꣎ U+A8CE SAURASHTRA DANDA\n"
" ꣏ U+A8CF SAURASHTRA DOUBLE DANDA\n"
"Devanagari Extended — Editorial marks items: 3\n"
" ꣸ U+A8F8 DEVANAGARI SIGN PUSHPIKA\n"
" ꣹ U+A8F9 DEVANAGARI GAP FILLER\n"
" ꣺ U+A8FA DEVANAGARI CARET\n"
"Devanagari Extended — Sign items: 1\n"
" ꣼ U+A8FC DEVANAGARI SIGN SIDDHAM\n"
"Kayah Li — Punctuation items: 2\n"
" ꤮ U+A92E KAYAH LI SIGN CWI\n"
" ꤯ U+A92F KAYAH LI SIGN SHYA\n"
"Rejang — Punctuation items: 1\n"
" ꥟ U+A95F REJANG SECTION MARK\n"
"Javanese — Punctuation items: 13\n"
" ꧁ U+A9C1 JAVANESE LEFT RERENGGAN\n"
" ꧂ U+A9C2 JAVANESE RIGHT RERENGGAN\n"
" ꧃ U+A9C3 JAVANESE PADA ANDAP\n"
" ꧄ U+A9C4 JAVANESE PADA MADYA\n"
" ꧅ U+A9C5 JAVANESE PADA LUHUR\n"
" ꧆ U+A9C6 JAVANESE PADA WINDU\n"
" ꧇ U+A9C7 JAVANESE PADA PANGKAT\n"
" ꧈ U+A9C8 JAVANESE PADA LINGSA\n"
" ꧉ U+A9C9 JAVANESE PADA LUNGSI\n"
" ꧊ U+A9CA JAVANESE PADA ADEG\n"
" ꧋ U+A9CB JAVANESE PADA ADEG ADEG\n"
" ꧌ U+A9CC JAVANESE PADA PISELEH\n"
" ꧍ U+A9CD JAVANESE TURNED PADA PISELEH\n"
"Javanese — Ellipsis marks items: 2\n"
" ꧞ U+A9DE JAVANESE PADA TIRTA TUMETES\n"
" ꧟ U+A9DF JAVANESE PADA ISEN-ISEN\n"
"Cham — Punctuation items: 4\n"
" ꩜ U+AA5C CHAM PUNCTUATION SPIRAL\n"
" ꩝ U+AA5D CHAM PUNCTUATION DANDA\n"
" ꩞ U+AA5E CHAM PUNCTUATION DOUBLE DANDA\n"
" ꩟ U+AA5F CHAM PUNCTUATION TRIPLE DANDA\n"
"Tai Viet — Punctuation items: 2\n"
" ꫞ U+AADE TAI VIET SYMBOL HO HOI\n"
" ꫟ U+AADF TAI VIET SYMBOL KOI KOI\n"
"Meetei Mayek Extensions — Punctuation items: 2\n"
" ꫰ U+AAF0 MEETEI MAYEK CHEIKHAN\n"
" ꫱ U+AAF1 MEETEI MAYEK AHANG KHUDAM\n"
"Meetei Mayek — Punctuation items: 1\n"
" ꯫ U+ABEB MEETEI MAYEK CHEIKHEI\n"
"Arabic Presentation Forms A — Punctuation items: 2\n"
" ﴾ U+FD3E ORNATE LEFT PARENTHESIS\n"
" ﴿ U+FD3F ORNATE RIGHT PARENTHESIS\n"
"Vertical Forms — Glyphs for vertical variants items: 10\n"
" ︐ U+FE10 PRESENTATION FORM FOR VERTICAL COMMA\n"
" ︑ U+FE11 PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC COMMA\n"
" ︒ U+FE12 PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC FULL STOP\n"
" ︓ U+FE13 PRESENTATION FORM FOR VERTICAL COLON\n"
" ︔ U+FE14 PRESENTATION FORM FOR VERTICAL SEMICOLON\n"
" ︕ U+FE15 PRESENTATION FORM FOR VERTICAL EXCLAMATION MARK\n"
" ︖ U+FE16 PRESENTATION FORM FOR VERTICAL QUESTION MARK\n"
" ︗ U+FE17 PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET\n"
" ︘ U+FE18 PRESENTATION FORM FOR VERTICAL RIGHT WHITE LENTICULAR BRAKCET\n"
" ︙ U+FE19 PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS\n"
"CJK Compatibility Forms — Glyphs for vertical variants items: 23\n"
" ︰ U+FE30 PRESENTATION FORM FOR VERTICAL TWO DOT LEADER\n"
" ︱ U+FE31 PRESENTATION FORM FOR VERTICAL EM DASH\n"
" ︲ U+FE32 PRESENTATION FORM FOR VERTICAL EN DASH\n"
" ︳ U+FE33 PRESENTATION FORM FOR VERTICAL LOW LINE\n"
" ︴ U+FE34 PRESENTATION FORM FOR VERTICAL WAVY LOW LINE\n"
" ︵ U+FE35 PRESENTATION FORM FOR VERTICAL LEFT PARENTHESIS\n"
" ︶ U+FE36 PRESENTATION FORM FOR VERTICAL RIGHT PARENTHESIS\n"
" ︷ U+FE37 PRESENTATION FORM FOR VERTICAL LEFT CURLY BRACKET\n"
" ︸ U+FE38 PRESENTATION FORM FOR VERTICAL RIGHT CURLY BRACKET\n"
" ︹ U+FE39 PRESENTATION FORM FOR VERTICAL LEFT TORTOISE SHELL BRACKET\n"
" ︺ U+FE3A PRESENTATION FORM FOR VERTICAL RIGHT TORTOISE SHELL BRACKET\n"
" ︻ U+FE3B PRESENTATION FORM FOR VERTICAL LEFT BLACK LENTICULAR BRACKET\n"
" ︼ U+FE3C PRESENTATION FORM FOR VERTICAL RIGHT BLACK LENTICULAR BRACKET\n"
" ︽ U+FE3D PRESENTATION FORM FOR VERTICAL LEFT DOUBLE ANGLE BRACKET\n"
" ︾ U+FE3E PRESENTATION FORM FOR VERTICAL RIGHT DOUBLE ANGLE BRACKET\n"
" ︿ U+FE3F PRESENTATION FORM FOR VERTICAL LEFT ANGLE BRACKET\n"
" ﹀ U+FE40 PRESENTATION FORM FOR VERTICAL RIGHT ANGLE BRACKET\n"
" ﹁ U+FE41 PRESENTATION FORM FOR VERTICAL LEFT CORNER BRACKET\n"
" ﹂ U+FE42 PRESENTATION FORM FOR VERTICAL RIGHT CORNER BRACKET\n"
" ﹃ U+FE43 PRESENTATION FORM FOR VERTICAL LEFT WHITE CORNER BRACKET\n"
" ﹄ U+FE44 PRESENTATION FORM FOR VERTICAL RIGHT WHITE CORNER BRACKET\n"
" ﹇ U+FE47 PRESENTATION FORM FOR VERTICAL LEFT SQUARE BRACKET\n"
" ﹈ U+FE48 PRESENTATION FORM FOR VERTICAL RIGHT SQUARE BRACKET\n"
"CJK Compatibility Forms — Sidelining emphasis marks items: 2\n"
" ﹅ U+FE45 SESAME DOT\n"
" ﹆ U+FE46 WHITE SESAME DOT\n"
"CJK Compatibility Forms — Overscores and underscores items: 7\n"
" ﹉ U+FE49 DASHED OVERLINE\n"
" ﹊ U+FE4A CENTRELINE OVERLINE\n"
" ﹋ U+FE4B WAVY OVERLINE\n"
" ﹌ U+FE4C DOUBLE WAVY OVERLINE\n"
" ﹍ U+FE4D DASHED LOW LINE\n"
" ﹎ U+FE4E CENTRELINE LOW LINE\n"
" ﹏ U+FE4F WAVY LOW LINE\n"
"Small Form Variants — Small form variants items: 21\n"
" ﹐ U+FE50 SMALL COMMA\n"
" ﹑ U+FE51 SMALL IDEOGRAPHIC COMMA\n"
" ﹒ U+FE52 SMALL FULL STOP\n"
" ﹔ U+FE54 SMALL SEMICOLON\n"
" ﹕ U+FE55 SMALL COLON\n"
" ﹖ U+FE56 SMALL QUESTION MARK\n"
" ﹗ U+FE57 SMALL EXCLAMATION MARK\n"
" ﹘ U+FE58 SMALL EM DASH\n"
" ﹙ U+FE59 SMALL LEFT PARENTHESIS\n"
" ﹚ U+FE5A SMALL RIGHT PARENTHESIS\n"
" ﹛ U+FE5B SMALL LEFT CURLY BRACKET\n"
" ﹜ U+FE5C SMALL RIGHT CURLY BRACKET\n"
" ﹝ U+FE5D SMALL LEFT TORTOISE SHELL BRACKET\n"
" ﹞ U+FE5E SMALL RIGHT TORTOISE SHELL BRACKET\n"
" ﹟ U+FE5F SMALL NUMBER SIGN\n"
" ﹠ U+FE60 SMALL AMPERSAND\n"
" ﹡ U+FE61 SMALL ASTERISK\n"
" ﹣ U+FE63 SMALL HYPHEN-MINUS\n"
" ﹨ U+FE68 SMALL REVERSE SOLIDUS\n"
" ﹪ U+FE6A SMALL PERCENT SIGN\n"
" ﹫ U+FE6B SMALL COMMERCIAL AT\n"
"Halfwidth And Fullwidth Forms — Fullwidth ASCII variants items: 23\n"
" ! U+FF01 FULLWIDTH EXCLAMATION MARK\n"
" " U+FF02 FULLWIDTH QUOTATION MARK\n"
" # U+FF03 FULLWIDTH NUMBER SIGN\n"
" % U+FF05 FULLWIDTH PERCENT SIGN\n"
" & U+FF06 FULLWIDTH AMPERSAND\n"
" ' U+FF07 FULLWIDTH APOSTROPHE\n"
" ( U+FF08 FULLWIDTH LEFT PARENTHESIS\n"
" ) U+FF09 FULLWIDTH RIGHT PARENTHESIS\n"
" * U+FF0A FULLWIDTH ASTERISK\n"
" , U+FF0C FULLWIDTH COMMA\n"
" - U+FF0D FULLWIDTH HYPHEN-MINUS\n"
" . U+FF0E FULLWIDTH FULL STOP\n"
" / U+FF0F FULLWIDTH SOLIDUS\n"
" : U+FF1A FULLWIDTH COLON\n"
" ; U+FF1B FULLWIDTH SEMICOLON\n"
" ? U+FF1F FULLWIDTH QUESTION MARK\n"
" @ U+FF20 FULLWIDTH COMMERCIAL AT\n"
" [ U+FF3B FULLWIDTH LEFT SQUARE BRACKET\n"
" \ U+FF3C FULLWIDTH REVERSE SOLIDUS\n"
" ] U+FF3D FULLWIDTH RIGHT SQUARE BRACKET\n"
" _ U+FF3F FULLWIDTH LOW LINE\n"
" { U+FF5B FULLWIDTH LEFT CURLY BRACKET\n"
" } U+FF5D FULLWIDTH RIGHT CURLY BRACKET\n"
"Halfwidth And Fullwidth Forms — Fullwidth brackets items: 2\n"
" ⦅ U+FF5F FULLWIDTH LEFT WHITE PARENTHESIS\n"
" ⦆ U+FF60 FULLWIDTH RIGHT WHITE PARENTHESIS\n"
"Halfwidth And Fullwidth Forms — Halfwidth CJK punctuation items: 4\n"
" 。 U+FF61 HALFWIDTH IDEOGRAPHIC FULL STOP\n"
" 「 U+FF62 HALFWIDTH LEFT CORNER BRACKET\n"
" 」 U+FF63 HALFWIDTH RIGHT CORNER BRACKET\n"
" 、 U+FF64 HALFWIDTH IDEOGRAPHIC COMMA\n"
"Halfwidth And Fullwidth Forms — Halfwidth Katakana variants items: 1\n"
" ・ U+FF65 HALFWIDTH KATAKANA MIDDLE DOT\n"
"Aegean Numbers — Punctuation items: 3\n"
" 𐄀 U+10100 AEGEAN WORD SEPARATOR LINE\n"
" 𐄁 U+10101 AEGEAN WORD SEPARATOR DOT\n"
" 𐄂 U+10102 AEGEAN CHECK MARK\n"
"Ugaritic — Punctuation items: 1\n"
" 𐎟 U+1039F UGARITIC WORD DIVIDER\n"
"Old Persian — Punctuation items: 1\n"
" 𐏐 U+103D0 OLD PERSIAN WORD DIVIDER\n"
"Caucasian Albanian — Punctuation items: 1\n"
" 𐕯 U+1056F CAUCASIAN ALBANIAN CITATION MARK\n"
"Imperial Aramaic — Punctuation items: 1\n"
" 𐡗 U+10857 IMPERIAL ARAMAIC SECTION SIGN\n"
"Phoenician — Punctuation items: 1\n"
" 𐤟 U+1091F PHOENICIAN WORD SEPARATOR\n"
"Lydian — Punctuation items: 1\n"
" 𐤿 U+1093F LYDIAN TRIANGULAR MARK\n"
"Kharoshthi — Punctuation items: 9\n"
" 𐩐 U+10A50 KHAROSHTHI PUNCTUATION DOT\n"
" 𐩑 U+10A51 KHAROSHTHI PUNCTUATION SMALL CIRCLE\n"
" 𐩒 U+10A52 KHAROSHTHI PUNCTUATION CIRCLE\n"
" 𐩓 U+10A53 KHAROSHTHI PUNCTUATION CRESCENT BAR\n"
" 𐩔 U+10A54 KHAROSHTHI PUNCTUATION MANGALAM\n"
" 𐩕 U+10A55 KHAROSHTHI PUNCTUATION LOTUS\n"
" 𐩖 U+10A56 KHAROSHTHI PUNCTUATION DANDA\n"
" 𐩗 U+10A57 KHAROSHTHI PUNCTUATION DOUBLE DANDA\n"
" 𐩘 U+10A58 KHAROSHTHI PUNCTUATION LINES\n"
"Old South Arabian — Numbers items: 1\n"
" 𐩿 U+10A7F OLD SOUTH ARABIAN NUMERIC INDICATOR\n"
"Manichaean — Punctuation items: 7\n"
" 𐫰 U+10AF0 MANICHAEAN PUNCTUATION STAR\n"
" 𐫱 U+10AF1 MANICHAEAN PUNCTUATION FLEURON\n"
" 𐫲 U+10AF2 MANICHAEAN PUNCTUATION DOUBLE DOT WITHIN DOT\n"
" 𐫳 U+10AF3 MANICHAEAN PUNCTUATION DOT WITHIN DOT\n"
" 𐫴 U+10AF4 MANICHAEAN PUNCTUATION DOT\n"
" 𐫵 U+10AF5 MANICHAEAN PUNCTUATION TWO DOTS\n"
" 𐫶 U+10AF6 MANICHAEAN PUNCTUATION LINE FILLER\n"
"Avestan — Punctuation items: 7\n"
" 𐬹 U+10B39 AVESTAN ABBREVIATION MARK\n"
" 𐬺 U+10B3A TINY TWO DOTS OVER ONE DOT PUNCTUATION\n"
" 𐬻 U+10B3B SMALL TWO DOTS OVER ONE DOT PUNCTUATION\n"
" 𐬼 U+10B3C LARGE TWO DOTS OVER ONE DOT PUNCTUATION\n"
" 𐬽 U+10B3D LARGE ONE DOT OVER TWO DOTS PUNCTUATION\n"
" 𐬾 U+10B3E LARGE TWO RINGS OVER ONE RING PUNCTUATION\n"
" 𐬿 U+10B3F LARGE ONE RING OVER TWO RINGS PUNCTUATION\n"
"Psalter Pahlavi — Punctuation items: 4\n"
" 𐮙 U+10B99 PSALTER PAHLAVI SECTION MARK\n"
" 𐮚 U+10B9A PSALTER PAHLAVI TURNED SECTION MARK\n"
" 𐮛 U+10B9B PSALTER PAHLAVI FOUR DOTS WITH CROSS\n"
" 𐮜 U+10B9C PSALTER PAHLAVI FOUR DOTS WITH DOT\n"
"Sogdian — Punctuation items: 5\n"
" 𐽕 U+10F55 SOGDIAN PUNCTUATION TWO VERTICAL BARS\n"
" 𐽖 U+10F56 SOGDIAN PUNCTUATION TWO VERTICAL BARS WITH DOTS\n"
" 𐽗 U+10F57 SOGDIAN PUNCTUATION CIRCLE WITH DOT\n"
" 𐽘 U+10F58 SOGDIAN PUNCTUATION TWO CIRCLES WITH DOTS\n"
" 𐽙 U+10F59 SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT\n"
"Brahmi — Punctuation items: 7\n"
" 𑁇 U+11047 BRAHMI DANDA\n"
" 𑁈 U+11048 BRAHMI DOUBLE DANDA\n"
" 𑁉 U+11049 BRAHMI PUNCTUATION DOT\n"
" 𑁊 U+1104A BRAHMI PUNCTUATION DOUBLE DOT\n"
" 𑁋 U+1104B BRAHMI PUNCTUATION LINE\n"
" 𑁌 U+1104C BRAHMI PUNCTUATION CRESCENT BAR\n"
" 𑁍 U+1104D BRAHMI PUNCTUATION LOTUS\n"
"Kaithi — Various signs items: 2\n"
" 𑂻 U+110BB KAITHI ABBREVIATION SIGN\n"
" 𑂼 U+110BC KAITHI ENUMERATION SIGN\n"
"Kaithi — Punctuation items: 4\n"
" 𑂾 U+110BE KAITHI SECTION MARK\n"
" 𑂿 U+110BF KAITHI DOUBLE SECTION MARK\n"
" 𑃀 U+110C0 KAITHI DANDA\n"
" 𑃁 U+110C1 KAITHI DOUBLE DANDA\n"
"Chakma — Punctuation items: 4\n"
" 𑅀 U+11140 CHAKMA SECTION MARK\n"
" 𑅁 U+11141 CHAKMA DANDA\n"
" 𑅂 U+11142 CHAKMA DOUBLE DANDA\n"
" 𑅃 U+11143 CHAKMA QUESTION MARK\n"
"Mahajani — Punctuation items: 2\n"
" 𑅴 U+11174 MAHAJANI ABBREVIATION SIGN\n"
" 𑅵 U+11175 MAHAJANI SECTION MARK\n"
"Sharada — Punctuation items: 7\n"
" 𑇅 U+111C5 SHARADA DANDA\n"
" 𑇆 U+111C6 SHARADA DOUBLE DANDA\n"
" 𑇇 U+111C7 SHARADA ABBREVIATION SIGN\n"
" 𑇈 U+111C8 SHARADA SEPARATOR\n"
" 𑇍 U+111CD SHARADA SUTRA MARK\n"
" 𑇛 U+111DB SHARADA SIGN SIDDHAM\n"
" 𑇝 U+111DD SHARADA CONTINUATION SIGN\n"
"Sharada — Section marks items: 2\n"
" 𑇞 U+111DE SHARADA SECTION MARK-1\n"
" 𑇟 U+111DF SHARADA SECTION MARK-2\n"
"Khojki — Punctuation items: 6\n"
" 𑈸 U+11238 KHOJKI DANDA\n"
" 𑈹 U+11239 KHOJKI DOUBLE DANDA\n"
" 𑈺 U+1123A KHOJKI WORD SEPARATOR\n"
" 𑈻 U+1123B KHOJKI SECTION MARK\n"
" 𑈼 U+1123C KHOJKI DOUBLE SECTION MARK\n"
" 𑈽 U+1123D KHOJKI ABBREVIATION SIGN\n"
"Multani — Punctuation items: 1\n"
" 𑊩 U+112A9 MULTANI SECTION MARK\n"
"Newa — Punctuation items: 5\n"
" 𑑋 U+1144B NEWA DANDA\n"
" 𑑌 U+1144C NEWA DOUBLE DANDA\n"
" 𑑍 U+1144D NEWA COMMA\n"
" 𑑎 U+1144E NEWA GAP FILLER\n"
" 𑑏 U+1144F NEWA ABBREVIATION SIGN\n"
"Newa — Various signs items: 2\n"
" 𑑛 U+1145B NEWA PLACEHOLDER MARK\n"
" 𑑝 U+1145D NEWA INSERTION SIGN\n"
"Tirhuta — Various signs items: 1\n"
" 𑓆 U+114C6 TIRHUTA ABBREVIATION SIGN\n"
"Siddham — Head mark items: 1\n"
" 𑗁 U+115C1 SIDDHAM SIGN SIDDHAM\n"
"Siddham — Punctuation items: 4\n"
" 𑗂 U+115C2 SIDDHAM DANDA\n"
" 𑗃 U+115C3 SIDDHAM DOUBLE DANDA\n"
" 𑗄 U+115C4 SIDDHAM SEPARATOR DOT\n"
" 𑗅 U+115C5 SIDDHAM SEPARATOR BAR\n"
"Siddham — Repetition mark items: 3\n"
" 𑗆 U+115C6 SIDDHAM REPETITION MARK-1\n"
" 𑗇 U+115C7 SIDDHAM REPETITION MARK-2\n"
" 𑗈 U+115C8 SIDDHAM REPETITION MARK-3\n"
"Siddham — Terminal mark items: 1\n"
" 𑗉 U+115C9 SIDDHAM END OF TEXT MARK\n"
"Siddham — Section marks items: 14\n"
" 𑗊 U+115CA SIDDHAM SECTION MARK WITH TRIDENT AND U-SHAPED ORNAMENTS\n"
" 𑗋 U+115CB SIDDHAM SECTION MARK WITH TRIDENT AND DOTTED CRESCENTS\n"
" 𑗌 U+115CC SIDDHAM SECTION MARK WITH RAYS AND DOTTED CRESCENTS\n"
" 𑗍 U+115CD SIDDHAM SECTION MARK WITH RAYS AND DOTTED DOUBLE CRESCENTS\n"
" 𑗎 U+115CE SIDDHAM SECTION MARK WITH RAYS AND DOTTED TRIPLE CRESCENTS\n"
" 𑗏 U+115CF SIDDHAM SECTION MARK DOUBLE RING\n"
" 𑗐 U+115D0 SIDDHAM SECTION MARK DOUBLE RING WITH RAYS\n"
" 𑗑 U+115D1 SIDDHAM SECTION MARK WITH DOUBLE CRESCENTS\n"
" 𑗒 U+115D2 SIDDHAM SECTION MARK WITH TRIPLE CRESCENTS\n"
" 𑗓 U+115D3 SIDDHAM SECTION MARK WITH QUADRUPLE CRESCENTS\n"
" 𑗔 U+115D4 SIDDHAM SECTION MARK WITH SEPTUPLE CRESCENTS\n"
" 𑗕 U+115D5 SIDDHAM SECTION MARK WITH CIRCLES AND RAYS\n"
" 𑗖 U+115D6 SIDDHAM SECTION MARK WITH CIRCLES AND TWO ENCLOSURES\n"
" 𑗗 U+115D7 SIDDHAM SECTION MARK WITH CIRCLES AND FOUR ENCLOSURES\n"
"Modi — Punctuation items: 3\n"
" 𑙁 U+11641 MODI DANDA\n"
" 𑙂 U+11642 MODI DOUBLE DANDA\n"
" 𑙃 U+11643 MODI ABBREVIATION SIGN\n"
"Mongolian Supplement — Punctuation items: 13\n"
" 𑙠 U+11660 MONGOLIAN BIRGA WITH ORNAMENT\n"
" 𑙡 U+11661 MONGOLIAN ROTATED BIRGA\n"
" 𑙢 U+11662 MONGOLIAN DOUBLE BIRGA WITH ORNAMENT\n"
" 𑙣 U+11663 MONGOLIAN TRIPLE BIRGA WITH ORNAMENT\n"
" 𑙤 U+11664 MONGOLIAN BIRGA WITH DOUBLE ORNAMENT\n"
" 𑙥 U+11665 MONGOLIAN ROTATED BIRGA WITH ORNAMENT\n"
" 𑙦 U+11666 MONGOLIAN ROTATED BIRGA WITH DOUBLE ORNAMENT\n"
" 𑙧 U+11667 MONGOLIAN INVERTED BIRGA\n"
" 𑙨 U+11668 MONGOLIAN INVERTED BIRGA WITH DOUBLE ORNAMENT\n"
" 𑙩 U+11669 MONGOLIAN SWIRL BIRGA\n"
" 𑙪 U+1166A MONGOLIAN SWIRL BIRGA WITH ORNAMENT\n"
" 𑙫 U+1166B MONGOLIAN SWIRL BIRGA WITH DOUBLE ORNAMENT\n"
" 𑙬 U+1166C MONGOLIAN TURNED SWIRL BIRGA WITH DOUBLE ORNAMENT\n"
"Ahom — Punctuation items: 3\n"
" 𑜼 U+1173C AHOM SIGN SMALL SECTION\n"
" 𑜽 U+1173D AHOM SIGN SECTION\n"
" 𑜾 U+1173E AHOM SIGN RULAI\n"
"Dogra — Punctuation items: 1\n"
" 𑠻 U+1183B DOGRA ABBREVIATION SIGN\n"
"Zanabazar Square — Head mark items: 4\n"
" 𑨿 U+11A3F ZANABAZAR SQUARE INITIAL HEAD MARK\n"
" 𑩀 U+11A40 ZANABAZAR SQUARE CLOSING HEAD MARK\n"
" 𑩅 U+11A45 ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK\n"
" 𑩆 U+11A46 ZANABAZAR SQUARE CLOSING DOUBLE-LINED HEAD MARK\n"
"Zanabazar Square — Punctuation items: 4\n"
" 𑩁 U+11A41 ZANABAZAR SQUARE MARK TSHEG\n"
" 𑩂 U+11A42 ZANABAZAR SQUARE MARK SHAD\n"
" 𑩃 U+11A43 ZANABAZAR SQUARE MARK DOUBLE SHAD\n"
" 𑩄 U+11A44 ZANABAZAR SQUARE MARK LONG TSHEG\n"
"Soyombo — Punctuation items: 3\n"
" 𑪚 U+11A9A SOYOMBO MARK TSHEG\n"
" 𑪛 U+11A9B SOYOMBO MARK SHAD\n"
" 𑪜 U+11A9C SOYOMBO MARK DOUBLE SHAD\n"
"Soyombo — Head mark items: 3\n"
" 𑪞 U+11A9E SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME\n"
" 𑪟 U+11A9F SOYOMBO HEAD MARK WITH MOON AND SUN AND FLAME\n"
" 𑪠 U+11AA0 SOYOMBO HEAD MARK WITH MOON AND SUN\n"
"Soyombo — Terminal mark items: 2\n"
" 𑪡 U+11AA1 SOYOMBO TERMINAL MARK-1\n"
" 𑪢 U+11AA2 SOYOMBO TERMINAL MARK-2\n"
"Bhaiksuki — Punctuation items: 3\n"
" 𑱁 U+11C41 BHAIKSUKI DANDA\n"
" 𑱂 U+11C42 BHAIKSUKI DOUBLE DANDA\n"
" 𑱃 U+11C43 BHAIKSUKI WORD SEPARATOR\n"
"Bhaiksuki — Gap fillers items: 2\n"
" 𑱄 U+11C44 BHAIKSUKI GAP FILLER-1\n"
" 𑱅 U+11C45 BHAIKSUKI GAP FILLER-2\n"
"Marchen — Punctuation items: 2\n"
" 𑱰 U+11C70 MARCHEN HEAD MARK\n"
" 𑱱 U+11C71 MARCHEN MARK SHAD\n"
"Makasar — Punctuation items: 2\n"
" 𑻷 U+11EF7 MAKASAR PASSIMBANG\n"
" 𑻸 U+11EF8 MAKASAR END OF SECTION\n"
"Cuneiform Numbers And Punctuation — Punctuation items: 5\n"
" 𒑰 U+12470 CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER\n"
" 𒑱 U+12471 CUNEIFORM PUNCTUATION SIGN VERTICAL COLON\n"
" 𒑲 U+12472 CUNEIFORM PUNCTUATION SIGN DIAGONAL COLON\n"
" 𒑳 U+12473 CUNEIFORM PUNCTUATION SIGN DIAGONAL TRICOLON\n"
" 𒑴 U+12474 CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON\n"
"Mro — Punctuation items: 2\n"
" 𖩮 U+16A6E MRO DANDA\n"
" 𖩯 U+16A6F MRO DOUBLE DANDA\n"
"Bassa Vah — Punctuation items: 1\n"
" 𖫵 U+16AF5 BASSA VAH FULL STOP\n"
"Pahawh Hmong — Punctuation items: 6\n"
" 𖬷 U+16B37 PAHAWH HMONG SIGN VOS THOM\n"
" 𖬸 U+16B38 PAHAWH HMONG SIGN VOS TSHAB CEEB\n"
" 𖬹 U+16B39 PAHAWH HMONG SIGN CIM CHEEM\n"
" 𖬺 U+16B3A PAHAWH HMONG SIGN VOS THIAB\n"
" 𖬻 U+16B3B PAHAWH HMONG SIGN VOS FEEM\n"
" 𖭄 U+16B44 PAHAWH HMONG SIGN XAUS\n"
"Medefaidrin — Punctuation items: 2\n"
" 𖺗 U+16E97 MEDEFAIDRIN COMMA\n"
" 𖺘 U+16E98 MEDEFAIDRIN FULL STOP\n"
"Medefaidrin — Sign items: 2\n"
" 𖺙 U+16E99 MEDEFAIDRIN SYMBOL AIVA\n"
" 𖺚 U+16E9A MEDEFAIDRIN EXCLAMATION OH\n"
"Duployan — Chinook punctuation items: 1\n"
" 𛲟 U+1BC9F DUPLOYAN PUNCTUATION CHINOOK FULL STOP\n"
"Sutton SignWriting — Punctuation items: 5\n"
" 𝪇 U+1DA87 SIGNWRITING COMMA\n"
" 𝪈 U+1DA88 SIGNWRITING FULL STOP\n"
" 𝪉 U+1DA89 SIGNWRITING SEMICOLON\n"
" 𝪊 U+1DA8A SIGNWRITING COLON\n"
" 𝪋 U+1DA8B SIGNWRITING PARENTHESIS\n"
"Adlam — Punctuation items: 2\n"
" 𞥞 U+1E95E ADLAM INITIAL EXCLAMATION MARK\n"
" 𞥟 U+1E95F ADLAM INITIAL QUESTION MARK")
matches = regex.finditer(test_str)
for match_num, match in enumerate(matches, start=1):
print(f"Match {match_num} was found at {match.start()}-{match.end()}: {match.group()}")
for group_num, group in enumerate(match.groups(), start=1):
print(f"Group {group_num} found at {match.start(group_num)}-{match.end(group_num)}: {group}")
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Python, please visit: https://docs.python.org/3/library/re.html