# coding=utf8
# the above tag defines encoding for this document and is for Python 2.x compatibility
import re
regex = r"(?:[!-#%-\*,-\/:;\?@\[-\]_\{\}\xA1\xA7\xAB\xB6\xB7\xBB\xBF\u037E\u0387\u055A-\u055F\u0589\u058A\u05BE\u05C0\u05C3\u05C6\u05F3\u05F4\u0609\u060A\u060C\u060D\u061B\u061E\u061F\u066A-\u066D\u06D4\u0700-\u070D\u07F7-\u07F9\u0830-\u083E\u085E\u0964\u0965\u0970\u09FD\u0A76\u0AF0\u0C84\u0DF4\u0E4F\u0E5A\u0E5B\u0F04-\u0F12\u0F14\u0F3A-\u0F3D\u0F85\u0FD0-\u0FD4\u0FD9\u0FDA\u104A-\u104F\u10FB\u1360-\u1368\u1400\u166D\u166E\u169B\u169C\u16EB-\u16ED\u1735\u1736\u17D4-\u17D6\u17D8-\u17DA\u1800-\u180A\u1944\u1945\u1A1E\u1A1F\u1AA0-\u1AA6\u1AA8-\u1AAD\u1B5A-\u1B60\u1BFC-\u1BFF\u1C3B-\u1C3F\u1C7E\u1C7F\u1CC0-\u1CC7\u1CD3\u2010-\u2027\u2030-\u2043\u2045-\u2051\u2053-\u205E\u207D\u207E\u208D\u208E\u2308-\u230B\u2329\u232A\u2768-\u2775\u27C5\u27C6\u27E6-\u27EF\u2983-\u2998\u29D8-\u29DB\u29FC\u29FD\u2CF9-\u2CFC\u2CFE\u2CFF\u2D70\u2E00-\u2E2E\u2E30-\u2E4E\u3001-\u3003\u3008-\u3011\u3014-\u301F\u3030\u303D\u30A0\u30FB\uA4FE\uA4FF\uA60D-\uA60F\uA673\uA67E\uA6F2-\uA6F7\uA874-\uA877\uA8CE\uA8CF\uA8F8-\uA8FA\uA8FC\uA92E\uA92F\uA95F\uA9C1-\uA9CD\uA9DE\uA9DF\uAA5C-\uAA5F\uAADE\uAADF\uAAF0\uAAF1\uABEB\uFD3E\uFD3F\uFE10-\uFE19\uFE30-\uFE52\uFE54-\uFE61\uFE63\uFE68\uFE6A\uFE6B\uFF01-\uFF03\uFF05-\uFF0A\uFF0C-\uFF0F\uFF1A\uFF1B\uFF1F\uFF20\uFF3B-\uFF3D\uFF3F\uFF5B\uFF5D\uFF5F-\uFF65]|\uD800[\uDD00-\uDD02\uDF9F\uDFD0]|\uD801\uDD6F|\uD802[\uDC57\uDD1F\uDD3F\uDE50-\uDE58\uDE7F\uDEF0-\uDEF6\uDF39-\uDF3F\uDF99-\uDF9C]|\uD803[\uDF55-\uDF59]|\uD804[\uDC47-\uDC4D\uDCBB\uDCBC\uDCBE-\uDCC1\uDD40-\uDD43\uDD74\uDD75\uDDC5-\uDDC8\uDDCD\uDDDB\uDDDD-\uDDDF\uDE38-\uDE3D\uDEA9]|\uD805[\uDC4B-\uDC4F\uDC5B\uDC5D\uDCC6\uDDC1-\uDDD7\uDE41-\uDE43\uDE60-\uDE6C\uDF3C-\uDF3E]|\uD806[\uDC3B\uDE3F-\uDE46\uDE9A-\uDE9C\uDE9E-\uDEA2]|\uD807[\uDC41-\uDC45\uDC70\uDC71\uDEF7\uDEF8]|\uD809[\uDC70-\uDC74]|\uD81A[\uDE6E\uDE6F\uDEF5\uDF37-\uDF3B\uDF44]|\uD81B[\uDE97-\uDE9A]|\uD82F\uDC9F|\uD836[\uDE87-\uDE8B]|\uD83A[\uDD5E\uDD5F])"
test_str = ("\n"
"Basic Latin — ASCII punctuation and symbols items: 23\n"
" ! U+0021 EXCLAMATION MARK\n"
" \" U+0022 QUOTATION MARK\n"
" # U+0023 NUMBER SIGN\n"
" % U+0025 PERCENT SIGN\n"
" & U+0026 AMPERSAND\n"
" ' U+0027 APOSTROPHE\n"
" ( U+0028 LEFT PARENTHESIS\n"
" ) U+0029 RIGHT PARENTHESIS\n"
" * U+002A ASTERISK\n"
" , U+002C COMMA\n"
" - U+002D HYPHEN-MINUS\n"
" . U+002E FULL STOP\n"
" / U+002F SOLIDUS\n"
" : U+003A COLON\n"
" ; U+003B SEMICOLON\n"
" ? U+003F QUESTION MARK\n"
" @ U+0040 COMMERCIAL AT\n"
" [ U+005B LEFT SQUARE BRACKET\n"
" \\ U+005C REVERSE SOLIDUS\n"
" ] U+005D RIGHT SQUARE BRACKET\n"
" _ U+005F LOW LINE\n"
" { U+007B LEFT CURLY BRACKET\n"
" } U+007D RIGHT CURLY BRACKET\n"
"Latin 1 Supplement — Latin-1 punctuation and symbols items: 6\n"
" ¡ U+00A1 INVERTED EXCLAMATION MARK\n"
" § U+00A7 SECTION SIGN\n"
" « U+00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK\n"
" ¶ U+00B6 PILCROW SIGN\n"
" · U+00B7 MIDDLE DOT\n"
" » U+00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK\n"
"Latin 1 Supplement — Punctuation items: 1\n"
" ¿ U+00BF INVERTED QUESTION MARK\n"
"Greek And Coptic — Punctuation items: 2\n"
" ; U+037E GREEK QUESTION MARK\n"
" · U+0387 GREEK ANO TELEIA\n"
"Armenian — Modifier letter items: 6\n"
" ՚ U+055A ARMENIAN APOSTROPHE\n"
" ՛ U+055B ARMENIAN EMPHASIS MARK\n"
" ՜ U+055C ARMENIAN EXCLAMATION MARK\n"
" ՝ U+055D ARMENIAN COMMA\n"
" ՞ U+055E ARMENIAN QUESTION MARK\n"
" ՟ U+055F ARMENIAN ABBREVIATION MARK\n"
"Armenian — Punctuation items: 2\n"
" ։ U+0589 ARMENIAN FULL STOP\n"
" ֊ U+058A ARMENIAN HYPHEN\n"
"Hebrew — Points and punctuation items: 4\n"
" ־ U+05BE HEBREW PUNCTUATION MAQAF\n"
" ׀ U+05C0 HEBREW PUNCTUATION PASEQ\n"
" ׃ U+05C3 HEBREW PUNCTUATION SOF PASUQ\n"
" ׆ U+05C6 HEBREW PUNCTUATION NUN HAFUKHA\n"
"Hebrew — Punctuation items: 2\n"
" ׳ U+05F3 HEBREW PUNCTUATION GERESH\n"
" ״ U+05F4 HEBREW PUNCTUATION GERSHAYIM\n"
"Arabic — Punctuation items: 12\n"
" ؉ U+0609 ARABIC-INDIC PER MILLE SIGN\n"
" ؊ U+060A ARABIC-INDIC PER TEN THOUSAND SIGN\n"
" ، U+060C ARABIC COMMA\n"
" ؍ U+060D ARABIC DATE SEPARATOR\n"
" ؛ U+061B ARABIC SEMICOLON\n"
" ؞ U+061E ARABIC TRIPLE DOT PUNCTUATION MARK\n"
" ؟ U+061F ARABIC QUESTION MARK\n"
" ٪ U+066A ARABIC PERCENT SIGN\n"
" ٫ U+066B ARABIC DECIMAL SEPARATOR\n"
" ٬ U+066C ARABIC THOUSANDS SEPARATOR\n"
" ٭ U+066D ARABIC FIVE POINTED STAR\n"
" ۔ U+06D4 ARABIC FULL STOP\n"
"Syriac — Syriac punctuation and signs items: 14\n"
" ܀ U+0700 SYRIAC END OF PARAGRAPH\n"
" ܁ U+0701 SYRIAC SUPRALINEAR FULL STOP\n"
" ܂ U+0702 SYRIAC SUBLINEAR FULL STOP\n"
" ܃ U+0703 SYRIAC SUPRALINEAR COLON\n"
" ܄ U+0704 SYRIAC SUBLINEAR COLON\n"
" ܅ U+0705 SYRIAC HORIZONTAL COLON\n"
" ܆ U+0706 SYRIAC COLON SKEWED LEFT\n"
" ܇ U+0707 SYRIAC COLON SKEWED RIGHT\n"
" ܈ U+0708 SYRIAC SUPRALINEAR COLON SKEWED LEFT\n"
" ܉ U+0709 SYRIAC SUBLINEAR COLON SKEWED RIGHT\n"
" ܊ U+070A SYRIAC CONTRACTION\n"
" ܋ U+070B SYRIAC HARKLEAN OBELUS\n"
" ܌ U+070C SYRIAC HARKLEAN METOBELUS\n"
" ܍ U+070D SYRIAC HARKLEAN ASTERISCUS\n"
"NKo — Punctuation items: 3\n"
" ߷ U+07F7 NKO SYMBOL GBAKURUNEN\n"
" ߸ U+07F8 NKO COMMA\n"
" ߹ U+07F9 NKO EXCLAMATION MARK\n"
"Samaritan — Punctuation items: 15\n"
" ࠰ U+0830 SAMARITAN PUNCTUATION NEQUDAA\n"
" ࠱ U+0831 SAMARITAN PUNCTUATION AFSAAQ\n"
" ࠲ U+0832 SAMARITAN PUNCTUATION ANGED\n"
" ࠳ U+0833 SAMARITAN PUNCTUATION BAU\n"
" ࠴ U+0834 SAMARITAN PUNCTUATION ATMAAU\n"
" ࠵ U+0835 SAMARITAN PUNCTUATION SHIYYAALAA\n"
" ࠶ U+0836 SAMARITAN ABBREVIATION MARK\n"
" ࠷ U+0837 SAMARITAN PUNCTUATION MELODIC QITSA\n"
" ࠸ U+0838 SAMARITAN PUNCTUATION ZIQAA\n"
" ࠹ U+0839 SAMARITAN PUNCTUATION QITSA\n"
" ࠺ U+083A SAMARITAN PUNCTUATION ZAEF\n"
" ࠻ U+083B SAMARITAN PUNCTUATION TURU\n"
" ࠼ U+083C SAMARITAN PUNCTUATION ARKAANU\n"
" ࠽ U+083D SAMARITAN PUNCTUATION SOF MASHFAAT\n"
" ࠾ U+083E SAMARITAN PUNCTUATION ANNAAU\n"
"Mandaic — Punctuation items: 1\n"
" ࡞ U+085E MANDAIC PUNCTUATION\n"
"Devanagari — Generic punctuation for scripts of India items: 2\n"
" । U+0964 DEVANAGARI DANDA\n"
" ॥ U+0965 DEVANAGARI DOUBLE DANDA\n"
"Devanagari — Abbreviation mark items: 1\n"
" ॰ U+0970 DEVANAGARI ABBREVIATION SIGN\n"
"Bengali — Sign items: 1\n"
" ৽ U+09FD BENGALI ABBREVIATION SIGN\n"
"Gurmukhi — Sign items: 1\n"
" ੶ U+0A76 GURMUKHI ABBREVIATION SIGN\n"
"Gujarati — Abbreviation mark items: 1\n"
" ૰ U+0AF0 GUJARATI ABBREVIATION SIGN\n"
"Kannada — Various signs items: 1\n"
" ಄ U+0C84 KANNADA SIGN SIDDHAM\n"
"Sinhala — Punctuation items: 1\n"
" ෴ U+0DF4 SINHALA PUNCTUATION KUNDDALIYA\n"
"Thai — Sign items: 3\n"
" ๏ U+0E4F THAI CHARACTER FONGMAN\n"
" ๚ U+0E5A THAI CHARACTER ANGKHANKHU\n"
" ๛ U+0E5B THAI CHARACTER KHOMUT\n"
"Tibetan — Head mark items: 6\n"
" ༄ U+0F04 TIBETAN MARK INITIAL YIG MGO MDUN MA\n"
" ༅ U+0F05 TIBETAN MARK CLOSING YIG MGO SGAB MA\n"
" ༆ U+0F06 TIBETAN MARK CARET YIG MGO PHUR SHAD MA\n"
" ༇ U+0F07 TIBETAN MARK YIG MGO TSHEG SHAD MA\n"
" ࿓ U+0FD3 TIBETAN MARK INITIAL BRDA RNYING YIG MGO MDUN MA\n"
" ࿔ U+0FD4 TIBETAN MARK CLOSING BRDA RNYING YIG MGO SGAB MA\n"
"Tibetan — Sign items: 16\n"
" ༈ U+0F08 TIBETAN MARK SBRUL SHAD\n"
" ༉ U+0F09 TIBETAN MARK BSKUR YIG MGO\n"
" ༊ U+0F0A TIBETAN MARK BKA- SHOG YIG MGO\n"
" ་ U+0F0B TIBETAN MARK INTERSYLLABIC TSHEG\n"
" ༌ U+0F0C TIBETAN MARK DELIMITER TSHEG BSTAR\n"
" ། U+0F0D TIBETAN MARK SHAD\n"
" ༎ U+0F0E TIBETAN MARK NYIS SHAD\n"
" ༏ U+0F0F TIBETAN MARK TSHEG SHAD\n"
" ༐ U+0F10 TIBETAN MARK NYIS TSHEG SHAD\n"
" ༑ U+0F11 TIBETAN MARK RIN CHEN SPUNGS SHAD\n"
" ༒ U+0F12 TIBETAN MARK RGYA GRAM SHAD\n"
" ༔ U+0F14 TIBETAN MARK GTER TSHEG\n"
" ྅ U+0F85 TIBETAN MARK PALUTA\n"
" ࿐ U+0FD0 TIBETAN MARK BSKA- SHOG GI MGO RGYAN\n"
" ࿑ U+0FD1 TIBETAN MARK MNYAM YIG GI MGO RGYAN\n"
" ࿒ U+0FD2 TIBETAN MARK NYIS TSHEG\n"
"Tibetan — Paired punctuation items: 4\n"
" ༺ U+0F3A TIBETAN MARK GUG RTAGS GYON\n"
" ༻ U+0F3B TIBETAN MARK GUG RTAGS GYAS\n"
" ༼ U+0F3C TIBETAN MARK ANG KHANG GYON\n"
" ༽ U+0F3D TIBETAN MARK ANG KHANG GYAS\n"
"Tibetan — Annotation marks items: 2\n"
" ࿙ U+0FD9 TIBETAN MARK LEADING MCHAN RTAGS\n"
" ࿚ U+0FDA TIBETAN MARK TRAILING MCHAN RTAGS\n"
"Myanmar — Punctuation items: 2\n"
" ၊ U+104A MYANMAR SIGN LITTLE SECTION\n"
" ။ U+104B MYANMAR SIGN SECTION\n"
"Myanmar — Various signs items: 4\n"
" ၌ U+104C MYANMAR SYMBOL LOCATIVE\n"
" ၍ U+104D MYANMAR SYMBOL COMPLETED\n"
" ၎ U+104E MYANMAR SYMBOL AFOREMENTIONED\n"
" ၏ U+104F MYANMAR SYMBOL GENITIVE\n"
"Georgian — Punctuation items: 1\n"
" ჻ U+10FB GEORGIAN PARAGRAPH SEPARATOR\n"
"Ethiopic — Punctuation items: 9\n"
" ፠ U+1360 ETHIOPIC SECTION MARK\n"
" ፡ U+1361 ETHIOPIC WORDSPACE\n"
" ። U+1362 ETHIOPIC FULL STOP\n"
" ፣ U+1363 ETHIOPIC COMMA\n"
" ፤ U+1364 ETHIOPIC SEMICOLON\n"
" ፥ U+1365 ETHIOPIC COLON\n"
" ፦ U+1366 ETHIOPIC PREFACE COLON\n"
" ፧ U+1367 ETHIOPIC QUESTION MARK\n"
" ፨ U+1368 ETHIOPIC PARAGRAPH SEPARATOR\n"
"Unified Canadian Aboriginal Syllabics — Punctuation items: 2\n"
" ᐀ U+1400 CANADIAN SYLLABICS HYPHEN\n"
" ᙮ U+166E CANADIAN SYLLABICS FULL STOP\n"
"Unified Canadian Aboriginal Syllabics — Sign items: 1\n"
" ᙭ U+166D CANADIAN SYLLABICS CHI SIGN\n"
"Ogham — Punctuation items: 2\n"
" ᚛ U+169B OGHAM FEATHER MARK\n"
" ᚜ U+169C OGHAM REVERSED FEATHER MARK\n"
"Runic — Punctuation items: 3\n"
" ᛫ U+16EB RUNIC SINGLE PUNCTUATION\n"
" ᛬ U+16EC RUNIC MULTIPLE PUNCTUATION\n"
" ᛭ U+16ED RUNIC CROSS PUNCTUATION\n"
"Hanunoo — Generic punctuation for Philippine scripts items: 2\n"
" ᜵ U+1735 PHILIPPINE SINGLE PUNCTUATION\n"
" ᜶ U+1736 PHILIPPINE DOUBLE PUNCTUATION\n"
"Khmer — Various signs items: 6\n"
" ។ U+17D4 KHMER SIGN KHAN\n"
" ៕ U+17D5 KHMER SIGN BARIYOOSAN\n"
" ៖ U+17D6 KHMER SIGN CAMNUC PII KUUH\n"
" ៘ U+17D8 KHMER SIGN BEYYAL\n"
" ៙ U+17D9 KHMER SIGN PHNAEK MUAN\n"
" ៚ U+17DA KHMER SIGN KOOMUUT\n"
"Mongolian — Punctuation items: 11\n"
" ᠀ U+1800 MONGOLIAN BIRGA\n"
" ᠁ U+1801 MONGOLIAN ELLIPSIS\n"
" ᠂ U+1802 MONGOLIAN COMMA\n"
" ᠃ U+1803 MONGOLIAN FULL STOP\n"
" ᠄ U+1804 MONGOLIAN COLON\n"
" ᠅ U+1805 MONGOLIAN FOUR DOTS\n"
" ᠆ U+1806 MONGOLIAN TODO SOFT HYPHEN\n"
" ᠇ U+1807 MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER\n"
" ᠈ U+1808 MONGOLIAN MANCHU COMMA\n"
" ᠉ U+1809 MONGOLIAN MANCHU FULL STOP\n"
" ᠊ U+180A MONGOLIAN NIRUGU\n"
"Limbu — Various signs items: 2\n"
" ᥄ U+1944 LIMBU EXCLAMATION MARK\n"
" ᥅ U+1945 LIMBU QUESTION MARK\n"
"Buginese — Various signs items: 2\n"
" ᨞ U+1A1E BUGINESE PALLAWA\n"
" ᨟ U+1A1F BUGINESE END OF SECTION\n"
"Tai Tham — Logographs items: 3\n"
" ᪠ U+1AA0 TAI THAM SIGN WIANG\n"
" ᪡ U+1AA1 TAI THAM SIGN WIANGWAAK\n"
" ᪢ U+1AA2 TAI THAM SIGN SAWAN\n"
"Tai Tham — Punctuation items: 10\n"
" ᪣ U+1AA3 TAI THAM SIGN KEOW\n"
" ᪤ U+1AA4 TAI THAM SIGN HOY\n"
" ᪥ U+1AA5 TAI THAM SIGN DOKMAI\n"
" ᪦ U+1AA6 TAI THAM SIGN REVERSED ROTATED RANA\n"
" ᪨ U+1AA8 TAI THAM SIGN KAAN\n"
" ᪩ U+1AA9 TAI THAM SIGN KAANKUU\n"
" ᪪ U+1AAA TAI THAM SIGN SATKAAN\n"
" ᪫ U+1AAB TAI THAM SIGN SATKAANKUU\n"
" ᪬ U+1AAC TAI THAM SIGN HANG\n"
" ᪭ U+1AAD TAI THAM SIGN CAANG\n"
"Balinese — Punctuation items: 7\n"
" ᭚ U+1B5A BALINESE PANTI\n"
" ᭛ U+1B5B BALINESE PAMADA\n"
" ᭜ U+1B5C BALINESE WINDU\n"
" ᭝ U+1B5D BALINESE CARIK PAMUNGKAH\n"
" ᭞ U+1B5E BALINESE CARIK SIKI\n"
" ᭟ U+1B5F BALINESE CARIK PAREREN\n"
" ᭠ U+1B60 BALINESE PAMENENG\n"
"Batak — Punctuation items: 4\n"
" ᯼ U+1BFC BATAK SYMBOL BINDU NA METEK\n"
" ᯽ U+1BFD BATAK SYMBOL BINDU PINARBORAS\n"
" ᯾ U+1BFE BATAK SYMBOL BINDU JUDUL\n"
" ᯿ U+1BFF BATAK SYMBOL BINDU PANGOLAT\n"
"Lepcha — Punctuation items: 5\n"
" ᰻ U+1C3B LEPCHA PUNCTUATION TA-ROL\n"
" ᰼ U+1C3C LEPCHA PUNCTUATION NYET THYOOM TA-ROL\n"
" ᰽ U+1C3D LEPCHA PUNCTUATION CER-WA\n"
" ᰾ U+1C3E LEPCHA PUNCTUATION TSHOOK CER-WA\n"
" ᰿ U+1C3F LEPCHA PUNCTUATION TSHOOK\n"
"Ol Chiki — Punctuation items: 2\n"
" ᱾ U+1C7E OL CHIKI PUNCTUATION MUCAAD\n"
" ᱿ U+1C7F OL CHIKI PUNCTUATION DOUBLE MUCAAD\n"
"Sundanese Supplement — Punctuation items: 8\n"
" ᳀ U+1CC0 SUNDANESE PUNCTUATION BINDU SURYA\n"
" ᳁ U+1CC1 SUNDANESE PUNCTUATION BINDU PANGLONG\n"
" ᳂ U+1CC2 SUNDANESE PUNCTUATION BINDU PURNAMA\n"
" ᳃ U+1CC3 SUNDANESE PUNCTUATION BINDU CAKRA\n"
" ᳄ U+1CC4 SUNDANESE PUNCTUATION BINDU LEU SATANGA\n"
" ᳅ U+1CC5 SUNDANESE PUNCTUATION BINDU KA SATANGA\n"
" ᳆ U+1CC6 SUNDANESE PUNCTUATION BINDU DA SATANGA\n"
" ᳇ U+1CC7 SUNDANESE PUNCTUATION BINDU BA SATANGA\n"
"Vedic Extensions — Breathing mark for the Samaveda items: 1\n"
" ᳓ U+1CD3 VEDIC SIGN NIHSHVASA\n"
"General Punctuation — Dashes items: 6\n"
" ‐ U+2010 HYPHEN\n"
" ‑ U+2011 NON-BREAKING HYPHEN\n"
" ‒ U+2012 FIGURE DASH\n"
" – U+2013 EN DASH\n"
" — U+2014 EM DASH\n"
" ― U+2015 HORIZONTAL BAR\n"
"General Punctuation — General punctuation items: 39\n"
" ‖ U+2016 DOUBLE VERTICAL LINE\n"
" ‗ U+2017 DOUBLE LOW LINE\n"
" † U+2020 DAGGER\n"
" ‡ U+2021 DOUBLE DAGGER\n"
" • U+2022 BULLET\n"
" ‣ U+2023 TRIANGULAR BULLET\n"
" ․ U+2024 ONE DOT LEADER\n"
" ‥ U+2025 TWO DOT LEADER\n"
" … U+2026 HORIZONTAL ELLIPSIS\n"
" ‧ U+2027 HYPHENATION POINT\n"
" ‰ U+2030 PER MILLE SIGN\n"
" ‱ U+2031 PER TEN THOUSAND SIGN\n"
" ′ U+2032 PRIME\n"
" ″ U+2033 DOUBLE PRIME\n"
" ‴ U+2034 TRIPLE PRIME\n"
" ‵ U+2035 REVERSED PRIME\n"
" ‶ U+2036 REVERSED DOUBLE PRIME\n"
" ‷ U+2037 REVERSED TRIPLE PRIME\n"
" ‸ U+2038 CARET\n"
" ※ U+203B REFERENCE MARK\n"
" ‽ U+203D INTERROBANG\n"
" ‾ U+203E OVERLINE\n"
" ‿ U+203F UNDERTIE\n"
" ⁀ U+2040 CHARACTER TIE\n"
" ⁁ U+2041 CARET INSERTION POINT\n"
" ⁂ U+2042 ASTERISM\n"
" ⁃ U+2043 HYPHEN BULLET\n"
" ⁊ U+204A TIRONIAN SIGN ET\n"
" ⁋ U+204B REVERSED PILCROW SIGN\n"
" ⁌ U+204C BLACK LEFTWARDS BULLET\n"
" ⁍ U+204D BLACK RIGHTWARDS BULLET\n"
" ⁎ U+204E LOW ASTERISK\n"
" ⁏ U+204F REVERSED SEMICOLON\n"
" ⁐ U+2050 CLOSE UP\n"
" ⁑ U+2051 TWO ASTERISKS ALIGNED VERTICALLY\n"
" ⁓ U+2053 SWUNG DASH\n"
" ⁔ U+2054 INVERTED UNDERTIE\n"
" ⁕ U+2055 FLOWER PUNCTUATION MARK\n"
" ⁗ U+2057 QUADRUPLE PRIME\n"
"General Punctuation — Quotation marks and apostrophe items: 8\n"
" ‘ U+2018 LEFT SINGLE QUOTATION MARK\n"
" ’ U+2019 RIGHT SINGLE QUOTATION MARK\n"
" ‚ U+201A SINGLE LOW-9 QUOTATION MARK\n"
" ‛ U+201B SINGLE HIGH-REVERSED-9 QUOTATION MARK\n"
" “ U+201C LEFT DOUBLE QUOTATION MARK\n"
" ” U+201D RIGHT DOUBLE QUOTATION MARK\n"
" „ U+201E DOUBLE LOW-9 QUOTATION MARK\n"
" ‟ U+201F DOUBLE HIGH-REVERSED-9 QUOTATION MARK\n"
"General Punctuation — Quotation marks items: 2\n"
" ‹ U+2039 SINGLE LEFT-POINTING ANGLE QUOTATION MARK\n"
" › U+203A SINGLE RIGHT-POINTING ANGLE QUOTATION MARK\n"
"General Punctuation — Double punctuation for vertical text items: 4\n"
" ‼️ U+203C DOUBLE EXCLAMATION MARK\n"
" ⁇ U+2047 DOUBLE QUESTION MARK\n"
" ⁈ U+2048 QUESTION EXCLAMATION MARK\n"
" ⁉️ U+2049 EXCLAMATION QUESTION MARK\n"
"General Punctuation — Brackets items: 2\n"
" ⁅ U+2045 LEFT SQUARE BRACKET WITH QUILL\n"
" ⁆ U+2046 RIGHT SQUARE BRACKET WITH QUILL\n"
"General Punctuation — Archaic punctuation items: 8\n"
" ⁖ U+2056 THREE DOT PUNCTUATION\n"
" ⁘ U+2058 FOUR DOT PUNCTUATION\n"
" ⁙ U+2059 FIVE DOT PUNCTUATION\n"
" ⁚ U+205A TWO DOT PUNCTUATION\n"
" ⁛ U+205B FOUR DOT MARK\n"
" ⁜ U+205C DOTTED CROSS\n"
" ⁝ U+205D TRICOLON\n"
" ⁞ U+205E VERTICAL FOUR DOTS\n"
"Superscripts And Subscripts — Superscripts items: 2\n"
" ⁽ U+207D SUPERSCRIPT LEFT PARENTHESIS\n"
" ⁾ U+207E SUPERSCRIPT RIGHT PARENTHESIS\n"
"Superscripts And Subscripts — Subscripts items: 2\n"
" ₍ U+208D SUBSCRIPT LEFT PARENTHESIS\n"
" ₎ U+208E SUBSCRIPT RIGHT PARENTHESIS\n"
"Miscellaneous Technical — Ceilings and floors items: 4\n"
" ⌈ U+2308 LEFT CEILING\n"
" ⌉ U+2309 RIGHT CEILING\n"
" ⌊ U+230A LEFT FLOOR\n"
" ⌋ U+230B RIGHT FLOOR\n"
"Miscellaneous Technical — Deprecated angle brackets items: 2\n"
" 〈 U+2329 LEFT-POINTING ANGLE BRACKET\n"
" 〉 U+232A RIGHT-POINTING ANGLE BRACKET\n"
"Dingbats — Ornamental brackets items: 14\n"
" ❨ U+2768 MEDIUM LEFT PARENTHESIS ORNAMENT\n"
" ❩ U+2769 MEDIUM RIGHT PARENTHESIS ORNAMENT\n"
" ❪ U+276A MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT\n"
" ❫ U+276B MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT\n"
" ❬ U+276C MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT\n"
" ❭ U+276D MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT\n"
" ❮ U+276E HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT\n"
" ❯ U+276F HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT\n"
" ❰ U+2770 HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT\n"
" ❱ U+2771 HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT\n"
" ❲ U+2772 LIGHT LEFT TORTOISE SHELL BRACKET ORNAMENT\n"
" ❳ U+2773 LIGHT RIGHT TORTOISE SHELL BRACKET ORNAMENT\n"
" ❴ U+2774 MEDIUM LEFT CURLY BRACKET ORNAMENT\n"
" ❵ U+2775 MEDIUM RIGHT CURLY BRACKET ORNAMENT\n"
"Miscellaneous Mathematical Symbols A — Paired punctuation items: 2\n"
" ⟅ U+27C5 LEFT S-SHAPED BAG DELIMITER\n"
" ⟆ U+27C6 RIGHT S-SHAPED BAG DELIMITER\n"
"Miscellaneous Mathematical Symbols A — Mathematical brackets items: 10\n"
" ⟦ U+27E6 MATHEMATICAL LEFT WHITE SQUARE BRACKET\n"
" ⟧ U+27E7 MATHEMATICAL RIGHT WHITE SQUARE BRACKET\n"
" ⟨ U+27E8 MATHEMATICAL LEFT ANGLE BRACKET\n"
" ⟩ U+27E9 MATHEMATICAL RIGHT ANGLE BRACKET\n"
" ⟪ U+27EA MATHEMATICAL LEFT DOUBLE ANGLE BRACKET\n"
" ⟫ U+27EB MATHEMATICAL RIGHT DOUBLE ANGLE BRACKET\n"
" ⟬ U+27EC MATHEMATICAL LEFT WHITE TORTOISE SHELL BRACKET\n"
" ⟭ U+27ED MATHEMATICAL RIGHT WHITE TORTOISE SHELL BRACKET\n"
" ⟮ U+27EE MATHEMATICAL LEFT FLATTENED PARENTHESIS\n"
" ⟯ U+27EF MATHEMATICAL RIGHT FLATTENED PARENTHESIS\n"
"Miscellaneous Mathematical Symbols B — Brackets items: 20\n"
" ⦃ U+2983 LEFT WHITE CURLY BRACKET\n"
" ⦄ U+2984 RIGHT WHITE CURLY BRACKET\n"
" ⦅ U+2985 LEFT WHITE PARENTHESIS\n"
" ⦆ U+2986 RIGHT WHITE PARENTHESIS\n"
" ⦇ U+2987 Z NOTATION LEFT IMAGE BRACKET\n"
" ⦈ U+2988 Z NOTATION RIGHT IMAGE BRACKET\n"
" ⦉ U+2989 Z NOTATION LEFT BINDING BRACKET\n"
" ⦊ U+298A Z NOTATION RIGHT BINDING BRACKET\n"
" ⦋ U+298B LEFT SQUARE BRACKET WITH UNDERBAR\n"
" ⦌ U+298C RIGHT SQUARE BRACKET WITH UNDERBAR\n"
" ⦑ U+2991 LEFT ANGLE BRACKET WITH DOT\n"
" ⦒ U+2992 RIGHT ANGLE BRACKET WITH DOT\n"
" ⦓ U+2993 LEFT ARC LESS-THAN BRACKET\n"
" ⦔ U+2994 RIGHT ARC GREATER-THAN BRACKET\n"
" ⦕ U+2995 DOUBLE LEFT ARC GREATER-THAN BRACKET\n"
" ⦖ U+2996 DOUBLE RIGHT ARC LESS-THAN BRACKET\n"
" ⦗ U+2997 LEFT BLACK TORTOISE SHELL BRACKET\n"
" ⦘ U+2998 RIGHT BLACK TORTOISE SHELL BRACKET\n"
" ⧼ U+29FC LEFT-POINTING CURVED ANGLE BRACKET\n"
" ⧽ U+29FD RIGHT-POINTING CURVED ANGLE BRACKET\n"
"Miscellaneous Mathematical Symbols B — Brackets with ticks items: 4\n"
" ⦍ U+298D LEFT SQUARE BRACKET WITH TICK IN TOP CORNER\n"
" ⦎ U+298E RIGHT SQUARE BRACKET WITH TICK IN BOTTOM CORNER\n"
" ⦏ U+298F LEFT SQUARE BRACKET WITH TICK IN BOTTOM CORNER\n"
" ⦐ U+2990 RIGHT SQUARE BRACKET WITH TICK IN TOP CORNER\n"
"Miscellaneous Mathematical Symbols B — Fences items: 4\n"
" ⧘ U+29D8 LEFT WIGGLY FENCE\n"
" ⧙ U+29D9 RIGHT WIGGLY FENCE\n"
" ⧚ U+29DA LEFT DOUBLE WIGGLY FENCE\n"
" ⧛ U+29DB RIGHT DOUBLE WIGGLY FENCE\n"
"Coptic — Old Nubian punctuation items: 4\n"
" ⳹ U+2CF9 COPTIC OLD NUBIAN FULL STOP\n"
" ⳺ U+2CFA COPTIC OLD NUBIAN DIRECT QUESTION MARK\n"
" ⳻ U+2CFB COPTIC OLD NUBIAN INDIRECT QUESTION MARK\n"
" ⳼ U+2CFC COPTIC OLD NUBIAN VERSE DIVIDER\n"
"Coptic — Punctuation items: 2\n"
" ⳾ U+2CFE COPTIC FULL STOP\n"
" ⳿ U+2CFF COPTIC MORPHOLOGICAL DIVIDER\n"
"Tifinagh — Punctuation items: 1\n"
" ⵰ U+2D70 TIFINAGH SEPARATOR MARK\n"
"Supplemental Punctuation — New Testament editorial symbols items: 14\n"
" ⸀ U+2E00 RIGHT ANGLE SUBSTITUTION MARKER\n"
" ⸁ U+2E01 RIGHT ANGLE DOTTED SUBSTITUTION MARKER\n"
" ⸂ U+2E02 LEFT SUBSTITUTION BRACKET\n"
" ⸃ U+2E03 RIGHT SUBSTITUTION BRACKET\n"
" ⸄ U+2E04 LEFT DOTTED SUBSTITUTION BRACKET\n"
" ⸅ U+2E05 RIGHT DOTTED SUBSTITUTION BRACKET\n"
" ⸆ U+2E06 RAISED INTERPOLATION MARKER\n"
" ⸇ U+2E07 RAISED DOTTED INTERPOLATION MARKER\n"
" ⸈ U+2E08 DOTTED TRANSPOSITION MARKER\n"
" ⸉ U+2E09 LEFT TRANSPOSITION BRACKET\n"
" ⸊ U+2E0A RIGHT TRANSPOSITION BRACKET\n"
" ⸋ U+2E0B RAISED SQUARE\n"
" ⸌ U+2E0C LEFT RAISED OMISSION BRACKET\n"
" ⸍ U+2E0D RIGHT RAISED OMISSION BRACKET\n"
"Supplemental Punctuation — Ancient Greek textual symbols items: 9\n"
" ⸎ U+2E0E EDITORIAL CORONIS\n"
" ⸏ U+2E0F PARAGRAPHOS\n"
" ⸐ U+2E10 FORKED PARAGRAPHOS\n"
" ⸑ U+2E11 REVERSED FORKED PARAGRAPHOS\n"
" ⸒ U+2E12 HYPODIASTOLE\n"
" ⸓ U+2E13 DOTTED OBELOS\n"
" ⸔ U+2E14 DOWNWARDS ANCORA\n"
" ⸕ U+2E15 UPWARDS ANCORA\n"
" ⸖ U+2E16 DOTTED RIGHT-POINTING ANGLE\n"
"Supplemental Punctuation — Ancient Near-Eastern linguistic symbol items: 1\n"
" ⸗ U+2E17 DOUBLE OBLIQUE HYPHEN\n"
"Supplemental Punctuation — General punctuation items: 2\n"
" ⸘ U+2E18 INVERTED INTERROBANG\n"
" ⸙ U+2E19 PALM BRANCH\n"
"Supplemental Punctuation — Dictionary punctuation items: 4\n"
" ⸚ U+2E1A HYPHEN WITH DIAERESIS\n"
" ⸛ U+2E1B TILDE WITH RING ABOVE\n"
" ⸞ U+2E1E TILDE WITH DOT ABOVE\n"
" ⸟ U+2E1F TILDE WITH DOT BELOW\n"
"Supplemental Punctuation — Brackets items: 8\n"
" ⸜ U+2E1C LEFT LOW PARAPHRASE BRACKET\n"
" ⸝ U+2E1D RIGHT LOW PARAPHRASE BRACKET\n"
" ⸠ U+2E20 LEFT VERTICAL BAR WITH QUILL\n"
" ⸡ U+2E21 RIGHT VERTICAL BAR WITH QUILL\n"
" ⸦ U+2E26 LEFT SIDEWAYS U BRACKET\n"
" ⸧ U+2E27 RIGHT SIDEWAYS U BRACKET\n"
" ⸨ U+2E28 LEFT DOUBLE PARENTHESIS\n"
" ⸩ U+2E29 RIGHT DOUBLE PARENTHESIS\n"
"Supplemental Punctuation — Half brackets items: 4\n"
" ⸢ U+2E22 TOP LEFT HALF BRACKET\n"
" ⸣ U+2E23 TOP RIGHT HALF BRACKET\n"
" ⸤ U+2E24 BOTTOM LEFT HALF BRACKET\n"
" ⸥ U+2E25 BOTTOM RIGHT HALF BRACKET\n"
"Supplemental Punctuation — Archaic punctuation items: 15\n"
" ⸪ U+2E2A TWO DOTS OVER ONE DOT PUNCTUATION\n"
" ⸫ U+2E2B ONE DOT OVER TWO DOTS PUNCTUATION\n"
" ⸬ U+2E2C SQUARED FOUR DOT PUNCTUATION\n"
" ⸭ U+2E2D FIVE DOT MARK\n"
" ⸮ U+2E2E REVERSED QUESTION MARK\n"
" ⸰ U+2E30 RING POINT\n"
" ⸱ U+2E31 WORD SEPARATOR MIDDLE DOT\n"
" ⸳ U+2E33 RAISED DOT\n"
" ⸴ U+2E34 RAISED COMMA\n"
" ⸿ U+2E3F CAPITULUM\n"
" ⹊ U+2E4A DOTTED SOLIDUS\n"
" ⹋ U+2E4B TRIPLE DAGGER\n"
" ⹌ U+2E4C MEDIEVAL COMMA\n"
" ⹍ U+2E4D PARAGRAPHUS MARK\n"
" ⹎ U+2E4E PUNCTUS ELEVATUS MARK\n"
"Supplemental Punctuation — Palaeotype transliteration symbol items: 6\n"
" ⸲ U+2E32 TURNED COMMA\n"
" ⸵ U+2E35 TURNED SEMICOLON\n"
" ⸶ U+2E36 DAGGER WITH LEFT GUARD\n"
" ⸷ U+2E37 DAGGER WITH RIGHT GUARD\n"
" ⸸ U+2E38 TURNED DAGGER\n"
" ⸹ U+2E39 TOP HALF SECTION SIGN\n"
"Supplemental Punctuation — Dashes items: 2\n"
" ⸺ U+2E3A TWO-EM DASH\n"
" ⸻ U+2E3B THREE-EM DASH\n"
"Supplemental Punctuation — Alternate forms of punctuation items: 3\n"
" ⸼ U+2E3C STENOGRAPHIC FULL STOP\n"
" ⸽ U+2E3D VERTICAL SIX DOTS\n"
" ⸾ U+2E3E WIGGLY VERTICAL LINE\n"
"Supplemental Punctuation — Double hyphen items: 1\n"
" ⹀ U+2E40 DOUBLE HYPHEN\n"
"Supplemental Punctuation — Reversed punctuation items: 2\n"
" ⹁ U+2E41 REVERSED COMMA\n"
" ⹂ U+2E42 DOUBLE LOW-REVERSED-9 QUOTATION MARK\n"
"Supplemental Punctuation — Miscellaneous punctuation items: 2\n"
" ⹃ U+2E43 DASH WITH LEFT UPTURN\n"
" ⹄ U+2E44 DOUBLE SUSPENSION MARK\n"
"Supplemental Punctuation — Typicon punctuation items: 5\n"
" ⹅ U+2E45 INVERTED LOW KAVYKA\n"
" ⹆ U+2E46 INVERTED LOW KAVYKA WITH KAVYKA ABOVE\n"
" ⹇ U+2E47 LOW KAVYKA\n"
" ⹈ U+2E48 LOW KAVYKA WITH DOT\n"
" ⹉ U+2E49 DOUBLE STACKED COMMA\n"
"CJK Symbols And Punctuation — CJK symbols and punctuation items: 3\n"
" 、 U+3001 IDEOGRAPHIC COMMA\n"
" 。 U+3002 IDEOGRAPHIC FULL STOP\n"
" 〃 U+3003 DITTO MARK\n"
"CJK Symbols And Punctuation — CJK angle brackets items: 4\n"
" 〈 U+3008 LEFT ANGLE BRACKET\n"
" 〉 U+3009 RIGHT ANGLE BRACKET\n"
" 《 U+300A LEFT DOUBLE ANGLE BRACKET\n"
" 》 U+300B RIGHT DOUBLE ANGLE BRACKET\n"
"CJK Symbols And Punctuation — CJK corner brackets items: 4\n"
" 「 U+300C LEFT CORNER BRACKET\n"
" 」 U+300D RIGHT CORNER BRACKET\n"
" 『 U+300E LEFT WHITE CORNER BRACKET\n"
" 』 U+300F RIGHT WHITE CORNER BRACKET\n"
"CJK Symbols And Punctuation — CJK brackets items: 10\n"
" 【 U+3010 LEFT BLACK LENTICULAR BRACKET\n"
" 】 U+3011 RIGHT BLACK LENTICULAR BRACKET\n"
" 〔 U+3014 LEFT TORTOISE SHELL BRACKET\n"
" 〕 U+3015 RIGHT TORTOISE SHELL BRACKET\n"
" 〖 U+3016 LEFT WHITE LENTICULAR BRACKET\n"
" 〗 U+3017 RIGHT WHITE LENTICULAR BRACKET\n"
" 〘 U+3018 LEFT WHITE TORTOISE SHELL BRACKET\n"
" 〙 U+3019 RIGHT WHITE TORTOISE SHELL BRACKET\n"
" 〚 U+301A LEFT WHITE SQUARE BRACKET\n"
" 〛 U+301B RIGHT WHITE SQUARE BRACKET\n"
"CJK Symbols And Punctuation — CJK punctuation items: 6\n"
" 〜 U+301C WAVE DASH\n"
" 〝 U+301D REVERSED DOUBLE PRIME QUOTATION MARK\n"
" 〞 U+301E DOUBLE PRIME QUOTATION MARK\n"
" 〟 U+301F LOW DOUBLE PRIME QUOTATION MARK\n"
" 〰️ U+3030 WAVY DASH\n"
" 〽️ U+303D PART ALTERNATION MARK\n"
"Katakana — Katakana punctuation items: 1\n"
" ゠ U+30A0 KATAKANA-HIRAGANA DOUBLE HYPHEN\n"
"Katakana — Conjunction and length marks items: 1\n"
" ・ U+30FB KATAKANA MIDDLE DOT\n"
"Lisu — Punctuation items: 2\n"
" ꓾ U+A4FE LISU PUNCTUATION COMMA\n"
" ꓿ U+A4FF LISU PUNCTUATION FULL STOP\n"
"Vai — Punctuation items: 3\n"
" ꘍ U+A60D VAI COMMA\n"
" ꘎ U+A60E VAI FULL STOP\n"
" ꘏ U+A60F VAI QUESTION MARK\n"
"Cyrillic Extended B — Punctuation mark items: 2\n"
" ꙳ U+A673 SLAVONIC ASTERISK\n"
" ꙾ U+A67E CYRILLIC KAVYKA\n"
"Bamum — Punctuation items: 6\n"
" ꛲ U+A6F2 BAMUM NJAEMLI\n"
" ꛳ U+A6F3 BAMUM FULL STOP\n"
" ꛴ U+A6F4 BAMUM COLON\n"
" ꛵ U+A6F5 BAMUM COMMA\n"
" ꛶ U+A6F6 BAMUM SEMICOLON\n"
" ꛷ U+A6F7 BAMUM QUESTION MARK\n"
"Phags Pa — Head marks for Tibetan items: 2\n"
" ꡴ U+A874 PHAGS-PA SINGLE HEAD MARK\n"
" ꡵ U+A875 PHAGS-PA DOUBLE HEAD MARK\n"
"Phags Pa — Punctuation for Tibetan items: 2\n"
" ꡶ U+A876 PHAGS-PA MARK SHAD\n"
" ꡷ U+A877 PHAGS-PA MARK DOUBLE SHAD\n"
"Saurashtra — Punctuation items: 2\n"
" ꣎ U+A8CE SAURASHTRA DANDA\n"
" ꣏ U+A8CF SAURASHTRA DOUBLE DANDA\n"
"Devanagari Extended — Editorial marks items: 3\n"
" ꣸ U+A8F8 DEVANAGARI SIGN PUSHPIKA\n"
" ꣹ U+A8F9 DEVANAGARI GAP FILLER\n"
" ꣺ U+A8FA DEVANAGARI CARET\n"
"Devanagari Extended — Sign items: 1\n"
" ꣼ U+A8FC DEVANAGARI SIGN SIDDHAM\n"
"Kayah Li — Punctuation items: 2\n"
" ꤮ U+A92E KAYAH LI SIGN CWI\n"
" ꤯ U+A92F KAYAH LI SIGN SHYA\n"
"Rejang — Punctuation items: 1\n"
" ꥟ U+A95F REJANG SECTION MARK\n"
"Javanese — Punctuation items: 13\n"
" ꧁ U+A9C1 JAVANESE LEFT RERENGGAN\n"
" ꧂ U+A9C2 JAVANESE RIGHT RERENGGAN\n"
" ꧃ U+A9C3 JAVANESE PADA ANDAP\n"
" ꧄ U+A9C4 JAVANESE PADA MADYA\n"
" ꧅ U+A9C5 JAVANESE PADA LUHUR\n"
" ꧆ U+A9C6 JAVANESE PADA WINDU\n"
" ꧇ U+A9C7 JAVANESE PADA PANGKAT\n"
" ꧈ U+A9C8 JAVANESE PADA LINGSA\n"
" ꧉ U+A9C9 JAVANESE PADA LUNGSI\n"
" ꧊ U+A9CA JAVANESE PADA ADEG\n"
" ꧋ U+A9CB JAVANESE PADA ADEG ADEG\n"
" ꧌ U+A9CC JAVANESE PADA PISELEH\n"
" ꧍ U+A9CD JAVANESE TURNED PADA PISELEH\n"
"Javanese — Ellipsis marks items: 2\n"
" ꧞ U+A9DE JAVANESE PADA TIRTA TUMETES\n"
" ꧟ U+A9DF JAVANESE PADA ISEN-ISEN\n"
"Cham — Punctuation items: 4\n"
" ꩜ U+AA5C CHAM PUNCTUATION SPIRAL\n"
" ꩝ U+AA5D CHAM PUNCTUATION DANDA\n"
" ꩞ U+AA5E CHAM PUNCTUATION DOUBLE DANDA\n"
" ꩟ U+AA5F CHAM PUNCTUATION TRIPLE DANDA\n"
"Tai Viet — Punctuation items: 2\n"
" ꫞ U+AADE TAI VIET SYMBOL HO HOI\n"
" ꫟ U+AADF TAI VIET SYMBOL KOI KOI\n"
"Meetei Mayek Extensions — Punctuation items: 2\n"
" ꫰ U+AAF0 MEETEI MAYEK CHEIKHAN\n"
" ꫱ U+AAF1 MEETEI MAYEK AHANG KHUDAM\n"
"Meetei Mayek — Punctuation items: 1\n"
" ꯫ U+ABEB MEETEI MAYEK CHEIKHEI\n"
"Arabic Presentation Forms A — Punctuation items: 2\n"
" ﴾ U+FD3E ORNATE LEFT PARENTHESIS\n"
" ﴿ U+FD3F ORNATE RIGHT PARENTHESIS\n"
"Vertical Forms — Glyphs for vertical variants items: 10\n"
" ︐ U+FE10 PRESENTATION FORM FOR VERTICAL COMMA\n"
" ︑ U+FE11 PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC COMMA\n"
" ︒ U+FE12 PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC FULL STOP\n"
" ︓ U+FE13 PRESENTATION FORM FOR VERTICAL COLON\n"
" ︔ U+FE14 PRESENTATION FORM FOR VERTICAL SEMICOLON\n"
" ︕ U+FE15 PRESENTATION FORM FOR VERTICAL EXCLAMATION MARK\n"
" ︖ U+FE16 PRESENTATION FORM FOR VERTICAL QUESTION MARK\n"
" ︗ U+FE17 PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET\n"
" ︘ U+FE18 PRESENTATION FORM FOR VERTICAL RIGHT WHITE LENTICULAR BRAKCET\n"
" ︙ U+FE19 PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS\n"
"CJK Compatibility Forms — Glyphs for vertical variants items: 23\n"
" ︰ U+FE30 PRESENTATION FORM FOR VERTICAL TWO DOT LEADER\n"
" ︱ U+FE31 PRESENTATION FORM FOR VERTICAL EM DASH\n"
" ︲ U+FE32 PRESENTATION FORM FOR VERTICAL EN DASH\n"
" ︳ U+FE33 PRESENTATION FORM FOR VERTICAL LOW LINE\n"
" ︴ U+FE34 PRESENTATION FORM FOR VERTICAL WAVY LOW LINE\n"
" ︵ U+FE35 PRESENTATION FORM FOR VERTICAL LEFT PARENTHESIS\n"
" ︶ U+FE36 PRESENTATION FORM FOR VERTICAL RIGHT PARENTHESIS\n"
" ︷ U+FE37 PRESENTATION FORM FOR VERTICAL LEFT CURLY BRACKET\n"
" ︸ U+FE38 PRESENTATION FORM FOR VERTICAL RIGHT CURLY BRACKET\n"
" ︹ U+FE39 PRESENTATION FORM FOR VERTICAL LEFT TORTOISE SHELL BRACKET\n"
" ︺ U+FE3A PRESENTATION FORM FOR VERTICAL RIGHT TORTOISE SHELL BRACKET\n"
" ︻ U+FE3B PRESENTATION FORM FOR VERTICAL LEFT BLACK LENTICULAR BRACKET\n"
" ︼ U+FE3C PRESENTATION FORM FOR VERTICAL RIGHT BLACK LENTICULAR BRACKET\n"
" ︽ U+FE3D PRESENTATION FORM FOR VERTICAL LEFT DOUBLE ANGLE BRACKET\n"
" ︾ U+FE3E PRESENTATION FORM FOR VERTICAL RIGHT DOUBLE ANGLE BRACKET\n"
" ︿ U+FE3F PRESENTATION FORM FOR VERTICAL LEFT ANGLE BRACKET\n"
" ﹀ U+FE40 PRESENTATION FORM FOR VERTICAL RIGHT ANGLE BRACKET\n"
" ﹁ U+FE41 PRESENTATION FORM FOR VERTICAL LEFT CORNER BRACKET\n"
" ﹂ U+FE42 PRESENTATION FORM FOR VERTICAL RIGHT CORNER BRACKET\n"
" ﹃ U+FE43 PRESENTATION FORM FOR VERTICAL LEFT WHITE CORNER BRACKET\n"
" ﹄ U+FE44 PRESENTATION FORM FOR VERTICAL RIGHT WHITE CORNER BRACKET\n"
" ﹇ U+FE47 PRESENTATION FORM FOR VERTICAL LEFT SQUARE BRACKET\n"
" ﹈ U+FE48 PRESENTATION FORM FOR VERTICAL RIGHT SQUARE BRACKET\n"
"CJK Compatibility Forms — Sidelining emphasis marks items: 2\n"
" ﹅ U+FE45 SESAME DOT\n"
" ﹆ U+FE46 WHITE SESAME DOT\n"
"CJK Compatibility Forms — Overscores and underscores items: 7\n"
" ﹉ U+FE49 DASHED OVERLINE\n"
" ﹊ U+FE4A CENTRELINE OVERLINE\n"
" ﹋ U+FE4B WAVY OVERLINE\n"
" ﹌ U+FE4C DOUBLE WAVY OVERLINE\n"
" ﹍ U+FE4D DASHED LOW LINE\n"
" ﹎ U+FE4E CENTRELINE LOW LINE\n"
" ﹏ U+FE4F WAVY LOW LINE\n"
"Small Form Variants — Small form variants items: 21\n"
" ﹐ U+FE50 SMALL COMMA\n"
" ﹑ U+FE51 SMALL IDEOGRAPHIC COMMA\n"
" ﹒ U+FE52 SMALL FULL STOP\n"
" ﹔ U+FE54 SMALL SEMICOLON\n"
" ﹕ U+FE55 SMALL COLON\n"
" ﹖ U+FE56 SMALL QUESTION MARK\n"
" ﹗ U+FE57 SMALL EXCLAMATION MARK\n"
" ﹘ U+FE58 SMALL EM DASH\n"
" ﹙ U+FE59 SMALL LEFT PARENTHESIS\n"
" ﹚ U+FE5A SMALL RIGHT PARENTHESIS\n"
" ﹛ U+FE5B SMALL LEFT CURLY BRACKET\n"
" ﹜ U+FE5C SMALL RIGHT CURLY BRACKET\n"
" ﹝ U+FE5D SMALL LEFT TORTOISE SHELL BRACKET\n"
" ﹞ U+FE5E SMALL RIGHT TORTOISE SHELL BRACKET\n"
" ﹟ U+FE5F SMALL NUMBER SIGN\n"
" ﹠ U+FE60 SMALL AMPERSAND\n"
" ﹡ U+FE61 SMALL ASTERISK\n"
" ﹣ U+FE63 SMALL HYPHEN-MINUS\n"
" ﹨ U+FE68 SMALL REVERSE SOLIDUS\n"
" ﹪ U+FE6A SMALL PERCENT SIGN\n"
" ﹫ U+FE6B SMALL COMMERCIAL AT\n"
"Halfwidth And Fullwidth Forms — Fullwidth ASCII variants items: 23\n"
" ! U+FF01 FULLWIDTH EXCLAMATION MARK\n"
" " U+FF02 FULLWIDTH QUOTATION MARK\n"
" # U+FF03 FULLWIDTH NUMBER SIGN\n"
" % U+FF05 FULLWIDTH PERCENT SIGN\n"
" & U+FF06 FULLWIDTH AMPERSAND\n"
" ' U+FF07 FULLWIDTH APOSTROPHE\n"
" ( U+FF08 FULLWIDTH LEFT PARENTHESIS\n"
" ) U+FF09 FULLWIDTH RIGHT PARENTHESIS\n"
" * U+FF0A FULLWIDTH ASTERISK\n"
" , U+FF0C FULLWIDTH COMMA\n"
" - U+FF0D FULLWIDTH HYPHEN-MINUS\n"
" . U+FF0E FULLWIDTH FULL STOP\n"
" / U+FF0F FULLWIDTH SOLIDUS\n"
" : U+FF1A FULLWIDTH COLON\n"
" ; U+FF1B FULLWIDTH SEMICOLON\n"
" ? U+FF1F FULLWIDTH QUESTION MARK\n"
" @ U+FF20 FULLWIDTH COMMERCIAL AT\n"
" [ U+FF3B FULLWIDTH LEFT SQUARE BRACKET\n"
" \ U+FF3C FULLWIDTH REVERSE SOLIDUS\n"
" ] U+FF3D FULLWIDTH RIGHT SQUARE BRACKET\n"
" _ U+FF3F FULLWIDTH LOW LINE\n"
" { U+FF5B FULLWIDTH LEFT CURLY BRACKET\n"
" } U+FF5D FULLWIDTH RIGHT CURLY BRACKET\n"
"Halfwidth And Fullwidth Forms — Fullwidth brackets items: 2\n"
" ⦅ U+FF5F FULLWIDTH LEFT WHITE PARENTHESIS\n"
" ⦆ U+FF60 FULLWIDTH RIGHT WHITE PARENTHESIS\n"
"Halfwidth And Fullwidth Forms — Halfwidth CJK punctuation items: 4\n"
" 。 U+FF61 HALFWIDTH IDEOGRAPHIC FULL STOP\n"
" 「 U+FF62 HALFWIDTH LEFT CORNER BRACKET\n"
" 」 U+FF63 HALFWIDTH RIGHT CORNER BRACKET\n"
" 、 U+FF64 HALFWIDTH IDEOGRAPHIC COMMA\n"
"Halfwidth And Fullwidth Forms — Halfwidth Katakana variants items: 1\n"
" ・ U+FF65 HALFWIDTH KATAKANA MIDDLE DOT\n"
"Aegean Numbers — Punctuation items: 3\n"
" 𐄀 U+10100 AEGEAN WORD SEPARATOR LINE\n"
" 𐄁 U+10101 AEGEAN WORD SEPARATOR DOT\n"
" 𐄂 U+10102 AEGEAN CHECK MARK\n"
"Ugaritic — Punctuation items: 1\n"
" 𐎟 U+1039F UGARITIC WORD DIVIDER\n"
"Old Persian — Punctuation items: 1\n"
" 𐏐 U+103D0 OLD PERSIAN WORD DIVIDER\n"
"Caucasian Albanian — Punctuation items: 1\n"
" 𐕯 U+1056F CAUCASIAN ALBANIAN CITATION MARK\n"
"Imperial Aramaic — Punctuation items: 1\n"
" 𐡗 U+10857 IMPERIAL ARAMAIC SECTION SIGN\n"
"Phoenician — Punctuation items: 1\n"
" 𐤟 U+1091F PHOENICIAN WORD SEPARATOR\n"
"Lydian — Punctuation items: 1\n"
" 𐤿 U+1093F LYDIAN TRIANGULAR MARK\n"
"Kharoshthi — Punctuation items: 9\n"
" 𐩐 U+10A50 KHAROSHTHI PUNCTUATION DOT\n"
" 𐩑 U+10A51 KHAROSHTHI PUNCTUATION SMALL CIRCLE\n"
" 𐩒 U+10A52 KHAROSHTHI PUNCTUATION CIRCLE\n"
" 𐩓 U+10A53 KHAROSHTHI PUNCTUATION CRESCENT BAR\n"
" 𐩔 U+10A54 KHAROSHTHI PUNCTUATION MANGALAM\n"
" 𐩕 U+10A55 KHAROSHTHI PUNCTUATION LOTUS\n"
" 𐩖 U+10A56 KHAROSHTHI PUNCTUATION DANDA\n"
" 𐩗 U+10A57 KHAROSHTHI PUNCTUATION DOUBLE DANDA\n"
" 𐩘 U+10A58 KHAROSHTHI PUNCTUATION LINES\n"
"Old South Arabian — Numbers items: 1\n"
" 𐩿 U+10A7F OLD SOUTH ARABIAN NUMERIC INDICATOR\n"
"Manichaean — Punctuation items: 7\n"
" 𐫰 U+10AF0 MANICHAEAN PUNCTUATION STAR\n"
" 𐫱 U+10AF1 MANICHAEAN PUNCTUATION FLEURON\n"
" 𐫲 U+10AF2 MANICHAEAN PUNCTUATION DOUBLE DOT WITHIN DOT\n"
" 𐫳 U+10AF3 MANICHAEAN PUNCTUATION DOT WITHIN DOT\n"
" 𐫴 U+10AF4 MANICHAEAN PUNCTUATION DOT\n"
" 𐫵 U+10AF5 MANICHAEAN PUNCTUATION TWO DOTS\n"
" 𐫶 U+10AF6 MANICHAEAN PUNCTUATION LINE FILLER\n"
"Avestan — Punctuation items: 7\n"
" 𐬹 U+10B39 AVESTAN ABBREVIATION MARK\n"
" 𐬺 U+10B3A TINY TWO DOTS OVER ONE DOT PUNCTUATION\n"
" 𐬻 U+10B3B SMALL TWO DOTS OVER ONE DOT PUNCTUATION\n"
" 𐬼 U+10B3C LARGE TWO DOTS OVER ONE DOT PUNCTUATION\n"
" 𐬽 U+10B3D LARGE ONE DOT OVER TWO DOTS PUNCTUATION\n"
" 𐬾 U+10B3E LARGE TWO RINGS OVER ONE RING PUNCTUATION\n"
" 𐬿 U+10B3F LARGE ONE RING OVER TWO RINGS PUNCTUATION\n"
"Psalter Pahlavi — Punctuation items: 4\n"
" 𐮙 U+10B99 PSALTER PAHLAVI SECTION MARK\n"
" 𐮚 U+10B9A PSALTER PAHLAVI TURNED SECTION MARK\n"
" 𐮛 U+10B9B PSALTER PAHLAVI FOUR DOTS WITH CROSS\n"
" 𐮜 U+10B9C PSALTER PAHLAVI FOUR DOTS WITH DOT\n"
"Sogdian — Punctuation items: 5\n"
" 𐽕 U+10F55 SOGDIAN PUNCTUATION TWO VERTICAL BARS\n"
" 𐽖 U+10F56 SOGDIAN PUNCTUATION TWO VERTICAL BARS WITH DOTS\n"
" 𐽗 U+10F57 SOGDIAN PUNCTUATION CIRCLE WITH DOT\n"
" 𐽘 U+10F58 SOGDIAN PUNCTUATION TWO CIRCLES WITH DOTS\n"
" 𐽙 U+10F59 SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT\n"
"Brahmi — Punctuation items: 7\n"
" 𑁇 U+11047 BRAHMI DANDA\n"
" 𑁈 U+11048 BRAHMI DOUBLE DANDA\n"
" 𑁉 U+11049 BRAHMI PUNCTUATION DOT\n"
" 𑁊 U+1104A BRAHMI PUNCTUATION DOUBLE DOT\n"
" 𑁋 U+1104B BRAHMI PUNCTUATION LINE\n"
" 𑁌 U+1104C BRAHMI PUNCTUATION CRESCENT BAR\n"
" 𑁍 U+1104D BRAHMI PUNCTUATION LOTUS\n"
"Kaithi — Various signs items: 2\n"
" 𑂻 U+110BB KAITHI ABBREVIATION SIGN\n"
" 𑂼 U+110BC KAITHI ENUMERATION SIGN\n"
"Kaithi — Punctuation items: 4\n"
" 𑂾 U+110BE KAITHI SECTION MARK\n"
" 𑂿 U+110BF KAITHI DOUBLE SECTION MARK\n"
" 𑃀 U+110C0 KAITHI DANDA\n"
" 𑃁 U+110C1 KAITHI DOUBLE DANDA\n"
"Chakma — Punctuation items: 4\n"
" 𑅀 U+11140 CHAKMA SECTION MARK\n"
" 𑅁 U+11141 CHAKMA DANDA\n"
" 𑅂 U+11142 CHAKMA DOUBLE DANDA\n"
" 𑅃 U+11143 CHAKMA QUESTION MARK\n"
"Mahajani — Punctuation items: 2\n"
" 𑅴 U+11174 MAHAJANI ABBREVIATION SIGN\n"
" 𑅵 U+11175 MAHAJANI SECTION MARK\n"
"Sharada — Punctuation items: 7\n"
" 𑇅 U+111C5 SHARADA DANDA\n"
" 𑇆 U+111C6 SHARADA DOUBLE DANDA\n"
" 𑇇 U+111C7 SHARADA ABBREVIATION SIGN\n"
" 𑇈 U+111C8 SHARADA SEPARATOR\n"
" 𑇍 U+111CD SHARADA SUTRA MARK\n"
" 𑇛 U+111DB SHARADA SIGN SIDDHAM\n"
" 𑇝 U+111DD SHARADA CONTINUATION SIGN\n"
"Sharada — Section marks items: 2\n"
" 𑇞 U+111DE SHARADA SECTION MARK-1\n"
" 𑇟 U+111DF SHARADA SECTION MARK-2\n"
"Khojki — Punctuation items: 6\n"
" 𑈸 U+11238 KHOJKI DANDA\n"
" 𑈹 U+11239 KHOJKI DOUBLE DANDA\n"
" 𑈺 U+1123A KHOJKI WORD SEPARATOR\n"
" 𑈻 U+1123B KHOJKI SECTION MARK\n"
" 𑈼 U+1123C KHOJKI DOUBLE SECTION MARK\n"
" 𑈽 U+1123D KHOJKI ABBREVIATION SIGN\n"
"Multani — Punctuation items: 1\n"
" 𑊩 U+112A9 MULTANI SECTION MARK\n"
"Newa — Punctuation items: 5\n"
" 𑑋 U+1144B NEWA DANDA\n"
" 𑑌 U+1144C NEWA DOUBLE DANDA\n"
" 𑑍 U+1144D NEWA COMMA\n"
" 𑑎 U+1144E NEWA GAP FILLER\n"
" 𑑏 U+1144F NEWA ABBREVIATION SIGN\n"
"Newa — Various signs items: 2\n"
" 𑑛 U+1145B NEWA PLACEHOLDER MARK\n"
" 𑑝 U+1145D NEWA INSERTION SIGN\n"
"Tirhuta — Various signs items: 1\n"
" 𑓆 U+114C6 TIRHUTA ABBREVIATION SIGN\n"
"Siddham — Head mark items: 1\n"
" 𑗁 U+115C1 SIDDHAM SIGN SIDDHAM\n"
"Siddham — Punctuation items: 4\n"
" 𑗂 U+115C2 SIDDHAM DANDA\n"
" 𑗃 U+115C3 SIDDHAM DOUBLE DANDA\n"
" 𑗄 U+115C4 SIDDHAM SEPARATOR DOT\n"
" 𑗅 U+115C5 SIDDHAM SEPARATOR BAR\n"
"Siddham — Repetition mark items: 3\n"
" 𑗆 U+115C6 SIDDHAM REPETITION MARK-1\n"
" 𑗇 U+115C7 SIDDHAM REPETITION MARK-2\n"
" 𑗈 U+115C8 SIDDHAM REPETITION MARK-3\n"
"Siddham — Terminal mark items: 1\n"
" 𑗉 U+115C9 SIDDHAM END OF TEXT MARK\n"
"Siddham — Section marks items: 14\n"
" 𑗊 U+115CA SIDDHAM SECTION MARK WITH TRIDENT AND U-SHAPED ORNAMENTS\n"
" 𑗋 U+115CB SIDDHAM SECTION MARK WITH TRIDENT AND DOTTED CRESCENTS\n"
" 𑗌 U+115CC SIDDHAM SECTION MARK WITH RAYS AND DOTTED CRESCENTS\n"
" 𑗍 U+115CD SIDDHAM SECTION MARK WITH RAYS AND DOTTED DOUBLE CRESCENTS\n"
" 𑗎 U+115CE SIDDHAM SECTION MARK WITH RAYS AND DOTTED TRIPLE CRESCENTS\n"
" 𑗏 U+115CF SIDDHAM SECTION MARK DOUBLE RING\n"
" 𑗐 U+115D0 SIDDHAM SECTION MARK DOUBLE RING WITH RAYS\n"
" 𑗑 U+115D1 SIDDHAM SECTION MARK WITH DOUBLE CRESCENTS\n"
" 𑗒 U+115D2 SIDDHAM SECTION MARK WITH TRIPLE CRESCENTS\n"
" 𑗓 U+115D3 SIDDHAM SECTION MARK WITH QUADRUPLE CRESCENTS\n"
" 𑗔 U+115D4 SIDDHAM SECTION MARK WITH SEPTUPLE CRESCENTS\n"
" 𑗕 U+115D5 SIDDHAM SECTION MARK WITH CIRCLES AND RAYS\n"
" 𑗖 U+115D6 SIDDHAM SECTION MARK WITH CIRCLES AND TWO ENCLOSURES\n"
" 𑗗 U+115D7 SIDDHAM SECTION MARK WITH CIRCLES AND FOUR ENCLOSURES\n"
"Modi — Punctuation items: 3\n"
" 𑙁 U+11641 MODI DANDA\n"
" 𑙂 U+11642 MODI DOUBLE DANDA\n"
" 𑙃 U+11643 MODI ABBREVIATION SIGN\n"
"Mongolian Supplement — Punctuation items: 13\n"
" 𑙠 U+11660 MONGOLIAN BIRGA WITH ORNAMENT\n"
" 𑙡 U+11661 MONGOLIAN ROTATED BIRGA\n"
" 𑙢 U+11662 MONGOLIAN DOUBLE BIRGA WITH ORNAMENT\n"
" 𑙣 U+11663 MONGOLIAN TRIPLE BIRGA WITH ORNAMENT\n"
" 𑙤 U+11664 MONGOLIAN BIRGA WITH DOUBLE ORNAMENT\n"
" 𑙥 U+11665 MONGOLIAN ROTATED BIRGA WITH ORNAMENT\n"
" 𑙦 U+11666 MONGOLIAN ROTATED BIRGA WITH DOUBLE ORNAMENT\n"
" 𑙧 U+11667 MONGOLIAN INVERTED BIRGA\n"
" 𑙨 U+11668 MONGOLIAN INVERTED BIRGA WITH DOUBLE ORNAMENT\n"
" 𑙩 U+11669 MONGOLIAN SWIRL BIRGA\n"
" 𑙪 U+1166A MONGOLIAN SWIRL BIRGA WITH ORNAMENT\n"
" 𑙫 U+1166B MONGOLIAN SWIRL BIRGA WITH DOUBLE ORNAMENT\n"
" 𑙬 U+1166C MONGOLIAN TURNED SWIRL BIRGA WITH DOUBLE ORNAMENT\n"
"Ahom — Punctuation items: 3\n"
" 𑜼 U+1173C AHOM SIGN SMALL SECTION\n"
" 𑜽 U+1173D AHOM SIGN SECTION\n"
" 𑜾 U+1173E AHOM SIGN RULAI\n"
"Dogra — Punctuation items: 1\n"
" 𑠻 U+1183B DOGRA ABBREVIATION SIGN\n"
"Zanabazar Square — Head mark items: 4\n"
" 𑨿 U+11A3F ZANABAZAR SQUARE INITIAL HEAD MARK\n"
" 𑩀 U+11A40 ZANABAZAR SQUARE CLOSING HEAD MARK\n"
" 𑩅 U+11A45 ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK\n"
" 𑩆 U+11A46 ZANABAZAR SQUARE CLOSING DOUBLE-LINED HEAD MARK\n"
"Zanabazar Square — Punctuation items: 4\n"
" 𑩁 U+11A41 ZANABAZAR SQUARE MARK TSHEG\n"
" 𑩂 U+11A42 ZANABAZAR SQUARE MARK SHAD\n"
" 𑩃 U+11A43 ZANABAZAR SQUARE MARK DOUBLE SHAD\n"
" 𑩄 U+11A44 ZANABAZAR SQUARE MARK LONG TSHEG\n"
"Soyombo — Punctuation items: 3\n"
" 𑪚 U+11A9A SOYOMBO MARK TSHEG\n"
" 𑪛 U+11A9B SOYOMBO MARK SHAD\n"
" 𑪜 U+11A9C SOYOMBO MARK DOUBLE SHAD\n"
"Soyombo — Head mark items: 3\n"
" 𑪞 U+11A9E SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME\n"
" 𑪟 U+11A9F SOYOMBO HEAD MARK WITH MOON AND SUN AND FLAME\n"
" 𑪠 U+11AA0 SOYOMBO HEAD MARK WITH MOON AND SUN\n"
"Soyombo — Terminal mark items: 2\n"
" 𑪡 U+11AA1 SOYOMBO TERMINAL MARK-1\n"
" 𑪢 U+11AA2 SOYOMBO TERMINAL MARK-2\n"
"Bhaiksuki — Punctuation items: 3\n"
" 𑱁 U+11C41 BHAIKSUKI DANDA\n"
" 𑱂 U+11C42 BHAIKSUKI DOUBLE DANDA\n"
" 𑱃 U+11C43 BHAIKSUKI WORD SEPARATOR\n"
"Bhaiksuki — Gap fillers items: 2\n"
" 𑱄 U+11C44 BHAIKSUKI GAP FILLER-1\n"
" 𑱅 U+11C45 BHAIKSUKI GAP FILLER-2\n"
"Marchen — Punctuation items: 2\n"
" 𑱰 U+11C70 MARCHEN HEAD MARK\n"
" 𑱱 U+11C71 MARCHEN MARK SHAD\n"
"Makasar — Punctuation items: 2\n"
" 𑻷 U+11EF7 MAKASAR PASSIMBANG\n"
" 𑻸 U+11EF8 MAKASAR END OF SECTION\n"
"Cuneiform Numbers And Punctuation — Punctuation items: 5\n"
" 𒑰 U+12470 CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER\n"
" 𒑱 U+12471 CUNEIFORM PUNCTUATION SIGN VERTICAL COLON\n"
" 𒑲 U+12472 CUNEIFORM PUNCTUATION SIGN DIAGONAL COLON\n"
" 𒑳 U+12473 CUNEIFORM PUNCTUATION SIGN DIAGONAL TRICOLON\n"
" 𒑴 U+12474 CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON\n"
"Mro — Punctuation items: 2\n"
" 𖩮 U+16A6E MRO DANDA\n"
" 𖩯 U+16A6F MRO DOUBLE DANDA\n"
"Bassa Vah — Punctuation items: 1\n"
" 𖫵 U+16AF5 BASSA VAH FULL STOP\n"
"Pahawh Hmong — Punctuation items: 6\n"
" 𖬷 U+16B37 PAHAWH HMONG SIGN VOS THOM\n"
" 𖬸 U+16B38 PAHAWH HMONG SIGN VOS TSHAB CEEB\n"
" 𖬹 U+16B39 PAHAWH HMONG SIGN CIM CHEEM\n"
" 𖬺 U+16B3A PAHAWH HMONG SIGN VOS THIAB\n"
" 𖬻 U+16B3B PAHAWH HMONG SIGN VOS FEEM\n"
" 𖭄 U+16B44 PAHAWH HMONG SIGN XAUS\n"
"Medefaidrin — Punctuation items: 2\n"
" 𖺗 U+16E97 MEDEFAIDRIN COMMA\n"
" 𖺘 U+16E98 MEDEFAIDRIN FULL STOP\n"
"Medefaidrin — Sign items: 2\n"
" 𖺙 U+16E99 MEDEFAIDRIN SYMBOL AIVA\n"
" 𖺚 U+16E9A MEDEFAIDRIN EXCLAMATION OH\n"
"Duployan — Chinook punctuation items: 1\n"
" 𛲟 U+1BC9F DUPLOYAN PUNCTUATION CHINOOK FULL STOP\n"
"Sutton SignWriting — Punctuation items: 5\n"
" 𝪇 U+1DA87 SIGNWRITING COMMA\n"
" 𝪈 U+1DA88 SIGNWRITING FULL STOP\n"
" 𝪉 U+1DA89 SIGNWRITING SEMICOLON\n"
" 𝪊 U+1DA8A SIGNWRITING COLON\n"
" 𝪋 U+1DA8B SIGNWRITING PARENTHESIS\n"
"Adlam — Punctuation items: 2\n"
" 𞥞 U+1E95E ADLAM INITIAL EXCLAMATION MARK\n"
" 𞥟 U+1E95F ADLAM INITIAL QUESTION MARK")
matches = re.finditer(regex, test_str)
for matchNum, match in enumerate(matches, start=1):
print ("Match {matchNum} was found at {start}-{end}: {match}".format(matchNum = matchNum, start = match.start(), end = match.end(), match = match.group()))
for groupNum in range(0, len(match.groups())):
groupNum = groupNum + 1
print ("Group {groupNum} found at {start}-{end}: {group}".format(groupNum = groupNum, start = match.start(groupNum), end = match.end(groupNum), group = match.group(groupNum)))
# Note: for Python 2.7 compatibility, use ur"" to prefix the regex and u"" to prefix the test string and substitution.
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Python, please visit: https://docs.python.org/3/library/re.html