import java.util.regex.Matcher;
import java.util.regex.Pattern;
public class Example {
public static void main(String[] args) {
final String regex = "(?:[!-#%-\\*,-\\/:;\\?@\\[-\\]_\\{\\}\\xA1\\xA7\\xAB\\xB6\\xB7\\xBB\\xBF\\u037E\\u0387\\u055A-\\u055F\\u0589\\u058A\\u05BE\\u05C0\\u05C3\\u05C6\\u05F3\\u05F4\\u0609\\u060A\\u060C\\u060D\\u061B\\u061E\\u061F\\u066A-\\u066D\\u06D4\\u0700-\\u070D\\u07F7-\\u07F9\\u0830-\\u083E\\u085E\\u0964\\u0965\\u0970\\u09FD\\u0A76\\u0AF0\\u0C84\\u0DF4\\u0E4F\\u0E5A\\u0E5B\\u0F04-\\u0F12\\u0F14\\u0F3A-\\u0F3D\\u0F85\\u0FD0-\\u0FD4\\u0FD9\\u0FDA\\u104A-\\u104F\\u10FB\\u1360-\\u1368\\u1400\\u166D\\u166E\\u169B\\u169C\\u16EB-\\u16ED\\u1735\\u1736\\u17D4-\\u17D6\\u17D8-\\u17DA\\u1800-\\u180A\\u1944\\u1945\\u1A1E\\u1A1F\\u1AA0-\\u1AA6\\u1AA8-\\u1AAD\\u1B5A-\\u1B60\\u1BFC-\\u1BFF\\u1C3B-\\u1C3F\\u1C7E\\u1C7F\\u1CC0-\\u1CC7\\u1CD3\\u2010-\\u2027\\u2030-\\u2043\\u2045-\\u2051\\u2053-\\u205E\\u207D\\u207E\\u208D\\u208E\\u2308-\\u230B\\u2329\\u232A\\u2768-\\u2775\\u27C5\\u27C6\\u27E6-\\u27EF\\u2983-\\u2998\\u29D8-\\u29DB\\u29FC\\u29FD\\u2CF9-\\u2CFC\\u2CFE\\u2CFF\\u2D70\\u2E00-\\u2E2E\\u2E30-\\u2E4E\\u3001-\\u3003\\u3008-\\u3011\\u3014-\\u301F\\u3030\\u303D\\u30A0\\u30FB\\uA4FE\\uA4FF\\uA60D-\\uA60F\\uA673\\uA67E\\uA6F2-\\uA6F7\\uA874-\\uA877\\uA8CE\\uA8CF\\uA8F8-\\uA8FA\\uA8FC\\uA92E\\uA92F\\uA95F\\uA9C1-\\uA9CD\\uA9DE\\uA9DF\\uAA5C-\\uAA5F\\uAADE\\uAADF\\uAAF0\\uAAF1\\uABEB\\uFD3E\\uFD3F\\uFE10-\\uFE19\\uFE30-\\uFE52\\uFE54-\\uFE61\\uFE63\\uFE68\\uFE6A\\uFE6B\\uFF01-\\uFF03\\uFF05-\\uFF0A\\uFF0C-\\uFF0F\\uFF1A\\uFF1B\\uFF1F\\uFF20\\uFF3B-\\uFF3D\\uFF3F\\uFF5B\\uFF5D\\uFF5F-\\uFF65]|\\uD800[\\uDD00-\\uDD02\\uDF9F\\uDFD0]|\\uD801\\uDD6F|\\uD802[\\uDC57\\uDD1F\\uDD3F\\uDE50-\\uDE58\\uDE7F\\uDEF0-\\uDEF6\\uDF39-\\uDF3F\\uDF99-\\uDF9C]|\\uD803[\\uDF55-\\uDF59]|\\uD804[\\uDC47-\\uDC4D\\uDCBB\\uDCBC\\uDCBE-\\uDCC1\\uDD40-\\uDD43\\uDD74\\uDD75\\uDDC5-\\uDDC8\\uDDCD\\uDDDB\\uDDDD-\\uDDDF\\uDE38-\\uDE3D\\uDEA9]|\\uD805[\\uDC4B-\\uDC4F\\uDC5B\\uDC5D\\uDCC6\\uDDC1-\\uDDD7\\uDE41-\\uDE43\\uDE60-\\uDE6C\\uDF3C-\\uDF3E]|\\uD806[\\uDC3B\\uDE3F-\\uDE46\\uDE9A-\\uDE9C\\uDE9E-\\uDEA2]|\\uD807[\\uDC41-\\uDC45\\uDC70\\uDC71\\uDEF7\\uDEF8]|\\uD809[\\uDC70-\\uDC74]|\\uD81A[\\uDE6E\\uDE6F\\uDEF5\\uDF37-\\uDF3B\\uDF44]|\\uD81B[\\uDE97-\\uDE9A]|\\uD82F\\uDC9F|\\uD836[\\uDE87-\\uDE8B]|\\uD83A[\\uDD5E\\uDD5F])";
final String string = "\n"
+ "Basic Latin — ASCII punctuation and symbols items: 23\n"
+ " ! U+0021 EXCLAMATION MARK\n"
+ " \" U+0022 QUOTATION MARK\n"
+ " # U+0023 NUMBER SIGN\n"
+ " % U+0025 PERCENT SIGN\n"
+ " & U+0026 AMPERSAND\n"
+ " ' U+0027 APOSTROPHE\n"
+ " ( U+0028 LEFT PARENTHESIS\n"
+ " ) U+0029 RIGHT PARENTHESIS\n"
+ " * U+002A ASTERISK\n"
+ " , U+002C COMMA\n"
+ " - U+002D HYPHEN-MINUS\n"
+ " . U+002E FULL STOP\n"
+ " / U+002F SOLIDUS\n"
+ " : U+003A COLON\n"
+ " ; U+003B SEMICOLON\n"
+ " ? U+003F QUESTION MARK\n"
+ " @ U+0040 COMMERCIAL AT\n"
+ " [ U+005B LEFT SQUARE BRACKET\n"
+ " \\ U+005C REVERSE SOLIDUS\n"
+ " ] U+005D RIGHT SQUARE BRACKET\n"
+ " _ U+005F LOW LINE\n"
+ " { U+007B LEFT CURLY BRACKET\n"
+ " } U+007D RIGHT CURLY BRACKET\n"
+ "Latin 1 Supplement — Latin-1 punctuation and symbols items: 6\n"
+ " ¡ U+00A1 INVERTED EXCLAMATION MARK\n"
+ " § U+00A7 SECTION SIGN\n"
+ " « U+00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK\n"
+ " ¶ U+00B6 PILCROW SIGN\n"
+ " · U+00B7 MIDDLE DOT\n"
+ " » U+00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK\n"
+ "Latin 1 Supplement — Punctuation items: 1\n"
+ " ¿ U+00BF INVERTED QUESTION MARK\n"
+ "Greek And Coptic — Punctuation items: 2\n"
+ " ; U+037E GREEK QUESTION MARK\n"
+ " · U+0387 GREEK ANO TELEIA\n"
+ "Armenian — Modifier letter items: 6\n"
+ " ՚ U+055A ARMENIAN APOSTROPHE\n"
+ " ՛ U+055B ARMENIAN EMPHASIS MARK\n"
+ " ՜ U+055C ARMENIAN EXCLAMATION MARK\n"
+ " ՝ U+055D ARMENIAN COMMA\n"
+ " ՞ U+055E ARMENIAN QUESTION MARK\n"
+ " ՟ U+055F ARMENIAN ABBREVIATION MARK\n"
+ "Armenian — Punctuation items: 2\n"
+ " ։ U+0589 ARMENIAN FULL STOP\n"
+ " ֊ U+058A ARMENIAN HYPHEN\n"
+ "Hebrew — Points and punctuation items: 4\n"
+ " ־ U+05BE HEBREW PUNCTUATION MAQAF\n"
+ " ׀ U+05C0 HEBREW PUNCTUATION PASEQ\n"
+ " ׃ U+05C3 HEBREW PUNCTUATION SOF PASUQ\n"
+ " ׆ U+05C6 HEBREW PUNCTUATION NUN HAFUKHA\n"
+ "Hebrew — Punctuation items: 2\n"
+ " ׳ U+05F3 HEBREW PUNCTUATION GERESH\n"
+ " ״ U+05F4 HEBREW PUNCTUATION GERSHAYIM\n"
+ "Arabic — Punctuation items: 12\n"
+ " ؉ U+0609 ARABIC-INDIC PER MILLE SIGN\n"
+ " ؊ U+060A ARABIC-INDIC PER TEN THOUSAND SIGN\n"
+ " ، U+060C ARABIC COMMA\n"
+ " ؍ U+060D ARABIC DATE SEPARATOR\n"
+ " ؛ U+061B ARABIC SEMICOLON\n"
+ " ؞ U+061E ARABIC TRIPLE DOT PUNCTUATION MARK\n"
+ " ؟ U+061F ARABIC QUESTION MARK\n"
+ " ٪ U+066A ARABIC PERCENT SIGN\n"
+ " ٫ U+066B ARABIC DECIMAL SEPARATOR\n"
+ " ٬ U+066C ARABIC THOUSANDS SEPARATOR\n"
+ " ٭ U+066D ARABIC FIVE POINTED STAR\n"
+ " ۔ U+06D4 ARABIC FULL STOP\n"
+ "Syriac — Syriac punctuation and signs items: 14\n"
+ " ܀ U+0700 SYRIAC END OF PARAGRAPH\n"
+ " ܁ U+0701 SYRIAC SUPRALINEAR FULL STOP\n"
+ " ܂ U+0702 SYRIAC SUBLINEAR FULL STOP\n"
+ " ܃ U+0703 SYRIAC SUPRALINEAR COLON\n"
+ " ܄ U+0704 SYRIAC SUBLINEAR COLON\n"
+ " ܅ U+0705 SYRIAC HORIZONTAL COLON\n"
+ " ܆ U+0706 SYRIAC COLON SKEWED LEFT\n"
+ " ܇ U+0707 SYRIAC COLON SKEWED RIGHT\n"
+ " ܈ U+0708 SYRIAC SUPRALINEAR COLON SKEWED LEFT\n"
+ " ܉ U+0709 SYRIAC SUBLINEAR COLON SKEWED RIGHT\n"
+ " ܊ U+070A SYRIAC CONTRACTION\n"
+ " ܋ U+070B SYRIAC HARKLEAN OBELUS\n"
+ " ܌ U+070C SYRIAC HARKLEAN METOBELUS\n"
+ " ܍ U+070D SYRIAC HARKLEAN ASTERISCUS\n"
+ "NKo — Punctuation items: 3\n"
+ " ߷ U+07F7 NKO SYMBOL GBAKURUNEN\n"
+ " ߸ U+07F8 NKO COMMA\n"
+ " ߹ U+07F9 NKO EXCLAMATION MARK\n"
+ "Samaritan — Punctuation items: 15\n"
+ " ࠰ U+0830 SAMARITAN PUNCTUATION NEQUDAA\n"
+ " ࠱ U+0831 SAMARITAN PUNCTUATION AFSAAQ\n"
+ " ࠲ U+0832 SAMARITAN PUNCTUATION ANGED\n"
+ " ࠳ U+0833 SAMARITAN PUNCTUATION BAU\n"
+ " ࠴ U+0834 SAMARITAN PUNCTUATION ATMAAU\n"
+ " ࠵ U+0835 SAMARITAN PUNCTUATION SHIYYAALAA\n"
+ " ࠶ U+0836 SAMARITAN ABBREVIATION MARK\n"
+ " ࠷ U+0837 SAMARITAN PUNCTUATION MELODIC QITSA\n"
+ " ࠸ U+0838 SAMARITAN PUNCTUATION ZIQAA\n"
+ " ࠹ U+0839 SAMARITAN PUNCTUATION QITSA\n"
+ " ࠺ U+083A SAMARITAN PUNCTUATION ZAEF\n"
+ " ࠻ U+083B SAMARITAN PUNCTUATION TURU\n"
+ " ࠼ U+083C SAMARITAN PUNCTUATION ARKAANU\n"
+ " ࠽ U+083D SAMARITAN PUNCTUATION SOF MASHFAAT\n"
+ " ࠾ U+083E SAMARITAN PUNCTUATION ANNAAU\n"
+ "Mandaic — Punctuation items: 1\n"
+ " ࡞ U+085E MANDAIC PUNCTUATION\n"
+ "Devanagari — Generic punctuation for scripts of India items: 2\n"
+ " । U+0964 DEVANAGARI DANDA\n"
+ " ॥ U+0965 DEVANAGARI DOUBLE DANDA\n"
+ "Devanagari — Abbreviation mark items: 1\n"
+ " ॰ U+0970 DEVANAGARI ABBREVIATION SIGN\n"
+ "Bengali — Sign items: 1\n"
+ " ৽ U+09FD BENGALI ABBREVIATION SIGN\n"
+ "Gurmukhi — Sign items: 1\n"
+ " ੶ U+0A76 GURMUKHI ABBREVIATION SIGN\n"
+ "Gujarati — Abbreviation mark items: 1\n"
+ " ૰ U+0AF0 GUJARATI ABBREVIATION SIGN\n"
+ "Kannada — Various signs items: 1\n"
+ " ಄ U+0C84 KANNADA SIGN SIDDHAM\n"
+ "Sinhala — Punctuation items: 1\n"
+ " ෴ U+0DF4 SINHALA PUNCTUATION KUNDDALIYA\n"
+ "Thai — Sign items: 3\n"
+ " ๏ U+0E4F THAI CHARACTER FONGMAN\n"
+ " ๚ U+0E5A THAI CHARACTER ANGKHANKHU\n"
+ " ๛ U+0E5B THAI CHARACTER KHOMUT\n"
+ "Tibetan — Head mark items: 6\n"
+ " ༄ U+0F04 TIBETAN MARK INITIAL YIG MGO MDUN MA\n"
+ " ༅ U+0F05 TIBETAN MARK CLOSING YIG MGO SGAB MA\n"
+ " ༆ U+0F06 TIBETAN MARK CARET YIG MGO PHUR SHAD MA\n"
+ " ༇ U+0F07 TIBETAN MARK YIG MGO TSHEG SHAD MA\n"
+ " ࿓ U+0FD3 TIBETAN MARK INITIAL BRDA RNYING YIG MGO MDUN MA\n"
+ " ࿔ U+0FD4 TIBETAN MARK CLOSING BRDA RNYING YIG MGO SGAB MA\n"
+ "Tibetan — Sign items: 16\n"
+ " ༈ U+0F08 TIBETAN MARK SBRUL SHAD\n"
+ " ༉ U+0F09 TIBETAN MARK BSKUR YIG MGO\n"
+ " ༊ U+0F0A TIBETAN MARK BKA- SHOG YIG MGO\n"
+ " ་ U+0F0B TIBETAN MARK INTERSYLLABIC TSHEG\n"
+ " ༌ U+0F0C TIBETAN MARK DELIMITER TSHEG BSTAR\n"
+ " ། U+0F0D TIBETAN MARK SHAD\n"
+ " ༎ U+0F0E TIBETAN MARK NYIS SHAD\n"
+ " ༏ U+0F0F TIBETAN MARK TSHEG SHAD\n"
+ " ༐ U+0F10 TIBETAN MARK NYIS TSHEG SHAD\n"
+ " ༑ U+0F11 TIBETAN MARK RIN CHEN SPUNGS SHAD\n"
+ " ༒ U+0F12 TIBETAN MARK RGYA GRAM SHAD\n"
+ " ༔ U+0F14 TIBETAN MARK GTER TSHEG\n"
+ " ྅ U+0F85 TIBETAN MARK PALUTA\n"
+ " ࿐ U+0FD0 TIBETAN MARK BSKA- SHOG GI MGO RGYAN\n"
+ " ࿑ U+0FD1 TIBETAN MARK MNYAM YIG GI MGO RGYAN\n"
+ " ࿒ U+0FD2 TIBETAN MARK NYIS TSHEG\n"
+ "Tibetan — Paired punctuation items: 4\n"
+ " ༺ U+0F3A TIBETAN MARK GUG RTAGS GYON\n"
+ " ༻ U+0F3B TIBETAN MARK GUG RTAGS GYAS\n"
+ " ༼ U+0F3C TIBETAN MARK ANG KHANG GYON\n"
+ " ༽ U+0F3D TIBETAN MARK ANG KHANG GYAS\n"
+ "Tibetan — Annotation marks items: 2\n"
+ " ࿙ U+0FD9 TIBETAN MARK LEADING MCHAN RTAGS\n"
+ " ࿚ U+0FDA TIBETAN MARK TRAILING MCHAN RTAGS\n"
+ "Myanmar — Punctuation items: 2\n"
+ " ၊ U+104A MYANMAR SIGN LITTLE SECTION\n"
+ " ။ U+104B MYANMAR SIGN SECTION\n"
+ "Myanmar — Various signs items: 4\n"
+ " ၌ U+104C MYANMAR SYMBOL LOCATIVE\n"
+ " ၍ U+104D MYANMAR SYMBOL COMPLETED\n"
+ " ၎ U+104E MYANMAR SYMBOL AFOREMENTIONED\n"
+ " ၏ U+104F MYANMAR SYMBOL GENITIVE\n"
+ "Georgian — Punctuation items: 1\n"
+ " ჻ U+10FB GEORGIAN PARAGRAPH SEPARATOR\n"
+ "Ethiopic — Punctuation items: 9\n"
+ " ፠ U+1360 ETHIOPIC SECTION MARK\n"
+ " ፡ U+1361 ETHIOPIC WORDSPACE\n"
+ " ። U+1362 ETHIOPIC FULL STOP\n"
+ " ፣ U+1363 ETHIOPIC COMMA\n"
+ " ፤ U+1364 ETHIOPIC SEMICOLON\n"
+ " ፥ U+1365 ETHIOPIC COLON\n"
+ " ፦ U+1366 ETHIOPIC PREFACE COLON\n"
+ " ፧ U+1367 ETHIOPIC QUESTION MARK\n"
+ " ፨ U+1368 ETHIOPIC PARAGRAPH SEPARATOR\n"
+ "Unified Canadian Aboriginal Syllabics — Punctuation items: 2\n"
+ " ᐀ U+1400 CANADIAN SYLLABICS HYPHEN\n"
+ " ᙮ U+166E CANADIAN SYLLABICS FULL STOP\n"
+ "Unified Canadian Aboriginal Syllabics — Sign items: 1\n"
+ " ᙭ U+166D CANADIAN SYLLABICS CHI SIGN\n"
+ "Ogham — Punctuation items: 2\n"
+ " ᚛ U+169B OGHAM FEATHER MARK\n"
+ " ᚜ U+169C OGHAM REVERSED FEATHER MARK\n"
+ "Runic — Punctuation items: 3\n"
+ " ᛫ U+16EB RUNIC SINGLE PUNCTUATION\n"
+ " ᛬ U+16EC RUNIC MULTIPLE PUNCTUATION\n"
+ " ᛭ U+16ED RUNIC CROSS PUNCTUATION\n"
+ "Hanunoo — Generic punctuation for Philippine scripts items: 2\n"
+ " ᜵ U+1735 PHILIPPINE SINGLE PUNCTUATION\n"
+ " ᜶ U+1736 PHILIPPINE DOUBLE PUNCTUATION\n"
+ "Khmer — Various signs items: 6\n"
+ " ។ U+17D4 KHMER SIGN KHAN\n"
+ " ៕ U+17D5 KHMER SIGN BARIYOOSAN\n"
+ " ៖ U+17D6 KHMER SIGN CAMNUC PII KUUH\n"
+ " ៘ U+17D8 KHMER SIGN BEYYAL\n"
+ " ៙ U+17D9 KHMER SIGN PHNAEK MUAN\n"
+ " ៚ U+17DA KHMER SIGN KOOMUUT\n"
+ "Mongolian — Punctuation items: 11\n"
+ " ᠀ U+1800 MONGOLIAN BIRGA\n"
+ " ᠁ U+1801 MONGOLIAN ELLIPSIS\n"
+ " ᠂ U+1802 MONGOLIAN COMMA\n"
+ " ᠃ U+1803 MONGOLIAN FULL STOP\n"
+ " ᠄ U+1804 MONGOLIAN COLON\n"
+ " ᠅ U+1805 MONGOLIAN FOUR DOTS\n"
+ " ᠆ U+1806 MONGOLIAN TODO SOFT HYPHEN\n"
+ " ᠇ U+1807 MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER\n"
+ " ᠈ U+1808 MONGOLIAN MANCHU COMMA\n"
+ " ᠉ U+1809 MONGOLIAN MANCHU FULL STOP\n"
+ " ᠊ U+180A MONGOLIAN NIRUGU\n"
+ "Limbu — Various signs items: 2\n"
+ " ᥄ U+1944 LIMBU EXCLAMATION MARK\n"
+ " ᥅ U+1945 LIMBU QUESTION MARK\n"
+ "Buginese — Various signs items: 2\n"
+ " ᨞ U+1A1E BUGINESE PALLAWA\n"
+ " ᨟ U+1A1F BUGINESE END OF SECTION\n"
+ "Tai Tham — Logographs items: 3\n"
+ " ᪠ U+1AA0 TAI THAM SIGN WIANG\n"
+ " ᪡ U+1AA1 TAI THAM SIGN WIANGWAAK\n"
+ " ᪢ U+1AA2 TAI THAM SIGN SAWAN\n"
+ "Tai Tham — Punctuation items: 10\n"
+ " ᪣ U+1AA3 TAI THAM SIGN KEOW\n"
+ " ᪤ U+1AA4 TAI THAM SIGN HOY\n"
+ " ᪥ U+1AA5 TAI THAM SIGN DOKMAI\n"
+ " ᪦ U+1AA6 TAI THAM SIGN REVERSED ROTATED RANA\n"
+ " ᪨ U+1AA8 TAI THAM SIGN KAAN\n"
+ " ᪩ U+1AA9 TAI THAM SIGN KAANKUU\n"
+ " ᪪ U+1AAA TAI THAM SIGN SATKAAN\n"
+ " ᪫ U+1AAB TAI THAM SIGN SATKAANKUU\n"
+ " ᪬ U+1AAC TAI THAM SIGN HANG\n"
+ " ᪭ U+1AAD TAI THAM SIGN CAANG\n"
+ "Balinese — Punctuation items: 7\n"
+ " ᭚ U+1B5A BALINESE PANTI\n"
+ " ᭛ U+1B5B BALINESE PAMADA\n"
+ " ᭜ U+1B5C BALINESE WINDU\n"
+ " ᭝ U+1B5D BALINESE CARIK PAMUNGKAH\n"
+ " ᭞ U+1B5E BALINESE CARIK SIKI\n"
+ " ᭟ U+1B5F BALINESE CARIK PAREREN\n"
+ " ᭠ U+1B60 BALINESE PAMENENG\n"
+ "Batak — Punctuation items: 4\n"
+ " ᯼ U+1BFC BATAK SYMBOL BINDU NA METEK\n"
+ " ᯽ U+1BFD BATAK SYMBOL BINDU PINARBORAS\n"
+ " ᯾ U+1BFE BATAK SYMBOL BINDU JUDUL\n"
+ " ᯿ U+1BFF BATAK SYMBOL BINDU PANGOLAT\n"
+ "Lepcha — Punctuation items: 5\n"
+ " ᰻ U+1C3B LEPCHA PUNCTUATION TA-ROL\n"
+ " ᰼ U+1C3C LEPCHA PUNCTUATION NYET THYOOM TA-ROL\n"
+ " ᰽ U+1C3D LEPCHA PUNCTUATION CER-WA\n"
+ " ᰾ U+1C3E LEPCHA PUNCTUATION TSHOOK CER-WA\n"
+ " ᰿ U+1C3F LEPCHA PUNCTUATION TSHOOK\n"
+ "Ol Chiki — Punctuation items: 2\n"
+ " ᱾ U+1C7E OL CHIKI PUNCTUATION MUCAAD\n"
+ " ᱿ U+1C7F OL CHIKI PUNCTUATION DOUBLE MUCAAD\n"
+ "Sundanese Supplement — Punctuation items: 8\n"
+ " ᳀ U+1CC0 SUNDANESE PUNCTUATION BINDU SURYA\n"
+ " ᳁ U+1CC1 SUNDANESE PUNCTUATION BINDU PANGLONG\n"
+ " ᳂ U+1CC2 SUNDANESE PUNCTUATION BINDU PURNAMA\n"
+ " ᳃ U+1CC3 SUNDANESE PUNCTUATION BINDU CAKRA\n"
+ " ᳄ U+1CC4 SUNDANESE PUNCTUATION BINDU LEU SATANGA\n"
+ " ᳅ U+1CC5 SUNDANESE PUNCTUATION BINDU KA SATANGA\n"
+ " ᳆ U+1CC6 SUNDANESE PUNCTUATION BINDU DA SATANGA\n"
+ " ᳇ U+1CC7 SUNDANESE PUNCTUATION BINDU BA SATANGA\n"
+ "Vedic Extensions — Breathing mark for the Samaveda items: 1\n"
+ " ᳓ U+1CD3 VEDIC SIGN NIHSHVASA\n"
+ "General Punctuation — Dashes items: 6\n"
+ " ‐ U+2010 HYPHEN\n"
+ " ‑ U+2011 NON-BREAKING HYPHEN\n"
+ " ‒ U+2012 FIGURE DASH\n"
+ " – U+2013 EN DASH\n"
+ " — U+2014 EM DASH\n"
+ " ― U+2015 HORIZONTAL BAR\n"
+ "General Punctuation — General punctuation items: 39\n"
+ " ‖ U+2016 DOUBLE VERTICAL LINE\n"
+ " ‗ U+2017 DOUBLE LOW LINE\n"
+ " † U+2020 DAGGER\n"
+ " ‡ U+2021 DOUBLE DAGGER\n"
+ " • U+2022 BULLET\n"
+ " ‣ U+2023 TRIANGULAR BULLET\n"
+ " ․ U+2024 ONE DOT LEADER\n"
+ " ‥ U+2025 TWO DOT LEADER\n"
+ " … U+2026 HORIZONTAL ELLIPSIS\n"
+ " ‧ U+2027 HYPHENATION POINT\n"
+ " ‰ U+2030 PER MILLE SIGN\n"
+ " ‱ U+2031 PER TEN THOUSAND SIGN\n"
+ " ′ U+2032 PRIME\n"
+ " ″ U+2033 DOUBLE PRIME\n"
+ " ‴ U+2034 TRIPLE PRIME\n"
+ " ‵ U+2035 REVERSED PRIME\n"
+ " ‶ U+2036 REVERSED DOUBLE PRIME\n"
+ " ‷ U+2037 REVERSED TRIPLE PRIME\n"
+ " ‸ U+2038 CARET\n"
+ " ※ U+203B REFERENCE MARK\n"
+ " ‽ U+203D INTERROBANG\n"
+ " ‾ U+203E OVERLINE\n"
+ " ‿ U+203F UNDERTIE\n"
+ " ⁀ U+2040 CHARACTER TIE\n"
+ " ⁁ U+2041 CARET INSERTION POINT\n"
+ " ⁂ U+2042 ASTERISM\n"
+ " ⁃ U+2043 HYPHEN BULLET\n"
+ " ⁊ U+204A TIRONIAN SIGN ET\n"
+ " ⁋ U+204B REVERSED PILCROW SIGN\n"
+ " ⁌ U+204C BLACK LEFTWARDS BULLET\n"
+ " ⁍ U+204D BLACK RIGHTWARDS BULLET\n"
+ " ⁎ U+204E LOW ASTERISK\n"
+ " ⁏ U+204F REVERSED SEMICOLON\n"
+ " ⁐ U+2050 CLOSE UP\n"
+ " ⁑ U+2051 TWO ASTERISKS ALIGNED VERTICALLY\n"
+ " ⁓ U+2053 SWUNG DASH\n"
+ " ⁔ U+2054 INVERTED UNDERTIE\n"
+ " ⁕ U+2055 FLOWER PUNCTUATION MARK\n"
+ " ⁗ U+2057 QUADRUPLE PRIME\n"
+ "General Punctuation — Quotation marks and apostrophe items: 8\n"
+ " ‘ U+2018 LEFT SINGLE QUOTATION MARK\n"
+ " ’ U+2019 RIGHT SINGLE QUOTATION MARK\n"
+ " ‚ U+201A SINGLE LOW-9 QUOTATION MARK\n"
+ " ‛ U+201B SINGLE HIGH-REVERSED-9 QUOTATION MARK\n"
+ " “ U+201C LEFT DOUBLE QUOTATION MARK\n"
+ " ” U+201D RIGHT DOUBLE QUOTATION MARK\n"
+ " „ U+201E DOUBLE LOW-9 QUOTATION MARK\n"
+ " ‟ U+201F DOUBLE HIGH-REVERSED-9 QUOTATION MARK\n"
+ "General Punctuation — Quotation marks items: 2\n"
+ " ‹ U+2039 SINGLE LEFT-POINTING ANGLE QUOTATION MARK\n"
+ " › U+203A SINGLE RIGHT-POINTING ANGLE QUOTATION MARK\n"
+ "General Punctuation — Double punctuation for vertical text items: 4\n"
+ " ‼️ U+203C DOUBLE EXCLAMATION MARK\n"
+ " ⁇ U+2047 DOUBLE QUESTION MARK\n"
+ " ⁈ U+2048 QUESTION EXCLAMATION MARK\n"
+ " ⁉️ U+2049 EXCLAMATION QUESTION MARK\n"
+ "General Punctuation — Brackets items: 2\n"
+ " ⁅ U+2045 LEFT SQUARE BRACKET WITH QUILL\n"
+ " ⁆ U+2046 RIGHT SQUARE BRACKET WITH QUILL\n"
+ "General Punctuation — Archaic punctuation items: 8\n"
+ " ⁖ U+2056 THREE DOT PUNCTUATION\n"
+ " ⁘ U+2058 FOUR DOT PUNCTUATION\n"
+ " ⁙ U+2059 FIVE DOT PUNCTUATION\n"
+ " ⁚ U+205A TWO DOT PUNCTUATION\n"
+ " ⁛ U+205B FOUR DOT MARK\n"
+ " ⁜ U+205C DOTTED CROSS\n"
+ " ⁝ U+205D TRICOLON\n"
+ " ⁞ U+205E VERTICAL FOUR DOTS\n"
+ "Superscripts And Subscripts — Superscripts items: 2\n"
+ " ⁽ U+207D SUPERSCRIPT LEFT PARENTHESIS\n"
+ " ⁾ U+207E SUPERSCRIPT RIGHT PARENTHESIS\n"
+ "Superscripts And Subscripts — Subscripts items: 2\n"
+ " ₍ U+208D SUBSCRIPT LEFT PARENTHESIS\n"
+ " ₎ U+208E SUBSCRIPT RIGHT PARENTHESIS\n"
+ "Miscellaneous Technical — Ceilings and floors items: 4\n"
+ " ⌈ U+2308 LEFT CEILING\n"
+ " ⌉ U+2309 RIGHT CEILING\n"
+ " ⌊ U+230A LEFT FLOOR\n"
+ " ⌋ U+230B RIGHT FLOOR\n"
+ "Miscellaneous Technical — Deprecated angle brackets items: 2\n"
+ " 〈 U+2329 LEFT-POINTING ANGLE BRACKET\n"
+ " 〉 U+232A RIGHT-POINTING ANGLE BRACKET\n"
+ "Dingbats — Ornamental brackets items: 14\n"
+ " ❨ U+2768 MEDIUM LEFT PARENTHESIS ORNAMENT\n"
+ " ❩ U+2769 MEDIUM RIGHT PARENTHESIS ORNAMENT\n"
+ " ❪ U+276A MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT\n"
+ " ❫ U+276B MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT\n"
+ " ❬ U+276C MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT\n"
+ " ❭ U+276D MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT\n"
+ " ❮ U+276E HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT\n"
+ " ❯ U+276F HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT\n"
+ " ❰ U+2770 HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT\n"
+ " ❱ U+2771 HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT\n"
+ " ❲ U+2772 LIGHT LEFT TORTOISE SHELL BRACKET ORNAMENT\n"
+ " ❳ U+2773 LIGHT RIGHT TORTOISE SHELL BRACKET ORNAMENT\n"
+ " ❴ U+2774 MEDIUM LEFT CURLY BRACKET ORNAMENT\n"
+ " ❵ U+2775 MEDIUM RIGHT CURLY BRACKET ORNAMENT\n"
+ "Miscellaneous Mathematical Symbols A — Paired punctuation items: 2\n"
+ " ⟅ U+27C5 LEFT S-SHAPED BAG DELIMITER\n"
+ " ⟆ U+27C6 RIGHT S-SHAPED BAG DELIMITER\n"
+ "Miscellaneous Mathematical Symbols A — Mathematical brackets items: 10\n"
+ " ⟦ U+27E6 MATHEMATICAL LEFT WHITE SQUARE BRACKET\n"
+ " ⟧ U+27E7 MATHEMATICAL RIGHT WHITE SQUARE BRACKET\n"
+ " ⟨ U+27E8 MATHEMATICAL LEFT ANGLE BRACKET\n"
+ " ⟩ U+27E9 MATHEMATICAL RIGHT ANGLE BRACKET\n"
+ " ⟪ U+27EA MATHEMATICAL LEFT DOUBLE ANGLE BRACKET\n"
+ " ⟫ U+27EB MATHEMATICAL RIGHT DOUBLE ANGLE BRACKET\n"
+ " ⟬ U+27EC MATHEMATICAL LEFT WHITE TORTOISE SHELL BRACKET\n"
+ " ⟭ U+27ED MATHEMATICAL RIGHT WHITE TORTOISE SHELL BRACKET\n"
+ " ⟮ U+27EE MATHEMATICAL LEFT FLATTENED PARENTHESIS\n"
+ " ⟯ U+27EF MATHEMATICAL RIGHT FLATTENED PARENTHESIS\n"
+ "Miscellaneous Mathematical Symbols B — Brackets items: 20\n"
+ " ⦃ U+2983 LEFT WHITE CURLY BRACKET\n"
+ " ⦄ U+2984 RIGHT WHITE CURLY BRACKET\n"
+ " ⦅ U+2985 LEFT WHITE PARENTHESIS\n"
+ " ⦆ U+2986 RIGHT WHITE PARENTHESIS\n"
+ " ⦇ U+2987 Z NOTATION LEFT IMAGE BRACKET\n"
+ " ⦈ U+2988 Z NOTATION RIGHT IMAGE BRACKET\n"
+ " ⦉ U+2989 Z NOTATION LEFT BINDING BRACKET\n"
+ " ⦊ U+298A Z NOTATION RIGHT BINDING BRACKET\n"
+ " ⦋ U+298B LEFT SQUARE BRACKET WITH UNDERBAR\n"
+ " ⦌ U+298C RIGHT SQUARE BRACKET WITH UNDERBAR\n"
+ " ⦑ U+2991 LEFT ANGLE BRACKET WITH DOT\n"
+ " ⦒ U+2992 RIGHT ANGLE BRACKET WITH DOT\n"
+ " ⦓ U+2993 LEFT ARC LESS-THAN BRACKET\n"
+ " ⦔ U+2994 RIGHT ARC GREATER-THAN BRACKET\n"
+ " ⦕ U+2995 DOUBLE LEFT ARC GREATER-THAN BRACKET\n"
+ " ⦖ U+2996 DOUBLE RIGHT ARC LESS-THAN BRACKET\n"
+ " ⦗ U+2997 LEFT BLACK TORTOISE SHELL BRACKET\n"
+ " ⦘ U+2998 RIGHT BLACK TORTOISE SHELL BRACKET\n"
+ " ⧼ U+29FC LEFT-POINTING CURVED ANGLE BRACKET\n"
+ " ⧽ U+29FD RIGHT-POINTING CURVED ANGLE BRACKET\n"
+ "Miscellaneous Mathematical Symbols B — Brackets with ticks items: 4\n"
+ " ⦍ U+298D LEFT SQUARE BRACKET WITH TICK IN TOP CORNER\n"
+ " ⦎ U+298E RIGHT SQUARE BRACKET WITH TICK IN BOTTOM CORNER\n"
+ " ⦏ U+298F LEFT SQUARE BRACKET WITH TICK IN BOTTOM CORNER\n"
+ " ⦐ U+2990 RIGHT SQUARE BRACKET WITH TICK IN TOP CORNER\n"
+ "Miscellaneous Mathematical Symbols B — Fences items: 4\n"
+ " ⧘ U+29D8 LEFT WIGGLY FENCE\n"
+ " ⧙ U+29D9 RIGHT WIGGLY FENCE\n"
+ " ⧚ U+29DA LEFT DOUBLE WIGGLY FENCE\n"
+ " ⧛ U+29DB RIGHT DOUBLE WIGGLY FENCE\n"
+ "Coptic — Old Nubian punctuation items: 4\n"
+ " ⳹ U+2CF9 COPTIC OLD NUBIAN FULL STOP\n"
+ " ⳺ U+2CFA COPTIC OLD NUBIAN DIRECT QUESTION MARK\n"
+ " ⳻ U+2CFB COPTIC OLD NUBIAN INDIRECT QUESTION MARK\n"
+ " ⳼ U+2CFC COPTIC OLD NUBIAN VERSE DIVIDER\n"
+ "Coptic — Punctuation items: 2\n"
+ " ⳾ U+2CFE COPTIC FULL STOP\n"
+ " ⳿ U+2CFF COPTIC MORPHOLOGICAL DIVIDER\n"
+ "Tifinagh — Punctuation items: 1\n"
+ " ⵰ U+2D70 TIFINAGH SEPARATOR MARK\n"
+ "Supplemental Punctuation — New Testament editorial symbols items: 14\n"
+ " ⸀ U+2E00 RIGHT ANGLE SUBSTITUTION MARKER\n"
+ " ⸁ U+2E01 RIGHT ANGLE DOTTED SUBSTITUTION MARKER\n"
+ " ⸂ U+2E02 LEFT SUBSTITUTION BRACKET\n"
+ " ⸃ U+2E03 RIGHT SUBSTITUTION BRACKET\n"
+ " ⸄ U+2E04 LEFT DOTTED SUBSTITUTION BRACKET\n"
+ " ⸅ U+2E05 RIGHT DOTTED SUBSTITUTION BRACKET\n"
+ " ⸆ U+2E06 RAISED INTERPOLATION MARKER\n"
+ " ⸇ U+2E07 RAISED DOTTED INTERPOLATION MARKER\n"
+ " ⸈ U+2E08 DOTTED TRANSPOSITION MARKER\n"
+ " ⸉ U+2E09 LEFT TRANSPOSITION BRACKET\n"
+ " ⸊ U+2E0A RIGHT TRANSPOSITION BRACKET\n"
+ " ⸋ U+2E0B RAISED SQUARE\n"
+ " ⸌ U+2E0C LEFT RAISED OMISSION BRACKET\n"
+ " ⸍ U+2E0D RIGHT RAISED OMISSION BRACKET\n"
+ "Supplemental Punctuation — Ancient Greek textual symbols items: 9\n"
+ " ⸎ U+2E0E EDITORIAL CORONIS\n"
+ " ⸏ U+2E0F PARAGRAPHOS\n"
+ " ⸐ U+2E10 FORKED PARAGRAPHOS\n"
+ " ⸑ U+2E11 REVERSED FORKED PARAGRAPHOS\n"
+ " ⸒ U+2E12 HYPODIASTOLE\n"
+ " ⸓ U+2E13 DOTTED OBELOS\n"
+ " ⸔ U+2E14 DOWNWARDS ANCORA\n"
+ " ⸕ U+2E15 UPWARDS ANCORA\n"
+ " ⸖ U+2E16 DOTTED RIGHT-POINTING ANGLE\n"
+ "Supplemental Punctuation — Ancient Near-Eastern linguistic symbol items: 1\n"
+ " ⸗ U+2E17 DOUBLE OBLIQUE HYPHEN\n"
+ "Supplemental Punctuation — General punctuation items: 2\n"
+ " ⸘ U+2E18 INVERTED INTERROBANG\n"
+ " ⸙ U+2E19 PALM BRANCH\n"
+ "Supplemental Punctuation — Dictionary punctuation items: 4\n"
+ " ⸚ U+2E1A HYPHEN WITH DIAERESIS\n"
+ " ⸛ U+2E1B TILDE WITH RING ABOVE\n"
+ " ⸞ U+2E1E TILDE WITH DOT ABOVE\n"
+ " ⸟ U+2E1F TILDE WITH DOT BELOW\n"
+ "Supplemental Punctuation — Brackets items: 8\n"
+ " ⸜ U+2E1C LEFT LOW PARAPHRASE BRACKET\n"
+ " ⸝ U+2E1D RIGHT LOW PARAPHRASE BRACKET\n"
+ " ⸠ U+2E20 LEFT VERTICAL BAR WITH QUILL\n"
+ " ⸡ U+2E21 RIGHT VERTICAL BAR WITH QUILL\n"
+ " ⸦ U+2E26 LEFT SIDEWAYS U BRACKET\n"
+ " ⸧ U+2E27 RIGHT SIDEWAYS U BRACKET\n"
+ " ⸨ U+2E28 LEFT DOUBLE PARENTHESIS\n"
+ " ⸩ U+2E29 RIGHT DOUBLE PARENTHESIS\n"
+ "Supplemental Punctuation — Half brackets items: 4\n"
+ " ⸢ U+2E22 TOP LEFT HALF BRACKET\n"
+ " ⸣ U+2E23 TOP RIGHT HALF BRACKET\n"
+ " ⸤ U+2E24 BOTTOM LEFT HALF BRACKET\n"
+ " ⸥ U+2E25 BOTTOM RIGHT HALF BRACKET\n"
+ "Supplemental Punctuation — Archaic punctuation items: 15\n"
+ " ⸪ U+2E2A TWO DOTS OVER ONE DOT PUNCTUATION\n"
+ " ⸫ U+2E2B ONE DOT OVER TWO DOTS PUNCTUATION\n"
+ " ⸬ U+2E2C SQUARED FOUR DOT PUNCTUATION\n"
+ " ⸭ U+2E2D FIVE DOT MARK\n"
+ " ⸮ U+2E2E REVERSED QUESTION MARK\n"
+ " ⸰ U+2E30 RING POINT\n"
+ " ⸱ U+2E31 WORD SEPARATOR MIDDLE DOT\n"
+ " ⸳ U+2E33 RAISED DOT\n"
+ " ⸴ U+2E34 RAISED COMMA\n"
+ " ⸿ U+2E3F CAPITULUM\n"
+ " ⹊ U+2E4A DOTTED SOLIDUS\n"
+ " ⹋ U+2E4B TRIPLE DAGGER\n"
+ " ⹌ U+2E4C MEDIEVAL COMMA\n"
+ " ⹍ U+2E4D PARAGRAPHUS MARK\n"
+ " ⹎ U+2E4E PUNCTUS ELEVATUS MARK\n"
+ "Supplemental Punctuation — Palaeotype transliteration symbol items: 6\n"
+ " ⸲ U+2E32 TURNED COMMA\n"
+ " ⸵ U+2E35 TURNED SEMICOLON\n"
+ " ⸶ U+2E36 DAGGER WITH LEFT GUARD\n"
+ " ⸷ U+2E37 DAGGER WITH RIGHT GUARD\n"
+ " ⸸ U+2E38 TURNED DAGGER\n"
+ " ⸹ U+2E39 TOP HALF SECTION SIGN\n"
+ "Supplemental Punctuation — Dashes items: 2\n"
+ " ⸺ U+2E3A TWO-EM DASH\n"
+ " ⸻ U+2E3B THREE-EM DASH\n"
+ "Supplemental Punctuation — Alternate forms of punctuation items: 3\n"
+ " ⸼ U+2E3C STENOGRAPHIC FULL STOP\n"
+ " ⸽ U+2E3D VERTICAL SIX DOTS\n"
+ " ⸾ U+2E3E WIGGLY VERTICAL LINE\n"
+ "Supplemental Punctuation — Double hyphen items: 1\n"
+ " ⹀ U+2E40 DOUBLE HYPHEN\n"
+ "Supplemental Punctuation — Reversed punctuation items: 2\n"
+ " ⹁ U+2E41 REVERSED COMMA\n"
+ " ⹂ U+2E42 DOUBLE LOW-REVERSED-9 QUOTATION MARK\n"
+ "Supplemental Punctuation — Miscellaneous punctuation items: 2\n"
+ " ⹃ U+2E43 DASH WITH LEFT UPTURN\n"
+ " ⹄ U+2E44 DOUBLE SUSPENSION MARK\n"
+ "Supplemental Punctuation — Typicon punctuation items: 5\n"
+ " ⹅ U+2E45 INVERTED LOW KAVYKA\n"
+ " ⹆ U+2E46 INVERTED LOW KAVYKA WITH KAVYKA ABOVE\n"
+ " ⹇ U+2E47 LOW KAVYKA\n"
+ " ⹈ U+2E48 LOW KAVYKA WITH DOT\n"
+ " ⹉ U+2E49 DOUBLE STACKED COMMA\n"
+ "CJK Symbols And Punctuation — CJK symbols and punctuation items: 3\n"
+ " 、 U+3001 IDEOGRAPHIC COMMA\n"
+ " 。 U+3002 IDEOGRAPHIC FULL STOP\n"
+ " 〃 U+3003 DITTO MARK\n"
+ "CJK Symbols And Punctuation — CJK angle brackets items: 4\n"
+ " 〈 U+3008 LEFT ANGLE BRACKET\n"
+ " 〉 U+3009 RIGHT ANGLE BRACKET\n"
+ " 《 U+300A LEFT DOUBLE ANGLE BRACKET\n"
+ " 》 U+300B RIGHT DOUBLE ANGLE BRACKET\n"
+ "CJK Symbols And Punctuation — CJK corner brackets items: 4\n"
+ " 「 U+300C LEFT CORNER BRACKET\n"
+ " 」 U+300D RIGHT CORNER BRACKET\n"
+ " 『 U+300E LEFT WHITE CORNER BRACKET\n"
+ " 』 U+300F RIGHT WHITE CORNER BRACKET\n"
+ "CJK Symbols And Punctuation — CJK brackets items: 10\n"
+ " 【 U+3010 LEFT BLACK LENTICULAR BRACKET\n"
+ " 】 U+3011 RIGHT BLACK LENTICULAR BRACKET\n"
+ " 〔 U+3014 LEFT TORTOISE SHELL BRACKET\n"
+ " 〕 U+3015 RIGHT TORTOISE SHELL BRACKET\n"
+ " 〖 U+3016 LEFT WHITE LENTICULAR BRACKET\n"
+ " 〗 U+3017 RIGHT WHITE LENTICULAR BRACKET\n"
+ " 〘 U+3018 LEFT WHITE TORTOISE SHELL BRACKET\n"
+ " 〙 U+3019 RIGHT WHITE TORTOISE SHELL BRACKET\n"
+ " 〚 U+301A LEFT WHITE SQUARE BRACKET\n"
+ " 〛 U+301B RIGHT WHITE SQUARE BRACKET\n"
+ "CJK Symbols And Punctuation — CJK punctuation items: 6\n"
+ " 〜 U+301C WAVE DASH\n"
+ " 〝 U+301D REVERSED DOUBLE PRIME QUOTATION MARK\n"
+ " 〞 U+301E DOUBLE PRIME QUOTATION MARK\n"
+ " 〟 U+301F LOW DOUBLE PRIME QUOTATION MARK\n"
+ " 〰️ U+3030 WAVY DASH\n"
+ " 〽️ U+303D PART ALTERNATION MARK\n"
+ "Katakana — Katakana punctuation items: 1\n"
+ " ゠ U+30A0 KATAKANA-HIRAGANA DOUBLE HYPHEN\n"
+ "Katakana — Conjunction and length marks items: 1\n"
+ " ・ U+30FB KATAKANA MIDDLE DOT\n"
+ "Lisu — Punctuation items: 2\n"
+ " ꓾ U+A4FE LISU PUNCTUATION COMMA\n"
+ " ꓿ U+A4FF LISU PUNCTUATION FULL STOP\n"
+ "Vai — Punctuation items: 3\n"
+ " ꘍ U+A60D VAI COMMA\n"
+ " ꘎ U+A60E VAI FULL STOP\n"
+ " ꘏ U+A60F VAI QUESTION MARK\n"
+ "Cyrillic Extended B — Punctuation mark items: 2\n"
+ " ꙳ U+A673 SLAVONIC ASTERISK\n"
+ " ꙾ U+A67E CYRILLIC KAVYKA\n"
+ "Bamum — Punctuation items: 6\n"
+ " ꛲ U+A6F2 BAMUM NJAEMLI\n"
+ " ꛳ U+A6F3 BAMUM FULL STOP\n"
+ " ꛴ U+A6F4 BAMUM COLON\n"
+ " ꛵ U+A6F5 BAMUM COMMA\n"
+ " ꛶ U+A6F6 BAMUM SEMICOLON\n"
+ " ꛷ U+A6F7 BAMUM QUESTION MARK\n"
+ "Phags Pa — Head marks for Tibetan items: 2\n"
+ " ꡴ U+A874 PHAGS-PA SINGLE HEAD MARK\n"
+ " ꡵ U+A875 PHAGS-PA DOUBLE HEAD MARK\n"
+ "Phags Pa — Punctuation for Tibetan items: 2\n"
+ " ꡶ U+A876 PHAGS-PA MARK SHAD\n"
+ " ꡷ U+A877 PHAGS-PA MARK DOUBLE SHAD\n"
+ "Saurashtra — Punctuation items: 2\n"
+ " ꣎ U+A8CE SAURASHTRA DANDA\n"
+ " ꣏ U+A8CF SAURASHTRA DOUBLE DANDA\n"
+ "Devanagari Extended — Editorial marks items: 3\n"
+ " ꣸ U+A8F8 DEVANAGARI SIGN PUSHPIKA\n"
+ " ꣹ U+A8F9 DEVANAGARI GAP FILLER\n"
+ " ꣺ U+A8FA DEVANAGARI CARET\n"
+ "Devanagari Extended — Sign items: 1\n"
+ " ꣼ U+A8FC DEVANAGARI SIGN SIDDHAM\n"
+ "Kayah Li — Punctuation items: 2\n"
+ " ꤮ U+A92E KAYAH LI SIGN CWI\n"
+ " ꤯ U+A92F KAYAH LI SIGN SHYA\n"
+ "Rejang — Punctuation items: 1\n"
+ " ꥟ U+A95F REJANG SECTION MARK\n"
+ "Javanese — Punctuation items: 13\n"
+ " ꧁ U+A9C1 JAVANESE LEFT RERENGGAN\n"
+ " ꧂ U+A9C2 JAVANESE RIGHT RERENGGAN\n"
+ " ꧃ U+A9C3 JAVANESE PADA ANDAP\n"
+ " ꧄ U+A9C4 JAVANESE PADA MADYA\n"
+ " ꧅ U+A9C5 JAVANESE PADA LUHUR\n"
+ " ꧆ U+A9C6 JAVANESE PADA WINDU\n"
+ " ꧇ U+A9C7 JAVANESE PADA PANGKAT\n"
+ " ꧈ U+A9C8 JAVANESE PADA LINGSA\n"
+ " ꧉ U+A9C9 JAVANESE PADA LUNGSI\n"
+ " ꧊ U+A9CA JAVANESE PADA ADEG\n"
+ " ꧋ U+A9CB JAVANESE PADA ADEG ADEG\n"
+ " ꧌ U+A9CC JAVANESE PADA PISELEH\n"
+ " ꧍ U+A9CD JAVANESE TURNED PADA PISELEH\n"
+ "Javanese — Ellipsis marks items: 2\n"
+ " ꧞ U+A9DE JAVANESE PADA TIRTA TUMETES\n"
+ " ꧟ U+A9DF JAVANESE PADA ISEN-ISEN\n"
+ "Cham — Punctuation items: 4\n"
+ " ꩜ U+AA5C CHAM PUNCTUATION SPIRAL\n"
+ " ꩝ U+AA5D CHAM PUNCTUATION DANDA\n"
+ " ꩞ U+AA5E CHAM PUNCTUATION DOUBLE DANDA\n"
+ " ꩟ U+AA5F CHAM PUNCTUATION TRIPLE DANDA\n"
+ "Tai Viet — Punctuation items: 2\n"
+ " ꫞ U+AADE TAI VIET SYMBOL HO HOI\n"
+ " ꫟ U+AADF TAI VIET SYMBOL KOI KOI\n"
+ "Meetei Mayek Extensions — Punctuation items: 2\n"
+ " ꫰ U+AAF0 MEETEI MAYEK CHEIKHAN\n"
+ " ꫱ U+AAF1 MEETEI MAYEK AHANG KHUDAM\n"
+ "Meetei Mayek — Punctuation items: 1\n"
+ " ꯫ U+ABEB MEETEI MAYEK CHEIKHEI\n"
+ "Arabic Presentation Forms A — Punctuation items: 2\n"
+ " ﴾ U+FD3E ORNATE LEFT PARENTHESIS\n"
+ " ﴿ U+FD3F ORNATE RIGHT PARENTHESIS\n"
+ "Vertical Forms — Glyphs for vertical variants items: 10\n"
+ " ︐ U+FE10 PRESENTATION FORM FOR VERTICAL COMMA\n"
+ " ︑ U+FE11 PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC COMMA\n"
+ " ︒ U+FE12 PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC FULL STOP\n"
+ " ︓ U+FE13 PRESENTATION FORM FOR VERTICAL COLON\n"
+ " ︔ U+FE14 PRESENTATION FORM FOR VERTICAL SEMICOLON\n"
+ " ︕ U+FE15 PRESENTATION FORM FOR VERTICAL EXCLAMATION MARK\n"
+ " ︖ U+FE16 PRESENTATION FORM FOR VERTICAL QUESTION MARK\n"
+ " ︗ U+FE17 PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET\n"
+ " ︘ U+FE18 PRESENTATION FORM FOR VERTICAL RIGHT WHITE LENTICULAR BRAKCET\n"
+ " ︙ U+FE19 PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS\n"
+ "CJK Compatibility Forms — Glyphs for vertical variants items: 23\n"
+ " ︰ U+FE30 PRESENTATION FORM FOR VERTICAL TWO DOT LEADER\n"
+ " ︱ U+FE31 PRESENTATION FORM FOR VERTICAL EM DASH\n"
+ " ︲ U+FE32 PRESENTATION FORM FOR VERTICAL EN DASH\n"
+ " ︳ U+FE33 PRESENTATION FORM FOR VERTICAL LOW LINE\n"
+ " ︴ U+FE34 PRESENTATION FORM FOR VERTICAL WAVY LOW LINE\n"
+ " ︵ U+FE35 PRESENTATION FORM FOR VERTICAL LEFT PARENTHESIS\n"
+ " ︶ U+FE36 PRESENTATION FORM FOR VERTICAL RIGHT PARENTHESIS\n"
+ " ︷ U+FE37 PRESENTATION FORM FOR VERTICAL LEFT CURLY BRACKET\n"
+ " ︸ U+FE38 PRESENTATION FORM FOR VERTICAL RIGHT CURLY BRACKET\n"
+ " ︹ U+FE39 PRESENTATION FORM FOR VERTICAL LEFT TORTOISE SHELL BRACKET\n"
+ " ︺ U+FE3A PRESENTATION FORM FOR VERTICAL RIGHT TORTOISE SHELL BRACKET\n"
+ " ︻ U+FE3B PRESENTATION FORM FOR VERTICAL LEFT BLACK LENTICULAR BRACKET\n"
+ " ︼ U+FE3C PRESENTATION FORM FOR VERTICAL RIGHT BLACK LENTICULAR BRACKET\n"
+ " ︽ U+FE3D PRESENTATION FORM FOR VERTICAL LEFT DOUBLE ANGLE BRACKET\n"
+ " ︾ U+FE3E PRESENTATION FORM FOR VERTICAL RIGHT DOUBLE ANGLE BRACKET\n"
+ " ︿ U+FE3F PRESENTATION FORM FOR VERTICAL LEFT ANGLE BRACKET\n"
+ " ﹀ U+FE40 PRESENTATION FORM FOR VERTICAL RIGHT ANGLE BRACKET\n"
+ " ﹁ U+FE41 PRESENTATION FORM FOR VERTICAL LEFT CORNER BRACKET\n"
+ " ﹂ U+FE42 PRESENTATION FORM FOR VERTICAL RIGHT CORNER BRACKET\n"
+ " ﹃ U+FE43 PRESENTATION FORM FOR VERTICAL LEFT WHITE CORNER BRACKET\n"
+ " ﹄ U+FE44 PRESENTATION FORM FOR VERTICAL RIGHT WHITE CORNER BRACKET\n"
+ " ﹇ U+FE47 PRESENTATION FORM FOR VERTICAL LEFT SQUARE BRACKET\n"
+ " ﹈ U+FE48 PRESENTATION FORM FOR VERTICAL RIGHT SQUARE BRACKET\n"
+ "CJK Compatibility Forms — Sidelining emphasis marks items: 2\n"
+ " ﹅ U+FE45 SESAME DOT\n"
+ " ﹆ U+FE46 WHITE SESAME DOT\n"
+ "CJK Compatibility Forms — Overscores and underscores items: 7\n"
+ " ﹉ U+FE49 DASHED OVERLINE\n"
+ " ﹊ U+FE4A CENTRELINE OVERLINE\n"
+ " ﹋ U+FE4B WAVY OVERLINE\n"
+ " ﹌ U+FE4C DOUBLE WAVY OVERLINE\n"
+ " ﹍ U+FE4D DASHED LOW LINE\n"
+ " ﹎ U+FE4E CENTRELINE LOW LINE\n"
+ " ﹏ U+FE4F WAVY LOW LINE\n"
+ "Small Form Variants — Small form variants items: 21\n"
+ " ﹐ U+FE50 SMALL COMMA\n"
+ " ﹑ U+FE51 SMALL IDEOGRAPHIC COMMA\n"
+ " ﹒ U+FE52 SMALL FULL STOP\n"
+ " ﹔ U+FE54 SMALL SEMICOLON\n"
+ " ﹕ U+FE55 SMALL COLON\n"
+ " ﹖ U+FE56 SMALL QUESTION MARK\n"
+ " ﹗ U+FE57 SMALL EXCLAMATION MARK\n"
+ " ﹘ U+FE58 SMALL EM DASH\n"
+ " ﹙ U+FE59 SMALL LEFT PARENTHESIS\n"
+ " ﹚ U+FE5A SMALL RIGHT PARENTHESIS\n"
+ " ﹛ U+FE5B SMALL LEFT CURLY BRACKET\n"
+ " ﹜ U+FE5C SMALL RIGHT CURLY BRACKET\n"
+ " ﹝ U+FE5D SMALL LEFT TORTOISE SHELL BRACKET\n"
+ " ﹞ U+FE5E SMALL RIGHT TORTOISE SHELL BRACKET\n"
+ " ﹟ U+FE5F SMALL NUMBER SIGN\n"
+ " ﹠ U+FE60 SMALL AMPERSAND\n"
+ " ﹡ U+FE61 SMALL ASTERISK\n"
+ " ﹣ U+FE63 SMALL HYPHEN-MINUS\n"
+ " ﹨ U+FE68 SMALL REVERSE SOLIDUS\n"
+ " ﹪ U+FE6A SMALL PERCENT SIGN\n"
+ " ﹫ U+FE6B SMALL COMMERCIAL AT\n"
+ "Halfwidth And Fullwidth Forms — Fullwidth ASCII variants items: 23\n"
+ " ! U+FF01 FULLWIDTH EXCLAMATION MARK\n"
+ " " U+FF02 FULLWIDTH QUOTATION MARK\n"
+ " # U+FF03 FULLWIDTH NUMBER SIGN\n"
+ " % U+FF05 FULLWIDTH PERCENT SIGN\n"
+ " & U+FF06 FULLWIDTH AMPERSAND\n"
+ " ' U+FF07 FULLWIDTH APOSTROPHE\n"
+ " ( U+FF08 FULLWIDTH LEFT PARENTHESIS\n"
+ " ) U+FF09 FULLWIDTH RIGHT PARENTHESIS\n"
+ " * U+FF0A FULLWIDTH ASTERISK\n"
+ " , U+FF0C FULLWIDTH COMMA\n"
+ " - U+FF0D FULLWIDTH HYPHEN-MINUS\n"
+ " . U+FF0E FULLWIDTH FULL STOP\n"
+ " / U+FF0F FULLWIDTH SOLIDUS\n"
+ " : U+FF1A FULLWIDTH COLON\n"
+ " ; U+FF1B FULLWIDTH SEMICOLON\n"
+ " ? U+FF1F FULLWIDTH QUESTION MARK\n"
+ " @ U+FF20 FULLWIDTH COMMERCIAL AT\n"
+ " [ U+FF3B FULLWIDTH LEFT SQUARE BRACKET\n"
+ " \ U+FF3C FULLWIDTH REVERSE SOLIDUS\n"
+ " ] U+FF3D FULLWIDTH RIGHT SQUARE BRACKET\n"
+ " _ U+FF3F FULLWIDTH LOW LINE\n"
+ " { U+FF5B FULLWIDTH LEFT CURLY BRACKET\n"
+ " } U+FF5D FULLWIDTH RIGHT CURLY BRACKET\n"
+ "Halfwidth And Fullwidth Forms — Fullwidth brackets items: 2\n"
+ " ⦅ U+FF5F FULLWIDTH LEFT WHITE PARENTHESIS\n"
+ " ⦆ U+FF60 FULLWIDTH RIGHT WHITE PARENTHESIS\n"
+ "Halfwidth And Fullwidth Forms — Halfwidth CJK punctuation items: 4\n"
+ " 。 U+FF61 HALFWIDTH IDEOGRAPHIC FULL STOP\n"
+ " 「 U+FF62 HALFWIDTH LEFT CORNER BRACKET\n"
+ " 」 U+FF63 HALFWIDTH RIGHT CORNER BRACKET\n"
+ " 、 U+FF64 HALFWIDTH IDEOGRAPHIC COMMA\n"
+ "Halfwidth And Fullwidth Forms — Halfwidth Katakana variants items: 1\n"
+ " ・ U+FF65 HALFWIDTH KATAKANA MIDDLE DOT\n"
+ "Aegean Numbers — Punctuation items: 3\n"
+ " 𐄀 U+10100 AEGEAN WORD SEPARATOR LINE\n"
+ " 𐄁 U+10101 AEGEAN WORD SEPARATOR DOT\n"
+ " 𐄂 U+10102 AEGEAN CHECK MARK\n"
+ "Ugaritic — Punctuation items: 1\n"
+ " 𐎟 U+1039F UGARITIC WORD DIVIDER\n"
+ "Old Persian — Punctuation items: 1\n"
+ " 𐏐 U+103D0 OLD PERSIAN WORD DIVIDER\n"
+ "Caucasian Albanian — Punctuation items: 1\n"
+ " 𐕯 U+1056F CAUCASIAN ALBANIAN CITATION MARK\n"
+ "Imperial Aramaic — Punctuation items: 1\n"
+ " 𐡗 U+10857 IMPERIAL ARAMAIC SECTION SIGN\n"
+ "Phoenician — Punctuation items: 1\n"
+ " 𐤟 U+1091F PHOENICIAN WORD SEPARATOR\n"
+ "Lydian — Punctuation items: 1\n"
+ " 𐤿 U+1093F LYDIAN TRIANGULAR MARK\n"
+ "Kharoshthi — Punctuation items: 9\n"
+ " 𐩐 U+10A50 KHAROSHTHI PUNCTUATION DOT\n"
+ " 𐩑 U+10A51 KHAROSHTHI PUNCTUATION SMALL CIRCLE\n"
+ " 𐩒 U+10A52 KHAROSHTHI PUNCTUATION CIRCLE\n"
+ " 𐩓 U+10A53 KHAROSHTHI PUNCTUATION CRESCENT BAR\n"
+ " 𐩔 U+10A54 KHAROSHTHI PUNCTUATION MANGALAM\n"
+ " 𐩕 U+10A55 KHAROSHTHI PUNCTUATION LOTUS\n"
+ " 𐩖 U+10A56 KHAROSHTHI PUNCTUATION DANDA\n"
+ " 𐩗 U+10A57 KHAROSHTHI PUNCTUATION DOUBLE DANDA\n"
+ " 𐩘 U+10A58 KHAROSHTHI PUNCTUATION LINES\n"
+ "Old South Arabian — Numbers items: 1\n"
+ " 𐩿 U+10A7F OLD SOUTH ARABIAN NUMERIC INDICATOR\n"
+ "Manichaean — Punctuation items: 7\n"
+ " 𐫰 U+10AF0 MANICHAEAN PUNCTUATION STAR\n"
+ " 𐫱 U+10AF1 MANICHAEAN PUNCTUATION FLEURON\n"
+ " 𐫲 U+10AF2 MANICHAEAN PUNCTUATION DOUBLE DOT WITHIN DOT\n"
+ " 𐫳 U+10AF3 MANICHAEAN PUNCTUATION DOT WITHIN DOT\n"
+ " 𐫴 U+10AF4 MANICHAEAN PUNCTUATION DOT\n"
+ " 𐫵 U+10AF5 MANICHAEAN PUNCTUATION TWO DOTS\n"
+ " 𐫶 U+10AF6 MANICHAEAN PUNCTUATION LINE FILLER\n"
+ "Avestan — Punctuation items: 7\n"
+ " 𐬹 U+10B39 AVESTAN ABBREVIATION MARK\n"
+ " 𐬺 U+10B3A TINY TWO DOTS OVER ONE DOT PUNCTUATION\n"
+ " 𐬻 U+10B3B SMALL TWO DOTS OVER ONE DOT PUNCTUATION\n"
+ " 𐬼 U+10B3C LARGE TWO DOTS OVER ONE DOT PUNCTUATION\n"
+ " 𐬽 U+10B3D LARGE ONE DOT OVER TWO DOTS PUNCTUATION\n"
+ " 𐬾 U+10B3E LARGE TWO RINGS OVER ONE RING PUNCTUATION\n"
+ " 𐬿 U+10B3F LARGE ONE RING OVER TWO RINGS PUNCTUATION\n"
+ "Psalter Pahlavi — Punctuation items: 4\n"
+ " 𐮙 U+10B99 PSALTER PAHLAVI SECTION MARK\n"
+ " 𐮚 U+10B9A PSALTER PAHLAVI TURNED SECTION MARK\n"
+ " 𐮛 U+10B9B PSALTER PAHLAVI FOUR DOTS WITH CROSS\n"
+ " 𐮜 U+10B9C PSALTER PAHLAVI FOUR DOTS WITH DOT\n"
+ "Sogdian — Punctuation items: 5\n"
+ " 𐽕 U+10F55 SOGDIAN PUNCTUATION TWO VERTICAL BARS\n"
+ " 𐽖 U+10F56 SOGDIAN PUNCTUATION TWO VERTICAL BARS WITH DOTS\n"
+ " 𐽗 U+10F57 SOGDIAN PUNCTUATION CIRCLE WITH DOT\n"
+ " 𐽘 U+10F58 SOGDIAN PUNCTUATION TWO CIRCLES WITH DOTS\n"
+ " 𐽙 U+10F59 SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT\n"
+ "Brahmi — Punctuation items: 7\n"
+ " 𑁇 U+11047 BRAHMI DANDA\n"
+ " 𑁈 U+11048 BRAHMI DOUBLE DANDA\n"
+ " 𑁉 U+11049 BRAHMI PUNCTUATION DOT\n"
+ " 𑁊 U+1104A BRAHMI PUNCTUATION DOUBLE DOT\n"
+ " 𑁋 U+1104B BRAHMI PUNCTUATION LINE\n"
+ " 𑁌 U+1104C BRAHMI PUNCTUATION CRESCENT BAR\n"
+ " 𑁍 U+1104D BRAHMI PUNCTUATION LOTUS\n"
+ "Kaithi — Various signs items: 2\n"
+ " 𑂻 U+110BB KAITHI ABBREVIATION SIGN\n"
+ " 𑂼 U+110BC KAITHI ENUMERATION SIGN\n"
+ "Kaithi — Punctuation items: 4\n"
+ " 𑂾 U+110BE KAITHI SECTION MARK\n"
+ " 𑂿 U+110BF KAITHI DOUBLE SECTION MARK\n"
+ " 𑃀 U+110C0 KAITHI DANDA\n"
+ " 𑃁 U+110C1 KAITHI DOUBLE DANDA\n"
+ "Chakma — Punctuation items: 4\n"
+ " 𑅀 U+11140 CHAKMA SECTION MARK\n"
+ " 𑅁 U+11141 CHAKMA DANDA\n"
+ " 𑅂 U+11142 CHAKMA DOUBLE DANDA\n"
+ " 𑅃 U+11143 CHAKMA QUESTION MARK\n"
+ "Mahajani — Punctuation items: 2\n"
+ " 𑅴 U+11174 MAHAJANI ABBREVIATION SIGN\n"
+ " 𑅵 U+11175 MAHAJANI SECTION MARK\n"
+ "Sharada — Punctuation items: 7\n"
+ " 𑇅 U+111C5 SHARADA DANDA\n"
+ " 𑇆 U+111C6 SHARADA DOUBLE DANDA\n"
+ " 𑇇 U+111C7 SHARADA ABBREVIATION SIGN\n"
+ " 𑇈 U+111C8 SHARADA SEPARATOR\n"
+ " 𑇍 U+111CD SHARADA SUTRA MARK\n"
+ " 𑇛 U+111DB SHARADA SIGN SIDDHAM\n"
+ " 𑇝 U+111DD SHARADA CONTINUATION SIGN\n"
+ "Sharada — Section marks items: 2\n"
+ " 𑇞 U+111DE SHARADA SECTION MARK-1\n"
+ " 𑇟 U+111DF SHARADA SECTION MARK-2\n"
+ "Khojki — Punctuation items: 6\n"
+ " 𑈸 U+11238 KHOJKI DANDA\n"
+ " 𑈹 U+11239 KHOJKI DOUBLE DANDA\n"
+ " 𑈺 U+1123A KHOJKI WORD SEPARATOR\n"
+ " 𑈻 U+1123B KHOJKI SECTION MARK\n"
+ " 𑈼 U+1123C KHOJKI DOUBLE SECTION MARK\n"
+ " 𑈽 U+1123D KHOJKI ABBREVIATION SIGN\n"
+ "Multani — Punctuation items: 1\n"
+ " 𑊩 U+112A9 MULTANI SECTION MARK\n"
+ "Newa — Punctuation items: 5\n"
+ " 𑑋 U+1144B NEWA DANDA\n"
+ " 𑑌 U+1144C NEWA DOUBLE DANDA\n"
+ " 𑑍 U+1144D NEWA COMMA\n"
+ " 𑑎 U+1144E NEWA GAP FILLER\n"
+ " 𑑏 U+1144F NEWA ABBREVIATION SIGN\n"
+ "Newa — Various signs items: 2\n"
+ " 𑑛 U+1145B NEWA PLACEHOLDER MARK\n"
+ " 𑑝 U+1145D NEWA INSERTION SIGN\n"
+ "Tirhuta — Various signs items: 1\n"
+ " 𑓆 U+114C6 TIRHUTA ABBREVIATION SIGN\n"
+ "Siddham — Head mark items: 1\n"
+ " 𑗁 U+115C1 SIDDHAM SIGN SIDDHAM\n"
+ "Siddham — Punctuation items: 4\n"
+ " 𑗂 U+115C2 SIDDHAM DANDA\n"
+ " 𑗃 U+115C3 SIDDHAM DOUBLE DANDA\n"
+ " 𑗄 U+115C4 SIDDHAM SEPARATOR DOT\n"
+ " 𑗅 U+115C5 SIDDHAM SEPARATOR BAR\n"
+ "Siddham — Repetition mark items: 3\n"
+ " 𑗆 U+115C6 SIDDHAM REPETITION MARK-1\n"
+ " 𑗇 U+115C7 SIDDHAM REPETITION MARK-2\n"
+ " 𑗈 U+115C8 SIDDHAM REPETITION MARK-3\n"
+ "Siddham — Terminal mark items: 1\n"
+ " 𑗉 U+115C9 SIDDHAM END OF TEXT MARK\n"
+ "Siddham — Section marks items: 14\n"
+ " 𑗊 U+115CA SIDDHAM SECTION MARK WITH TRIDENT AND U-SHAPED ORNAMENTS\n"
+ " 𑗋 U+115CB SIDDHAM SECTION MARK WITH TRIDENT AND DOTTED CRESCENTS\n"
+ " 𑗌 U+115CC SIDDHAM SECTION MARK WITH RAYS AND DOTTED CRESCENTS\n"
+ " 𑗍 U+115CD SIDDHAM SECTION MARK WITH RAYS AND DOTTED DOUBLE CRESCENTS\n"
+ " 𑗎 U+115CE SIDDHAM SECTION MARK WITH RAYS AND DOTTED TRIPLE CRESCENTS\n"
+ " 𑗏 U+115CF SIDDHAM SECTION MARK DOUBLE RING\n"
+ " 𑗐 U+115D0 SIDDHAM SECTION MARK DOUBLE RING WITH RAYS\n"
+ " 𑗑 U+115D1 SIDDHAM SECTION MARK WITH DOUBLE CRESCENTS\n"
+ " 𑗒 U+115D2 SIDDHAM SECTION MARK WITH TRIPLE CRESCENTS\n"
+ " 𑗓 U+115D3 SIDDHAM SECTION MARK WITH QUADRUPLE CRESCENTS\n"
+ " 𑗔 U+115D4 SIDDHAM SECTION MARK WITH SEPTUPLE CRESCENTS\n"
+ " 𑗕 U+115D5 SIDDHAM SECTION MARK WITH CIRCLES AND RAYS\n"
+ " 𑗖 U+115D6 SIDDHAM SECTION MARK WITH CIRCLES AND TWO ENCLOSURES\n"
+ " 𑗗 U+115D7 SIDDHAM SECTION MARK WITH CIRCLES AND FOUR ENCLOSURES\n"
+ "Modi — Punctuation items: 3\n"
+ " 𑙁 U+11641 MODI DANDA\n"
+ " 𑙂 U+11642 MODI DOUBLE DANDA\n"
+ " 𑙃 U+11643 MODI ABBREVIATION SIGN\n"
+ "Mongolian Supplement — Punctuation items: 13\n"
+ " 𑙠 U+11660 MONGOLIAN BIRGA WITH ORNAMENT\n"
+ " 𑙡 U+11661 MONGOLIAN ROTATED BIRGA\n"
+ " 𑙢 U+11662 MONGOLIAN DOUBLE BIRGA WITH ORNAMENT\n"
+ " 𑙣 U+11663 MONGOLIAN TRIPLE BIRGA WITH ORNAMENT\n"
+ " 𑙤 U+11664 MONGOLIAN BIRGA WITH DOUBLE ORNAMENT\n"
+ " 𑙥 U+11665 MONGOLIAN ROTATED BIRGA WITH ORNAMENT\n"
+ " 𑙦 U+11666 MONGOLIAN ROTATED BIRGA WITH DOUBLE ORNAMENT\n"
+ " 𑙧 U+11667 MONGOLIAN INVERTED BIRGA\n"
+ " 𑙨 U+11668 MONGOLIAN INVERTED BIRGA WITH DOUBLE ORNAMENT\n"
+ " 𑙩 U+11669 MONGOLIAN SWIRL BIRGA\n"
+ " 𑙪 U+1166A MONGOLIAN SWIRL BIRGA WITH ORNAMENT\n"
+ " 𑙫 U+1166B MONGOLIAN SWIRL BIRGA WITH DOUBLE ORNAMENT\n"
+ " 𑙬 U+1166C MONGOLIAN TURNED SWIRL BIRGA WITH DOUBLE ORNAMENT\n"
+ "Ahom — Punctuation items: 3\n"
+ " 𑜼 U+1173C AHOM SIGN SMALL SECTION\n"
+ " 𑜽 U+1173D AHOM SIGN SECTION\n"
+ " 𑜾 U+1173E AHOM SIGN RULAI\n"
+ "Dogra — Punctuation items: 1\n"
+ " 𑠻 U+1183B DOGRA ABBREVIATION SIGN\n"
+ "Zanabazar Square — Head mark items: 4\n"
+ " 𑨿 U+11A3F ZANABAZAR SQUARE INITIAL HEAD MARK\n"
+ " 𑩀 U+11A40 ZANABAZAR SQUARE CLOSING HEAD MARK\n"
+ " 𑩅 U+11A45 ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK\n"
+ " 𑩆 U+11A46 ZANABAZAR SQUARE CLOSING DOUBLE-LINED HEAD MARK\n"
+ "Zanabazar Square — Punctuation items: 4\n"
+ " 𑩁 U+11A41 ZANABAZAR SQUARE MARK TSHEG\n"
+ " 𑩂 U+11A42 ZANABAZAR SQUARE MARK SHAD\n"
+ " 𑩃 U+11A43 ZANABAZAR SQUARE MARK DOUBLE SHAD\n"
+ " 𑩄 U+11A44 ZANABAZAR SQUARE MARK LONG TSHEG\n"
+ "Soyombo — Punctuation items: 3\n"
+ " 𑪚 U+11A9A SOYOMBO MARK TSHEG\n"
+ " 𑪛 U+11A9B SOYOMBO MARK SHAD\n"
+ " 𑪜 U+11A9C SOYOMBO MARK DOUBLE SHAD\n"
+ "Soyombo — Head mark items: 3\n"
+ " 𑪞 U+11A9E SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME\n"
+ " 𑪟 U+11A9F SOYOMBO HEAD MARK WITH MOON AND SUN AND FLAME\n"
+ " 𑪠 U+11AA0 SOYOMBO HEAD MARK WITH MOON AND SUN\n"
+ "Soyombo — Terminal mark items: 2\n"
+ " 𑪡 U+11AA1 SOYOMBO TERMINAL MARK-1\n"
+ " 𑪢 U+11AA2 SOYOMBO TERMINAL MARK-2\n"
+ "Bhaiksuki — Punctuation items: 3\n"
+ " 𑱁 U+11C41 BHAIKSUKI DANDA\n"
+ " 𑱂 U+11C42 BHAIKSUKI DOUBLE DANDA\n"
+ " 𑱃 U+11C43 BHAIKSUKI WORD SEPARATOR\n"
+ "Bhaiksuki — Gap fillers items: 2\n"
+ " 𑱄 U+11C44 BHAIKSUKI GAP FILLER-1\n"
+ " 𑱅 U+11C45 BHAIKSUKI GAP FILLER-2\n"
+ "Marchen — Punctuation items: 2\n"
+ " 𑱰 U+11C70 MARCHEN HEAD MARK\n"
+ " 𑱱 U+11C71 MARCHEN MARK SHAD\n"
+ "Makasar — Punctuation items: 2\n"
+ " 𑻷 U+11EF7 MAKASAR PASSIMBANG\n"
+ " 𑻸 U+11EF8 MAKASAR END OF SECTION\n"
+ "Cuneiform Numbers And Punctuation — Punctuation items: 5\n"
+ " 𒑰 U+12470 CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER\n"
+ " 𒑱 U+12471 CUNEIFORM PUNCTUATION SIGN VERTICAL COLON\n"
+ " 𒑲 U+12472 CUNEIFORM PUNCTUATION SIGN DIAGONAL COLON\n"
+ " 𒑳 U+12473 CUNEIFORM PUNCTUATION SIGN DIAGONAL TRICOLON\n"
+ " 𒑴 U+12474 CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON\n"
+ "Mro — Punctuation items: 2\n"
+ " 𖩮 U+16A6E MRO DANDA\n"
+ " 𖩯 U+16A6F MRO DOUBLE DANDA\n"
+ "Bassa Vah — Punctuation items: 1\n"
+ " 𖫵 U+16AF5 BASSA VAH FULL STOP\n"
+ "Pahawh Hmong — Punctuation items: 6\n"
+ " 𖬷 U+16B37 PAHAWH HMONG SIGN VOS THOM\n"
+ " 𖬸 U+16B38 PAHAWH HMONG SIGN VOS TSHAB CEEB\n"
+ " 𖬹 U+16B39 PAHAWH HMONG SIGN CIM CHEEM\n"
+ " 𖬺 U+16B3A PAHAWH HMONG SIGN VOS THIAB\n"
+ " 𖬻 U+16B3B PAHAWH HMONG SIGN VOS FEEM\n"
+ " 𖭄 U+16B44 PAHAWH HMONG SIGN XAUS\n"
+ "Medefaidrin — Punctuation items: 2\n"
+ " 𖺗 U+16E97 MEDEFAIDRIN COMMA\n"
+ " 𖺘 U+16E98 MEDEFAIDRIN FULL STOP\n"
+ "Medefaidrin — Sign items: 2\n"
+ " 𖺙 U+16E99 MEDEFAIDRIN SYMBOL AIVA\n"
+ " 𖺚 U+16E9A MEDEFAIDRIN EXCLAMATION OH\n"
+ "Duployan — Chinook punctuation items: 1\n"
+ " 𛲟 U+1BC9F DUPLOYAN PUNCTUATION CHINOOK FULL STOP\n"
+ "Sutton SignWriting — Punctuation items: 5\n"
+ " 𝪇 U+1DA87 SIGNWRITING COMMA\n"
+ " 𝪈 U+1DA88 SIGNWRITING FULL STOP\n"
+ " 𝪉 U+1DA89 SIGNWRITING SEMICOLON\n"
+ " 𝪊 U+1DA8A SIGNWRITING COLON\n"
+ " 𝪋 U+1DA8B SIGNWRITING PARENTHESIS\n"
+ "Adlam — Punctuation items: 2\n"
+ " 𞥞 U+1E95E ADLAM INITIAL EXCLAMATION MARK\n"
+ " 𞥟 U+1E95F ADLAM INITIAL QUESTION MARK";
final Pattern pattern = Pattern.compile(regex);
final Matcher matcher = pattern.matcher(string);
while (matcher.find()) {
System.out.println("Full match: " + matcher.group(0));
for (int i = 1; i <= matcher.groupCount(); i++) {
System.out.println("Group " + i + ": " + matcher.group(i));
}
}
}
}
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Java, please visit: https://docs.oracle.com/javase/7/docs/api/java/util/regex/Pattern.html