const regex = /(?:[!-#%-\*,-\/:;\?@\[-\]_\{\}\xA1\xA7\xAB\xB6\xB7\xBB\xBF\u037E\u0387\u055A-\u055F\u0589\u058A\u05BE\u05C0\u05C3\u05C6\u05F3\u05F4\u0609\u060A\u060C\u060D\u061B\u061E\u061F\u066A-\u066D\u06D4\u0700-\u070D\u07F7-\u07F9\u0830-\u083E\u085E\u0964\u0965\u0970\u09FD\u0A76\u0AF0\u0C84\u0DF4\u0E4F\u0E5A\u0E5B\u0F04-\u0F12\u0F14\u0F3A-\u0F3D\u0F85\u0FD0-\u0FD4\u0FD9\u0FDA\u104A-\u104F\u10FB\u1360-\u1368\u1400\u166D\u166E\u169B\u169C\u16EB-\u16ED\u1735\u1736\u17D4-\u17D6\u17D8-\u17DA\u1800-\u180A\u1944\u1945\u1A1E\u1A1F\u1AA0-\u1AA6\u1AA8-\u1AAD\u1B5A-\u1B60\u1BFC-\u1BFF\u1C3B-\u1C3F\u1C7E\u1C7F\u1CC0-\u1CC7\u1CD3\u2010-\u2027\u2030-\u2043\u2045-\u2051\u2053-\u205E\u207D\u207E\u208D\u208E\u2308-\u230B\u2329\u232A\u2768-\u2775\u27C5\u27C6\u27E6-\u27EF\u2983-\u2998\u29D8-\u29DB\u29FC\u29FD\u2CF9-\u2CFC\u2CFE\u2CFF\u2D70\u2E00-\u2E2E\u2E30-\u2E4E\u3001-\u3003\u3008-\u3011\u3014-\u301F\u3030\u303D\u30A0\u30FB\uA4FE\uA4FF\uA60D-\uA60F\uA673\uA67E\uA6F2-\uA6F7\uA874-\uA877\uA8CE\uA8CF\uA8F8-\uA8FA\uA8FC\uA92E\uA92F\uA95F\uA9C1-\uA9CD\uA9DE\uA9DF\uAA5C-\uAA5F\uAADE\uAADF\uAAF0\uAAF1\uABEB\uFD3E\uFD3F\uFE10-\uFE19\uFE30-\uFE52\uFE54-\uFE61\uFE63\uFE68\uFE6A\uFE6B\uFF01-\uFF03\uFF05-\uFF0A\uFF0C-\uFF0F\uFF1A\uFF1B\uFF1F\uFF20\uFF3B-\uFF3D\uFF3F\uFF5B\uFF5D\uFF5F-\uFF65]|\uD800[\uDD00-\uDD02\uDF9F\uDFD0]|\uD801\uDD6F|\uD802[\uDC57\uDD1F\uDD3F\uDE50-\uDE58\uDE7F\uDEF0-\uDEF6\uDF39-\uDF3F\uDF99-\uDF9C]|\uD803[\uDF55-\uDF59]|\uD804[\uDC47-\uDC4D\uDCBB\uDCBC\uDCBE-\uDCC1\uDD40-\uDD43\uDD74\uDD75\uDDC5-\uDDC8\uDDCD\uDDDB\uDDDD-\uDDDF\uDE38-\uDE3D\uDEA9]|\uD805[\uDC4B-\uDC4F\uDC5B\uDC5D\uDCC6\uDDC1-\uDDD7\uDE41-\uDE43\uDE60-\uDE6C\uDF3C-\uDF3E]|\uD806[\uDC3B\uDE3F-\uDE46\uDE9A-\uDE9C\uDE9E-\uDEA2]|\uD807[\uDC41-\uDC45\uDC70\uDC71\uDEF7\uDEF8]|\uD809[\uDC70-\uDC74]|\uD81A[\uDE6E\uDE6F\uDEF5\uDF37-\uDF3B\uDF44]|\uD81B[\uDE97-\uDE9A]|\uD82F\uDC9F|\uD836[\uDE87-\uDE8B]|\uD83A[\uDD5E\uDD5F])/g;
// Alternative syntax using RegExp constructor
// const regex = new RegExp('(?:[!-#%-\\*,-\\\/:;\\?@\\[-\\]_\\{\\}\\xA1\\xA7\\xAB\\xB6\\xB7\\xBB\\xBF\\u037E\\u0387\\u055A-\\u055F\\u0589\\u058A\\u05BE\\u05C0\\u05C3\\u05C6\\u05F3\\u05F4\\u0609\\u060A\\u060C\\u060D\\u061B\\u061E\\u061F\\u066A-\\u066D\\u06D4\\u0700-\\u070D\\u07F7-\\u07F9\\u0830-\\u083E\\u085E\\u0964\\u0965\\u0970\\u09FD\\u0A76\\u0AF0\\u0C84\\u0DF4\\u0E4F\\u0E5A\\u0E5B\\u0F04-\\u0F12\\u0F14\\u0F3A-\\u0F3D\\u0F85\\u0FD0-\\u0FD4\\u0FD9\\u0FDA\\u104A-\\u104F\\u10FB\\u1360-\\u1368\\u1400\\u166D\\u166E\\u169B\\u169C\\u16EB-\\u16ED\\u1735\\u1736\\u17D4-\\u17D6\\u17D8-\\u17DA\\u1800-\\u180A\\u1944\\u1945\\u1A1E\\u1A1F\\u1AA0-\\u1AA6\\u1AA8-\\u1AAD\\u1B5A-\\u1B60\\u1BFC-\\u1BFF\\u1C3B-\\u1C3F\\u1C7E\\u1C7F\\u1CC0-\\u1CC7\\u1CD3\\u2010-\\u2027\\u2030-\\u2043\\u2045-\\u2051\\u2053-\\u205E\\u207D\\u207E\\u208D\\u208E\\u2308-\\u230B\\u2329\\u232A\\u2768-\\u2775\\u27C5\\u27C6\\u27E6-\\u27EF\\u2983-\\u2998\\u29D8-\\u29DB\\u29FC\\u29FD\\u2CF9-\\u2CFC\\u2CFE\\u2CFF\\u2D70\\u2E00-\\u2E2E\\u2E30-\\u2E4E\\u3001-\\u3003\\u3008-\\u3011\\u3014-\\u301F\\u3030\\u303D\\u30A0\\u30FB\\uA4FE\\uA4FF\\uA60D-\\uA60F\\uA673\\uA67E\\uA6F2-\\uA6F7\\uA874-\\uA877\\uA8CE\\uA8CF\\uA8F8-\\uA8FA\\uA8FC\\uA92E\\uA92F\\uA95F\\uA9C1-\\uA9CD\\uA9DE\\uA9DF\\uAA5C-\\uAA5F\\uAADE\\uAADF\\uAAF0\\uAAF1\\uABEB\\uFD3E\\uFD3F\\uFE10-\\uFE19\\uFE30-\\uFE52\\uFE54-\\uFE61\\uFE63\\uFE68\\uFE6A\\uFE6B\\uFF01-\\uFF03\\uFF05-\\uFF0A\\uFF0C-\\uFF0F\\uFF1A\\uFF1B\\uFF1F\\uFF20\\uFF3B-\\uFF3D\\uFF3F\\uFF5B\\uFF5D\\uFF5F-\\uFF65]|\\uD800[\\uDD00-\\uDD02\\uDF9F\\uDFD0]|\\uD801\\uDD6F|\\uD802[\\uDC57\\uDD1F\\uDD3F\\uDE50-\\uDE58\\uDE7F\\uDEF0-\\uDEF6\\uDF39-\\uDF3F\\uDF99-\\uDF9C]|\\uD803[\\uDF55-\\uDF59]|\\uD804[\\uDC47-\\uDC4D\\uDCBB\\uDCBC\\uDCBE-\\uDCC1\\uDD40-\\uDD43\\uDD74\\uDD75\\uDDC5-\\uDDC8\\uDDCD\\uDDDB\\uDDDD-\\uDDDF\\uDE38-\\uDE3D\\uDEA9]|\\uD805[\\uDC4B-\\uDC4F\\uDC5B\\uDC5D\\uDCC6\\uDDC1-\\uDDD7\\uDE41-\\uDE43\\uDE60-\\uDE6C\\uDF3C-\\uDF3E]|\\uD806[\\uDC3B\\uDE3F-\\uDE46\\uDE9A-\\uDE9C\\uDE9E-\\uDEA2]|\\uD807[\\uDC41-\\uDC45\\uDC70\\uDC71\\uDEF7\\uDEF8]|\\uD809[\\uDC70-\\uDC74]|\\uD81A[\\uDE6E\\uDE6F\\uDEF5\\uDF37-\\uDF3B\\uDF44]|\\uD81B[\\uDE97-\\uDE9A]|\\uD82F\\uDC9F|\\uD836[\\uDE87-\\uDE8B]|\\uD83A[\\uDD5E\\uDD5F])', 'g')
const str = `
Basic Latin — ASCII punctuation and symbols items: 23
! U+0021 EXCLAMATION MARK
" U+0022 QUOTATION MARK
# U+0023 NUMBER SIGN
% U+0025 PERCENT SIGN
& U+0026 AMPERSAND
' U+0027 APOSTROPHE
( U+0028 LEFT PARENTHESIS
) U+0029 RIGHT PARENTHESIS
* U+002A ASTERISK
, U+002C COMMA
- U+002D HYPHEN-MINUS
. U+002E FULL STOP
/ U+002F SOLIDUS
: U+003A COLON
; U+003B SEMICOLON
? U+003F QUESTION MARK
@ U+0040 COMMERCIAL AT
[ U+005B LEFT SQUARE BRACKET
\\ U+005C REVERSE SOLIDUS
] U+005D RIGHT SQUARE BRACKET
_ U+005F LOW LINE
{ U+007B LEFT CURLY BRACKET
} U+007D RIGHT CURLY BRACKET
Latin 1 Supplement — Latin-1 punctuation and symbols items: 6
¡ U+00A1 INVERTED EXCLAMATION MARK
§ U+00A7 SECTION SIGN
« U+00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
¶ U+00B6 PILCROW SIGN
· U+00B7 MIDDLE DOT
» U+00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
Latin 1 Supplement — Punctuation items: 1
¿ U+00BF INVERTED QUESTION MARK
Greek And Coptic — Punctuation items: 2
; U+037E GREEK QUESTION MARK
· U+0387 GREEK ANO TELEIA
Armenian — Modifier letter items: 6
՚ U+055A ARMENIAN APOSTROPHE
՛ U+055B ARMENIAN EMPHASIS MARK
՜ U+055C ARMENIAN EXCLAMATION MARK
՝ U+055D ARMENIAN COMMA
՞ U+055E ARMENIAN QUESTION MARK
՟ U+055F ARMENIAN ABBREVIATION MARK
Armenian — Punctuation items: 2
։ U+0589 ARMENIAN FULL STOP
֊ U+058A ARMENIAN HYPHEN
Hebrew — Points and punctuation items: 4
־ U+05BE HEBREW PUNCTUATION MAQAF
׀ U+05C0 HEBREW PUNCTUATION PASEQ
׃ U+05C3 HEBREW PUNCTUATION SOF PASUQ
׆ U+05C6 HEBREW PUNCTUATION NUN HAFUKHA
Hebrew — Punctuation items: 2
׳ U+05F3 HEBREW PUNCTUATION GERESH
״ U+05F4 HEBREW PUNCTUATION GERSHAYIM
Arabic — Punctuation items: 12
؉ U+0609 ARABIC-INDIC PER MILLE SIGN
؊ U+060A ARABIC-INDIC PER TEN THOUSAND SIGN
، U+060C ARABIC COMMA
؍ U+060D ARABIC DATE SEPARATOR
؛ U+061B ARABIC SEMICOLON
؞ U+061E ARABIC TRIPLE DOT PUNCTUATION MARK
؟ U+061F ARABIC QUESTION MARK
٪ U+066A ARABIC PERCENT SIGN
٫ U+066B ARABIC DECIMAL SEPARATOR
٬ U+066C ARABIC THOUSANDS SEPARATOR
٭ U+066D ARABIC FIVE POINTED STAR
۔ U+06D4 ARABIC FULL STOP
Syriac — Syriac punctuation and signs items: 14
܀ U+0700 SYRIAC END OF PARAGRAPH
܁ U+0701 SYRIAC SUPRALINEAR FULL STOP
܂ U+0702 SYRIAC SUBLINEAR FULL STOP
܃ U+0703 SYRIAC SUPRALINEAR COLON
܄ U+0704 SYRIAC SUBLINEAR COLON
܅ U+0705 SYRIAC HORIZONTAL COLON
܆ U+0706 SYRIAC COLON SKEWED LEFT
܇ U+0707 SYRIAC COLON SKEWED RIGHT
܈ U+0708 SYRIAC SUPRALINEAR COLON SKEWED LEFT
܉ U+0709 SYRIAC SUBLINEAR COLON SKEWED RIGHT
܊ U+070A SYRIAC CONTRACTION
܋ U+070B SYRIAC HARKLEAN OBELUS
܌ U+070C SYRIAC HARKLEAN METOBELUS
܍ U+070D SYRIAC HARKLEAN ASTERISCUS
NKo — Punctuation items: 3
߷ U+07F7 NKO SYMBOL GBAKURUNEN
߸ U+07F8 NKO COMMA
߹ U+07F9 NKO EXCLAMATION MARK
Samaritan — Punctuation items: 15
࠰ U+0830 SAMARITAN PUNCTUATION NEQUDAA
࠱ U+0831 SAMARITAN PUNCTUATION AFSAAQ
࠲ U+0832 SAMARITAN PUNCTUATION ANGED
࠳ U+0833 SAMARITAN PUNCTUATION BAU
࠴ U+0834 SAMARITAN PUNCTUATION ATMAAU
࠵ U+0835 SAMARITAN PUNCTUATION SHIYYAALAA
࠶ U+0836 SAMARITAN ABBREVIATION MARK
࠷ U+0837 SAMARITAN PUNCTUATION MELODIC QITSA
࠸ U+0838 SAMARITAN PUNCTUATION ZIQAA
࠹ U+0839 SAMARITAN PUNCTUATION QITSA
࠺ U+083A SAMARITAN PUNCTUATION ZAEF
࠻ U+083B SAMARITAN PUNCTUATION TURU
࠼ U+083C SAMARITAN PUNCTUATION ARKAANU
࠽ U+083D SAMARITAN PUNCTUATION SOF MASHFAAT
࠾ U+083E SAMARITAN PUNCTUATION ANNAAU
Mandaic — Punctuation items: 1
࡞ U+085E MANDAIC PUNCTUATION
Devanagari — Generic punctuation for scripts of India items: 2
। U+0964 DEVANAGARI DANDA
॥ U+0965 DEVANAGARI DOUBLE DANDA
Devanagari — Abbreviation mark items: 1
॰ U+0970 DEVANAGARI ABBREVIATION SIGN
Bengali — Sign items: 1
৽ U+09FD BENGALI ABBREVIATION SIGN
Gurmukhi — Sign items: 1
੶ U+0A76 GURMUKHI ABBREVIATION SIGN
Gujarati — Abbreviation mark items: 1
૰ U+0AF0 GUJARATI ABBREVIATION SIGN
Kannada — Various signs items: 1
಄ U+0C84 KANNADA SIGN SIDDHAM
Sinhala — Punctuation items: 1
෴ U+0DF4 SINHALA PUNCTUATION KUNDDALIYA
Thai — Sign items: 3
๏ U+0E4F THAI CHARACTER FONGMAN
๚ U+0E5A THAI CHARACTER ANGKHANKHU
๛ U+0E5B THAI CHARACTER KHOMUT
Tibetan — Head mark items: 6
༄ U+0F04 TIBETAN MARK INITIAL YIG MGO MDUN MA
༅ U+0F05 TIBETAN MARK CLOSING YIG MGO SGAB MA
༆ U+0F06 TIBETAN MARK CARET YIG MGO PHUR SHAD MA
༇ U+0F07 TIBETAN MARK YIG MGO TSHEG SHAD MA
࿓ U+0FD3 TIBETAN MARK INITIAL BRDA RNYING YIG MGO MDUN MA
࿔ U+0FD4 TIBETAN MARK CLOSING BRDA RNYING YIG MGO SGAB MA
Tibetan — Sign items: 16
༈ U+0F08 TIBETAN MARK SBRUL SHAD
༉ U+0F09 TIBETAN MARK BSKUR YIG MGO
༊ U+0F0A TIBETAN MARK BKA- SHOG YIG MGO
་ U+0F0B TIBETAN MARK INTERSYLLABIC TSHEG
༌ U+0F0C TIBETAN MARK DELIMITER TSHEG BSTAR
། U+0F0D TIBETAN MARK SHAD
༎ U+0F0E TIBETAN MARK NYIS SHAD
༏ U+0F0F TIBETAN MARK TSHEG SHAD
༐ U+0F10 TIBETAN MARK NYIS TSHEG SHAD
༑ U+0F11 TIBETAN MARK RIN CHEN SPUNGS SHAD
༒ U+0F12 TIBETAN MARK RGYA GRAM SHAD
༔ U+0F14 TIBETAN MARK GTER TSHEG
྅ U+0F85 TIBETAN MARK PALUTA
࿐ U+0FD0 TIBETAN MARK BSKA- SHOG GI MGO RGYAN
࿑ U+0FD1 TIBETAN MARK MNYAM YIG GI MGO RGYAN
࿒ U+0FD2 TIBETAN MARK NYIS TSHEG
Tibetan — Paired punctuation items: 4
༺ U+0F3A TIBETAN MARK GUG RTAGS GYON
༻ U+0F3B TIBETAN MARK GUG RTAGS GYAS
༼ U+0F3C TIBETAN MARK ANG KHANG GYON
༽ U+0F3D TIBETAN MARK ANG KHANG GYAS
Tibetan — Annotation marks items: 2
࿙ U+0FD9 TIBETAN MARK LEADING MCHAN RTAGS
࿚ U+0FDA TIBETAN MARK TRAILING MCHAN RTAGS
Myanmar — Punctuation items: 2
၊ U+104A MYANMAR SIGN LITTLE SECTION
။ U+104B MYANMAR SIGN SECTION
Myanmar — Various signs items: 4
၌ U+104C MYANMAR SYMBOL LOCATIVE
၍ U+104D MYANMAR SYMBOL COMPLETED
၎ U+104E MYANMAR SYMBOL AFOREMENTIONED
၏ U+104F MYANMAR SYMBOL GENITIVE
Georgian — Punctuation items: 1
჻ U+10FB GEORGIAN PARAGRAPH SEPARATOR
Ethiopic — Punctuation items: 9
፠ U+1360 ETHIOPIC SECTION MARK
፡ U+1361 ETHIOPIC WORDSPACE
። U+1362 ETHIOPIC FULL STOP
፣ U+1363 ETHIOPIC COMMA
፤ U+1364 ETHIOPIC SEMICOLON
፥ U+1365 ETHIOPIC COLON
፦ U+1366 ETHIOPIC PREFACE COLON
፧ U+1367 ETHIOPIC QUESTION MARK
፨ U+1368 ETHIOPIC PARAGRAPH SEPARATOR
Unified Canadian Aboriginal Syllabics — Punctuation items: 2
᐀ U+1400 CANADIAN SYLLABICS HYPHEN
᙮ U+166E CANADIAN SYLLABICS FULL STOP
Unified Canadian Aboriginal Syllabics — Sign items: 1
᙭ U+166D CANADIAN SYLLABICS CHI SIGN
Ogham — Punctuation items: 2
᚛ U+169B OGHAM FEATHER MARK
᚜ U+169C OGHAM REVERSED FEATHER MARK
Runic — Punctuation items: 3
᛫ U+16EB RUNIC SINGLE PUNCTUATION
᛬ U+16EC RUNIC MULTIPLE PUNCTUATION
᛭ U+16ED RUNIC CROSS PUNCTUATION
Hanunoo — Generic punctuation for Philippine scripts items: 2
᜵ U+1735 PHILIPPINE SINGLE PUNCTUATION
᜶ U+1736 PHILIPPINE DOUBLE PUNCTUATION
Khmer — Various signs items: 6
។ U+17D4 KHMER SIGN KHAN
៕ U+17D5 KHMER SIGN BARIYOOSAN
៖ U+17D6 KHMER SIGN CAMNUC PII KUUH
៘ U+17D8 KHMER SIGN BEYYAL
៙ U+17D9 KHMER SIGN PHNAEK MUAN
៚ U+17DA KHMER SIGN KOOMUUT
Mongolian — Punctuation items: 11
᠀ U+1800 MONGOLIAN BIRGA
᠁ U+1801 MONGOLIAN ELLIPSIS
᠂ U+1802 MONGOLIAN COMMA
᠃ U+1803 MONGOLIAN FULL STOP
᠄ U+1804 MONGOLIAN COLON
᠅ U+1805 MONGOLIAN FOUR DOTS
᠆ U+1806 MONGOLIAN TODO SOFT HYPHEN
᠇ U+1807 MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER
᠈ U+1808 MONGOLIAN MANCHU COMMA
᠉ U+1809 MONGOLIAN MANCHU FULL STOP
᠊ U+180A MONGOLIAN NIRUGU
Limbu — Various signs items: 2
᥄ U+1944 LIMBU EXCLAMATION MARK
᥅ U+1945 LIMBU QUESTION MARK
Buginese — Various signs items: 2
᨞ U+1A1E BUGINESE PALLAWA
᨟ U+1A1F BUGINESE END OF SECTION
Tai Tham — Logographs items: 3
᪠ U+1AA0 TAI THAM SIGN WIANG
᪡ U+1AA1 TAI THAM SIGN WIANGWAAK
᪢ U+1AA2 TAI THAM SIGN SAWAN
Tai Tham — Punctuation items: 10
᪣ U+1AA3 TAI THAM SIGN KEOW
᪤ U+1AA4 TAI THAM SIGN HOY
᪥ U+1AA5 TAI THAM SIGN DOKMAI
᪦ U+1AA6 TAI THAM SIGN REVERSED ROTATED RANA
᪨ U+1AA8 TAI THAM SIGN KAAN
᪩ U+1AA9 TAI THAM SIGN KAANKUU
᪪ U+1AAA TAI THAM SIGN SATKAAN
᪫ U+1AAB TAI THAM SIGN SATKAANKUU
᪬ U+1AAC TAI THAM SIGN HANG
᪭ U+1AAD TAI THAM SIGN CAANG
Balinese — Punctuation items: 7
᭚ U+1B5A BALINESE PANTI
᭛ U+1B5B BALINESE PAMADA
᭜ U+1B5C BALINESE WINDU
᭝ U+1B5D BALINESE CARIK PAMUNGKAH
᭞ U+1B5E BALINESE CARIK SIKI
᭟ U+1B5F BALINESE CARIK PAREREN
᭠ U+1B60 BALINESE PAMENENG
Batak — Punctuation items: 4
᯼ U+1BFC BATAK SYMBOL BINDU NA METEK
᯽ U+1BFD BATAK SYMBOL BINDU PINARBORAS
᯾ U+1BFE BATAK SYMBOL BINDU JUDUL
᯿ U+1BFF BATAK SYMBOL BINDU PANGOLAT
Lepcha — Punctuation items: 5
᰻ U+1C3B LEPCHA PUNCTUATION TA-ROL
᰼ U+1C3C LEPCHA PUNCTUATION NYET THYOOM TA-ROL
᰽ U+1C3D LEPCHA PUNCTUATION CER-WA
᰾ U+1C3E LEPCHA PUNCTUATION TSHOOK CER-WA
᰿ U+1C3F LEPCHA PUNCTUATION TSHOOK
Ol Chiki — Punctuation items: 2
᱾ U+1C7E OL CHIKI PUNCTUATION MUCAAD
᱿ U+1C7F OL CHIKI PUNCTUATION DOUBLE MUCAAD
Sundanese Supplement — Punctuation items: 8
᳀ U+1CC0 SUNDANESE PUNCTUATION BINDU SURYA
᳁ U+1CC1 SUNDANESE PUNCTUATION BINDU PANGLONG
᳂ U+1CC2 SUNDANESE PUNCTUATION BINDU PURNAMA
᳃ U+1CC3 SUNDANESE PUNCTUATION BINDU CAKRA
᳄ U+1CC4 SUNDANESE PUNCTUATION BINDU LEU SATANGA
᳅ U+1CC5 SUNDANESE PUNCTUATION BINDU KA SATANGA
᳆ U+1CC6 SUNDANESE PUNCTUATION BINDU DA SATANGA
᳇ U+1CC7 SUNDANESE PUNCTUATION BINDU BA SATANGA
Vedic Extensions — Breathing mark for the Samaveda items: 1
᳓ U+1CD3 VEDIC SIGN NIHSHVASA
General Punctuation — Dashes items: 6
‐ U+2010 HYPHEN
‑ U+2011 NON-BREAKING HYPHEN
‒ U+2012 FIGURE DASH
– U+2013 EN DASH
— U+2014 EM DASH
― U+2015 HORIZONTAL BAR
General Punctuation — General punctuation items: 39
‖ U+2016 DOUBLE VERTICAL LINE
‗ U+2017 DOUBLE LOW LINE
† U+2020 DAGGER
‡ U+2021 DOUBLE DAGGER
• U+2022 BULLET
‣ U+2023 TRIANGULAR BULLET
․ U+2024 ONE DOT LEADER
‥ U+2025 TWO DOT LEADER
… U+2026 HORIZONTAL ELLIPSIS
‧ U+2027 HYPHENATION POINT
‰ U+2030 PER MILLE SIGN
‱ U+2031 PER TEN THOUSAND SIGN
′ U+2032 PRIME
″ U+2033 DOUBLE PRIME
‴ U+2034 TRIPLE PRIME
‵ U+2035 REVERSED PRIME
‶ U+2036 REVERSED DOUBLE PRIME
‷ U+2037 REVERSED TRIPLE PRIME
‸ U+2038 CARET
※ U+203B REFERENCE MARK
‽ U+203D INTERROBANG
‾ U+203E OVERLINE
‿ U+203F UNDERTIE
⁀ U+2040 CHARACTER TIE
⁁ U+2041 CARET INSERTION POINT
⁂ U+2042 ASTERISM
⁃ U+2043 HYPHEN BULLET
⁊ U+204A TIRONIAN SIGN ET
⁋ U+204B REVERSED PILCROW SIGN
⁌ U+204C BLACK LEFTWARDS BULLET
⁍ U+204D BLACK RIGHTWARDS BULLET
⁎ U+204E LOW ASTERISK
⁏ U+204F REVERSED SEMICOLON
⁐ U+2050 CLOSE UP
⁑ U+2051 TWO ASTERISKS ALIGNED VERTICALLY
⁓ U+2053 SWUNG DASH
⁔ U+2054 INVERTED UNDERTIE
⁕ U+2055 FLOWER PUNCTUATION MARK
⁗ U+2057 QUADRUPLE PRIME
General Punctuation — Quotation marks and apostrophe items: 8
‘ U+2018 LEFT SINGLE QUOTATION MARK
’ U+2019 RIGHT SINGLE QUOTATION MARK
‚ U+201A SINGLE LOW-9 QUOTATION MARK
‛ U+201B SINGLE HIGH-REVERSED-9 QUOTATION MARK
“ U+201C LEFT DOUBLE QUOTATION MARK
” U+201D RIGHT DOUBLE QUOTATION MARK
„ U+201E DOUBLE LOW-9 QUOTATION MARK
‟ U+201F DOUBLE HIGH-REVERSED-9 QUOTATION MARK
General Punctuation — Quotation marks items: 2
‹ U+2039 SINGLE LEFT-POINTING ANGLE QUOTATION MARK
› U+203A SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
General Punctuation — Double punctuation for vertical text items: 4
‼️ U+203C DOUBLE EXCLAMATION MARK
⁇ U+2047 DOUBLE QUESTION MARK
⁈ U+2048 QUESTION EXCLAMATION MARK
⁉️ U+2049 EXCLAMATION QUESTION MARK
General Punctuation — Brackets items: 2
⁅ U+2045 LEFT SQUARE BRACKET WITH QUILL
⁆ U+2046 RIGHT SQUARE BRACKET WITH QUILL
General Punctuation — Archaic punctuation items: 8
⁖ U+2056 THREE DOT PUNCTUATION
⁘ U+2058 FOUR DOT PUNCTUATION
⁙ U+2059 FIVE DOT PUNCTUATION
⁚ U+205A TWO DOT PUNCTUATION
⁛ U+205B FOUR DOT MARK
⁜ U+205C DOTTED CROSS
⁝ U+205D TRICOLON
⁞ U+205E VERTICAL FOUR DOTS
Superscripts And Subscripts — Superscripts items: 2
⁽ U+207D SUPERSCRIPT LEFT PARENTHESIS
⁾ U+207E SUPERSCRIPT RIGHT PARENTHESIS
Superscripts And Subscripts — Subscripts items: 2
₍ U+208D SUBSCRIPT LEFT PARENTHESIS
₎ U+208E SUBSCRIPT RIGHT PARENTHESIS
Miscellaneous Technical — Ceilings and floors items: 4
⌈ U+2308 LEFT CEILING
⌉ U+2309 RIGHT CEILING
⌊ U+230A LEFT FLOOR
⌋ U+230B RIGHT FLOOR
Miscellaneous Technical — Deprecated angle brackets items: 2
〈 U+2329 LEFT-POINTING ANGLE BRACKET
〉 U+232A RIGHT-POINTING ANGLE BRACKET
Dingbats — Ornamental brackets items: 14
❨ U+2768 MEDIUM LEFT PARENTHESIS ORNAMENT
❩ U+2769 MEDIUM RIGHT PARENTHESIS ORNAMENT
❪ U+276A MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT
❫ U+276B MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT
❬ U+276C MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT
❭ U+276D MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT
❮ U+276E HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT
❯ U+276F HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT
❰ U+2770 HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT
❱ U+2771 HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT
❲ U+2772 LIGHT LEFT TORTOISE SHELL BRACKET ORNAMENT
❳ U+2773 LIGHT RIGHT TORTOISE SHELL BRACKET ORNAMENT
❴ U+2774 MEDIUM LEFT CURLY BRACKET ORNAMENT
❵ U+2775 MEDIUM RIGHT CURLY BRACKET ORNAMENT
Miscellaneous Mathematical Symbols A — Paired punctuation items: 2
⟅ U+27C5 LEFT S-SHAPED BAG DELIMITER
⟆ U+27C6 RIGHT S-SHAPED BAG DELIMITER
Miscellaneous Mathematical Symbols A — Mathematical brackets items: 10
⟦ U+27E6 MATHEMATICAL LEFT WHITE SQUARE BRACKET
⟧ U+27E7 MATHEMATICAL RIGHT WHITE SQUARE BRACKET
⟨ U+27E8 MATHEMATICAL LEFT ANGLE BRACKET
⟩ U+27E9 MATHEMATICAL RIGHT ANGLE BRACKET
⟪ U+27EA MATHEMATICAL LEFT DOUBLE ANGLE BRACKET
⟫ U+27EB MATHEMATICAL RIGHT DOUBLE ANGLE BRACKET
⟬ U+27EC MATHEMATICAL LEFT WHITE TORTOISE SHELL BRACKET
⟭ U+27ED MATHEMATICAL RIGHT WHITE TORTOISE SHELL BRACKET
⟮ U+27EE MATHEMATICAL LEFT FLATTENED PARENTHESIS
⟯ U+27EF MATHEMATICAL RIGHT FLATTENED PARENTHESIS
Miscellaneous Mathematical Symbols B — Brackets items: 20
⦃ U+2983 LEFT WHITE CURLY BRACKET
⦄ U+2984 RIGHT WHITE CURLY BRACKET
⦅ U+2985 LEFT WHITE PARENTHESIS
⦆ U+2986 RIGHT WHITE PARENTHESIS
⦇ U+2987 Z NOTATION LEFT IMAGE BRACKET
⦈ U+2988 Z NOTATION RIGHT IMAGE BRACKET
⦉ U+2989 Z NOTATION LEFT BINDING BRACKET
⦊ U+298A Z NOTATION RIGHT BINDING BRACKET
⦋ U+298B LEFT SQUARE BRACKET WITH UNDERBAR
⦌ U+298C RIGHT SQUARE BRACKET WITH UNDERBAR
⦑ U+2991 LEFT ANGLE BRACKET WITH DOT
⦒ U+2992 RIGHT ANGLE BRACKET WITH DOT
⦓ U+2993 LEFT ARC LESS-THAN BRACKET
⦔ U+2994 RIGHT ARC GREATER-THAN BRACKET
⦕ U+2995 DOUBLE LEFT ARC GREATER-THAN BRACKET
⦖ U+2996 DOUBLE RIGHT ARC LESS-THAN BRACKET
⦗ U+2997 LEFT BLACK TORTOISE SHELL BRACKET
⦘ U+2998 RIGHT BLACK TORTOISE SHELL BRACKET
⧼ U+29FC LEFT-POINTING CURVED ANGLE BRACKET
⧽ U+29FD RIGHT-POINTING CURVED ANGLE BRACKET
Miscellaneous Mathematical Symbols B — Brackets with ticks items: 4
⦍ U+298D LEFT SQUARE BRACKET WITH TICK IN TOP CORNER
⦎ U+298E RIGHT SQUARE BRACKET WITH TICK IN BOTTOM CORNER
⦏ U+298F LEFT SQUARE BRACKET WITH TICK IN BOTTOM CORNER
⦐ U+2990 RIGHT SQUARE BRACKET WITH TICK IN TOP CORNER
Miscellaneous Mathematical Symbols B — Fences items: 4
⧘ U+29D8 LEFT WIGGLY FENCE
⧙ U+29D9 RIGHT WIGGLY FENCE
⧚ U+29DA LEFT DOUBLE WIGGLY FENCE
⧛ U+29DB RIGHT DOUBLE WIGGLY FENCE
Coptic — Old Nubian punctuation items: 4
⳹ U+2CF9 COPTIC OLD NUBIAN FULL STOP
⳺ U+2CFA COPTIC OLD NUBIAN DIRECT QUESTION MARK
⳻ U+2CFB COPTIC OLD NUBIAN INDIRECT QUESTION MARK
⳼ U+2CFC COPTIC OLD NUBIAN VERSE DIVIDER
Coptic — Punctuation items: 2
⳾ U+2CFE COPTIC FULL STOP
⳿ U+2CFF COPTIC MORPHOLOGICAL DIVIDER
Tifinagh — Punctuation items: 1
⵰ U+2D70 TIFINAGH SEPARATOR MARK
Supplemental Punctuation — New Testament editorial symbols items: 14
⸀ U+2E00 RIGHT ANGLE SUBSTITUTION MARKER
⸁ U+2E01 RIGHT ANGLE DOTTED SUBSTITUTION MARKER
⸂ U+2E02 LEFT SUBSTITUTION BRACKET
⸃ U+2E03 RIGHT SUBSTITUTION BRACKET
⸄ U+2E04 LEFT DOTTED SUBSTITUTION BRACKET
⸅ U+2E05 RIGHT DOTTED SUBSTITUTION BRACKET
⸆ U+2E06 RAISED INTERPOLATION MARKER
⸇ U+2E07 RAISED DOTTED INTERPOLATION MARKER
⸈ U+2E08 DOTTED TRANSPOSITION MARKER
⸉ U+2E09 LEFT TRANSPOSITION BRACKET
⸊ U+2E0A RIGHT TRANSPOSITION BRACKET
⸋ U+2E0B RAISED SQUARE
⸌ U+2E0C LEFT RAISED OMISSION BRACKET
⸍ U+2E0D RIGHT RAISED OMISSION BRACKET
Supplemental Punctuation — Ancient Greek textual symbols items: 9
⸎ U+2E0E EDITORIAL CORONIS
⸏ U+2E0F PARAGRAPHOS
⸐ U+2E10 FORKED PARAGRAPHOS
⸑ U+2E11 REVERSED FORKED PARAGRAPHOS
⸒ U+2E12 HYPODIASTOLE
⸓ U+2E13 DOTTED OBELOS
⸔ U+2E14 DOWNWARDS ANCORA
⸕ U+2E15 UPWARDS ANCORA
⸖ U+2E16 DOTTED RIGHT-POINTING ANGLE
Supplemental Punctuation — Ancient Near-Eastern linguistic symbol items: 1
⸗ U+2E17 DOUBLE OBLIQUE HYPHEN
Supplemental Punctuation — General punctuation items: 2
⸘ U+2E18 INVERTED INTERROBANG
⸙ U+2E19 PALM BRANCH
Supplemental Punctuation — Dictionary punctuation items: 4
⸚ U+2E1A HYPHEN WITH DIAERESIS
⸛ U+2E1B TILDE WITH RING ABOVE
⸞ U+2E1E TILDE WITH DOT ABOVE
⸟ U+2E1F TILDE WITH DOT BELOW
Supplemental Punctuation — Brackets items: 8
⸜ U+2E1C LEFT LOW PARAPHRASE BRACKET
⸝ U+2E1D RIGHT LOW PARAPHRASE BRACKET
⸠ U+2E20 LEFT VERTICAL BAR WITH QUILL
⸡ U+2E21 RIGHT VERTICAL BAR WITH QUILL
⸦ U+2E26 LEFT SIDEWAYS U BRACKET
⸧ U+2E27 RIGHT SIDEWAYS U BRACKET
⸨ U+2E28 LEFT DOUBLE PARENTHESIS
⸩ U+2E29 RIGHT DOUBLE PARENTHESIS
Supplemental Punctuation — Half brackets items: 4
⸢ U+2E22 TOP LEFT HALF BRACKET
⸣ U+2E23 TOP RIGHT HALF BRACKET
⸤ U+2E24 BOTTOM LEFT HALF BRACKET
⸥ U+2E25 BOTTOM RIGHT HALF BRACKET
Supplemental Punctuation — Archaic punctuation items: 15
⸪ U+2E2A TWO DOTS OVER ONE DOT PUNCTUATION
⸫ U+2E2B ONE DOT OVER TWO DOTS PUNCTUATION
⸬ U+2E2C SQUARED FOUR DOT PUNCTUATION
⸭ U+2E2D FIVE DOT MARK
⸮ U+2E2E REVERSED QUESTION MARK
⸰ U+2E30 RING POINT
⸱ U+2E31 WORD SEPARATOR MIDDLE DOT
⸳ U+2E33 RAISED DOT
⸴ U+2E34 RAISED COMMA
⸿ U+2E3F CAPITULUM
⹊ U+2E4A DOTTED SOLIDUS
⹋ U+2E4B TRIPLE DAGGER
⹌ U+2E4C MEDIEVAL COMMA
⹍ U+2E4D PARAGRAPHUS MARK
⹎ U+2E4E PUNCTUS ELEVATUS MARK
Supplemental Punctuation — Palaeotype transliteration symbol items: 6
⸲ U+2E32 TURNED COMMA
⸵ U+2E35 TURNED SEMICOLON
⸶ U+2E36 DAGGER WITH LEFT GUARD
⸷ U+2E37 DAGGER WITH RIGHT GUARD
⸸ U+2E38 TURNED DAGGER
⸹ U+2E39 TOP HALF SECTION SIGN
Supplemental Punctuation — Dashes items: 2
⸺ U+2E3A TWO-EM DASH
⸻ U+2E3B THREE-EM DASH
Supplemental Punctuation — Alternate forms of punctuation items: 3
⸼ U+2E3C STENOGRAPHIC FULL STOP
⸽ U+2E3D VERTICAL SIX DOTS
⸾ U+2E3E WIGGLY VERTICAL LINE
Supplemental Punctuation — Double hyphen items: 1
⹀ U+2E40 DOUBLE HYPHEN
Supplemental Punctuation — Reversed punctuation items: 2
⹁ U+2E41 REVERSED COMMA
⹂ U+2E42 DOUBLE LOW-REVERSED-9 QUOTATION MARK
Supplemental Punctuation — Miscellaneous punctuation items: 2
⹃ U+2E43 DASH WITH LEFT UPTURN
⹄ U+2E44 DOUBLE SUSPENSION MARK
Supplemental Punctuation — Typicon punctuation items: 5
⹅ U+2E45 INVERTED LOW KAVYKA
⹆ U+2E46 INVERTED LOW KAVYKA WITH KAVYKA ABOVE
⹇ U+2E47 LOW KAVYKA
⹈ U+2E48 LOW KAVYKA WITH DOT
⹉ U+2E49 DOUBLE STACKED COMMA
CJK Symbols And Punctuation — CJK symbols and punctuation items: 3
、 U+3001 IDEOGRAPHIC COMMA
。 U+3002 IDEOGRAPHIC FULL STOP
〃 U+3003 DITTO MARK
CJK Symbols And Punctuation — CJK angle brackets items: 4
〈 U+3008 LEFT ANGLE BRACKET
〉 U+3009 RIGHT ANGLE BRACKET
《 U+300A LEFT DOUBLE ANGLE BRACKET
》 U+300B RIGHT DOUBLE ANGLE BRACKET
CJK Symbols And Punctuation — CJK corner brackets items: 4
「 U+300C LEFT CORNER BRACKET
」 U+300D RIGHT CORNER BRACKET
『 U+300E LEFT WHITE CORNER BRACKET
』 U+300F RIGHT WHITE CORNER BRACKET
CJK Symbols And Punctuation — CJK brackets items: 10
【 U+3010 LEFT BLACK LENTICULAR BRACKET
】 U+3011 RIGHT BLACK LENTICULAR BRACKET
〔 U+3014 LEFT TORTOISE SHELL BRACKET
〕 U+3015 RIGHT TORTOISE SHELL BRACKET
〖 U+3016 LEFT WHITE LENTICULAR BRACKET
〗 U+3017 RIGHT WHITE LENTICULAR BRACKET
〘 U+3018 LEFT WHITE TORTOISE SHELL BRACKET
〙 U+3019 RIGHT WHITE TORTOISE SHELL BRACKET
〚 U+301A LEFT WHITE SQUARE BRACKET
〛 U+301B RIGHT WHITE SQUARE BRACKET
CJK Symbols And Punctuation — CJK punctuation items: 6
〜 U+301C WAVE DASH
〝 U+301D REVERSED DOUBLE PRIME QUOTATION MARK
〞 U+301E DOUBLE PRIME QUOTATION MARK
〟 U+301F LOW DOUBLE PRIME QUOTATION MARK
〰️ U+3030 WAVY DASH
〽️ U+303D PART ALTERNATION MARK
Katakana — Katakana punctuation items: 1
゠ U+30A0 KATAKANA-HIRAGANA DOUBLE HYPHEN
Katakana — Conjunction and length marks items: 1
・ U+30FB KATAKANA MIDDLE DOT
Lisu — Punctuation items: 2
꓾ U+A4FE LISU PUNCTUATION COMMA
꓿ U+A4FF LISU PUNCTUATION FULL STOP
Vai — Punctuation items: 3
꘍ U+A60D VAI COMMA
꘎ U+A60E VAI FULL STOP
꘏ U+A60F VAI QUESTION MARK
Cyrillic Extended B — Punctuation mark items: 2
꙳ U+A673 SLAVONIC ASTERISK
꙾ U+A67E CYRILLIC KAVYKA
Bamum — Punctuation items: 6
꛲ U+A6F2 BAMUM NJAEMLI
꛳ U+A6F3 BAMUM FULL STOP
꛴ U+A6F4 BAMUM COLON
꛵ U+A6F5 BAMUM COMMA
꛶ U+A6F6 BAMUM SEMICOLON
꛷ U+A6F7 BAMUM QUESTION MARK
Phags Pa — Head marks for Tibetan items: 2
꡴ U+A874 PHAGS-PA SINGLE HEAD MARK
꡵ U+A875 PHAGS-PA DOUBLE HEAD MARK
Phags Pa — Punctuation for Tibetan items: 2
꡶ U+A876 PHAGS-PA MARK SHAD
꡷ U+A877 PHAGS-PA MARK DOUBLE SHAD
Saurashtra — Punctuation items: 2
꣎ U+A8CE SAURASHTRA DANDA
꣏ U+A8CF SAURASHTRA DOUBLE DANDA
Devanagari Extended — Editorial marks items: 3
꣸ U+A8F8 DEVANAGARI SIGN PUSHPIKA
꣹ U+A8F9 DEVANAGARI GAP FILLER
꣺ U+A8FA DEVANAGARI CARET
Devanagari Extended — Sign items: 1
꣼ U+A8FC DEVANAGARI SIGN SIDDHAM
Kayah Li — Punctuation items: 2
꤮ U+A92E KAYAH LI SIGN CWI
꤯ U+A92F KAYAH LI SIGN SHYA
Rejang — Punctuation items: 1
꥟ U+A95F REJANG SECTION MARK
Javanese — Punctuation items: 13
꧁ U+A9C1 JAVANESE LEFT RERENGGAN
꧂ U+A9C2 JAVANESE RIGHT RERENGGAN
꧃ U+A9C3 JAVANESE PADA ANDAP
꧄ U+A9C4 JAVANESE PADA MADYA
꧅ U+A9C5 JAVANESE PADA LUHUR
꧆ U+A9C6 JAVANESE PADA WINDU
꧇ U+A9C7 JAVANESE PADA PANGKAT
꧈ U+A9C8 JAVANESE PADA LINGSA
꧉ U+A9C9 JAVANESE PADA LUNGSI
꧊ U+A9CA JAVANESE PADA ADEG
꧋ U+A9CB JAVANESE PADA ADEG ADEG
꧌ U+A9CC JAVANESE PADA PISELEH
꧍ U+A9CD JAVANESE TURNED PADA PISELEH
Javanese — Ellipsis marks items: 2
꧞ U+A9DE JAVANESE PADA TIRTA TUMETES
꧟ U+A9DF JAVANESE PADA ISEN-ISEN
Cham — Punctuation items: 4
꩜ U+AA5C CHAM PUNCTUATION SPIRAL
꩝ U+AA5D CHAM PUNCTUATION DANDA
꩞ U+AA5E CHAM PUNCTUATION DOUBLE DANDA
꩟ U+AA5F CHAM PUNCTUATION TRIPLE DANDA
Tai Viet — Punctuation items: 2
꫞ U+AADE TAI VIET SYMBOL HO HOI
꫟ U+AADF TAI VIET SYMBOL KOI KOI
Meetei Mayek Extensions — Punctuation items: 2
꫰ U+AAF0 MEETEI MAYEK CHEIKHAN
꫱ U+AAF1 MEETEI MAYEK AHANG KHUDAM
Meetei Mayek — Punctuation items: 1
꯫ U+ABEB MEETEI MAYEK CHEIKHEI
Arabic Presentation Forms A — Punctuation items: 2
﴾ U+FD3E ORNATE LEFT PARENTHESIS
﴿ U+FD3F ORNATE RIGHT PARENTHESIS
Vertical Forms — Glyphs for vertical variants items: 10
︐ U+FE10 PRESENTATION FORM FOR VERTICAL COMMA
︑ U+FE11 PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC COMMA
︒ U+FE12 PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC FULL STOP
︓ U+FE13 PRESENTATION FORM FOR VERTICAL COLON
︔ U+FE14 PRESENTATION FORM FOR VERTICAL SEMICOLON
︕ U+FE15 PRESENTATION FORM FOR VERTICAL EXCLAMATION MARK
︖ U+FE16 PRESENTATION FORM FOR VERTICAL QUESTION MARK
︗ U+FE17 PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET
︘ U+FE18 PRESENTATION FORM FOR VERTICAL RIGHT WHITE LENTICULAR BRAKCET
︙ U+FE19 PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS
CJK Compatibility Forms — Glyphs for vertical variants items: 23
︰ U+FE30 PRESENTATION FORM FOR VERTICAL TWO DOT LEADER
︱ U+FE31 PRESENTATION FORM FOR VERTICAL EM DASH
︲ U+FE32 PRESENTATION FORM FOR VERTICAL EN DASH
︳ U+FE33 PRESENTATION FORM FOR VERTICAL LOW LINE
︴ U+FE34 PRESENTATION FORM FOR VERTICAL WAVY LOW LINE
︵ U+FE35 PRESENTATION FORM FOR VERTICAL LEFT PARENTHESIS
︶ U+FE36 PRESENTATION FORM FOR VERTICAL RIGHT PARENTHESIS
︷ U+FE37 PRESENTATION FORM FOR VERTICAL LEFT CURLY BRACKET
︸ U+FE38 PRESENTATION FORM FOR VERTICAL RIGHT CURLY BRACKET
︹ U+FE39 PRESENTATION FORM FOR VERTICAL LEFT TORTOISE SHELL BRACKET
︺ U+FE3A PRESENTATION FORM FOR VERTICAL RIGHT TORTOISE SHELL BRACKET
︻ U+FE3B PRESENTATION FORM FOR VERTICAL LEFT BLACK LENTICULAR BRACKET
︼ U+FE3C PRESENTATION FORM FOR VERTICAL RIGHT BLACK LENTICULAR BRACKET
︽ U+FE3D PRESENTATION FORM FOR VERTICAL LEFT DOUBLE ANGLE BRACKET
︾ U+FE3E PRESENTATION FORM FOR VERTICAL RIGHT DOUBLE ANGLE BRACKET
︿ U+FE3F PRESENTATION FORM FOR VERTICAL LEFT ANGLE BRACKET
﹀ U+FE40 PRESENTATION FORM FOR VERTICAL RIGHT ANGLE BRACKET
﹁ U+FE41 PRESENTATION FORM FOR VERTICAL LEFT CORNER BRACKET
﹂ U+FE42 PRESENTATION FORM FOR VERTICAL RIGHT CORNER BRACKET
﹃ U+FE43 PRESENTATION FORM FOR VERTICAL LEFT WHITE CORNER BRACKET
﹄ U+FE44 PRESENTATION FORM FOR VERTICAL RIGHT WHITE CORNER BRACKET
﹇ U+FE47 PRESENTATION FORM FOR VERTICAL LEFT SQUARE BRACKET
﹈ U+FE48 PRESENTATION FORM FOR VERTICAL RIGHT SQUARE BRACKET
CJK Compatibility Forms — Sidelining emphasis marks items: 2
﹅ U+FE45 SESAME DOT
﹆ U+FE46 WHITE SESAME DOT
CJK Compatibility Forms — Overscores and underscores items: 7
﹉ U+FE49 DASHED OVERLINE
﹊ U+FE4A CENTRELINE OVERLINE
﹋ U+FE4B WAVY OVERLINE
﹌ U+FE4C DOUBLE WAVY OVERLINE
﹍ U+FE4D DASHED LOW LINE
﹎ U+FE4E CENTRELINE LOW LINE
﹏ U+FE4F WAVY LOW LINE
Small Form Variants — Small form variants items: 21
﹐ U+FE50 SMALL COMMA
﹑ U+FE51 SMALL IDEOGRAPHIC COMMA
﹒ U+FE52 SMALL FULL STOP
﹔ U+FE54 SMALL SEMICOLON
﹕ U+FE55 SMALL COLON
﹖ U+FE56 SMALL QUESTION MARK
﹗ U+FE57 SMALL EXCLAMATION MARK
﹘ U+FE58 SMALL EM DASH
﹙ U+FE59 SMALL LEFT PARENTHESIS
﹚ U+FE5A SMALL RIGHT PARENTHESIS
﹛ U+FE5B SMALL LEFT CURLY BRACKET
﹜ U+FE5C SMALL RIGHT CURLY BRACKET
﹝ U+FE5D SMALL LEFT TORTOISE SHELL BRACKET
﹞ U+FE5E SMALL RIGHT TORTOISE SHELL BRACKET
﹟ U+FE5F SMALL NUMBER SIGN
﹠ U+FE60 SMALL AMPERSAND
﹡ U+FE61 SMALL ASTERISK
﹣ U+FE63 SMALL HYPHEN-MINUS
﹨ U+FE68 SMALL REVERSE SOLIDUS
﹪ U+FE6A SMALL PERCENT SIGN
﹫ U+FE6B SMALL COMMERCIAL AT
Halfwidth And Fullwidth Forms — Fullwidth ASCII variants items: 23
! U+FF01 FULLWIDTH EXCLAMATION MARK
" U+FF02 FULLWIDTH QUOTATION MARK
# U+FF03 FULLWIDTH NUMBER SIGN
% U+FF05 FULLWIDTH PERCENT SIGN
& U+FF06 FULLWIDTH AMPERSAND
' U+FF07 FULLWIDTH APOSTROPHE
( U+FF08 FULLWIDTH LEFT PARENTHESIS
) U+FF09 FULLWIDTH RIGHT PARENTHESIS
* U+FF0A FULLWIDTH ASTERISK
, U+FF0C FULLWIDTH COMMA
- U+FF0D FULLWIDTH HYPHEN-MINUS
. U+FF0E FULLWIDTH FULL STOP
/ U+FF0F FULLWIDTH SOLIDUS
: U+FF1A FULLWIDTH COLON
; U+FF1B FULLWIDTH SEMICOLON
? U+FF1F FULLWIDTH QUESTION MARK
@ U+FF20 FULLWIDTH COMMERCIAL AT
[ U+FF3B FULLWIDTH LEFT SQUARE BRACKET
\ U+FF3C FULLWIDTH REVERSE SOLIDUS
] U+FF3D FULLWIDTH RIGHT SQUARE BRACKET
_ U+FF3F FULLWIDTH LOW LINE
{ U+FF5B FULLWIDTH LEFT CURLY BRACKET
} U+FF5D FULLWIDTH RIGHT CURLY BRACKET
Halfwidth And Fullwidth Forms — Fullwidth brackets items: 2
⦅ U+FF5F FULLWIDTH LEFT WHITE PARENTHESIS
⦆ U+FF60 FULLWIDTH RIGHT WHITE PARENTHESIS
Halfwidth And Fullwidth Forms — Halfwidth CJK punctuation items: 4
。 U+FF61 HALFWIDTH IDEOGRAPHIC FULL STOP
「 U+FF62 HALFWIDTH LEFT CORNER BRACKET
」 U+FF63 HALFWIDTH RIGHT CORNER BRACKET
、 U+FF64 HALFWIDTH IDEOGRAPHIC COMMA
Halfwidth And Fullwidth Forms — Halfwidth Katakana variants items: 1
・ U+FF65 HALFWIDTH KATAKANA MIDDLE DOT
Aegean Numbers — Punctuation items: 3
𐄀 U+10100 AEGEAN WORD SEPARATOR LINE
𐄁 U+10101 AEGEAN WORD SEPARATOR DOT
𐄂 U+10102 AEGEAN CHECK MARK
Ugaritic — Punctuation items: 1
𐎟 U+1039F UGARITIC WORD DIVIDER
Old Persian — Punctuation items: 1
𐏐 U+103D0 OLD PERSIAN WORD DIVIDER
Caucasian Albanian — Punctuation items: 1
𐕯 U+1056F CAUCASIAN ALBANIAN CITATION MARK
Imperial Aramaic — Punctuation items: 1
𐡗 U+10857 IMPERIAL ARAMAIC SECTION SIGN
Phoenician — Punctuation items: 1
𐤟 U+1091F PHOENICIAN WORD SEPARATOR
Lydian — Punctuation items: 1
𐤿 U+1093F LYDIAN TRIANGULAR MARK
Kharoshthi — Punctuation items: 9
𐩐 U+10A50 KHAROSHTHI PUNCTUATION DOT
𐩑 U+10A51 KHAROSHTHI PUNCTUATION SMALL CIRCLE
𐩒 U+10A52 KHAROSHTHI PUNCTUATION CIRCLE
𐩓 U+10A53 KHAROSHTHI PUNCTUATION CRESCENT BAR
𐩔 U+10A54 KHAROSHTHI PUNCTUATION MANGALAM
𐩕 U+10A55 KHAROSHTHI PUNCTUATION LOTUS
𐩖 U+10A56 KHAROSHTHI PUNCTUATION DANDA
𐩗 U+10A57 KHAROSHTHI PUNCTUATION DOUBLE DANDA
𐩘 U+10A58 KHAROSHTHI PUNCTUATION LINES
Old South Arabian — Numbers items: 1
𐩿 U+10A7F OLD SOUTH ARABIAN NUMERIC INDICATOR
Manichaean — Punctuation items: 7
𐫰 U+10AF0 MANICHAEAN PUNCTUATION STAR
𐫱 U+10AF1 MANICHAEAN PUNCTUATION FLEURON
𐫲 U+10AF2 MANICHAEAN PUNCTUATION DOUBLE DOT WITHIN DOT
𐫳 U+10AF3 MANICHAEAN PUNCTUATION DOT WITHIN DOT
𐫴 U+10AF4 MANICHAEAN PUNCTUATION DOT
𐫵 U+10AF5 MANICHAEAN PUNCTUATION TWO DOTS
𐫶 U+10AF6 MANICHAEAN PUNCTUATION LINE FILLER
Avestan — Punctuation items: 7
𐬹 U+10B39 AVESTAN ABBREVIATION MARK
𐬺 U+10B3A TINY TWO DOTS OVER ONE DOT PUNCTUATION
𐬻 U+10B3B SMALL TWO DOTS OVER ONE DOT PUNCTUATION
𐬼 U+10B3C LARGE TWO DOTS OVER ONE DOT PUNCTUATION
𐬽 U+10B3D LARGE ONE DOT OVER TWO DOTS PUNCTUATION
𐬾 U+10B3E LARGE TWO RINGS OVER ONE RING PUNCTUATION
𐬿 U+10B3F LARGE ONE RING OVER TWO RINGS PUNCTUATION
Psalter Pahlavi — Punctuation items: 4
𐮙 U+10B99 PSALTER PAHLAVI SECTION MARK
𐮚 U+10B9A PSALTER PAHLAVI TURNED SECTION MARK
𐮛 U+10B9B PSALTER PAHLAVI FOUR DOTS WITH CROSS
𐮜 U+10B9C PSALTER PAHLAVI FOUR DOTS WITH DOT
Sogdian — Punctuation items: 5
𐽕 U+10F55 SOGDIAN PUNCTUATION TWO VERTICAL BARS
𐽖 U+10F56 SOGDIAN PUNCTUATION TWO VERTICAL BARS WITH DOTS
𐽗 U+10F57 SOGDIAN PUNCTUATION CIRCLE WITH DOT
𐽘 U+10F58 SOGDIAN PUNCTUATION TWO CIRCLES WITH DOTS
𐽙 U+10F59 SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT
Brahmi — Punctuation items: 7
𑁇 U+11047 BRAHMI DANDA
𑁈 U+11048 BRAHMI DOUBLE DANDA
𑁉 U+11049 BRAHMI PUNCTUATION DOT
𑁊 U+1104A BRAHMI PUNCTUATION DOUBLE DOT
𑁋 U+1104B BRAHMI PUNCTUATION LINE
𑁌 U+1104C BRAHMI PUNCTUATION CRESCENT BAR
𑁍 U+1104D BRAHMI PUNCTUATION LOTUS
Kaithi — Various signs items: 2
𑂻 U+110BB KAITHI ABBREVIATION SIGN
𑂼 U+110BC KAITHI ENUMERATION SIGN
Kaithi — Punctuation items: 4
𑂾 U+110BE KAITHI SECTION MARK
𑂿 U+110BF KAITHI DOUBLE SECTION MARK
𑃀 U+110C0 KAITHI DANDA
𑃁 U+110C1 KAITHI DOUBLE DANDA
Chakma — Punctuation items: 4
𑅀 U+11140 CHAKMA SECTION MARK
𑅁 U+11141 CHAKMA DANDA
𑅂 U+11142 CHAKMA DOUBLE DANDA
𑅃 U+11143 CHAKMA QUESTION MARK
Mahajani — Punctuation items: 2
𑅴 U+11174 MAHAJANI ABBREVIATION SIGN
𑅵 U+11175 MAHAJANI SECTION MARK
Sharada — Punctuation items: 7
𑇅 U+111C5 SHARADA DANDA
𑇆 U+111C6 SHARADA DOUBLE DANDA
𑇇 U+111C7 SHARADA ABBREVIATION SIGN
𑇈 U+111C8 SHARADA SEPARATOR
𑇍 U+111CD SHARADA SUTRA MARK
𑇛 U+111DB SHARADA SIGN SIDDHAM
𑇝 U+111DD SHARADA CONTINUATION SIGN
Sharada — Section marks items: 2
𑇞 U+111DE SHARADA SECTION MARK-1
𑇟 U+111DF SHARADA SECTION MARK-2
Khojki — Punctuation items: 6
𑈸 U+11238 KHOJKI DANDA
𑈹 U+11239 KHOJKI DOUBLE DANDA
𑈺 U+1123A KHOJKI WORD SEPARATOR
𑈻 U+1123B KHOJKI SECTION MARK
𑈼 U+1123C KHOJKI DOUBLE SECTION MARK
𑈽 U+1123D KHOJKI ABBREVIATION SIGN
Multani — Punctuation items: 1
𑊩 U+112A9 MULTANI SECTION MARK
Newa — Punctuation items: 5
𑑋 U+1144B NEWA DANDA
𑑌 U+1144C NEWA DOUBLE DANDA
𑑍 U+1144D NEWA COMMA
𑑎 U+1144E NEWA GAP FILLER
𑑏 U+1144F NEWA ABBREVIATION SIGN
Newa — Various signs items: 2
𑑛 U+1145B NEWA PLACEHOLDER MARK
𑑝 U+1145D NEWA INSERTION SIGN
Tirhuta — Various signs items: 1
𑓆 U+114C6 TIRHUTA ABBREVIATION SIGN
Siddham — Head mark items: 1
𑗁 U+115C1 SIDDHAM SIGN SIDDHAM
Siddham — Punctuation items: 4
𑗂 U+115C2 SIDDHAM DANDA
𑗃 U+115C3 SIDDHAM DOUBLE DANDA
𑗄 U+115C4 SIDDHAM SEPARATOR DOT
𑗅 U+115C5 SIDDHAM SEPARATOR BAR
Siddham — Repetition mark items: 3
𑗆 U+115C6 SIDDHAM REPETITION MARK-1
𑗇 U+115C7 SIDDHAM REPETITION MARK-2
𑗈 U+115C8 SIDDHAM REPETITION MARK-3
Siddham — Terminal mark items: 1
𑗉 U+115C9 SIDDHAM END OF TEXT MARK
Siddham — Section marks items: 14
𑗊 U+115CA SIDDHAM SECTION MARK WITH TRIDENT AND U-SHAPED ORNAMENTS
𑗋 U+115CB SIDDHAM SECTION MARK WITH TRIDENT AND DOTTED CRESCENTS
𑗌 U+115CC SIDDHAM SECTION MARK WITH RAYS AND DOTTED CRESCENTS
𑗍 U+115CD SIDDHAM SECTION MARK WITH RAYS AND DOTTED DOUBLE CRESCENTS
𑗎 U+115CE SIDDHAM SECTION MARK WITH RAYS AND DOTTED TRIPLE CRESCENTS
𑗏 U+115CF SIDDHAM SECTION MARK DOUBLE RING
𑗐 U+115D0 SIDDHAM SECTION MARK DOUBLE RING WITH RAYS
𑗑 U+115D1 SIDDHAM SECTION MARK WITH DOUBLE CRESCENTS
𑗒 U+115D2 SIDDHAM SECTION MARK WITH TRIPLE CRESCENTS
𑗓 U+115D3 SIDDHAM SECTION MARK WITH QUADRUPLE CRESCENTS
𑗔 U+115D4 SIDDHAM SECTION MARK WITH SEPTUPLE CRESCENTS
𑗕 U+115D5 SIDDHAM SECTION MARK WITH CIRCLES AND RAYS
𑗖 U+115D6 SIDDHAM SECTION MARK WITH CIRCLES AND TWO ENCLOSURES
𑗗 U+115D7 SIDDHAM SECTION MARK WITH CIRCLES AND FOUR ENCLOSURES
Modi — Punctuation items: 3
𑙁 U+11641 MODI DANDA
𑙂 U+11642 MODI DOUBLE DANDA
𑙃 U+11643 MODI ABBREVIATION SIGN
Mongolian Supplement — Punctuation items: 13
𑙠 U+11660 MONGOLIAN BIRGA WITH ORNAMENT
𑙡 U+11661 MONGOLIAN ROTATED BIRGA
𑙢 U+11662 MONGOLIAN DOUBLE BIRGA WITH ORNAMENT
𑙣 U+11663 MONGOLIAN TRIPLE BIRGA WITH ORNAMENT
𑙤 U+11664 MONGOLIAN BIRGA WITH DOUBLE ORNAMENT
𑙥 U+11665 MONGOLIAN ROTATED BIRGA WITH ORNAMENT
𑙦 U+11666 MONGOLIAN ROTATED BIRGA WITH DOUBLE ORNAMENT
𑙧 U+11667 MONGOLIAN INVERTED BIRGA
𑙨 U+11668 MONGOLIAN INVERTED BIRGA WITH DOUBLE ORNAMENT
𑙩 U+11669 MONGOLIAN SWIRL BIRGA
𑙪 U+1166A MONGOLIAN SWIRL BIRGA WITH ORNAMENT
𑙫 U+1166B MONGOLIAN SWIRL BIRGA WITH DOUBLE ORNAMENT
𑙬 U+1166C MONGOLIAN TURNED SWIRL BIRGA WITH DOUBLE ORNAMENT
Ahom — Punctuation items: 3
𑜼 U+1173C AHOM SIGN SMALL SECTION
𑜽 U+1173D AHOM SIGN SECTION
𑜾 U+1173E AHOM SIGN RULAI
Dogra — Punctuation items: 1
𑠻 U+1183B DOGRA ABBREVIATION SIGN
Zanabazar Square — Head mark items: 4
𑨿 U+11A3F ZANABAZAR SQUARE INITIAL HEAD MARK
𑩀 U+11A40 ZANABAZAR SQUARE CLOSING HEAD MARK
𑩅 U+11A45 ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK
𑩆 U+11A46 ZANABAZAR SQUARE CLOSING DOUBLE-LINED HEAD MARK
Zanabazar Square — Punctuation items: 4
𑩁 U+11A41 ZANABAZAR SQUARE MARK TSHEG
𑩂 U+11A42 ZANABAZAR SQUARE MARK SHAD
𑩃 U+11A43 ZANABAZAR SQUARE MARK DOUBLE SHAD
𑩄 U+11A44 ZANABAZAR SQUARE MARK LONG TSHEG
Soyombo — Punctuation items: 3
𑪚 U+11A9A SOYOMBO MARK TSHEG
𑪛 U+11A9B SOYOMBO MARK SHAD
𑪜 U+11A9C SOYOMBO MARK DOUBLE SHAD
Soyombo — Head mark items: 3
𑪞 U+11A9E SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME
𑪟 U+11A9F SOYOMBO HEAD MARK WITH MOON AND SUN AND FLAME
𑪠 U+11AA0 SOYOMBO HEAD MARK WITH MOON AND SUN
Soyombo — Terminal mark items: 2
𑪡 U+11AA1 SOYOMBO TERMINAL MARK-1
𑪢 U+11AA2 SOYOMBO TERMINAL MARK-2
Bhaiksuki — Punctuation items: 3
𑱁 U+11C41 BHAIKSUKI DANDA
𑱂 U+11C42 BHAIKSUKI DOUBLE DANDA
𑱃 U+11C43 BHAIKSUKI WORD SEPARATOR
Bhaiksuki — Gap fillers items: 2
𑱄 U+11C44 BHAIKSUKI GAP FILLER-1
𑱅 U+11C45 BHAIKSUKI GAP FILLER-2
Marchen — Punctuation items: 2
𑱰 U+11C70 MARCHEN HEAD MARK
𑱱 U+11C71 MARCHEN MARK SHAD
Makasar — Punctuation items: 2
𑻷 U+11EF7 MAKASAR PASSIMBANG
𑻸 U+11EF8 MAKASAR END OF SECTION
Cuneiform Numbers And Punctuation — Punctuation items: 5
𒑰 U+12470 CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER
𒑱 U+12471 CUNEIFORM PUNCTUATION SIGN VERTICAL COLON
𒑲 U+12472 CUNEIFORM PUNCTUATION SIGN DIAGONAL COLON
𒑳 U+12473 CUNEIFORM PUNCTUATION SIGN DIAGONAL TRICOLON
𒑴 U+12474 CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON
Mro — Punctuation items: 2
𖩮 U+16A6E MRO DANDA
𖩯 U+16A6F MRO DOUBLE DANDA
Bassa Vah — Punctuation items: 1
𖫵 U+16AF5 BASSA VAH FULL STOP
Pahawh Hmong — Punctuation items: 6
𖬷 U+16B37 PAHAWH HMONG SIGN VOS THOM
𖬸 U+16B38 PAHAWH HMONG SIGN VOS TSHAB CEEB
𖬹 U+16B39 PAHAWH HMONG SIGN CIM CHEEM
𖬺 U+16B3A PAHAWH HMONG SIGN VOS THIAB
𖬻 U+16B3B PAHAWH HMONG SIGN VOS FEEM
𖭄 U+16B44 PAHAWH HMONG SIGN XAUS
Medefaidrin — Punctuation items: 2
𖺗 U+16E97 MEDEFAIDRIN COMMA
𖺘 U+16E98 MEDEFAIDRIN FULL STOP
Medefaidrin — Sign items: 2
𖺙 U+16E99 MEDEFAIDRIN SYMBOL AIVA
𖺚 U+16E9A MEDEFAIDRIN EXCLAMATION OH
Duployan — Chinook punctuation items: 1
𛲟 U+1BC9F DUPLOYAN PUNCTUATION CHINOOK FULL STOP
Sutton SignWriting — Punctuation items: 5
𝪇 U+1DA87 SIGNWRITING COMMA
𝪈 U+1DA88 SIGNWRITING FULL STOP
𝪉 U+1DA89 SIGNWRITING SEMICOLON
𝪊 U+1DA8A SIGNWRITING COLON
𝪋 U+1DA8B SIGNWRITING PARENTHESIS
Adlam — Punctuation items: 2
𞥞 U+1E95E ADLAM INITIAL EXCLAMATION MARK
𞥟 U+1E95F ADLAM INITIAL QUESTION MARK`;
// Reset `lastIndex` if this regex is defined globally
// regex.lastIndex = 0;
let m;
while ((m = regex.exec(str)) !== null) {
// This is necessary to avoid infinite loops with zero-width matches
if (m.index === regex.lastIndex) {
regex.lastIndex++;
}
// The result can be accessed through the `m`-variable.
m.forEach((match, groupIndex) => {
console.log(`Found match, group ${groupIndex}: ${match}`);
});
}
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for JavaScript, please visit: https://developer.mozilla.org/en/docs/Web/JavaScript/Guide/Regular_Expressions