# coding=utf8
# the above tag defines encoding for this document and is for Python 2.x compatibility
import re
regex = r"(.*\n\n((^>+\s{1}.*$)+\n?)+)"
test_str = ("and again\n\n"
"2016-05-06 14:27 GMT+03:00 serg radzishevsky :\n\n"
"> ok cool comment #2\n"
">\n"
"> 2016-05-06 14:24 GMT+03:00 Sergey Radzishevsky :\n"
">\n"
">> first comment\n"
">>\n"
">> *Lorem Ipsum* is simply dummy text of the printing and typesetting\n"
">> industry. Lorem Ipsum has been the industry's standard dummy text ever\n"
">> since the 1500s, when an unknown printer took a galley of type and\n"
">> scrambled it to make a type specimen book. It has survived not only five\n"
">> centuries, but also the leap into electronic typesetting, remaining\n"
">> essentially unchanged. It was popularised in the 1960s with the release of\n"
">> Letraset sheets containing Lorem Ipsum passages, and more recently with\n"
">> desktop publishing software like Aldus PageMaker including versions of\n"
">> Lorem Ipsum\n"
">>\n"
">> --\n"
">> *Sergey Radzishevsky*\n"
">> \n"
">> [image: Facebook page] [image:\n"
">> Twitter account] [image: Dribbble\n"
">> account] [image: Github repository]\n"
">> [image: Linkedin account]\n"
">> \n"
">>\n"
">> *Skype*: * radzserg*\n"
">>\n"
">>\n"
">\n"
">\n"
"> --\n"
"> Best Regards\n"
">\n"
"> Radzishevsky Sergey\n"
">\n"
"> *Skype: radzserg*\n"
">\n")
matches = re.finditer(regex, test_str, re.MULTILINE | re.IGNORECASE)
for matchNum, match in enumerate(matches, start=1):
print ("Match {matchNum} was found at {start}-{end}: {match}".format(matchNum = matchNum, start = match.start(), end = match.end(), match = match.group()))
for groupNum in range(0, len(match.groups())):
groupNum = groupNum + 1
print ("Group {groupNum} found at {start}-{end}: {group}".format(groupNum = groupNum, start = match.start(groupNum), end = match.end(groupNum), group = match.group(groupNum)))
# Note: for Python 2.7 compatibility, use ur"" to prefix the regex and u"" to prefix the test string and substitution.
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Python, please visit: https://docs.python.org/3/library/re.html