import re
regex = re.compile(r"<[^>]*>", flags=re.MULTILINE)
test_str = (" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl00_ListItem1\" class=\"starLink\"><a href='/CheatSheet.aspx'>Regex Cheat Sheet</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl02_ListItem1\"><a href='/Search.aspx'>Search</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl03_ListItem1\"><a href='/RETester.aspx'>Regex Tester</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl04_ListItem1\"><a href='/DisplayPatterns.aspx'>Browse Expressions</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl05_ListItem1\"><a href='/Add.aspx'>Add Regex</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl06_ListItem1\"><a href='/UserPatterns.aspx'>Manage My Expressions</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl07_ListItem1\"><a href='/Contributors.aspx'>Contributors</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl11_ListItem1\"><a href='/Resources.aspx'>Regex Resources</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl12_ListItem1\"><a href='/WebServices.asmx'>Web Services</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl13_ListItem1\"><a href='http://lakequincy.com/advertisers/publisherinfo/regExLib.aspx'>Advertise</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl14_ListItem1\"><a href='/Contact.aspx'>Contact Us</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl15_ListItem1\"><a href='/Register.aspx'>Register</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl16_ListItem1\" class=\"rssLink\"><a href='http://feeds.feedburner.com/Regexlibcom-RecentPatterns'>Recent Expressions</a></li>\n"
" \n"
" <li id=\"ctl00_LeftNavigation1_LeftMenu_ctl17_ListItem1\" class=\"rssLink\"><a href='http://feeds.feedburner.com/Regexlibcom-RecentComments'>Recent Comments</a></li>")
matches = regex.finditer(test_str)
for match_num, match in enumerate(matches, start=1):
print(f"Match {match_num} was found at {match.start()}-{match.end()}: {match.group()}")
for group_num, group in enumerate(match.groups(), start=1):
print(f"Group {group_num} found at {match.start(group_num)}-{match.end(group_num)}: {group}")
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Python, please visit: https://docs.python.org/3/library/re.html