import re
regex = re.compile(r"<(\s)*([a-z0-9]+)(\s)*([a-zA-z0-9%,;()=\"'?\.\-:_\[\]&{}\/\s]*)(>|(\s)*\/>)*", flags=re.MULTILINE)
test_str = ("<div class=\"portal\" role=\"navigation\" id='p-tb'>\n"
"<h3>Toolbox</h3>\n"
"<div class=\"body\">\n"
"<ul>\n"
"<li id=\"t-whatlinkshere\"><a href=\"/wiki/Special:WhatLinksHere/Human_trafficking_in_Canada\" title=\"List of all English Wikipedia pages containing links to this page [j]\" accesskey=\"j\">What links here</a></li>\n"
"<li id=\"t-recentchangeslinked\"><a href=\"/wiki/Special:RecentChangesLinked/Human_trafficking_in_Canada\" title=\"Recent changes in pages linked from this page [k]\" accesskey=\"k\">Related changes</a></li>\n"
"<li id=\"t-upload\"><a href=\"/wiki/Wikipedia:File_Upload_Wizard\" title=\"Upload files [u]\" accesskey=\"u\">Upload file</a></li>\n"
"<li id=\"t-specialpages\"><a href=\"/wiki/Special:SpecialPages\" title=\"A list of all special pages [q]\" accesskey=\"q\">Special pages</a></li>\n"
"<li id=\"t-permalink\"><a href=\"/w/index.php?title=Human_trafficking_in_Canada&oldid=560794473\" title=\"Permanent link to this revision of the page\">Permanent link</a></li>\n"
"<li id=\"t-info\"><a href=\"/w/index.php?title=Human_trafficking_in_Canada&action=info\">Page information</a></li>\n"
"<li id=\"t-cite\"><a href=\"/w/index.php?title=Special:Cite&page=Human_trafficking_in_Canada&id=560794473\" title=\"Information on how to cite this page\">Cite this page</a></li> </ul>\n"
"</div>\n"
"</div>")
matches = regex.finditer(test_str)
for match_num, match in enumerate(matches, start=1):
print(f"Match {match_num} was found at {match.start()}-{match.end()}: {match.group()}")
for group_num, group in enumerate(match.groups(), start=1):
print(f"Group {group_num} found at {match.start(group_num)}-{match.end(group_num)}: {group}")
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Python, please visit: https://docs.python.org/3/library/re.html