import re
regex = re.compile(r"(1(\s|-)?)?(\+\d{1,3}\s?)?((\(\d{3}\)\s?)|(\d{3})(\s|-?))(\d{3}(\s|-?))(\d{4})(\s?(([E|e]xt[:|.|]?)|x|X)(\s?\d+))?", flags=re.MULTILINE)
test_str = ("/* Regular local phone number (XXX) XXX-XXXX */\n"
"1231231231\n"
"123-1231231\n"
"123123-1231\n"
"123-123 1231\n"
"123 123-1231\n"
"123-123-1231\n"
"(123)123-1231\n"
"(123)123 1231\n"
"(123) 123-1231\n"
"(123) 123 1231\n"
"1(212)2231141\n"
"1 232 442 1123\n"
"1-233-223-4433\n"
"12232234433\n"
"1(732) 1131131\n\n"
"/* International codes +XXX (XXX) XXX-XXXX */\n"
"+99 1234567890\n"
"+991234567890\n\n"
"/* Extensions (XXX) XXX-XXXX Ext. XXX... */\n"
"1234567890 Ext 1123123\n"
"1234567890Ext 1123123\n"
"1234567890 Ext1123123\n"
"1234567890Ext1123123\n\n"
"1234567890 Ext: 1123123\n"
"1234567890Ext: 1123123\n"
"1234567890 Ext:1123123\n"
"1234567890Ext:1123123\n\n"
"1234567890 Ext. 1123123\n"
"1234567890Ext. 1123123\n"
"1234567890 Ext.1123123\n"
"1234567890Ext.1123123\n\n"
"1234567890 ext 1123123\n"
"1234567890ext 1123123\n"
"1234567890 ext1123123\n"
"1234567890ext1123123\n\n"
"1234567890 ext: 1123123\n"
"1234567890ext: 1123123\n"
"1234567890 ext:1123123\n"
"1234567890ext:1123123\n\n"
"1234567890 X 1123123\n"
"1234567890X1123123\n"
"1234567890X 1123123\n"
"1234567890 X1123123\n"
"1234567890 x 1123123\n"
"1234567890x1123123\n"
"1234567890 x1123123\n"
"1234567890x 1123123")
matches = regex.finditer(test_str)
for match_num, match in enumerate(matches, start=1):
print(f"Match {match_num} was found at {match.start()}-{match.end()}: {match.group()}")
for group_num, group in enumerate(match.groups(), start=1):
print(f"Group {group_num} found at {match.start(group_num)}-{match.end(group_num)}: {group}")
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Python, please visit: https://docs.python.org/3/library/re.html