import re
regex = re.compile(r"(?:(Received:)|\G(?!\A))\s*(from|by|with|id|via|for|;)\s*(\S+?(?:\s+\S+?)*?)\s*(?=Received:|by|with|id|via|for|;|\z)", flags=re.MULTILINE)
test_str = ("Received: from VE1PR01MB5599.eurprd01.prod.exchangelabs.com\n"
" (2603:10a6:7:7c::43) by HE1PR0102MB2714.eurprd01.prod.exchangelabs.com with\n"
" HTTPS via HE1PR0402CA0054.EURPRD04.PROD.OUTLOOK.COM; Thu, 9 Jan 2020 16:34:13\n"
" +0000\n\n"
"Received: from VI1PR0102CA0029.eurprd01.prod.exchangelabs.com\n"
" (2603:10a6:802::42) by VE1PR01MB5599.eurprd01.prod.exchangelabs.com\n"
" (2603:10a6:803:11f::30) with Microsoft SMTP Server (version=TLS1_2,\n"
" cipher=TLS_ECDHE_RSA_WITH_AES_256_GCM_SHA384) id 15.20.2602.12; Thu, 9 Jan\n"
" 2020 16:34:13 +0000\n\n"
"Received: from DB5EUR01FT034.eop-EUR01.prod.protection.outlook.com\n"
" (2a01:111:f400:7e02::203) by VI1PR0102CA0029.outlook.office365.com\n"
" (2603:10a6:802::42) with Microsoft SMTP Server (version=TLS1_2,\n"
" cipher=TLS_ECDHE_RSA_WITH_AES_256_GCM_SHA384) id 15.20.2623.9 via Frontend\n"
" Transport; Thu, 9 Jan 2020 16:34:13 +0000\n\n"
"Received: from relay-out.ohc.cu (200.55.138.44) by\n"
" DB5EUR01FT034.mail.protection.outlook.com (10.152.4.246) with Microsoft SMTP\n"
" Server (version=TLS1_2, cipher=TLS_ECDHE_RSA_WITH_AES_256_GCM_SHA384) id\n"
" 15.20.2623.9 via Frontend Transport; Thu, 9 Jan 2020 16:34:12 +0000\n\n"
"Received: from relay-in.ohc.cu (relay-in.ohc.cu [127.0.0.1])\n"
" by relay-out.ohc.cu (Postfix) with ESMTP id 69EA722DD\n"
" for <some.email@some.domain>; Thu, 9 Jan 2020 11:29:43 -0500 (CST)\n\n"
"Received: from relay-out.ohc.cu ([127.0.0.1])\n"
" by relay-in.ohc.cu (relay-in.ohc.cu [127.0.0.1]) (amavisd-new, port 10024)\n"
" with ESMTP id 7CZku5Y59vGC for <some.email@some.domain>;\n"
" Thu, 9 Jan 2020 11:29:38 -0500 (CST)\n\n"
"Received: from correo.patrimonio.ohc.cu (unknown [192.168.229.20])\n"
" by relay-out.ohc.cu (Postfix) with ESMTP id B83BA22F5\n"
" for <some.email@some.domain>; Thu, 9 Jan 2020 11:29:36 -0500 (CST)\n\n"
"Received: from localhost (localhost.localdomain [127.0.0.1])\n"
" by correo.patrimonio.ohc.cu (Postfix) with ESMTP id 65413232A001\n"
" for <some.email@some.domain>; Thu, 9 Jan 2020 11:40:05 -0500 (CST)\n\n"
"Received: from correo.patrimonio.ohc.cu ([127.0.0.1])\n"
" by localhost (correo.patrimonio.ohc.cu [127.0.0.1]) (amavisd-new, port 10024)\n"
" with ESMTP id hNMp-6lHHtzH for <some.email@some.domain>;\n"
" Thu, 9 Jan 2020 11:40:05 -0500 (CST)\n\n"
"Received: from correoweb.patrimonio.ohc.cu (unknown [192.168.229.23])\n"
" by correo.patrimonio.ohc.cu (Postfix) with ESMTPA id EC62A232A00A;\n"
" Thu, 9 Jan 2020 11:39:53 -0500 (CST)")
matches = regex.finditer(test_str)
for match_num, match in enumerate(matches, start=1):
print(f"Match {match_num} was found at {match.start()}-{match.end()}: {match.group()}")
for group_num, group in enumerate(match.groups(), start=1):
print(f"Group {group_num} found at {match.start(group_num)}-{match.end(group_num)}: {group}")
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Python, please visit: https://docs.python.org/3/library/re.html