import re
regex = re.compile(r"<img[^>]*alt=\"([^\"]+)\"[^>]*>", flags=re.MULTILINE)
test_str = ("<span itemprop=\"description\"> <img src=\"//res.smzdm.com/images/emotions/30.png\" alt=\"[小怒]\" class=\"wp-smiley\"> <img src=\"//res.smzdm.com/images/emotions/30.png\" alt=\"[小怒]\" class=\"wp-smiley\"> <img src=\"//res.smzdm.com/images/emotions/30.png\" alt=\"[小怒]\" class=\"wp-smiley\"> 这文章百度哪里搬来的 </span>\n\n"
"<span itemprop=\"description\"> <img src=\"//res.smzdm.com/images/emotions/36.png\" alt=\"[喜极而泣]\" class=\"wp-smiley\"> 年少无知看了那篇文章好奇买了4瓶 喝了一口差点吐出来 </span>\n\n"
"<span itemprop=\"description\">国内咋就没厂商做点纯气泡水呢,成本应该不高吧,钱都让屈臣氏巴黎水赚去了 <img src=\"//res.smzdm.com/images/emotions/23.png\" alt=\"[皱眉]\" class=\"wp-smiley\"> </span>\n\n"
"<span itemprop=\"description\">小时候就经常煲来喝,利尿排毒 <img src=\"//res.smzdm.com/images/emotions/45.png\" alt=\"[抽烟]\" class=\"wp-smiley\"> </span>\n\n"
"<p class=\"p_content_166651051\"><span itemprop=\"description\">我喜欢香草味的,滑滑的感觉 </span></p>\n\n"
"<p class=\"p_content_166650868\"><span itemprop=\"description\">我喝过好几箱,后来还回购了,再后来就喝不起了,太贵[皱眉] </span></p>")
subst = "\\g<1>"
result = regex.sub(subst, test_str)
if result:
print(result)
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Python, please visit: https://docs.python.org/3/library/re.html