# coding=utf8
# the above tag defines encoding for this document and is for Python 2.x compatibility
import re
regex = r"(.*\d{5,}.*)|(^(\,|\.|\\|\'|\-|\?|\*|\(|\@|\^|\=|\/|\%|\").*)|(.*(\<|\>|\[|\]|\;).*)|(.*(\.html|\.php).*)|^(\d\.\d)|(^\\.*)|(^\%.*\%)|(\d{1,3}(((x|\.|\.[[:space:]]){1,2})|[[:space:]])\d{1,3})|.*x$|^0[a-z]*|.{50,}"
test_str = ("<script>alert('hai');</script>\n"
"0.8 \n"
"003902\n"
",eja kerja\n"
".akeup\n"
"081320266690\n"
"1 set meja kursi\n"
"0elan\n"
"meja makan\n"
"100 meja\n"
"12 cm\n"
"10023995\n"
"]\n"
"\"abcd\"\n"
"\\yj magnolia\n"
"%m087%\n"
"'t. shower set kris prem rev wht ptss-0211-5w \n"
"-tangga/kamar-mandi/1kvigy-jual-title-deck-karpet-anti-licin-bath-mat-anti-slip\n"
"? sarapan✅ lunch crew✅ snack crew✅ video on process undangan ? roundown ✅ backdrops✅ photo booth✅ documentation ✅ rooms hotel ? catering ? panggung ? opening speech ? flag dance ✅ door prizes? seragam ? cue card ?. d . ,\n"
"?meja?\n"
"'merlott mylo set meja makan\n"
"*\"tangga\"*\n"
"@meja\n"
"(u/6)\n"
"*晶杯子\n"
"/*meja*/\n"
"/%meja\n"
"====\n"
"^meja^\n"
"14 pcs radiator cup tester ( top quality ) alat tes kebocoran radiator \n"
"120x200x35 cm jty202 ubah lokasi produk hanya bisa di ambil di lippo plaza kupang (informa) verified brand linotela dikirim oleh ruparupa detail produk\n"
"640 × 640gambar mungkin memiliki hak cipta. pelajari lebih lanjut kuncibengkel\n"
"%meja\n"
"%mp18.html\n"
"100x\n"
"25x25\n"
"250x250\n"
"123. 456\n"
"123.456\n"
"123 456")
matches = re.finditer(regex, test_str, re.MULTILINE)
for matchNum, match in enumerate(matches, start=1):
print ("Match {matchNum} was found at {start}-{end}: {match}".format(matchNum = matchNum, start = match.start(), end = match.end(), match = match.group()))
for groupNum in range(0, len(match.groups())):
groupNum = groupNum + 1
print ("Group {groupNum} found at {start}-{end}: {group}".format(groupNum = groupNum, start = match.start(groupNum), end = match.end(groupNum), group = match.group(groupNum)))
# Note: for Python 2.7 compatibility, use ur"" to prefix the regex and u"" to prefix the test string and substitution.
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Python, please visit: https://docs.python.org/3/library/re.html