import re
def tst():
text = '''
<script>
'''
if proxi := re.findall(r"(?:<td\s[^>]*?><font\sclass\=spy14>(.*?)<script.*?\"\+(.*?)\)<\/script)", text):
for proxy, port in proxi:
yield f"{proxy}:{''.join(port)}"
if dtt := re.findall(r"<td colspan=1><font class\=spy1><font class\=spy14>(.*?)</font> (\d+[:]\d+) <font class\=spy5>([(]\d+ \w+ \w+[)])", text):
for date, time, taken in dtt:
yield f"{date} {' '.join([time, taken])}"
return None
return None
for proxy in tst():
print(proxy)
output that i get
51.155.10.0:8000
178.128.96.80:7497
98.162.96.41:4145
27-oct-2022 11:05 (49 mins ago)
27-oct-2022 11:04 (50 mins ago)
27-oct-2022 11:03 (51 mins ago)
so i use this regex below to capture group from output
(\w+[.]\w+[.]\w+[.]\w+[:]\w+)|(\w+.*)
i want the result like this, how to combine it from output?
157.245.247.84:7497 - 27-oct-2022 11:05 (49 mins ago)
184.190.137.213:8111 - 27-oct-2022 11:04 (50 mins ago)
202.149.89.67:7999 - 27-oct-2022 11:03 (51 mins ago)