import re
for domain in all_data:
# 抽取出域名
if 'http' in domain:
domain = domain.replace('https://', '').replace('http://', '')
if '/' in domain:
domain = domain.split('/')[0]
res = re.findall('\.(.+?)\.(.+)',domain)
# 剔除前缀
if res:
domain = '.'.join(list(res[0]))
print(domain)
For further actions, you may consider blocking this person and/or reporting abuse
Top comments (0)