ppf: strip extraced uris

This commit is contained in:
Mickaël Serneels
2019-05-13 23:31:35 +02:00
parent 225b76462c
commit e2122a27d9

1
ppf.py
View File

@@ -82,6 +82,7 @@ def extract_urls(html, url):
for a in soup.find_all('a', href=True):
item = a['href'].encode('utf-8') if isinstance(a['href'], unicode) else a['href']
item = item.strip()
if is_bad_url(item):
continue