From e2122a27d9d97a8bca1363da00fefd20986706f8 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Micka=C3=ABl=20Serneels?= Date: Mon, 13 May 2019 23:31:35 +0200 Subject: [PATCH] ppf: strip extraced uris --- ppf.py | 1 + 1 file changed, 1 insertion(+) diff --git a/ppf.py b/ppf.py index 999fa56..699c0c8 100755 --- a/ppf.py +++ b/ppf.py @@ -82,6 +82,7 @@ def extract_urls(html, url): for a in soup.find_all('a', href=True): item = a['href'].encode('utf-8') if isinstance(a['href'], unicode) else a['href'] + item = item.strip() if is_bad_url(item): continue