xpath engine: bug fix

This commit is contained in:
dalf 2013-12-30 22:34:35 +01:00
parent 9eddcdb8e4
commit 664c039b38

View File

@ -28,7 +28,7 @@ def extract_url(xpath_results):
url = xpath_results[0].attrib.get('href') url = xpath_results[0].attrib.get('href')
else: else:
url = xpath_results.attrib.get('href') url = xpath_results.attrib.get('href')
if not url.startswith('http://') or not url.startswith('https://'): if not url.startswith('http://') and not url.startswith('https://'):
url = 'http://'+url url = 'http://'+url
parsed_url = urlparse(url) parsed_url = urlparse(url)
if not parsed_url.netloc: if not parsed_url.netloc: