|
|
|
|
53
|
# parse results
|
53
|
# parse results
|
54
|
for result in dom.xpath(results_xpath):
|
54
|
for result in dom.xpath(results_xpath):
|
55
|
url = result.xpath(url_xpath)[0].text
|
55
|
url = result.xpath(url_xpath)[0].text
|
|
|
56
|
+ if not url.startswith('http://') and not url.startswith('https://'):
|
|
|
57
|
+ url = 'http://' + url
|
56
|
title = result.xpath(title_xpath)[0].text
|
58
|
title = result.xpath(title_xpath)[0].text
|
57
|
content = escape(result.xpath(content_xpath)[0].text)
|
59
|
content = escape(result.xpath(content_xpath)[0].text)
|
58
|
|
60
|
|