|
@@ -1,5 +1,6 @@
|
1
|
1
|
from urllib import urlencode
|
2
|
2
|
from lxml import html
|
|
3
|
+from cgi import escape
|
3
|
4
|
|
4
|
5
|
base_url = None
|
5
|
6
|
search_url = None
|
|
@@ -35,11 +36,11 @@ def response(resp):
|
35
|
36
|
if url.startswith('http://www.google.')\
|
36
|
37
|
or url.startswith('https://www.google.'):
|
37
|
38
|
continue
|
38
|
|
- title = link.text_content()
|
|
39
|
+ title = escape(link.text_content())
|
39
|
40
|
|
40
|
41
|
content = ''
|
41
|
42
|
if result.xpath('./p[@class="desc"]'):
|
42
|
|
- content = result.xpath('./p[@class="desc"]')[0].text_content()
|
|
43
|
+ content = escape(result.xpath('./p[@class="desc"]')[0].text_content())
|
43
|
44
|
|
44
|
45
|
results.append({'url': url, 'title': title, 'content': content})
|
45
|
46
|
|