|
@@ -66,11 +66,14 @@ def response(resp):
|
66
|
66
|
|
67
|
67
|
# parse results
|
68
|
68
|
for result in dom.xpath('//div[@class="g"]|//div[@class="g _cy"]'):
|
69
|
|
- r = {
|
70
|
|
- 'url': result.xpath('.//div[@class="_cnc"]//a/@href')[0],
|
71
|
|
- 'title': ''.join(result.xpath('.//div[@class="_cnc"]//h3//text()')),
|
72
|
|
- 'content': ''.join(result.xpath('.//div[@class="st"]//text()')),
|
73
|
|
- }
|
|
69
|
+ try:
|
|
70
|
+ r = {
|
|
71
|
+ 'url': result.xpath('.//div[@class="_cnc"]//a/@href')[0],
|
|
72
|
+ 'title': ''.join(result.xpath('.//div[@class="_cnc"]//h3//text()')),
|
|
73
|
+ 'content': ''.join(result.xpath('.//div[@class="st"]//text()')),
|
|
74
|
+ }
|
|
75
|
+ except:
|
|
76
|
+ continue
|
74
|
77
|
|
75
|
78
|
imgs = result.xpath('.//img/@src')
|
76
|
79
|
if len(imgs) and not imgs[0].startswith('data'):
|