Przeglądaj źródła

[fix] skip non-complete google news results

Adam Tauber 8 lat temu
rodzic
commit
108392f8da
1 zmienionych plików z 8 dodań i 5 usunięć
  1. 8
    5
      searx/engines/google_news.py

+ 8
- 5
searx/engines/google_news.py Wyświetl plik

66
 
66
 
67
     # parse results
67
     # parse results
68
     for result in dom.xpath('//div[@class="g"]|//div[@class="g _cy"]'):
68
     for result in dom.xpath('//div[@class="g"]|//div[@class="g _cy"]'):
69
-        r = {
70
-            'url': result.xpath('.//div[@class="_cnc"]//a/@href')[0],
71
-            'title': ''.join(result.xpath('.//div[@class="_cnc"]//h3//text()')),
72
-            'content': ''.join(result.xpath('.//div[@class="st"]//text()')),
73
-        }
69
+        try:
70
+            r = {
71
+                'url': result.xpath('.//div[@class="_cnc"]//a/@href')[0],
72
+                'title': ''.join(result.xpath('.//div[@class="_cnc"]//h3//text()')),
73
+                'content': ''.join(result.xpath('.//div[@class="st"]//text()')),
74
+            }
75
+        except:
76
+            continue
74
 
77
 
75
         imgs = result.xpath('.//img/@src')
78
         imgs = result.xpath('.//img/@src')
76
         if len(imgs) and not imgs[0].startswith('data'):
79
         if len(imgs) and not imgs[0].startswith('data'):