瀏覽代碼

Merge pull request #780 from kvch/google-play-movies-fix

XPATH engines: Google Play Music, Habrahabr, Yandex
Adam Tauber 8 年之前
父節點
當前提交
75c58fd008
共有 2 個檔案被更改,包括 7 行新增6 行删除
  1. 2
    2
      searx/engines/yandex.py
  2. 5
    4
      searx/settings.yml

+ 2
- 2
searx/engines/yandex.py 查看文件

29
 base_url = 'https://yandex.{tld}/'
29
 base_url = 'https://yandex.{tld}/'
30
 search_url = 'search/?{query}&p={page}'
30
 search_url = 'search/?{query}&p={page}'
31
 
31
 
32
-results_xpath = '//div[@class="serp-item serp-item_plain_yes clearfix i-bem"]'
32
+results_xpath = '//li[@class="serp-item"]'
33
 url_xpath = './/h2/a/@href'
33
 url_xpath = './/h2/a/@href'
34
 title_xpath = './/h2/a//text()'
34
 title_xpath = './/h2/a//text()'
35
-content_xpath = './/div[@class="serp-item__text"]//text()'
35
+content_xpath = './/div[@class="text-container typo typo_text_m typo_line_m organic__text"]//text()'
36
 
36
 
37
 
37
 
38
 def request(query, params):
38
 def request(query, params):

+ 5
- 4
searx/settings.yml 查看文件

192
   - name : gigablast
192
   - name : gigablast
193
     engine : gigablast
193
     engine : gigablast
194
     shortcut : gb
194
     shortcut : gb
195
+    timeout : 3.0
195
     disabled: True
196
     disabled: True
196
 
197
 
197
   - name : gitlab
198
   - name : gitlab
250
     engine        : xpath
251
     engine        : xpath
251
     search_url    : https://play.google.com/store/search?q={query}&c=movies
252
     search_url    : https://play.google.com/store/search?q={query}&c=movies
252
     url_xpath     : //a[@class="title"]/@href
253
     url_xpath     : //a[@class="title"]/@href
253
-    title_xpath   : //a[@class="title"]
254
-    content_xpath : //a[@class="subtitle"]
254
+    title_xpath   : //a[@class="title"]/@title
255
+    content_xpath : //a[contains(@class, "subtitle")]
255
     categories : videos
256
     categories : videos
256
     shortcut : gpm
257
     shortcut : gpm
257
     disabled : True
258
     disabled : True
282
     engine : xpath
283
     engine : xpath
283
     paging : True
284
     paging : True
284
     search_url : https://habrahabr.ru/search/page{pageno}/?q={query}
285
     search_url : https://habrahabr.ru/search/page{pageno}/?q={query}
285
-    url_xpath : //div[@class="search_results"]//a[@class="post_title"]/@href
286
-    title_xpath : //div[@class="search_results"]//a[@class="post_title"]
286
+    url_xpath : //div[@class="search_results"]//a[contains(@class, "post__title_link")]/@href
287
+    title_xpath : //div[@class="search_results"]//a[contains(@class, "post__title_link")]
287
     content_xpath : //div[@class="search_results"]//div[contains(@class, "content")]
288
     content_xpath : //div[@class="search_results"]//div[contains(@class, "content")]
288
     categories : it
289
     categories : it
289
     timeout : 4.0
290
     timeout : 4.0