Ver código fonte

[fix] yahoo engine url extraction

Adam Tauber 11 anos atrás
pai
commit
ee1ffbc87f
2 arquivos alterados com 2 adições e 2 exclusões
  1. 1
    1
      searx/engines/yahoo.py
  2. 1
    1
      searx/engines/yahoo_news.py

+ 1
- 1
searx/engines/yahoo.py Ver arquivo

@@ -35,7 +35,7 @@ def response(resp):
35 35
 
36 36
     for result in dom.xpath(results_xpath):
37 37
         url_string = extract_url(result.xpath(url_xpath), search_url)
38
-        start = url_string.find('/RU=')+4
38
+        start = url_string.find('http', url_string.find('/RU=')+1)
39 39
         end = url_string.rfind('/RS')
40 40
         url = unquote(url_string[start:end])
41 41
         title = extract_text(result.xpath(title_xpath)[0])

+ 1
- 1
searx/engines/yahoo_news.py Ver arquivo

@@ -35,7 +35,7 @@ def response(resp):
35 35
 
36 36
     for result in dom.xpath(results_xpath):
37 37
         url_string = extract_url(result.xpath(url_xpath), search_url)
38
-        start = url_string.find('/RU=')+4
38
+        start = url_string.find('http', url_string.find('/RU=')+1)
39 39
         end = url_string.rfind('/RS')
40 40
         url = unquote(url_string[start:end])
41 41
         title = extract_text(result.xpath(title_xpath)[0])