Parcourir la source

[fix] remove html tags from qwant results

Adam Tauber il y a 8 ans
Parent
révision
c3dcebb778
1 fichiers modifiés avec 6 ajouts et 4 suppressions
  1. 6
    4
      searx/engines/qwant.py

+ 6
- 4
searx/engines/qwant.py Voir le fichier

10
  @parse       url, title, content
10
  @parse       url, title, content
11
 """
11
 """
12
 
12
 
13
-from urllib import urlencode
14
-from json import loads
15
 from datetime import datetime
13
 from datetime import datetime
14
+from json import loads
15
+from urllib import urlencode
16
+
17
+from searx.utils import html_to_text
16
 
18
 
17
 # engine dependent config
19
 # engine dependent config
18
 categories = None
20
 categories = None
66
     # parse results
68
     # parse results
67
     for result in res.get('items', {}):
69
     for result in res.get('items', {}):
68
 
70
 
69
-        title = result['title']
71
+        title = html_to_text(result['title'])
70
         res_url = result['url']
72
         res_url = result['url']
71
-        content = result['desc']
73
+        content = html_to_text(result['desc'])
72
 
74
 
73
         if category_to_keyword.get(categories[0], '') == 'web':
75
         if category_to_keyword.get(categories[0], '') == 'web':
74
             results.append({'title': title,
76
             results.append({'title': title,