search.py 4.1KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114
  1. from searx.engines import (
  2. categories, engines, engine_shortcuts
  3. )
  4. from searx.languages import language_codes
  5. class Search(object):
  6. """Search information container"""
  7. def __init__(self, request):
  8. super(Search, self).__init__()
  9. self.query = None
  10. self.engines = []
  11. self.categories = []
  12. self.paging = False
  13. self.pageno = 1
  14. self.lang = 'all'
  15. if request.cookies.get('blocked_engines'):
  16. self.blocked_engines = request.cookies['blocked_engines'].split(',') # noqa
  17. else:
  18. self.blocked_engines = []
  19. self.results = []
  20. self.suggestions = []
  21. self.request_data = {}
  22. if request.cookies.get('language')\
  23. and request.cookies['language'] in (x[0] for x in language_codes):
  24. self.lang = request.cookies['language']
  25. if request.method == 'POST':
  26. self.request_data = request.form
  27. else:
  28. self.request_data = request.args
  29. # TODO better exceptions
  30. if not self.request_data.get('q'):
  31. raise Exception('noquery')
  32. self.query = self.request_data['q']
  33. pageno_param = self.request_data.get('pageno', '1')
  34. if not pageno_param.isdigit() or int(pageno_param) < 1:
  35. raise Exception('wrong pagenumber')
  36. self.pageno = int(pageno_param)
  37. self.parse_query()
  38. self.categories = []
  39. if self.engines:
  40. self.categories = list(set(engine['category']
  41. for engine in self.engines))
  42. else:
  43. for pd_name, pd in self.request_data.items():
  44. if pd_name.startswith('category_'):
  45. category = pd_name[9:]
  46. if not category in categories:
  47. continue
  48. self.categories.append(category)
  49. if not self.categories:
  50. cookie_categories = request.cookies.get('categories', '')
  51. cookie_categories = cookie_categories.split(',')
  52. for ccateg in cookie_categories:
  53. if ccateg in categories:
  54. self.categories.append(ccateg)
  55. if not self.categories:
  56. self.categories = ['general']
  57. for categ in self.categories:
  58. self.engines.extend({'category': categ,
  59. 'name': x.name}
  60. for x in categories[categ]
  61. if not x.name in self.blocked_engines)
  62. def parse_query(self):
  63. query_parts = self.query.split()
  64. modified = False
  65. if query_parts[0].startswith(':'):
  66. lang = query_parts[0][1:].lower()
  67. for lc in language_codes:
  68. lang_id, lang_name, country = map(str.lower, lc)
  69. if lang == lang_id\
  70. or lang_id.startswith(lang)\
  71. or lang == lang_name\
  72. or lang == country:
  73. self.lang = lang
  74. modified = True
  75. break
  76. elif query_parts[0].startswith('!'):
  77. prefix = query_parts[0][1:].replace('_', ' ')
  78. if prefix in engine_shortcuts\
  79. and not engine_shortcuts[prefix] in self.blocked_engines:
  80. modified = True
  81. self.engines.append({'category': 'none',
  82. 'name': engine_shortcuts[prefix]})
  83. elif prefix in engines\
  84. and not prefix in self.blocked_engines:
  85. modified = True
  86. self.engines.append({'category': 'none',
  87. 'name': prefix})
  88. elif prefix in categories:
  89. modified = True
  90. self.engines.extend({'category': prefix,
  91. 'name': engine.name}
  92. for engine in categories[prefix]
  93. if not engine in self.blocked_engines)
  94. if modified:
  95. self.query = self.query.replace(query_parts[0], '', 1).strip()
  96. self.parse_query()