12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667 |
- ## general mediawiki-engine (Web)
- #
- # @website websites built on mediawiki (https://www.mediawiki.org)
- # @provide-api yes (http://www.mediawiki.org/wiki/API:Search)
- #
- # @using-api yes
- # @results JSON
- # @stable yes
- # @parse url, title
- #
- # @todo content
-
- from json import loads
- from urllib import urlencode, quote
-
- # engine dependent config
- categories = ['general']
- language_support = True
- paging = True
- number_of_results = 1
-
- # search-url
- base_url = 'https://{language}.wikipedia.org/'
- search_url = base_url + 'w/api.php?action=query&list=search&{query}&srprop=timestamp&format=json&sroffset={offset}&srlimit={limit}' # noqa
-
-
- # do search-request
- def request(query, params):
- offset = (params['pageno'] - 1) * number_of_results
-
- if params['language'] == 'all':
- language = 'en'
- else:
- language = params['language'].split('_')[0]
-
- # write search-language back to params, required in response
- params['language'] = language
-
- params['url'] = search_url.format(query=urlencode({'srsearch': query}),
- offset=offset,
- limit=number_of_results,
- language=language)
-
- return params
-
-
- # get response from search-request
- def response(resp):
- results = []
-
- search_results = loads(resp.text)
-
- # return empty array if there are no results
- if not search_results.get('query', {}).get('search'):
- return []
-
- # parse results
- for result in search_results['query']['search']:
- url = base_url.format(language=resp.search_params['language']) + 'wiki/' + quote(result['title'].replace(' ', '_').encode('utf-8'))
-
- # append result
- results.append({'url': url,
- 'title': result['title'],
- 'content': ''})
-
- # return results
- return results
|