123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384 |
- """
- general mediawiki-engine (Web)
- @website websites built on mediawiki (https://www.mediawiki.org)
- @provide-api yes (http://www.mediawiki.org/wiki/API:Search)
- @using-api yes
- @results JSON
- @stable yes
- @parse url, title
- @todo content
- """
- from json import loads
- from string import Formatter
- from urllib import urlencode, quote
- # engine dependent config
- categories = ['general']
- language_support = True
- paging = True
- number_of_results = 1
- # search-url
- base_url = 'https://{language}.wikipedia.org/'
- search_url = base_url + 'w/api.php?action=query'\
- '&list=search'\
- '&{query}'\
- '&srprop=timestamp'\
- '&format=json'\
- '&sroffset={offset}'\
- '&srlimit={limit}' # noqa
- # do search-request
- def request(query, params):
- offset = (params['pageno'] - 1) * number_of_results
- string_args = dict(query=urlencode({'srsearch': query}),
- offset=offset,
- limit=number_of_results)
- format_strings = list(Formatter().parse(base_url))
- if params['language'] == 'all':
- language = 'en'
- else:
- language = params['language'].split('_')[0]
- if len(format_strings) > 1:
- string_args['language'] = language
- # write search-language back to params, required in response
- params['language'] = language
- params['url'] = search_url.format(**string_args)
- return params
- # get response from search-request
- def response(resp):
- results = []
- search_results = loads(resp.text)
- # return empty array if there are no results
- if not search_results.get('query', {}).get('search'):
- return []
- # parse results
- for result in search_results['query']['search']:
- url = base_url.format(language=resp.search_params['language']) +\
- 'wiki/' + quote(result['title'].replace(' ', '_').encode('utf-8'))
- # append result
- results.append({'url': url,
- 'title': result['title'],
- 'content': ''})
- # return results
- return results
|