mirror of https://github.com/searx/searx
[fix] restrict wikipedia queries to the titles to avoid irrelevant results
This commit is contained in:
parent
909424e1e5
commit
b5061b5f0f
|
@ -27,10 +27,10 @@ base_url = 'https://{language}.wikipedia.org/'
|
||||||
search_postfix = 'w/api.php?action=query'\
|
search_postfix = 'w/api.php?action=query'\
|
||||||
'&list=search'\
|
'&list=search'\
|
||||||
'&{query}'\
|
'&{query}'\
|
||||||
'&srprop=timestamp'\
|
|
||||||
'&format=json'\
|
'&format=json'\
|
||||||
'&sroffset={offset}'\
|
'&sroffset={offset}'\
|
||||||
'&srlimit={limit}'
|
'&srlimit={limit}'\
|
||||||
|
'&srwhat=nearmatch' # search for a near match in the title
|
||||||
|
|
||||||
|
|
||||||
# do search-request
|
# do search-request
|
||||||
|
@ -74,6 +74,8 @@ def response(resp):
|
||||||
|
|
||||||
# parse results
|
# parse results
|
||||||
for result in search_results['query']['search']:
|
for result in search_results['query']['search']:
|
||||||
|
if result.get('snippet', '').startswith('#REDIRECT'):
|
||||||
|
continue
|
||||||
url = base_url.format(language=resp.search_params['language']) +\
|
url = base_url.format(language=resp.search_params['language']) +\
|
||||||
'wiki/' + quote(result['title'].replace(' ', '_').encode('utf-8'))
|
'wiki/' + quote(result['title'].replace(' ', '_').encode('utf-8'))
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue