From b5061b5f0fd2e3058af60038a47676ad26c671e6 Mon Sep 17 00:00:00 2001 From: Adam Tauber Date: Tue, 9 Feb 2016 21:21:59 +0100 Subject: [PATCH] [fix] restrict wikipedia queries to the titles to avoid irrelevant results --- searx/engines/mediawiki.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/searx/engines/mediawiki.py b/searx/engines/mediawiki.py index ff3fad2d7..26d3720d9 100644 --- a/searx/engines/mediawiki.py +++ b/searx/engines/mediawiki.py @@ -27,10 +27,10 @@ base_url = 'https://{language}.wikipedia.org/' search_postfix = 'w/api.php?action=query'\ '&list=search'\ '&{query}'\ - '&srprop=timestamp'\ '&format=json'\ '&sroffset={offset}'\ - '&srlimit={limit}' + '&srlimit={limit}'\ + '&srwhat=nearmatch' # search for a near match in the title # do search-request @@ -74,6 +74,8 @@ def response(resp): # parse results for result in search_results['query']['search']: + if result.get('snippet', '').startswith('#REDIRECT'): + continue url = base_url.format(language=resp.search_params['language']) +\ 'wiki/' + quote(result['title'].replace(' ', '_').encode('utf-8'))