mirror of https://github.com/searx/searx
Merge pull request #783 from kvch/time-range-search-year
add year support to engines which support it
This commit is contained in:
commit
e58949b76f
|
@ -33,7 +33,8 @@ time_range_string = '&qft=+filterui:age-lt{interval}'
|
||||||
thumb_url = "https://www.bing.com/th?id={ihk}"
|
thumb_url = "https://www.bing.com/th?id={ihk}"
|
||||||
time_range_dict = {'day': '1440',
|
time_range_dict = {'day': '1440',
|
||||||
'week': '10080',
|
'week': '10080',
|
||||||
'month': '43200'}
|
'month': '43200',
|
||||||
|
'year': '525600'}
|
||||||
|
|
||||||
# safesearch definitions
|
# safesearch definitions
|
||||||
safesearch_types = {2: 'STRICT',
|
safesearch_types = {2: 'STRICT',
|
||||||
|
|
|
@ -66,6 +66,9 @@ def _get_url(query, language, offset, time_range):
|
||||||
|
|
||||||
# do search-request
|
# do search-request
|
||||||
def request(query, params):
|
def request(query, params):
|
||||||
|
if params['time_range'] and params['time_range'] not in time_range_dict:
|
||||||
|
return params
|
||||||
|
|
||||||
offset = (params['pageno'] - 1) * 10 + 1
|
offset = (params['pageno'] - 1) * 10 + 1
|
||||||
|
|
||||||
if params['language'] == 'all':
|
if params['language'] == 'all':
|
||||||
|
|
|
@ -34,6 +34,9 @@ time_range_dict = {'day': 11,
|
||||||
|
|
||||||
# do search-request
|
# do search-request
|
||||||
def request(query, params):
|
def request(query, params):
|
||||||
|
if params['time_range'] and params['time_range'] not in time_range_dict:
|
||||||
|
return params
|
||||||
|
|
||||||
offset = (params['pageno'] - 1) * 24
|
offset = (params['pageno'] - 1) * 24
|
||||||
|
|
||||||
params['url'] = search_url.format(offset=offset,
|
params['url'] = search_url.format(offset=offset,
|
||||||
|
|
|
@ -41,6 +41,9 @@ content_xpath = './/a[@class="result__snippet"]'
|
||||||
|
|
||||||
# do search-request
|
# do search-request
|
||||||
def request(query, params):
|
def request(query, params):
|
||||||
|
if params['time_range'] and params['time_range'] not in time_range_dict:
|
||||||
|
return params
|
||||||
|
|
||||||
offset = (params['pageno'] - 1) * 30
|
offset = (params['pageno'] - 1) * 30
|
||||||
|
|
||||||
if params['language'] == 'all':
|
if params['language'] == 'all':
|
||||||
|
|
|
@ -34,7 +34,8 @@ paging = True
|
||||||
time_range_support = True
|
time_range_support = True
|
||||||
time_range_dict = {'day': 60 * 60 * 24,
|
time_range_dict = {'day': 60 * 60 * 24,
|
||||||
'week': 60 * 60 * 24 * 7,
|
'week': 60 * 60 * 24 * 7,
|
||||||
'month': 60 * 60 * 24 * 7 * 4}
|
'month': 60 * 60 * 24 * 7 * 4,
|
||||||
|
'year': 60 * 60 * 24 * 7 * 52}
|
||||||
|
|
||||||
|
|
||||||
def build_flickr_url(user_id, photo_id):
|
def build_flickr_url(user_id, photo_id):
|
||||||
|
|
|
@ -95,7 +95,8 @@ search_url = ('https://{hostname}' +
|
||||||
time_range_search = "&tbs=qdr:{range}"
|
time_range_search = "&tbs=qdr:{range}"
|
||||||
time_range_dict = {'day': 'd',
|
time_range_dict = {'day': 'd',
|
||||||
'week': 'w',
|
'week': 'w',
|
||||||
'month': 'm'}
|
'month': 'm',
|
||||||
|
'year': 'y'}
|
||||||
|
|
||||||
# other URLs
|
# other URLs
|
||||||
map_hostname_start = 'maps.google.'
|
map_hostname_start = 'maps.google.'
|
||||||
|
|
|
@ -10,10 +10,12 @@
|
||||||
@parse url, title, img_src
|
@parse url, title, img_src
|
||||||
"""
|
"""
|
||||||
|
|
||||||
|
from datetime import date, timedelta
|
||||||
from urllib import urlencode
|
from urllib import urlencode
|
||||||
from json import loads
|
from json import loads
|
||||||
from lxml import html
|
from lxml import html
|
||||||
|
|
||||||
|
|
||||||
# engine dependent config
|
# engine dependent config
|
||||||
categories = ['images']
|
categories = ['images']
|
||||||
paging = True
|
paging = True
|
||||||
|
@ -29,6 +31,7 @@ search_url = 'https://www.google.com/search'\
|
||||||
'&yv=2'\
|
'&yv=2'\
|
||||||
'&{search_options}'
|
'&{search_options}'
|
||||||
time_range_attr = "qdr:{range}"
|
time_range_attr = "qdr:{range}"
|
||||||
|
time_range_custom_attr = "cdr:1,cd_min:{start},cd_max{end}"
|
||||||
time_range_dict = {'day': 'd',
|
time_range_dict = {'day': 'd',
|
||||||
'week': 'w',
|
'week': 'w',
|
||||||
'month': 'm'}
|
'month': 'm'}
|
||||||
|
@ -36,7 +39,6 @@ time_range_dict = {'day': 'd',
|
||||||
|
|
||||||
# do search-request
|
# do search-request
|
||||||
def request(query, params):
|
def request(query, params):
|
||||||
|
|
||||||
search_options = {
|
search_options = {
|
||||||
'ijn': params['pageno'] - 1,
|
'ijn': params['pageno'] - 1,
|
||||||
'start': (params['pageno'] - 1) * number_of_results
|
'start': (params['pageno'] - 1) * number_of_results
|
||||||
|
@ -44,6 +46,12 @@ def request(query, params):
|
||||||
|
|
||||||
if params['time_range'] in time_range_dict:
|
if params['time_range'] in time_range_dict:
|
||||||
search_options['tbs'] = time_range_attr.format(range=time_range_dict[params['time_range']])
|
search_options['tbs'] = time_range_attr.format(range=time_range_dict[params['time_range']])
|
||||||
|
elif params['time_range'] == 'year':
|
||||||
|
now = date.today()
|
||||||
|
then = now - timedelta(days=365)
|
||||||
|
start = then.strftime('%m/%d/%Y')
|
||||||
|
end = now.strftime('%m/%d/%Y')
|
||||||
|
search_options['tbs'] = time_range_custom_attr.format(start=start, end=end)
|
||||||
|
|
||||||
if safesearch and params['safesearch']:
|
if safesearch and params['safesearch']:
|
||||||
search_options['safe'] = 'on'
|
search_options['safe'] = 'on'
|
||||||
|
|
|
@ -29,7 +29,8 @@ search_url = 'https://www.google.com/search'\
|
||||||
time_range_attr = "qdr:{range}"
|
time_range_attr = "qdr:{range}"
|
||||||
time_range_dict = {'day': 'd',
|
time_range_dict = {'day': 'd',
|
||||||
'week': 'w',
|
'week': 'w',
|
||||||
'month': 'm'}
|
'month': 'm',
|
||||||
|
'year': 'y'}
|
||||||
|
|
||||||
|
|
||||||
# do search-request
|
# do search-request
|
||||||
|
|
|
@ -77,6 +77,9 @@ def _get_language(params):
|
||||||
|
|
||||||
# do search-request
|
# do search-request
|
||||||
def request(query, params):
|
def request(query, params):
|
||||||
|
if params['time_range'] and params['time_range'] not in time_range_dict:
|
||||||
|
return params
|
||||||
|
|
||||||
offset = (params['pageno'] - 1) * 10 + 1
|
offset = (params['pageno'] - 1) * 10 + 1
|
||||||
language = _get_language(params)
|
language = _get_language(params)
|
||||||
|
|
||||||
|
|
|
@ -25,7 +25,8 @@ search_url = base_url + '?search_query={query}&page={page}'
|
||||||
time_range_url = '&sp=EgII{time_range}%253D%253D'
|
time_range_url = '&sp=EgII{time_range}%253D%253D'
|
||||||
time_range_dict = {'day': 'Ag',
|
time_range_dict = {'day': 'Ag',
|
||||||
'week': 'Aw',
|
'week': 'Aw',
|
||||||
'month': 'BA'}
|
'month': 'BA',
|
||||||
|
'year': 'BQ'}
|
||||||
|
|
||||||
embedded_url = '<iframe width="540" height="304" ' +\
|
embedded_url = '<iframe width="540" height="304" ' +\
|
||||||
'data-src="//www.youtube-nocookie.com/embed/{videoid}" ' +\
|
'data-src="//www.youtube-nocookie.com/embed/{videoid}" ' +\
|
||||||
|
|
|
@ -11,4 +11,7 @@
|
||||||
<option id="time-range-month" value="month" {{ "selected" if time_range=="month" else ""}}>
|
<option id="time-range-month" value="month" {{ "selected" if time_range=="month" else ""}}>
|
||||||
{{ _('Last month') }}
|
{{ _('Last month') }}
|
||||||
</option>
|
</option>
|
||||||
|
<option id="time-range-year" value="year" {{ "selected" if time_range=="year" else ""}}>
|
||||||
|
{{ _('Last year') }}
|
||||||
|
</option>
|
||||||
</select>
|
</select>
|
||||||
|
|
|
@ -23,6 +23,13 @@ class TestBingNewsEngine(SearxTestCase):
|
||||||
params = bing_news.request(query, dicto)
|
params = bing_news.request(query, dicto)
|
||||||
self.assertIn('en', params['url'])
|
self.assertIn('en', params['url'])
|
||||||
|
|
||||||
|
def test_no_url_in_request_year_time_range(self):
|
||||||
|
dicto = defaultdict(dict)
|
||||||
|
query = 'test_query'
|
||||||
|
dicto['time_range'] = 'year'
|
||||||
|
params = bing_news.request(query, dicto)
|
||||||
|
self.assertEqual({}, params['url'])
|
||||||
|
|
||||||
def test_response(self):
|
def test_response(self):
|
||||||
self.assertRaises(AttributeError, bing_news.response, None)
|
self.assertRaises(AttributeError, bing_news.response, None)
|
||||||
self.assertRaises(AttributeError, bing_news.response, [])
|
self.assertRaises(AttributeError, bing_news.response, [])
|
||||||
|
|
|
@ -7,8 +7,8 @@ from searx.testing import SearxTestCase
|
||||||
class TestDeviantartEngine(SearxTestCase):
|
class TestDeviantartEngine(SearxTestCase):
|
||||||
|
|
||||||
def test_request(self):
|
def test_request(self):
|
||||||
query = 'test_query'
|
|
||||||
dicto = defaultdict(dict)
|
dicto = defaultdict(dict)
|
||||||
|
query = 'test_query'
|
||||||
dicto['pageno'] = 0
|
dicto['pageno'] = 0
|
||||||
dicto['time_range'] = ''
|
dicto['time_range'] = ''
|
||||||
params = deviantart.request(query, dicto)
|
params = deviantart.request(query, dicto)
|
||||||
|
@ -16,6 +16,13 @@ class TestDeviantartEngine(SearxTestCase):
|
||||||
self.assertTrue(query in params['url'])
|
self.assertTrue(query in params['url'])
|
||||||
self.assertTrue('deviantart.com' in params['url'])
|
self.assertTrue('deviantart.com' in params['url'])
|
||||||
|
|
||||||
|
def test_no_url_in_request_year_time_range(self):
|
||||||
|
dicto = defaultdict(dict)
|
||||||
|
query = 'test_query'
|
||||||
|
dicto['time_range'] = 'year'
|
||||||
|
params = deviantart.request(query, dicto)
|
||||||
|
self.assertEqual({}, params['url'])
|
||||||
|
|
||||||
def test_response(self):
|
def test_response(self):
|
||||||
self.assertRaises(AttributeError, deviantart.response, None)
|
self.assertRaises(AttributeError, deviantart.response, None)
|
||||||
self.assertRaises(AttributeError, deviantart.response, [])
|
self.assertRaises(AttributeError, deviantart.response, [])
|
||||||
|
|
|
@ -19,6 +19,13 @@ class TestDuckduckgoEngine(SearxTestCase):
|
||||||
self.assertIn('duckduckgo.com', params['url'])
|
self.assertIn('duckduckgo.com', params['url'])
|
||||||
self.assertIn('ch-de', params['url'])
|
self.assertIn('ch-de', params['url'])
|
||||||
|
|
||||||
|
def test_no_url_in_request_year_time_range(self):
|
||||||
|
dicto = defaultdict(dict)
|
||||||
|
query = 'test_query'
|
||||||
|
dicto['time_range'] = 'year'
|
||||||
|
params = duckduckgo.request(query, dicto)
|
||||||
|
self.assertEqual({}, params['url'])
|
||||||
|
|
||||||
def test_response(self):
|
def test_response(self):
|
||||||
self.assertRaises(AttributeError, duckduckgo.response, None)
|
self.assertRaises(AttributeError, duckduckgo.response, None)
|
||||||
self.assertRaises(AttributeError, duckduckgo.response, [])
|
self.assertRaises(AttributeError, duckduckgo.response, [])
|
||||||
|
|
|
@ -46,6 +46,13 @@ class TestYahooEngine(SearxTestCase):
|
||||||
self.assertIn('en', params['cookies']['sB'])
|
self.assertIn('en', params['cookies']['sB'])
|
||||||
self.assertIn('en', params['url'])
|
self.assertIn('en', params['url'])
|
||||||
|
|
||||||
|
def test_no_url_in_request_year_time_range(self):
|
||||||
|
dicto = defaultdict(dict)
|
||||||
|
query = 'test_query'
|
||||||
|
dicto['time_range'] = 'year'
|
||||||
|
params = yahoo.request(query, dicto)
|
||||||
|
self.assertEqual({}, params['url'])
|
||||||
|
|
||||||
def test_response(self):
|
def test_response(self):
|
||||||
self.assertRaises(AttributeError, yahoo.response, None)
|
self.assertRaises(AttributeError, yahoo.response, None)
|
||||||
self.assertRaises(AttributeError, yahoo.response, [])
|
self.assertRaises(AttributeError, yahoo.response, [])
|
||||||
|
|
|
@ -17,6 +17,25 @@ class TestYoutubeNoAPIEngine(SearxTestCase):
|
||||||
self.assertIn(query, params['url'])
|
self.assertIn(query, params['url'])
|
||||||
self.assertIn('youtube.com', params['url'])
|
self.assertIn('youtube.com', params['url'])
|
||||||
|
|
||||||
|
def test_time_range_search(self):
|
||||||
|
dicto = defaultdict(dict)
|
||||||
|
query = 'test_query'
|
||||||
|
dicto['time_range'] = 'year'
|
||||||
|
params = youtube_noapi.request(query, dicto)
|
||||||
|
self.assertIn('&sp=EgIIBQ%253D%253D', params['url'])
|
||||||
|
|
||||||
|
dicto['time_range'] = 'month'
|
||||||
|
params = youtube_noapi.request(query, dicto)
|
||||||
|
self.assertIn('&sp=EgIIBA%253D%253D', params['url'])
|
||||||
|
|
||||||
|
dicto['time_range'] = 'week'
|
||||||
|
params = youtube_noapi.request(query, dicto)
|
||||||
|
self.assertIn('&sp=EgIIAw%253D%253D', params['url'])
|
||||||
|
|
||||||
|
dicto['time_range'] = 'day'
|
||||||
|
params = youtube_noapi.request(query, dicto)
|
||||||
|
self.assertIn('&sp=EgIIAg%253D%253D', params['url'])
|
||||||
|
|
||||||
def test_response(self):
|
def test_response(self):
|
||||||
self.assertRaises(AttributeError, youtube_noapi.response, None)
|
self.assertRaises(AttributeError, youtube_noapi.response, None)
|
||||||
self.assertRaises(AttributeError, youtube_noapi.response, [])
|
self.assertRaises(AttributeError, youtube_noapi.response, [])
|
||||||
|
|
Loading…
Reference in New Issue