From 210e59c68c4817e2734e7db4a87a5bb6212150b2 Mon Sep 17 00:00:00 2001 From: james-still <107592590+james-still@users.noreply.github.com> Date: Thu, 28 Jul 2022 20:45:07 +0100 Subject: [PATCH] Add engine for Emojipedia (#3278) --- searx/engines/emojipedia.py | 68 +++++++++++++++++++++++++++++++++++++ searx/settings.yml | 6 ++++ 2 files changed, 74 insertions(+) create mode 100644 searx/engines/emojipedia.py diff --git a/searx/engines/emojipedia.py b/searx/engines/emojipedia.py new file mode 100644 index 00000000..5a26ca2c --- /dev/null +++ b/searx/engines/emojipedia.py @@ -0,0 +1,68 @@ +# SPDX-License-Identifier: AGPL-3.0-or-later +""" + Emojipedia +""" + +from urllib.parse import urlencode +from lxml import html + +from searx import logger +from searx.utils import ( + eval_xpath_list, + eval_xpath_getindex, + extract_text, +) + +logger = logger.getChild('Emojipedia engine') + +about = { + "website": 'https://emojipedia.org', + "wikidata_id": None, + "official_api_documentation": None, + "use_official_api": False, + "require_api_key": False, + "results": 'HTML', +} + +categories = [] +paging = False +time_range_support = False + +base_url = 'https://emojipedia.org' +search_url = base_url + '/search/?{query}' + + +def request(query, params): + params['url'] = search_url.format( + query=urlencode({'q': query}), + ) + return params + + +def response(resp): + results = [] + + dom = html.fromstring(resp.text) + + for result in eval_xpath_list(dom, "//ol[@class='search-results']/li"): + + extracted_desc = extract_text(eval_xpath_getindex(result, './/p', 0)) + + if 'No results found.' in extracted_desc: + break + + link = eval_xpath_getindex(result, './/h2/a', 0) + + url = base_url + link.attrib.get('href') + title = extract_text(link) + content = extracted_desc + + res = { + 'url': url, + 'title': title, + 'content': content + } + + results.append(res) + + return results diff --git a/searx/settings.yml b/searx/settings.yml index cc955311..5560eb7e 100644 --- a/searx/settings.yml +++ b/searx/settings.yml @@ -378,6 +378,12 @@ engines: require_api_key: false results: HTML + - name: emojipedia + engine: emojipedia + timeout: 4.0 + shortcut: em + disabled: True + # - name : elasticsearch # shortcut : es # engine : elasticsearch