diff options
author | Alexandre Flament <alex@al-f.net> | 2021-02-21 14:08:02 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2021-02-21 14:08:02 +0100 |
commit | 9ace31c829daa545b7316db5ff9adf2c11ffa5cb (patch) | |
tree | 2a7247823a266aa97cc711bd52bdf54e18fc3278 /searx | |
parent | 640d6ce77877551361b0acd116a9cd7faf47c611 (diff) | |
parent | 1d0a32a2c536e05fb0a09d49f39359b2646b9b5f (diff) | |
download | searxng-9ace31c829daa545b7316db5ff9adf2c11ffa5cb.tar.gz searxng-9ace31c829daa545b7316db5ff9adf2c11ffa5cb.zip |
Merge pull request #2588 from datagram1/master
Added rumble.com video search engine.
Diffstat (limited to 'searx')
-rw-r--r-- | searx/engines/rumble.py | 81 | ||||
-rw-r--r-- | searx/settings.yml | 8 |
2 files changed, 89 insertions, 0 deletions
diff --git a/searx/engines/rumble.py b/searx/engines/rumble.py new file mode 100644 index 000000000..fc9e29d90 --- /dev/null +++ b/searx/engines/rumble.py @@ -0,0 +1,81 @@ +# SPDX-License-Identifier: AGPL-3.0-or-later +""" + Wikipedia (Web +""" +from urllib.parse import urlencode +from lxml import html +from datetime import datetime + +# about +from searx.utils import extract_text + +about = { + "website": 'https://rumble.com/', + "wikidata_id": 'Q104765127', + "official_api_documentation": 'https://help.rumble.com/', + "use_official_api": False, + "require_api_key": False, + "results": 'HTML', +} + +# engine dependent config +categories = ['videos'] +paging = True + +# search-url +base_url = 'https://rumble.com' +# https://rumble.com/search/video?q=searx&page=3 +search_url = base_url + '/search/video?{query}&page={pageno}' + +url_xpath = './/a[@class="video-item--a"]/@href' +thumbnail_xpath = './/img[@class="video-item--img"]/@src' +title_xpath = './/h3[@class="video-item--title"]' +published_date = './/time[@class="video-item--meta video-item--time"]/@datetime' +earned_xpath = './/span[@class="video-item--meta video-item--earned"]/@data-value' +views_xpath = './/span[@class="video-item--meta video-item--views"]/@data-value' +rumbles_xpath = './/span[@class="video-item--meta video-item--rumbles"]/@data-value' +author_xpath = './/div[@class="ellipsis-1"]' +length_xpath = './/span[@class="video-item--duration"]/@data-value' + + +def request(query, params): + params['url'] = search_url.format(pageno=params['pageno'], query=urlencode({'q': query})) + return params + + +def response(resp): + results = [] + dom = html.fromstring(resp.text) + results_dom = dom.xpath('//li[contains(@class, "video-listing-entry")]') + + if not results_dom: + return [] + + for result_dom in results_dom: + url = base_url + extract_text(result_dom.xpath(url_xpath)) + thumbnail = extract_text(result_dom.xpath(thumbnail_xpath)) + title = extract_text(result_dom.xpath(title_xpath)) + p_date = extract_text(result_dom.xpath(published_date)) + # fix offset date for line 644 webapp.py check + fixed_date = datetime.strptime(p_date, '%Y-%m-%dT%H:%M:%S%z') + earned = extract_text(result_dom.xpath(earned_xpath)) + views = extract_text(result_dom.xpath(views_xpath)) + rumbles = extract_text(result_dom.xpath(rumbles_xpath)) + author = extract_text(result_dom.xpath(author_xpath)) + length = extract_text(result_dom.xpath(length_xpath)) + if earned: + content = f"{views} views - {rumbles} rumbles - ${earned}" + else: + content = f"{views} views - {rumbles} rumbles" + + results.append({ + 'url': url, + 'title': title, + 'content': content, + 'author': author, + 'length': length, + 'template': 'videos.html', + 'publishedDate': fixed_date, + 'thumbnail': thumbnail, + }) + return results diff --git a/searx/settings.yml b/searx/settings.yml index b3a71e6a7..88ea27c75 100644 --- a/searx/settings.yml +++ b/searx/settings.yml @@ -1251,6 +1251,14 @@ engines: # number_of_results : 5 # timeout : 3.0 + - name : rumble + engine : rumble + shortcut : ru + base_url : https://rumble.com/ + paging : True + categories: videos + disabled : True + # Doku engine lets you access to any Doku wiki instance: # A public one or a privete/corporate one. # - name : ubuntuwiki |