searxng/searx/engines/rumble.py

# SPDX-License-Identifier: AGPL-3.0-or-later
"""Rumble (Videos)

"""

from datetime import datetime

from urllib.parse import urlencode
from lxml import html

# about
from searx.utils import extract_text

about = {
    "website": 'https://rumble.com/',
    "wikidata_id": 'Q104765127',
    "official_api_documentation": 'https://help.rumble.com/',
    "use_official_api": False,
    "require_api_key": False,
    "results": 'HTML',
}

# engine dependent config
categories = ['videos']
paging = True

# search-url
base_url = 'https://rumble.com/'

url_xpath = './/a[@class="video-item--a"]/@href'
thumbnail_xpath = './/img[@class="video-item--img"]/@src'
title_xpath = './/h3[@class="video-item--title"]'
published_date = './/time[@class="video-item--meta video-item--time"]/@datetime'
earned_xpath = './/span[@class="video-item--meta video-item--earned"]/@data-value'
views_xpath = './/span[@class="video-item--meta video-item--views"]/@data-value'
rumbles_xpath = './/span[@class="video-item--meta video-item--rumbles"]/@data-value'
author_xpath = './/div[@class="ellipsis-1"]'
length_xpath = './/span[@class="video-item--duration"]/@data-value'


def request(query, params):
    args = {"q": query}
    if params["pageno"] > 1:
        args['page'] = params["pageno"]
    params['url'] = f'{base_url}search/video?{urlencode(args)}'
    return params


def response(resp):
    results = []
    dom = html.fromstring(resp.text)
    results_dom = dom.xpath('//li[contains(@class, "video-listing-entry")]')

    if not results_dom:
        return []

    for result_dom in results_dom:
        url = base_url + extract_text(result_dom.xpath(url_xpath))
        thumbnail = extract_text(result_dom.xpath(thumbnail_xpath))
        title = extract_text(result_dom.xpath(title_xpath))
        p_date = extract_text(result_dom.xpath(published_date))
        # fix offset date for line 644 webapp.py check
        fixed_date = datetime.strptime(p_date, '%Y-%m-%dT%H:%M:%S%z')
        earned = extract_text(result_dom.xpath(earned_xpath))
        views = extract_text(result_dom.xpath(views_xpath))
        rumbles = extract_text(result_dom.xpath(rumbles_xpath))
        author = extract_text(result_dom.xpath(author_xpath))
        length = extract_text(result_dom.xpath(length_xpath))
        if earned:
            content = f"{views} views - {rumbles} rumbles - ${earned}"
        else:
            content = f"{views} views - {rumbles} rumbles"

        results.append(
            {
                'url': url,
                'title': title,
                'content': content,
                'author': author,
                'length': length,
                'template': 'videos.html',
                'publishedDate': fixed_date,
                'thumbnail': thumbnail,
            }
        )
    return results
Added rumble.com video search engine. TODO video embedding. Update rumble.py some lines too long. Disable Rumble engine disabled : True PEP8 fix change line spacing 2021-02-19 16:25:24 +01:00			`# SPDX-License-Identifier: AGPL-3.0-or-later`
[mod] pylint all engines without PYLINT_SEARXNG_DISABLE_OPTION Signed-off-by: Markus Heiser <markus.heiser@darmarit.de> 2024-03-11 07:45:08 +01:00			`"""Rumble (Videos)`

Added rumble.com video search engine. TODO video embedding. Update rumble.py some lines too long. Disable Rumble engine disabled : True PEP8 fix change line spacing 2021-02-19 16:25:24 +01:00			`"""`
[mod] pylint all engines without PYLINT_SEARXNG_DISABLE_OPTION Signed-off-by: Markus Heiser <markus.heiser@darmarit.de> 2024-03-11 07:45:08 +01:00
			`from datetime import datetime`

Added rumble.com video search engine. TODO video embedding. Update rumble.py some lines too long. Disable Rumble engine disabled : True PEP8 fix change line spacing 2021-02-19 16:25:24 +01:00			`from urllib.parse import urlencode`
			`from lxml import html`

			`# about`
			`from searx.utils import extract_text`

			`about = {`
			`"website": 'https://rumble.com/',`
			`"wikidata_id": 'Q104765127',`
			`"official_api_documentation": 'https://help.rumble.com/',`
			`"use_official_api": False,`
			`"require_api_key": False,`
			`"results": 'HTML',`
			`}`

			`# engine dependent config`
			`categories = ['videos']`
			`paging = True`

			`# search-url`
[fix] rumble redirect 2023-09-14 12:08:38 +02:00			`base_url = 'https://rumble.com/'`
Added rumble.com video search engine. TODO video embedding. Update rumble.py some lines too long. Disable Rumble engine disabled : True PEP8 fix change line spacing 2021-02-19 16:25:24 +01:00
			`url_xpath = './/a[@class="video-item--a"]/@href'`
			`thumbnail_xpath = './/img[@class="video-item--img"]/@src'`
			`title_xpath = './/h3[@class="video-item--title"]'`
			`published_date = './/time[@class="video-item--meta video-item--time"]/@datetime'`
			`earned_xpath = './/span[@class="video-item--meta video-item--earned"]/@data-value'`
			`views_xpath = './/span[@class="video-item--meta video-item--views"]/@data-value'`
			`rumbles_xpath = './/span[@class="video-item--meta video-item--rumbles"]/@data-value'`
			`author_xpath = './/div[@class="ellipsis-1"]'`
			`length_xpath = './/span[@class="video-item--duration"]/@data-value'`


			`def request(query, params):`
[fix] rumble redirect 2023-09-14 12:08:38 +02:00			`args = {"q": query}`
			`if params["pageno"] > 1:`
			`args['page'] = params["pageno"]`
			`params['url'] = f'{base_url}search/video?{urlencode(args)}'`
Added rumble.com video search engine. TODO video embedding. Update rumble.py some lines too long. Disable Rumble engine disabled : True PEP8 fix change line spacing 2021-02-19 16:25:24 +01:00			`return params`


			`def response(resp):`
			`results = []`
			`dom = html.fromstring(resp.text)`
			`results_dom = dom.xpath('//li[contains(@class, "video-listing-entry")]')`

			`if not results_dom:`
			`return []`

			`for result_dom in results_dom:`
			`url = base_url + extract_text(result_dom.xpath(url_xpath))`
			`thumbnail = extract_text(result_dom.xpath(thumbnail_xpath))`
			`title = extract_text(result_dom.xpath(title_xpath))`
			`p_date = extract_text(result_dom.xpath(published_date))`
			`# fix offset date for line 644 webapp.py check`
			`fixed_date = datetime.strptime(p_date, '%Y-%m-%dT%H:%M:%S%z')`
			`earned = extract_text(result_dom.xpath(earned_xpath))`
			`views = extract_text(result_dom.xpath(views_xpath))`
			`rumbles = extract_text(result_dom.xpath(rumbles_xpath))`
			`author = extract_text(result_dom.xpath(author_xpath))`
			`length = extract_text(result_dom.xpath(length_xpath))`
			`if earned:`
			`content = f"{views} views - {rumbles} rumbles - ${earned}"`
			`else:`
			`content = f"{views} views - {rumbles} rumbles"`

[format.python] initial formatting of the python code This patch was generated by black [1]:: make format.python [1] https://github.com/psf/black Signed-off-by: Markus Heiser <markus.heiser@darmarit.de> 2021-12-27 09:26:22 +01:00			`results.append(`
			`{`
			`'url': url,`
			`'title': title,`
			`'content': content,`
			`'author': author,`
			`'length': length,`
			`'template': 'videos.html',`
			`'publishedDate': fixed_date,`
			`'thumbnail': thumbnail,`
			`}`
			`)`
Added rumble.com video search engine. TODO video embedding. Update rumble.py some lines too long. Disable Rumble engine disabled : True PEP8 fix change line spacing 2021-02-19 16:25:24 +01:00			`return results`