From d6dfada1a9c77cae13596c441f7d1cb1c2b30899 Mon Sep 17 00:00:00 2001 From: ta Date: Sat, 13 Aug 2022 06:04:31 +0700 Subject: [PATCH] add neeva web engine Neeva is "the world's first ad-free, private search engine" and uses data from Apple, Bing, Yelp and "others". They claim to crawl "hundreds of millions" of URLs a day (https://twitter.com/Neeva/status/1536447373903335426). --- searx/settings.yml | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) diff --git a/searx/settings.yml b/searx/settings.yml index ec03819a5..52b75082c 100644 --- a/searx/settings.yml +++ b/searx/settings.yml @@ -960,6 +960,30 @@ engines: # collection: 'reviews' # name of the db collection # key: 'name' # key in the collection to search for + - name: neeva + engine: xpath + shortcut: nv + search_url: https://neeva.com/search?q={query}&c=All&src=Pagination&page={pageno}{time_range} + results_xpath: //div[@class="web-index__component-2rKiM"] | //li[@class="web-rich-deep-links__deepLink-SIbD4"] + url_xpath: .//a[@class="lib-doc-title__link-1b9rC"]/@href | ./h2/a/@href + title_xpath: .//a[@class="lib-doc-title__link-1b9rC"] | ./h2/a + content_xpath: > + .//div[@class="lib-doc-snippet__component-3ewW6"]/text() | + .//div[@class="lib-doc-snippet__component-3ewW6"]/*[not(self::a)] | + ./p + content_html_to_text: true + suggestion_xpath: //span[@class="result-related-searches__link-2ho_u"] + paging: true + disabled: true + categories: [general, web] + timeout: 5.0 + about: + website: https://neeva.com + official_api_documentation: + use_official_api: false + require_api_key: false + results: HTML + - name: npm engine: json_engine paging: true