From f56649e3a9fd6f6b0dd4febe1d2fb377ad0bc528 Mon Sep 17 00:00:00 2001 From: asciimoo Date: Sun, 20 Oct 2013 11:12:10 +0200 Subject: [PATCH] [enh] deviantart engine added --- searx/engines/deviantart.py | 29 +++++++++++++++++++++++++++++ 1 file changed, 29 insertions(+) create mode 100644 searx/engines/deviantart.py diff --git a/searx/engines/deviantart.py b/searx/engines/deviantart.py new file mode 100644 index 000000000..c46a19a63 --- /dev/null +++ b/searx/engines/deviantart.py @@ -0,0 +1,29 @@ +from urllib import urlencode +from lxml import html +from urlparse import urljoin + +categories = ['images'] + +base_url = 'https://www.deviantart.com/' +search_url = base_url+'search?' + +def request(query, params): + global search_url + params['url'] = search_url + urlencode({'q': query}) + return params + + +def response(resp): + global base_url + results = [] + if resp.status_code == 302: + return results + dom = html.fromstring(resp.text) + for result in dom.xpath('//div[contains(@class, "tt-a tt-fh")]'): + link = result.xpath('.//a[contains(@class, "thumb")]')[0] + url = urljoin(base_url, link.attrib.get('href')) + title_links = result.xpath('.//span[@class="details"]//a[contains(@class, "t")]') + title = ''.join(title_links[0].xpath('.//text()')) + content = html.tostring(link)+'
'+link.attrib.get('title') + results.append({'url': url, 'title': title, 'content': content}) + return results