1
0
mirror of https://github.com/searxng/searxng.git synced 2024-11-22 12:10:11 +01:00

[fix] yahoo url mods

This commit is contained in:
Adam Tauber 2014-02-27 10:59:39 +01:00
parent 8c8d9d10cb
commit 4627788834

View File

@ -1,6 +1,7 @@
#!/usr/bin/env python
from urllib import urlencode
from urlparse import unquote
from lxml import html
from searx.engines.xpath import extract_text, extract_url
@ -33,7 +34,10 @@ def response(resp):
dom = html.fromstring(resp.text)
for result in dom.xpath(results_xpath):
url = extract_url(result.xpath(url_xpath), search_url)
url_string = extract_url(result.xpath(url_xpath), search_url)
start = url_string.find('/RU=')+4
end = url_string.rfind('/RS')
url = unquote(url_string[start:end])
title = extract_text(result.xpath(title_xpath)[0])
content = extract_text(result.xpath(content_xpath)[0])
results.append({'url': url, 'title': title, 'content': content})