1
0
mirror of https://github.com/searxng/searxng.git synced 2024-11-18 02:10:12 +01:00
searxng/searx/tests/engines/test_duckduckgo.py

92 lines
3.7 KiB
Python
Raw Normal View History

2015-09-07 23:13:04 +02:00
# -*- coding: utf-8 -*-
2015-02-02 17:55:39 +01:00
from collections import defaultdict
import mock
from searx.engines import duckduckgo
from searx.testing import SearxTestCase
class TestDuckduckgoEngine(SearxTestCase):
2015-02-02 17:55:39 +01:00
def test_request(self):
query = 'test_query'
dicto = defaultdict(dict)
dicto['pageno'] = 1
dicto['language'] = 'fr_FR'
params = duckduckgo.request(query, dicto)
self.assertIn('url', params)
self.assertIn(query, params['url'])
self.assertIn('duckduckgo.com', params['url'])
self.assertIn('fr-fr', params['url'])
dicto['language'] = 'all'
params = duckduckgo.request(query, dicto)
self.assertIn('en-us', params['url'])
def test_response(self):
self.assertRaises(AttributeError, duckduckgo.response, None)
self.assertRaises(AttributeError, duckduckgo.response, [])
self.assertRaises(AttributeError, duckduckgo.response, '')
self.assertRaises(AttributeError, duckduckgo.response, '[]')
response = mock.Mock(text='<html></html>')
self.assertEqual(duckduckgo.response(response), [])
2015-09-07 23:13:04 +02:00
html = u"""
2015-02-02 17:55:39 +01:00
<div class="results_links results_links_deep web-result">
<div class="icon_fav" style="display: block;">
<a rel="nofollow" href="https://www.test.com/">
<img width="16" height="16" alt=""
src="/i/www.test.com.ico" style="visibility: visible;" name="i15" />
</a>
</div>
<div class="links_main links_deep"> <!-- This is the visible part -->
2015-09-07 23:13:04 +02:00
<a rel="nofollow" class="large" href="http://this.should.be.the.link/ű">
2015-02-02 17:55:39 +01:00
This <b>is</b> <b>the</b> title
</a>
<div class="snippet"><b>This</b> should be the content.</div>
<div class="url">
http://this.should.be.the.link/
</div>
</div>
</div>
"""
response = mock.Mock(text=html)
results = duckduckgo.response(response)
self.assertEqual(type(results), list)
self.assertEqual(len(results), 1)
self.assertEqual(results[0]['title'], 'This is the title')
2015-09-07 23:13:04 +02:00
self.assertEqual(results[0]['url'], u'http://this.should.be.the.link/ű')
2015-02-02 17:55:39 +01:00
self.assertEqual(results[0]['content'], 'This should be the content.')
html = """
<div class="results_links results_links_deep web-result">
<div class="icon_fav" style="display: block;">
</div>
<div class="links_main links_deep"> <!-- This is the visible part -->
<div class="snippet"><b>This</b> should be the content.</div>
<div class="url">
http://this.should.be.the.link/
</div>
</div>
</div>
<div class="results_links results_links_deep web-result">
<div class="icon_fav" style="display: block;">
<img width="16" height="16" alt=""
src="/i/www.test.com.ico" style="visibility: visible;" name="i15" />
</div>
<div class="links_main links_deep"> <!-- This is the visible part -->
<a rel="nofollow" class="large" href="">
This <b>is</b> <b>the</b> title
</a>
<div class="snippet"><b>This</b> should be the content.</div>
<div class="url">
http://this.should.be.the.link/
</div>
</div>
</div>
"""
response = mock.Mock(text=html)
results = duckduckgo.response(response)
self.assertEqual(type(results), list)
self.assertEqual(len(results), 0)