mirror of
https://github.com/searxng/searxng.git
synced 2024-11-22 20:17:45 +01:00
11fc9913e9
use data from embedded JSON to improve results (e.g. real page title), add image format and source info (see PR #1567), improve paging logic (it now works)
133 lines
5.3 KiB
Python
133 lines
5.3 KiB
Python
# -*- coding: utf-8 -*-
|
|
from collections import defaultdict
|
|
import mock
|
|
from searx.engines import bing_images
|
|
from searx.testing import SearxTestCase
|
|
|
|
|
|
class TestBingImagesEngine(SearxTestCase):
|
|
|
|
def test_request(self):
|
|
bing_images.supported_languages = ['fr-FR', 'en-US']
|
|
bing_images.language_aliases = {}
|
|
query = 'test_query'
|
|
dicto = defaultdict(dict)
|
|
dicto['pageno'] = 1
|
|
dicto['language'] = 'fr-FR'
|
|
dicto['safesearch'] = 1
|
|
dicto['time_range'] = ''
|
|
params = bing_images.request(query, dicto)
|
|
self.assertTrue('url' in params)
|
|
self.assertTrue(query in params['url'])
|
|
self.assertTrue('bing.com' in params['url'])
|
|
self.assertTrue('SRCHHPGUSR' in params['cookies'])
|
|
self.assertTrue('DEMOTE' in params['cookies']['SRCHHPGUSR'])
|
|
self.assertTrue('_EDGE_S' in params['cookies'])
|
|
self.assertTrue('fr-fr' in params['cookies']['_EDGE_S'])
|
|
|
|
dicto['language'] = 'fr'
|
|
params = bing_images.request(query, dicto)
|
|
self.assertTrue('_EDGE_S' in params['cookies'])
|
|
self.assertTrue('fr-fr' in params['cookies']['_EDGE_S'])
|
|
|
|
dicto['language'] = 'all'
|
|
params = bing_images.request(query, dicto)
|
|
self.assertTrue('_EDGE_S' in params['cookies'])
|
|
self.assertTrue('en-us' in params['cookies']['_EDGE_S'])
|
|
|
|
def test_response(self):
|
|
self.assertRaises(AttributeError, bing_images.response, None)
|
|
self.assertRaises(AttributeError, bing_images.response, [])
|
|
self.assertRaises(AttributeError, bing_images.response, '')
|
|
self.assertRaises(AttributeError, bing_images.response, '[]')
|
|
|
|
response = mock.Mock(text='<html></html>')
|
|
self.assertEqual(bing_images.response(response), [])
|
|
|
|
response = mock.Mock(text='<html></html>')
|
|
self.assertEqual(bing_images.response(response), [])
|
|
|
|
html = """
|
|
<div id="mmComponent_images_1">
|
|
<ul>
|
|
<li>
|
|
<div>
|
|
<div class="imgpt">
|
|
<a m='{"purl":"page_url","murl":"img_url","turl":"thumb_url","t":"Page 1 title"}'>
|
|
<img src="" alt="alt text" />
|
|
</a>
|
|
<div class="img_info">
|
|
<span>1 x 1 - jpeg</span>
|
|
<a>1.example.org</a>
|
|
</div>
|
|
</div>
|
|
<div></div>
|
|
</div>
|
|
<div>
|
|
<div class="imgpt">
|
|
<a m='{"purl":"page_url2","murl":"img_url2","turl":"thumb_url2","t":"Page 2 title"}'>
|
|
<img src="" alt="alt text 2" />
|
|
</a>
|
|
<div class="img_info">
|
|
<span>2 x 2 - jpeg</span>
|
|
<a>2.example.org</a>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
</li>
|
|
</ul>
|
|
<ul>
|
|
<li>
|
|
<div>
|
|
<div class="imgpt">
|
|
<a m='{"purl":"page_url3","murl":"img_url3","turl":"thumb_url3","t":"Page 3 title"}'>
|
|
<img src="" alt="alt text 3" />
|
|
</a>
|
|
<div class="img_info">
|
|
<span>3 x 3 - jpeg</span>
|
|
<a>3.example.org</a>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
</li>
|
|
</ul>
|
|
</div>
|
|
"""
|
|
html = html.replace('\r\n', '').replace('\n', '').replace('\r', '')
|
|
response = mock.Mock(text=html)
|
|
results = bing_images.response(response)
|
|
self.assertEqual(type(results), list)
|
|
self.assertEqual(len(results), 3)
|
|
self.assertEqual(results[0]['title'], 'Page 1 title')
|
|
self.assertEqual(results[0]['url'], 'page_url')
|
|
self.assertEqual(results[0]['content'], '')
|
|
self.assertEqual(results[0]['thumbnail_src'], 'thumb_url')
|
|
self.assertEqual(results[0]['img_src'], 'img_url')
|
|
self.assertEqual(results[0]['img_format'], '1 x 1 - jpeg')
|
|
self.assertEqual(results[0]['source'], '1.example.org')
|
|
|
|
def test_fetch_supported_languages(self):
|
|
html = """
|
|
<div>
|
|
<div id="region-section-content">
|
|
<ul class="b_vList">
|
|
<li>
|
|
<a href="https://bing...&setmkt=de-DE&s...">Germany</a>
|
|
<a href="https://bing...&setmkt=nb-NO&s...">Norway</a>
|
|
</li>
|
|
</ul>
|
|
<ul class="b_vList">
|
|
<li>
|
|
<a href="https://bing...&setmkt=es-AR&s...">Argentina</a>
|
|
</li>
|
|
</ul>
|
|
</div>
|
|
</div>
|
|
"""
|
|
response = mock.Mock(text=html)
|
|
languages = list(bing_images._fetch_supported_languages(response))
|
|
self.assertEqual(len(languages), 3)
|
|
self.assertIn('de-DE', languages)
|
|
self.assertIn('no-NO', languages)
|
|
self.assertIn('es-AR', languages)
|