commit: 4184cece4a0b2d04b45105e755492bfee5fa1a12
parent: 362c849797e2e6f0e232642c23744c47a75cdfd4
Author: Adam Tauber <asciimoo@gmail.com>
Date: Mon, 7 Sep 2015 23:13:04 +0200
[fix] duckduckgo unicode url - #419
Diffstat:
2 files changed, 5 insertions(+), 4 deletions(-)
diff --git a/searx/engines/duckduckgo.py b/searx/engines/duckduckgo.py
@@ -72,7 +72,7 @@ def response(resp):
# append result
results.append({'title': title,
'content': content,
- 'url': res_url.encode('utf8')})
+ 'url': res_url})
# return results
return results
diff --git a/searx/tests/engines/test_duckduckgo.py b/searx/tests/engines/test_duckduckgo.py
@@ -1,3 +1,4 @@
+# -*- coding: utf-8 -*-
from collections import defaultdict
import mock
from searx.engines import duckduckgo
@@ -30,7 +31,7 @@ class TestDuckduckgoEngine(SearxTestCase):
response = mock.Mock(text='<html></html>')
self.assertEqual(duckduckgo.response(response), [])
- html = """
+ html = u"""
<div class="results_links results_links_deep web-result">
<div class="icon_fav" style="display: block;">
<a rel="nofollow" href="https://www.test.com/">
@@ -39,7 +40,7 @@ class TestDuckduckgoEngine(SearxTestCase):
</a>
</div>
<div class="links_main links_deep"> <!-- This is the visible part -->
- <a rel="nofollow" class="large" href="http://this.should.be.the.link/">
+ <a rel="nofollow" class="large" href="http://this.should.be.the.link/ű">
This <b>is</b> <b>the</b> title
</a>
<div class="snippet"><b>This</b> should be the content.</div>
@@ -54,7 +55,7 @@ class TestDuckduckgoEngine(SearxTestCase):
self.assertEqual(type(results), list)
self.assertEqual(len(results), 1)
self.assertEqual(results[0]['title'], 'This is the title')
- self.assertEqual(results[0]['url'], 'http://this.should.be.the.link/')
+ self.assertEqual(results[0]['url'], u'http://this.should.be.the.link/ű')
self.assertEqual(results[0]['content'], 'This should be the content.')
html = """