commit: 5d49c15f791c3b9297bb890b28643e6c50406f35
parent: a59d171385a0bfbff1b5df675ec78a88a0323543
Author: Adam Tauber <asciimoo@gmail.com>
Date: Thu, 29 Oct 2015 12:47:12 +0100
[fix] google engine - ignore new useless result type
Diffstat:
1 file changed, 6 insertions(+), 2 deletions(-)
diff --git a/searx/engines/google.py b/searx/engines/google.py
@@ -12,9 +12,12 @@ import re
from cgi import escape
from urllib import urlencode
from urlparse import urlparse, parse_qsl
-from lxml import html
+from lxml import html, etree
from searx.poolrequests import get
from searx.engines.xpath import extract_text, extract_url
+from searx.search import logger
+
+logger = logger.getChild('google engine')
# engine dependent config
@@ -225,8 +228,8 @@ def response(resp):
# parse results
for result in dom.xpath(results_xpath):
- title = extract_text(result.xpath(title_xpath)[0])
try:
+ title = extract_text(result.xpath(title_xpath)[0])
url = parse_url(extract_url(result.xpath(url_xpath), google_url), google_hostname)
parsed_url = urlparse(url, google_hostname)
@@ -269,6 +272,7 @@ def response(resp):
'content': content
})
except:
+ logger.debug('result parse error in:\n%s', etree.tostring(result, pretty_print=True))
continue
# parse suggestion