logo

searx

My custom branche(s) on searx, a meta-search engine
commit: 5d49c15f791c3b9297bb890b28643e6c50406f35
parent: a59d171385a0bfbff1b5df675ec78a88a0323543
Author: Adam Tauber <asciimoo@gmail.com>
Date:   Thu, 29 Oct 2015 12:47:12 +0100

[fix] google engine - ignore new useless result type

Diffstat:

Msearx/engines/google.py8++++++--
1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/searx/engines/google.py b/searx/engines/google.py @@ -12,9 +12,12 @@ import re from cgi import escape from urllib import urlencode from urlparse import urlparse, parse_qsl -from lxml import html +from lxml import html, etree from searx.poolrequests import get from searx.engines.xpath import extract_text, extract_url +from searx.search import logger + +logger = logger.getChild('google engine') # engine dependent config @@ -225,8 +228,8 @@ def response(resp): # parse results for result in dom.xpath(results_xpath): - title = extract_text(result.xpath(title_xpath)[0]) try: + title = extract_text(result.xpath(title_xpath)[0]) url = parse_url(extract_url(result.xpath(url_xpath), google_url), google_hostname) parsed_url = urlparse(url, google_hostname) @@ -269,6 +272,7 @@ def response(resp): 'content': content }) except: + logger.debug('result parse error in:\n%s', etree.tostring(result, pretty_print=True)) continue # parse suggestion