logo

searx

My custom branche(s) on searx, a meta-search engine
commit: 28493d41a327128762c6286a625d219e4b0b4e2e
parent: c706bea788d46bae8cb5cd71bc57abf71f1cb998
Author: Adam Tauber <adam.tauber@balabit.com>
Date:   Tue, 25 Aug 2015 13:12:51 +0200

[fix] handle missing url in twitter results

Diffstat:

Msearx/engines/twitter.py8++++++--
1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/searx/engines/twitter.py b/searx/engines/twitter.py @@ -55,10 +55,14 @@ def response(resp): # parse results for tweet in dom.xpath(results_xpath): - link = tweet.xpath(link_xpath)[0] + try: + link = tweet.xpath(link_xpath)[0] + content = extract_text(tweet.xpath(content_xpath)[0]) + except Exception: + continue + url = urljoin(base_url, link.attrib.get('href')) title = extract_text(tweet.xpath(title_xpath)) - content = extract_text(tweet.xpath(content_xpath)[0]) pubdate = tweet.xpath(timestamp_xpath) if len(pubdate) > 0: