logo

searx

My custom branche(s) on searx, a meta-search engine git clone https://hacktivis.me/git/searx.git
commit: 576d37f256649b570a9c8591a795acd85ac499bc
parent 16d6e758d73ed5b369a4cf70830b5ebf0d0196ba
Author: a01200356 <a01200356@itesm.mx>
Date:   Sun,  3 Jan 2016 15:58:01 -0600

[fix] unescape htmlentities in wolframalpha_noapi's answer

Diffstat:

Msearx/engines/wolframalpha_noapi.py7++++++-
Msearx/settings.yml3++-
2 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/searx/engines/wolframalpha_noapi.py b/searx/engines/wolframalpha_noapi.py @@ -12,6 +12,7 @@ from re import search, sub from json import loads from urllib import urlencode from lxml import html +import HTMLParser # search-url url = 'http://www.wolframalpha.com/' @@ -62,7 +63,11 @@ def response(resp): # extract answer from json answer = line[line.find('{'):line.rfind('}')+1] answer = loads(answer.encode('unicode-escape')) - answer = answer['stringified'].decode('unicode-escape') + answer = answer['stringified'] + + # clean plaintext answer + h = HTMLParser.HTMLParser() + answer = h.unescape(answer.decode('unicode-escape')) answer = sub(r'\\', '', answer) results.append({'answer': answer}) diff --git a/searx/settings.yml b/searx/settings.yml @@ -305,9 +305,10 @@ engines: # You can use the engine using the official stable API, but you need an API key # See : http://products.wolframalpha.com/api/ # engine : wolframalpha_api - # api_key: '5952JX-X52L3VKWT8' # required! + # api_key: '' # required! engine : wolframalpha_noapi timeout: 6.0 + disabled : True #The blekko technology and team have joined IBM Watson! -> https://blekko.com/ # - name : blekko images