logo

searx

My custom branche(s) on searx, a meta-search engine
commit: e467a24843b62ff444b20e81a7b22b0cc5783a9e
parent: a0037313ea1a3810aea50c6597c8a36eaebdd259
Author: asciimoo <asciimoo@gmail.com>
Date:   Thu, 17 Oct 2013 00:27:25 +0200

[enh] stackoverflow added

Diffstat:

Asearx/engines/stackoverflow.py25+++++++++++++++++++++++++
1 file changed, 25 insertions(+), 0 deletions(-)

diff --git a/searx/engines/stackoverflow.py b/searx/engines/stackoverflow.py @@ -0,0 +1,25 @@ +from urllib import quote +from lxml import html +from urlparse import urljoin + +base_url = 'http://stackoverflow.com/' +search_url = base_url+'search?q=' + +def request(query, params): + global search_url + query = quote(query.replace(' ', '+'), safe='+') + params['url'] = search_url + query + return params + + +def response(resp): + global base_url + results = [] + dom = html.fromstring(resp.text) + for result in dom.xpath('//div[@class="question-summary search-result"]'): + link = result.xpath('.//div[@class="result-link"]//a')[0] + url = urljoin(base_url, link.attrib.get('href')) + title = ' '.join(link.xpath('.//text()')) + content = ' '.join(result.xpath('.//div[@class="excerpt"]//text()')) + results.append({'url': url, 'title': title, 'content': content}) + return results