commit: d0427d9baebc5abeb9f09bac54196026e56498b8
parent: ad7c83e3f61885a2919fbc274a3b06edb6feca83
Author: asciimoo <asciimoo@gmail.com>
Date: Mon, 18 Nov 2013 16:47:20 +0100
[fix] html escape
Diffstat:
1 file changed, 4 insertions(+), 3 deletions(-)
diff --git a/searx/utils.py b/searx/utils.py
@@ -1,5 +1,5 @@
from HTMLParser import HTMLParser
-import htmlentitydefs
+#import htmlentitydefs
import csv
import codecs
import cStringIO
@@ -17,8 +17,9 @@ class HTMLTextExtractor(HTMLParser):
self.result.append(unichr(codepoint))
def handle_entityref(self, name):
- codepoint = htmlentitydefs.name2codepoint[name]
- self.result.append(unichr(codepoint))
+ #codepoint = htmlentitydefs.name2codepoint[name]
+ #self.result.append(unichr(codepoint))
+ self.result.append(name)
def get_text(self):
return u''.join(self.result)