changeset 2014 | e6d297dcf7aa |
parent 1990 | fea8bdb43992 |
child 2029 | 1f276091b42a |
--- a/app/soc/logic/cleaning.py Wed Mar 25 22:42:35 2009 +0000 +++ b/app/soc/logic/cleaning.py Thu Mar 26 12:19:33 2009 +0000 @@ -352,6 +352,7 @@ sanitizer = feedparser._HTMLSanitizer('utf-8') sanitizer.feed(content) content = sanitizer.output() + content = content.decode('utf-8') content = content.strip().replace('\r\n', '\n') return content