X-Git-Url: https://git.sommitrealweird.co.uk/rss2maildir.git/blobdiff_plain/385c031fd3e0796988b35b1b09c9977f7b0ba04a..9337881574f8f9370fecabfeb9a52e4341568cd9:/rss2maildir.py?ds=inline diff --git a/rss2maildir.py b/rss2maildir.py index dd5b112..9473dd0 100755 --- a/rss2maildir.py +++ b/rss2maildir.py @@ -407,7 +407,7 @@ class HTML2Text(HTMLParser): quote = unicode( \ " ".join(self.curdata.encode("utf-8").strip().split()), \ "utf-8") - seperator = u'\n' + u' ' * self.indentlevel + u'> ' + seperator = u'\n' + u' ' * self.indentlevel + u' ' if len(self.text) > 0 and self.text[-1] != u'\n': self.text = self.text + u'\n' self.text = self.text \ @@ -556,12 +556,15 @@ class HTML2Text(HTMLParser): self.opentags.append(u'p') self.curdata = self.curdata + data.decode("utf-8") + def handle_charref(self, name): + entity = unichr(int(name)) + self.curdata = self.curdata + unicode(entity.encode('utf-8'), \ + "utf-8") + def handle_entityref(self, name): entity = name if HTML2Text.entities.has_key(name): entity = HTML2Text.entities[name] - elif name[0] == "#": - entity = unichr(int(name[1:])) else: entity = "&" + name + ";"