1.1 --- a/parser.py Tue Dec 18 23:06:19 2012 +0100
1.2 +++ b/parser.py Wed Dec 19 00:15:50 2012 +0100
1.3 @@ -40,6 +40,7 @@
1.4 import re
1.5 import sys
1.6 import operator
1.7 +import htmlentitydefs
1.8
1.9 URL_SCHEMES = ("http", "https", "ftp", "mailto")
1.10
1.11 @@ -486,10 +487,9 @@
1.12 Parser.characters(self, content)
1.13
1.14 def skippedEntity(self, name):
1.15 - if name == "mdash":
1.16 - self.text[-1].append(u"\u2014")
1.17 - elif name == "ndash":
1.18 - self.text[-1].append(u"\u2013")
1.19 + ch = htmlentitydefs.name2codepoint.get(name)
1.20 + if ch:
1.21 + self.text[-1].append(unichr(ch))
1.22
1.23 # Parser-related methods.
1.24