TXT Input: Tweak Heuristic italicizing.

This commit is contained in:
John Schember 2011-01-08 13:53:32 -05:00
parent 843e1f2068
commit f593b21631

View File

@ -21,15 +21,15 @@ class TXTHeuristicProcessor(object):
] ]
self.ITALICIZE_STYLE_PATS = [ self.ITALICIZE_STYLE_PATS = [
r'(?msu)_(?P<words>.+?)_', r'(?msu)_(?P<words>.+?)_',
r'(?msu)/(?P<words>.+?)/', r'(?msu)/(?P<words>[^<>]+?)/',
r'(?msu)~~(?P<words>.+?)~~', r'(?msu)~~(?P<words>.+?)~~',
r'(?msu)\*(?P<words>.+?)\*', r'(?msu)\*(?P<words>.+?)\*',
r'(?msu)~(?P<words>.+?)~', r'(?msu)~(?P<words>.+?)~',
r'(?msu)_/(?P<words>.+?)/_', r'(?msu)_/(?P<words>[^<>]+?)/_',
r'(?msu)_\*(?P<words>.+?)\*_', r'(?msu)_\*(?P<words>.+?)\*_',
r'(?msu)\*/(?P<words>.+?)/\*', r'(?msu)\*/(?P<words>[^<>]+?)/\*',
r'(?msu)_\*/(?P<words>.+?)/\*_', r'(?msu)_\*/(?P<words>[^<>]+?)/\*_',
r'(?msu)/:(?P<words>.+?):/', r'(?msu)/:(?P<words>[^<>]+?):/',
r'(?msu)\|:(?P<words>.+?):\|', r'(?msu)\|:(?P<words>.+?):\|',
] ]
@ -84,5 +84,6 @@ class TXTHeuristicProcessor(object):
txt = u'\n'.join(processed) txt = u'\n'.join(processed)
txt = re.sub('[ ]{2,}', ' ', txt) txt = re.sub('[ ]{2,}', ' ', txt)
print txt
return HTML_TEMPLATE % (title, txt) return HTML_TEMPLATE % (title, txt)