This commit is contained in:
ldolse 2011-01-09 21:56:12 +08:00
parent 04bbda5e5a
commit 7008e9b64c

View File

@ -72,8 +72,6 @@ class DocAnalysis(object):
def __init__(self, format='html', raw=''):
raw = raw.replace(' ', ' ')
#raw = raw.replace('\r\n', '\n')
#raw = raw.replace('\r', '\n')
if format == 'html':
linere = re.compile('(?<=<p)(?![^>]*>\s*</p>).*?(?=</p>)', re.DOTALL)
elif format == 'pdf':