From ac0af1b844293f9c5720f9783fac6342e324724d Mon Sep 17 00:00:00 2001 From: John Schember Date: Thu, 9 Apr 2009 19:16:49 -0400 Subject: [PATCH] pdftohtml processing: fix spaces rule --- src/calibre/ebooks/conversion/preprocess.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/calibre/ebooks/conversion/preprocess.py b/src/calibre/ebooks/conversion/preprocess.py index 3fbbb47d13..6b58d2d18d 100644 --- a/src/calibre/ebooks/conversion/preprocess.py +++ b/src/calibre/ebooks/conversion/preprocess.py @@ -72,11 +72,11 @@ class HTMLPreProcessor(object): # Have paragraphs show better (re.compile(r''), lambda match : '

'), - # Re wrap lines + # Un wrap lines (re.compile(r'(?<=\w)\s*\s*\s*\s*(?=\w)'), lambda match: ' '), (re.compile(r'(?<=\w)\s*\s*(?=\w)', re.UNICODE), lambda match: ' '), # Clean up spaces - (re.compile(ru'(?<=\.|,|:|;|\?|!|”|"|\')[\s^ ]*(?=<)'), lambda match: ' '), + (re.compile(u'(?<=\.|,|:|;|\?|!|”|"|\')[\s^ ]*(?=<)'), lambda match: ' '), ] # Fix Book Designer markup