pdftohtml processing: fix spaces rule

2025-07-07 10:14:46 -04:00 · 2009-04-09 19:16:49 -04:00 · 2009-04-09 19:16:49 -04:00 · ac0af1b844
commit ac0af1b844
parent f7ec532d57
1 changed files with 2 additions and 2 deletions
--- a/src/calibre/ebooks/conversion/preprocess.py
+++ b/src/calibre/ebooks/conversion/preprocess.py
@ -72,11 +72,11 @@ class HTMLPreProcessor(object):
                  # Have paragraphs show better
                  (re.compile(r'<br.*?>'), lambda match : '<p>'),
                  
-                  # Re wrap lines
+                  # Un wrap lines
                  (re.compile(r'(?<=\w)\s*</i>\s*<p.*?>\s*<i>\s*(?=\w)'), lambda match: ' '),
                  (re.compile(r'(?<=\w)\s*<p.*?>\s*(?=\w)', re.UNICODE), lambda match: ' '),
                  # Clean up spaces
-                  (re.compile(ru'(?<=\.|,|:|;|\?|!|”|"|\')[\s^ ]*(?=<)'), lambda match: ' '),
+                  (re.compile(u'(?<=\.|,|:|;|\?|!|”|"|\')[\s^ ]*(?=<)'), lambda match: ' '),
                  ]

    # Fix Book Designer markup