diff --git a/src/calibre/ebooks/conversion/preprocess.py b/src/calibre/ebooks/conversion/preprocess.py index bb8ee90364..3fbbb47d13 100644 --- a/src/calibre/ebooks/conversion/preprocess.py +++ b/src/calibre/ebooks/conversion/preprocess.py @@ -48,6 +48,8 @@ class HTMLPreProcessor(object): # Fix pdftohtml markup PDFTOHTML = [ + # Remove page links + (re.compile(r'', re.IGNORECASE), lambda match: ''), # Remove
'), + + # Re wrap lines + (re.compile(r'(?<=\w)\s*\s*