diff --git a/src/calibre/ebooks/conversion/utils.py b/src/calibre/ebooks/conversion/utils.py index abfa43e7ed..ecf030b27d 100644 --- a/src/calibre/ebooks/conversion/utils.py +++ b/src/calibre/ebooks/conversion/utils.py @@ -111,7 +111,7 @@ class PreProcessor(object): html = add_markup.sub('

\n

', html) # detect chapters/sections to match xpath or splitting logic - heading = re.compile(']*>', re.IGNORECASE) + heading = re.compile(']*>', re.IGNORECASE) self.html_preprocess_sections = len(heading.findall(html)) self.log("found " + str(self.html_preprocess_sections) + " pre-existing headings") # @@ -134,7 +134,7 @@ class PreProcessor(object): self.log("Unwrapping Lines") # Some OCR sourced files have line breaks in the html using a combination of span & p tags # span are used for hard line breaks, p for new paragraphs. Determine which is used so - # that lines can be wrapped across page boundaries + # that lines can be un-wrapped across page boundaries paras_reg = re.compile(']*>', re.IGNORECASE) spans_reg = re.compile(']*>', re.IGNORECASE) paras = len(paras_reg.findall(html))