diff --git a/src/calibre/ebooks/conversion/utils.py b/src/calibre/ebooks/conversion/utils.py index eabeba7b4f..cbc8b41529 100644 --- a/src/calibre/ebooks/conversion/utils.py +++ b/src/calibre/ebooks/conversion/utils.py @@ -315,7 +315,7 @@ class HeuristicProcessor(object): supports a range of html markup and text files ''' # define the pieces of the regex - + lookahead = "(?<=.{"+str(length)+u"}([a-zäëïöüàèìòùáćéíĺóŕńśúýâêîôûçąężıãõñæøþðßěľščťžňďřů,:“”)\IA\u00DF]|(?]*>\s*\s*', '

', html) html = self.detect_whitespace(html) html = self.detect_soft_breaks(html)