diff --git a/src/calibre/ebooks/oeb/parse_utils.py b/src/calibre/ebooks/oeb/parse_utils.py index d262a6782c..a10d352d6d 100644 --- a/src/calibre/ebooks/oeb/parse_utils.py +++ b/src/calibre/ebooks/oeb/parse_utils.py @@ -80,6 +80,7 @@ def node_depth(node): def html5_parse(data, max_nesting_depth=100): import html5lib + data = re.sub(r'<\s*title\s*/\s*>', '', data) data = html5lib.parse(data, treebuilder='lxml').getroot() # Check that the asinine HTML 5 algorithm did not result in a tree with