Conversion: Improve detection of input documents that use uppercase tag/attribute names. Fixes #1622261 [Private bug](https://bugs.launchpad.net/calibre/+bug/1622261)

2025-07-09 03:04:10 -04:00 · 2016-09-13 08:27:38 +05:30 · 2016-09-13 08:27:38 +05:30 · b13b1ea5aa
commit b13b1ea5aa
parent df33ef6a3c
1 changed files with 1 additions and 1 deletions
--- a/src/calibre/ebooks/oeb/parse_utils.py
+++ b/src/calibre/ebooks/oeb/parse_utils.py
@ -297,7 +297,7 @@ def parse_html(data, log=None, decoder=None, preprocessor=None,
                    'HTML 5 parsing failed, falling back to older parsers')
                data = _html4_parse(data)
-    if has_html4_doctype or data.tag == 'HTML':
+    if has_html4_doctype or data.tag == 'HTML' or (len(data) and (data[-1].get('LANG') or data[-1].get('DIR'))):
        # Lower case all tag and attribute names
        data.tag = data.tag.lower()
        for x in data.iterdescendants():