From b13b1ea5aa4e8b7d4bb51edd069d77ba742b4444 Mon Sep 17 00:00:00 2001
From: Kovid Goyal <kovid@kovidgoyal.net>
Date: Tue, 13 Sep 2016 08:27:38 +0530
Subject: [PATCH] Conversion: Improve detection of input documents that use
 uppercase tag/attribute names. Fixes #1622261 [Private
 bug](https://bugs.launchpad.net/calibre/+bug/1622261)

---
 src/calibre/ebooks/oeb/parse_utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/calibre/ebooks/oeb/parse_utils.py b/src/calibre/ebooks/oeb/parse_utils.py
index 61029741a4..4c3382e215 100644
--- a/src/calibre/ebooks/oeb/parse_utils.py
+++ b/src/calibre/ebooks/oeb/parse_utils.py
@@ -297,7 +297,7 @@ def parse_html(data, log=None, decoder=None, preprocessor=None,
                     'HTML 5 parsing failed, falling back to older parsers')
                 data = _html4_parse(data)
 
-    if has_html4_doctype or data.tag == 'HTML':
+    if has_html4_doctype or data.tag == 'HTML' or (len(data) and (data[-1].get('LANG') or data[-1].get('DIR'))):
         # Lower case all tag and attribute names
         data.tag = data.tag.lower()
         for x in data.iterdescendants():