diff --git a/src/calibre/ebooks/html/input.py b/src/calibre/ebooks/html/input.py
index 6d3f5cde85..92c2df9690 100644
--- a/src/calibre/ebooks/html/input.py
+++ b/src/calibre/ebooks/html/input.py
@@ -110,7 +110,7 @@ class HTMLFile(object):
raise IOError(msg)
raise IgnoreFile(msg, err.errno)
- self.is_binary = not bool(self.HTML_PAT.search(src[:1024]))
+ self.is_binary = not bool(self.HTML_PAT.search(src[:4096]))
if not self.is_binary:
if encoding is None:
encoding = xml_to_unicode(src[:4096], verbose=verbose)[-1]