From b71a2874ffb0f41730839b29a74cae0ca7deb909 Mon Sep 17 00:00:00 2001 From: ldolse Date: Mon, 22 Nov 2010 19:54:51 +0800 Subject: [PATCH] ... --- src/calibre/ebooks/mobi/reader.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/calibre/ebooks/mobi/reader.py b/src/calibre/ebooks/mobi/reader.py index 355fc87c0c..733f79ee65 100644 --- a/src/calibre/ebooks/mobi/reader.py +++ b/src/calibre/ebooks/mobi/reader.py @@ -476,7 +476,8 @@ class MobiReader(object): self.processed_html = self.processed_html.replace('> <', '>\n<') self.processed_html = self.processed_html.replace(']*>', '', self.processed_html) - # Rearrange various style tags & paragraph tags so that lxml and BeautifulSoup don't get upset + # Swap inline and block level elements, and order block level elements according to priority + # - lxml and beautifulsoup live in the modern world and expect/assume a specific order self.processed_html = re.sub(r'(?i)(?P(<(h\d+|i|b|u|em|small|big|strong|tt)>\s*){1,})(?P]*>)', '\g'+'\g', self.processed_html) self.processed_html = re.sub(r'(?i)(?P]*>)\s*(?P(\s*){1,})', '\g'+'\g', self.processed_html)