From 847030ea5b30364fca81fdfbf402ffc5260fc218 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Fri, 13 Jul 2007 23:21:29 +0000 Subject: [PATCH] Handle   correctly --- src/libprs500/ebooks/lrf/html/convert_from.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/src/libprs500/ebooks/lrf/html/convert_from.py b/src/libprs500/ebooks/lrf/html/convert_from.py index 8cba759448..36bf039343 100644 --- a/src/libprs500/ebooks/lrf/html/convert_from.py +++ b/src/libprs500/ebooks/lrf/html/convert_from.py @@ -223,7 +223,8 @@ class HTMLConverter(object): PAGE_BREAK_PAT = re.compile(r'page-break-(?:after|before)\s*:\s*(\w+)', re.IGNORECASE) IGNORED_TAGS = (Comment, Declaration, ProcessingInstruction) # Fix elements - MARKUP_MASSAGE = [(re.compile("(<\s*[aA]\s+.*\/)\s*>"), #Close tags + MARKUP_MASSAGE = [(re.compile(' '), lambda match : ' '), # Convert   into a normal space as the default conversion converts it into \xa0 which is not a space in LRF + (re.compile("(<\s*[aA]\s+.*\/)\s*>"), #Close tags lambda match: match.group(1)+">"), # Strip comments from