From 186530f941c939b119b2eb8dd0518635a18e2e66 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Thu, 7 Feb 2013 12:41:16 +0530 Subject: [PATCH] =?UTF-8?q?Conversion:=20When=20transliterating=20unicode?= =?UTF-8?q?=20characters,=20handle=20=C2=AB=20and=20=C2=BB=20correctly.=20?= =?UTF-8?q?Fixes=20#1117270=20(Private=20bug)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/calibre/ebooks/conversion/preprocess.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/src/calibre/ebooks/conversion/preprocess.py b/src/calibre/ebooks/conversion/preprocess.py index 82cc4c0f4a..bbbc96a7a5 100644 --- a/src/calibre/ebooks/conversion/preprocess.py +++ b/src/calibre/ebooks/conversion/preprocess.py @@ -626,7 +626,10 @@ class HTMLPreProcessor(object): if getattr(self.extra_opts, 'asciiize', False): from calibre.utils.localization import get_udc + from calibre.utils.mreplace import MReplace unihandecoder = get_udc() + mr = MReplace(data={u'«':u'<'*3, u'»':u'>'*3}) + html = mr.mreplace(html) html = unihandecoder.decode(html) if getattr(self.extra_opts, 'enable_heuristics', False):