From 35320295f8c6ffbc7a430117696da434c8b3f2fc Mon Sep 17 00:00:00 2001 From: "Marshall T. Vandegrift" Date: Fri, 2 Jan 2009 09:27:47 -0500 Subject: [PATCH] Temporary (?) fix for multibyte char / record boundary issue. --- src/calibre/ebooks/mobi/writer.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/src/calibre/ebooks/mobi/writer.py b/src/calibre/ebooks/mobi/writer.py index 77b382e90a..fb5c1118a2 100644 --- a/src/calibre/ebooks/mobi/writer.py +++ b/src/calibre/ebooks/mobi/writer.py @@ -50,8 +50,9 @@ PALMDOC = 2 HUFFDIC = 17480 def encode(data): - #return data.encode('ascii', 'xmlcharrefreplace') - return data.encode('utf-8') + # Using UTF-8 means needing to worry about multibyte characters crossing + # record boundaries, so let's not for now. + return data.encode('ascii', 'xmlcharrefreplace') # Almost like the one for MS LIT, but not quite. def decint(value):