mirror of
https://github.com/kovidgoyal/calibre.git
synced 2025-07-09 03:04:10 -04:00
Add reference for claim that filenames in chm pgml blocks are utf-8
This commit is contained in:
parent
1a5fa973ea
commit
52adf96211
@ -134,6 +134,8 @@ class CHMReader(CHMFile):
|
||||
return toc
|
||||
|
||||
def ResolveObject(self, path):
|
||||
# filenames are utf-8 encoded in the chm index as far as I can
|
||||
# determine, see https://tika.apache.org/1.11/api/org/apache/tika/parser/chm/accessor/ChmPmgiHeader.html
|
||||
if not isinstance(path, bytes):
|
||||
path = path.encode('utf-8')
|
||||
return CHMFile.ResolveObject(self, path)
|
||||
@ -318,6 +320,7 @@ class CHMReader(CHMFile):
|
||||
|
||||
def get_paths(chm, ui, ctx):
|
||||
# these are supposed to be UTF-8 in CHM as best as I can determine
|
||||
# see https://tika.apache.org/1.11/api/org/apache/tika/parser/chm/accessor/ChmPmgiHeader.html
|
||||
path = as_unicode(ui.path, 'utf-8')
|
||||
# skip directories
|
||||
# note this path refers to the internal CHM structure
|
||||
|
Loading…
x
Reference in New Issue
Block a user