mirror of
				https://github.com/kovidgoyal/calibre.git
				synced 2025-10-26 00:02:25 -04:00 
			
		
		
		
	
		
			
				
	
	
		
			326 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			326 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #!/usr/bin/env python
 | |
| # vim:fileencoding=UTF-8:ts=4:sw=4:sta:et:sts=4:ai
 | |
| 
 | |
| 
 | |
| __license__   = 'GPL v3'
 | |
| __copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
 | |
| __docformat__ = 'restructuredtext en'
 | |
| 
 | |
| import os, re, shutil, zipfile, glob, json, errno
 | |
| from zlib import compress
 | |
| is_ci = os.environ.get('CI', '').lower() == 'true'
 | |
| 
 | |
| from setup import Command, basenames, __appname__, download_securely, dump_json
 | |
| from polyglot.builtins import codepoint_to_chr, itervalues, iteritems, only_unicode_recursive
 | |
| 
 | |
| 
 | |
| def get_opts_from_parser(parser):
 | |
|     def do_opt(opt):
 | |
|         for x in opt._long_opts:
 | |
|             yield x
 | |
|         for x in opt._short_opts:
 | |
|             yield x
 | |
|     for o in parser.option_list:
 | |
|         for x in do_opt(o):
 | |
|             yield x
 | |
|     for g in parser.option_groups:
 | |
|         for o in g.option_list:
 | |
|             for x in do_opt(o):
 | |
|                 yield x
 | |
| 
 | |
| 
 | |
| class Kakasi(Command):  # {{{
 | |
| 
 | |
|     description = 'Compile resources for unihandecode'
 | |
| 
 | |
|     KAKASI_PATH = os.path.join(Command.SRC,  __appname__,
 | |
|             'ebooks', 'unihandecode', 'pykakasi')
 | |
| 
 | |
|     def run(self, opts):
 | |
|         self.records = {}
 | |
|         src = self.j(self.KAKASI_PATH, 'kakasidict.utf8')
 | |
|         dest = self.j(self.RESOURCES, 'localization',
 | |
|                 'pykakasi','kanwadict2.calibre_msgpack')
 | |
|         base = os.path.dirname(dest)
 | |
|         if not os.path.exists(base):
 | |
|             os.makedirs(base)
 | |
| 
 | |
|         if self.newer(dest, src):
 | |
|             self.info('\tGenerating Kanwadict')
 | |
| 
 | |
|             for line in open(src, "rb"):
 | |
|                 self.parsekdict(line)
 | |
|             self.kanwaout(dest)
 | |
| 
 | |
|         src = self.j(self.KAKASI_PATH, 'itaijidict.utf8')
 | |
|         dest = self.j(self.RESOURCES, 'localization',
 | |
|                 'pykakasi','itaijidict2.calibre_msgpack')
 | |
| 
 | |
|         if self.newer(dest, src):
 | |
|             self.info('\tGenerating Itaijidict')
 | |
|             self.mkitaiji(src, dest)
 | |
| 
 | |
|         src = self.j(self.KAKASI_PATH, 'kanadict.utf8')
 | |
|         dest = self.j(self.RESOURCES, 'localization',
 | |
|                 'pykakasi','kanadict2.calibre_msgpack')
 | |
| 
 | |
|         if self.newer(dest, src):
 | |
|             self.info('\tGenerating kanadict')
 | |
|             self.mkkanadict(src, dest)
 | |
| 
 | |
|     def mkitaiji(self, src, dst):
 | |
|         dic = {}
 | |
|         for line in open(src, "rb"):
 | |
|             line = line.decode('utf-8').strip()
 | |
|             if line.startswith(';;'):  # skip comment
 | |
|                 continue
 | |
|             if re.match(r"^$",line):
 | |
|                 continue
 | |
|             pair = re.sub(r'\\u([0-9a-fA-F]{4})', lambda x:codepoint_to_chr(int(x.group(1),16)), line)
 | |
|             dic[pair[0]] = pair[1]
 | |
|         from calibre.utils.serialize import msgpack_dumps
 | |
|         with open(dst, 'wb') as f:
 | |
|             f.write(msgpack_dumps(dic))
 | |
| 
 | |
|     def mkkanadict(self, src, dst):
 | |
|         dic = {}
 | |
|         for line in open(src, "rb"):
 | |
|             line = line.decode('utf-8').strip()
 | |
|             if line.startswith(';;'):  # skip comment
 | |
|                 continue
 | |
|             if re.match(r"^$",line):
 | |
|                 continue
 | |
|             (alpha, kana) = line.split(' ')
 | |
|             dic[kana] = alpha
 | |
|         from calibre.utils.serialize import msgpack_dumps
 | |
|         with open(dst, 'wb') as f:
 | |
|             f.write(msgpack_dumps(dic))
 | |
| 
 | |
|     def parsekdict(self, line):
 | |
|         line = line.decode('utf-8').strip()
 | |
|         if line.startswith(';;'):  # skip comment
 | |
|             return
 | |
|         (yomi, kanji) = line.split(' ')
 | |
|         if ord(yomi[-1:]) <= ord('z'):
 | |
|             tail = yomi[-1:]
 | |
|             yomi = yomi[:-1]
 | |
|         else:
 | |
|             tail = ''
 | |
|         self.updaterec(kanji, yomi, tail)
 | |
| 
 | |
|     def updaterec(self, kanji, yomi, tail):
 | |
|         key = "%04x"%ord(kanji[0])
 | |
|         if key in self.records:
 | |
|             if kanji in self.records[key]:
 | |
|                 rec = self.records[key][kanji]
 | |
|                 rec.append((yomi,tail))
 | |
|                 self.records[key].update({kanji: rec})
 | |
|             else:
 | |
|                 self.records[key][kanji]=[(yomi, tail)]
 | |
|         else:
 | |
|             self.records[key] = {}
 | |
|             self.records[key][kanji]=[(yomi, tail)]
 | |
| 
 | |
|     def kanwaout(self, out):
 | |
|         from calibre.utils.serialize import msgpack_dumps
 | |
|         with open(out, 'wb') as f:
 | |
|             dic = {}
 | |
|             for k, v in iteritems(self.records):
 | |
|                 dic[k] = compress(msgpack_dumps(v))
 | |
|             f.write(msgpack_dumps(dic))
 | |
| 
 | |
|     def clean(self):
 | |
|         kakasi = self.j(self.RESOURCES, 'localization', 'pykakasi')
 | |
|         if os.path.exists(kakasi):
 | |
|             shutil.rmtree(kakasi)
 | |
| # }}}
 | |
| 
 | |
| 
 | |
| class CACerts(Command):  # {{{
 | |
| 
 | |
|     description = 'Get updated mozilla CA certificate bundle'
 | |
|     CA_PATH = os.path.join(Command.RESOURCES, 'mozilla-ca-certs.pem')
 | |
| 
 | |
|     def run(self, opts):
 | |
|         try:
 | |
|             with open(self.CA_PATH, 'rb') as f:
 | |
|                 raw = f.read()
 | |
|         except EnvironmentError as err:
 | |
|             if err.errno != errno.ENOENT:
 | |
|                 raise
 | |
|             raw = b''
 | |
|         nraw = download_securely('https://curl.haxx.se/ca/cacert.pem')
 | |
|         if not nraw:
 | |
|             raise RuntimeError('Failed to download CA cert bundle')
 | |
|         if nraw != raw:
 | |
|             self.info('Updating Mozilla CA certificates')
 | |
|             with open(self.CA_PATH, 'wb') as f:
 | |
|                 f.write(nraw)
 | |
|             self.verify_ca_certs()
 | |
| 
 | |
|     def verify_ca_certs(self):
 | |
|         from calibre.utils.https import get_https_resource_securely
 | |
|         get_https_resource_securely('https://calibre-ebook.com', cacerts=self.b(self.CA_PATH))
 | |
| # }}}
 | |
| 
 | |
| 
 | |
| class RecentUAs(Command):  # {{{
 | |
| 
 | |
|     description = 'Get updated list of common browser user agents'
 | |
|     UA_PATH = os.path.join(Command.RESOURCES, 'user-agent-data.json')
 | |
| 
 | |
|     def run(self, opts):
 | |
|         from setup.browser_data import get_data
 | |
|         data = get_data()
 | |
|         with open(self.UA_PATH, 'wb') as f:
 | |
|             f.write(json.dumps(data, indent=2, ensure_ascii=False, sort_keys=True).encode('utf-8'))
 | |
| # }}}
 | |
| 
 | |
| 
 | |
| class RapydScript(Command):  # {{{
 | |
| 
 | |
|     description = 'Compile RapydScript to JavaScript'
 | |
| 
 | |
|     def add_options(self, parser):
 | |
|         parser.add_option('--only-module', default=None,
 | |
|                 help='Only compile the specified module')
 | |
| 
 | |
|     def run(self, opts):
 | |
|         from calibre.utils.rapydscript import compile_srv, compile_editor, compile_viewer
 | |
|         if opts.only_module:
 | |
|             locals()['compile_' + opts.only_module]()
 | |
|         else:
 | |
|             compile_editor()
 | |
|             compile_viewer()
 | |
|             compile_srv()
 | |
| # }}}
 | |
| 
 | |
| 
 | |
| class Resources(Command):  # {{{
 | |
| 
 | |
|     description = 'Compile various needed calibre resources'
 | |
|     sub_commands = ['kakasi', 'mathjax', 'rapydscript', 'hyphenation']
 | |
| 
 | |
|     def run(self, opts):
 | |
|         from calibre.utils.serialize import msgpack_dumps
 | |
|         scripts = {}
 | |
|         for x in ('console', 'gui'):
 | |
|             for name in basenames[x]:
 | |
|                 if name in ('calibre-complete', 'calibre_postinstall'):
 | |
|                     continue
 | |
|                 scripts[name] = x
 | |
| 
 | |
|         dest = self.j(self.RESOURCES, 'scripts.calibre_msgpack')
 | |
|         if self.newer(dest, self.j(self.SRC, 'calibre', 'linux.py')):
 | |
|             self.info('\tCreating ' + self.b(dest))
 | |
|             with open(dest, 'wb') as f:
 | |
|                 f.write(msgpack_dumps(scripts))
 | |
| 
 | |
|         from calibre.web.feeds.recipes.collection import \
 | |
|                 serialize_builtin_recipes, iterate_over_builtin_recipe_files
 | |
| 
 | |
|         files = [x[1] for x in iterate_over_builtin_recipe_files()]
 | |
| 
 | |
|         dest = self.j(self.RESOURCES, 'builtin_recipes.xml')
 | |
|         if self.newer(dest, files):
 | |
|             self.info('\tCreating builtin_recipes.xml')
 | |
|             xml = serialize_builtin_recipes()
 | |
|             with open(dest, 'wb') as f:
 | |
|                 f.write(xml)
 | |
| 
 | |
|         recipe_icon_dir = self.a(self.j(self.RESOURCES, '..', 'recipes',
 | |
|             'icons'))
 | |
|         dest = os.path.splitext(dest)[0] + '.zip'
 | |
|         files += glob.glob(self.j(recipe_icon_dir, '*.png'))
 | |
|         if self.newer(dest, files):
 | |
|             self.info('\tCreating builtin_recipes.zip')
 | |
|             with zipfile.ZipFile(dest, 'w', zipfile.ZIP_STORED) as zf:
 | |
|                 for n in sorted(files, key=self.b):
 | |
|                     with open(n, 'rb') as f:
 | |
|                         zf.writestr(self.b(n), f.read())
 | |
| 
 | |
|         dest = self.j(self.RESOURCES, 'ebook-convert-complete.calibre_msgpack')
 | |
|         files = []
 | |
|         for x in os.walk(self.j(self.SRC, 'calibre')):
 | |
|             for f in x[-1]:
 | |
|                 if f.endswith('.py'):
 | |
|                     files.append(self.j(x[0], f))
 | |
|         if self.newer(dest, files):
 | |
|             self.info('\tCreating ' + self.b(dest))
 | |
|             complete = {}
 | |
|             from calibre.ebooks.conversion.plumber import supported_input_formats
 | |
|             complete['input_fmts'] = set(supported_input_formats())
 | |
|             from calibre.web.feeds.recipes.collection import get_builtin_recipe_titles
 | |
|             complete['input_recipes'] = [t+'.recipe ' for t in
 | |
|                     get_builtin_recipe_titles()]
 | |
|             from calibre.customize.ui import available_output_formats
 | |
|             complete['output'] = set(available_output_formats())
 | |
|             from calibre.ebooks.conversion.cli import create_option_parser
 | |
|             from calibre.utils.logging import Log
 | |
|             log = Log()
 | |
|             # log.outputs = []
 | |
|             for inf in supported_input_formats():
 | |
|                 if inf in ('zip', 'rar', 'oebzip'):
 | |
|                     continue
 | |
|                 for ouf in available_output_formats():
 | |
|                     of = ouf if ouf == 'oeb' else 'dummy.'+ouf
 | |
|                     p = create_option_parser(('ec', 'dummy1.'+inf, of, '-h'),
 | |
|                             log)[0]
 | |
|                     complete[(inf, ouf)] = [x+' 'for x in
 | |
|                             get_opts_from_parser(p)]
 | |
| 
 | |
|             with open(dest, 'wb') as f:
 | |
|                 f.write(msgpack_dumps(only_unicode_recursive(complete)))
 | |
| 
 | |
|         self.info('\tCreating template-functions.json')
 | |
|         dest = self.j(self.RESOURCES, 'template-functions.json')
 | |
|         function_dict = {}
 | |
|         import inspect
 | |
|         from calibre.utils.formatter_functions import formatter_functions
 | |
|         for obj in formatter_functions().get_builtins().values():
 | |
|             eval_func = inspect.getmembers(obj,
 | |
|                     lambda x: inspect.ismethod(x) and x.__name__ == 'evaluate')
 | |
|             try:
 | |
|                 lines = [l[4:] for l in inspect.getsourcelines(eval_func[0][1])[0]]
 | |
|             except:
 | |
|                 continue
 | |
|             lines = ''.join(lines)
 | |
|             function_dict[obj.name] = lines
 | |
|         dump_json(function_dict, dest)
 | |
| 
 | |
|         self.info('\tCreating editor-functions.json')
 | |
|         dest = self.j(self.RESOURCES, 'editor-functions.json')
 | |
|         function_dict = {}
 | |
|         from calibre.gui2.tweak_book.function_replace import builtin_functions
 | |
|         for func in builtin_functions():
 | |
|             try:
 | |
|                 src = ''.join(inspect.getsourcelines(func)[0][1:])
 | |
|             except Exception:
 | |
|                 continue
 | |
|             src = src.replace('def ' + func.__name__, 'def replace')
 | |
|             imports = ['from %s import %s' % (x.__module__, x.__name__) for x in func.imports]
 | |
|             if imports:
 | |
|                 src = '\n'.join(imports) + '\n\n' + src
 | |
|             function_dict[func.name] = src
 | |
|         dump_json(function_dict, dest)
 | |
|         self.info('\tCreating user-manual-translation-stats.json')
 | |
|         d = {}
 | |
|         for lc, stats in iteritems(json.load(open(self.j(self.d(self.SRC), 'manual', 'locale', 'completed.json')))):
 | |
|             total = sum(itervalues(stats))
 | |
|             d[lc] = stats['translated'] / float(total)
 | |
|         dump_json(d, self.j(self.RESOURCES, 'user-manual-translation-stats.json'))
 | |
| 
 | |
|     def clean(self):
 | |
|         for x in ('scripts', 'ebook-convert-complete'):
 | |
|             x = self.j(self.RESOURCES, x+'.pickle')
 | |
|             if os.path.exists(x):
 | |
|                 os.remove(x)
 | |
|         from setup.commands import kakasi
 | |
|         kakasi.clean()
 | |
|         for x in ('builtin_recipes.xml', 'builtin_recipes.zip',
 | |
|                 'template-functions.json', 'user-manual-translation-stats.json'):
 | |
|             x = self.j(self.RESOURCES, x)
 | |
|             if os.path.exists(x):
 | |
|                 os.remove(x)
 | |
| # }}}
 |