mirror of
				https://github.com/kovidgoyal/calibre.git
				synced 2025-10-25 15:52:25 -04:00 
			
		
		
		
	
		
			
				
	
	
		
			430 lines
		
	
	
		
			17 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			430 lines
		
	
	
		
			17 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #!/usr/bin/env python2
 | |
| # vim:fileencoding=UTF-8:ts=4:sw=4:sta:et:sts=4:ai
 | |
| from __future__ import with_statement
 | |
| 
 | |
| __license__   = 'GPL v3'
 | |
| __copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
 | |
| __docformat__ = 'restructuredtext en'
 | |
| 
 | |
| import os, cPickle, re, shutil, marshal, zipfile, glob, time, sys, hashlib, json, errno, subprocess
 | |
| from zlib import compress
 | |
| from itertools import chain
 | |
| is_ci = os.environ.get('CI', '').lower() == 'true'
 | |
| 
 | |
| from setup import Command, basenames, __appname__
 | |
| 
 | |
| def get_opts_from_parser(parser):
 | |
|     def do_opt(opt):
 | |
|         for x in opt._long_opts:
 | |
|             yield x
 | |
|         for x in opt._short_opts:
 | |
|             yield x
 | |
|     for o in parser.option_list:
 | |
|         for x in do_opt(o):
 | |
|             yield x
 | |
|     for g in parser.option_groups:
 | |
|         for o in g.option_list:
 | |
|             for x in do_opt(o):
 | |
|                 yield x
 | |
| 
 | |
| def download_securely(url):
 | |
|     # We use curl here as on some OSes (OS X) when bootstrapping calibre,
 | |
|     # python will be unable to validate certificates until after cacerts is
 | |
|     # installed
 | |
|     return subprocess.check_output(['curl', '-fsSL', url])
 | |
| 
 | |
| class Coffee(Command):  # {{{
 | |
| 
 | |
|     description = 'Compile coffeescript files into javascript'
 | |
|     COFFEE_DIRS = ('ebooks/oeb/display', 'ebooks/oeb/polish')
 | |
| 
 | |
|     def add_options(self, parser):
 | |
|         parser.add_option('--watch', '-w', action='store_true', default=False,
 | |
|                 help='Autocompile when .coffee files are changed')
 | |
|         parser.add_option('--show-js', action='store_true', default=False,
 | |
|                 help='Display the generated javascript')
 | |
| 
 | |
|     def run(self, opts):
 | |
|         self.do_coffee_compile(opts)
 | |
|         if opts.watch:
 | |
|             try:
 | |
|                 while True:
 | |
|                     time.sleep(0.5)
 | |
|                     self.do_coffee_compile(opts, timestamp=True,
 | |
|                             ignore_errors=True)
 | |
|             except KeyboardInterrupt:
 | |
|                 pass
 | |
| 
 | |
|     def show_js(self, raw):
 | |
|         from pygments.lexers import JavascriptLexer
 | |
|         from pygments.formatters import TerminalFormatter
 | |
|         from pygments import highlight
 | |
|         print highlight(raw, JavascriptLexer(), TerminalFormatter())
 | |
| 
 | |
|     def do_coffee_compile(self, opts, timestamp=False, ignore_errors=False):
 | |
|         from calibre.utils.serve_coffee import compile_coffeescript
 | |
|         src_files = {}
 | |
|         for src in self.COFFEE_DIRS:
 | |
|             for f in glob.glob(self.j(self.SRC, __appname__, src,
 | |
|                 '*.coffee')):
 | |
|                 bn = os.path.basename(f).rpartition('.')[0]
 | |
|                 arcname = src.replace('/', '.') + '.' + bn + '.js'
 | |
|                 try:
 | |
|                     with open(f, 'rb') as fs:
 | |
|                         src_files[arcname] = (f, hashlib.sha1(fs.read()).hexdigest())
 | |
|                 except EnvironmentError:
 | |
|                     time.sleep(0.1)
 | |
|                     with open(f, 'rb') as fs:
 | |
|                         src_files[arcname] = (f, hashlib.sha1(fs.read()).hexdigest())
 | |
| 
 | |
|         existing = {}
 | |
|         dest = self.j(self.RESOURCES, 'compiled_coffeescript.zip')
 | |
|         if os.path.exists(dest):
 | |
|             with zipfile.ZipFile(dest, 'r') as zf:
 | |
|                 existing_hashes = {}
 | |
|                 raw = zf.comment
 | |
|                 if raw:
 | |
|                     existing_hashes = json.loads(raw)
 | |
|                 for info in zf.infolist():
 | |
|                     if info.filename in existing_hashes and src_files.get(info.filename, (None, None))[1] == existing_hashes[info.filename]:
 | |
|                         existing[info.filename] = (zf.read(info), info, existing_hashes[info.filename])
 | |
| 
 | |
|         todo = set(src_files) - set(existing)
 | |
|         updated = {}
 | |
|         for arcname in todo:
 | |
|             name = arcname.rpartition('.')[0]
 | |
|             print ('\t%sCompiling %s'%(time.strftime('[%H:%M:%S] ') if
 | |
|                         timestamp else '', name))
 | |
|             src, sig = src_files[arcname]
 | |
|             js, errors = compile_coffeescript(open(src, 'rb').read(), filename=src)
 | |
|             if errors:
 | |
|                 print ('\n\tCompilation of %s failed'%name)
 | |
|                 for line in errors:
 | |
|                     print >>sys.stderr, line
 | |
|                 if ignore_errors:
 | |
|                     js = u'# Compilation from coffeescript failed'
 | |
|                 else:
 | |
|                     raise SystemExit(1)
 | |
|             else:
 | |
|                 if opts.show_js:
 | |
|                     self.show_js(js)
 | |
|                     print ('#'*80)
 | |
|                     print ('#'*80)
 | |
|             zi = zipfile.ZipInfo()
 | |
|             zi.filename = arcname
 | |
|             zi.date_time = time.localtime()[:6]
 | |
|             updated[arcname] = (js.encode('utf-8'), zi, sig)
 | |
|         if updated:
 | |
|             hashes = {}
 | |
|             with zipfile.ZipFile(dest, 'w', zipfile.ZIP_STORED) as zf:
 | |
|                 for raw, zi, sig in sorted(chain(updated.itervalues(), existing.itervalues()), key=lambda x: x[1].filename):
 | |
|                     zf.writestr(zi, raw)
 | |
|                     hashes[zi.filename] = sig
 | |
|                 zf.comment = json.dumps(hashes)
 | |
| 
 | |
|     def clean(self):
 | |
|         x = self.j(self.RESOURCES, 'compiled_coffeescript.zip')
 | |
|         if os.path.exists(x):
 | |
|             os.remove(x)
 | |
| # }}}
 | |
| 
 | |
| class Kakasi(Command):  # {{{
 | |
| 
 | |
|     description = 'Compile resources for unihandecode'
 | |
| 
 | |
|     KAKASI_PATH = os.path.join(Command.SRC,  __appname__,
 | |
|             'ebooks', 'unihandecode', 'pykakasi')
 | |
| 
 | |
|     def run(self, opts):
 | |
|         self.records = {}
 | |
|         src = self.j(self.KAKASI_PATH, 'kakasidict.utf8')
 | |
|         dest = self.j(self.RESOURCES, 'localization',
 | |
|                 'pykakasi','kanwadict2.pickle')
 | |
|         base = os.path.dirname(dest)
 | |
|         if not os.path.exists(base):
 | |
|             os.makedirs(base)
 | |
| 
 | |
|         if self.newer(dest, src):
 | |
|             self.info('\tGenerating Kanwadict')
 | |
| 
 | |
|             for line in open(src, "r"):
 | |
|                 self.parsekdict(line)
 | |
|             self.kanwaout(dest)
 | |
| 
 | |
|         src = self.j(self.KAKASI_PATH, 'itaijidict.utf8')
 | |
|         dest = self.j(self.RESOURCES, 'localization',
 | |
|                 'pykakasi','itaijidict2.pickle')
 | |
| 
 | |
|         if self.newer(dest, src):
 | |
|             self.info('\tGenerating Itaijidict')
 | |
|             self.mkitaiji(src, dest)
 | |
| 
 | |
|         src = self.j(self.KAKASI_PATH, 'kanadict.utf8')
 | |
|         dest = self.j(self.RESOURCES, 'localization',
 | |
|                 'pykakasi','kanadict2.pickle')
 | |
| 
 | |
|         if self.newer(dest, src):
 | |
|             self.info('\tGenerating kanadict')
 | |
|             self.mkkanadict(src, dest)
 | |
| 
 | |
|     def mkitaiji(self, src, dst):
 | |
|         dic = {}
 | |
|         for line in open(src, "r"):
 | |
|             line = line.decode("utf-8").strip()
 | |
|             if line.startswith(';;'):  # skip comment
 | |
|                 continue
 | |
|             if re.match(r"^$",line):
 | |
|                 continue
 | |
|             pair = re.sub(r'\\u([0-9a-fA-F]{4})', lambda x:unichr(int(x.group(1),16)), line)
 | |
|             dic[pair[0]] = pair[1]
 | |
|         cPickle.dump(dic, open(dst, 'wb'), protocol=-1)  # pickle
 | |
| 
 | |
|     def mkkanadict(self, src, dst):
 | |
|         dic = {}
 | |
|         for line in open(src, "r"):
 | |
|             line = line.decode("utf-8").strip()
 | |
|             if line.startswith(';;'):  # skip comment
 | |
|                 continue
 | |
|             if re.match(r"^$",line):
 | |
|                 continue
 | |
|             (alpha, kana) = line.split(' ')
 | |
|             dic[kana] = alpha
 | |
|         cPickle.dump(dic, open(dst, 'wb'), protocol=-1)  # pickle
 | |
| 
 | |
|     def parsekdict(self, line):
 | |
|         line = line.decode("utf-8").strip()
 | |
|         if line.startswith(';;'):  # skip comment
 | |
|             return
 | |
|         (yomi, kanji) = line.split(' ')
 | |
|         if ord(yomi[-1:]) <= ord('z'):
 | |
|             tail = yomi[-1:]
 | |
|             yomi = yomi[:-1]
 | |
|         else:
 | |
|             tail = ''
 | |
|         self.updaterec(kanji, yomi, tail)
 | |
| 
 | |
|     def updaterec(self, kanji, yomi, tail):
 | |
|         key = "%04x"%ord(kanji[0])
 | |
|         if key in self.records:
 | |
|             if kanji in self.records[key]:
 | |
|                 rec = self.records[key][kanji]
 | |
|                 rec.append((yomi,tail))
 | |
|                 self.records[key].update({kanji: rec})
 | |
|             else:
 | |
|                 self.records[key][kanji]=[(yomi, tail)]
 | |
|         else:
 | |
|             self.records[key] = {}
 | |
|             self.records[key][kanji]=[(yomi, tail)]
 | |
| 
 | |
|     def kanwaout(self, out):
 | |
|         with open(out, 'wb') as f:
 | |
|             dic = {}
 | |
|             for k, v in self.records.iteritems():
 | |
|                 dic[k] = compress(marshal.dumps(v))
 | |
|             cPickle.dump(dic, f, -1)
 | |
| 
 | |
|     def clean(self):
 | |
|         kakasi = self.j(self.RESOURCES, 'localization', 'pykakasi')
 | |
|         if os.path.exists(kakasi):
 | |
|             shutil.rmtree(kakasi)
 | |
| # }}}
 | |
| 
 | |
| class CACerts(Command):  # {{{
 | |
| 
 | |
|     description = 'Get updated mozilla CA certificate bundle'
 | |
|     CA_PATH = os.path.join(Command.RESOURCES, 'mozilla-ca-certs.pem')
 | |
| 
 | |
|     def run(self, opts):
 | |
|         try:
 | |
|             with open(self.CA_PATH, 'rb') as f:
 | |
|                 raw = f.read()
 | |
|         except EnvironmentError as err:
 | |
|             if err.errno != errno.ENOENT:
 | |
|                 raise
 | |
|             raw = b''
 | |
|         nraw = download_securely('https://curl.haxx.se/ca/cacert.pem')
 | |
|         if not nraw:
 | |
|             raise RuntimeError('Failed to download CA cert bundle')
 | |
|         if nraw != raw:
 | |
|             self.info('Updating Mozilla CA certificates')
 | |
|             with open(self.CA_PATH, 'wb') as f:
 | |
|                 f.write(nraw)
 | |
|             self.verify_ca_certs()
 | |
| 
 | |
|     def verify_ca_certs(self):
 | |
|         from calibre.utils.https import get_https_resource_securely
 | |
|         get_https_resource_securely('https://calibre-ebook.com', cacerts=self.b(self.CA_PATH))
 | |
| # }}}
 | |
| 
 | |
| class RecentUAs(Command):
 | |
| 
 | |
|     description = 'Get updated list of recent browser user agents'
 | |
|     UA_PATH = os.path.join(Command.RESOURCES, 'common-user-agents.txt')
 | |
| 
 | |
|     def get_list(self):
 | |
|         if is_ci:
 | |
|             # Dont hammer the server from CI
 | |
|             return [
 | |
|                  # IE 11 - windows 10
 | |
|                  'Mozilla/5.0 (Windows NT 10.0; Trident/7.0; rv:11.0) like Gecko',
 | |
|                  # IE 11 - windows 8.1
 | |
|                  'Mozilla/5.0 (Windows NT 6.3; Trident/7.0; rv:11.0) like Gecko',
 | |
|                  # IE 11 - windows 8
 | |
|                  'Mozilla/5.0 (Windows NT 6.2; Trident/7.0; rv:11.0) like Gecko',
 | |
|                  # IE 11 - windows 7
 | |
|                  'Mozilla/5.0 (Windows NT 6.1; Trident/7.0; rv:11.0) like Gecko',
 | |
|                  # 32bit IE 11 on 64 bit win 10
 | |
|                  'Mozilla/5.0 (Windows NT 10.0; WOW64; Trident/7.0; rv:11.0) like Gecko',
 | |
|                  # 32bit IE 11 on 64 bit win 8.1
 | |
|                  'Mozilla/5.0 (Windows NT 6.3; WOW64; Trident/7.0; rv:11.0) like Gecko',
 | |
|                  # 32bit IE 11 on 64 bit win 7
 | |
|                  'Mozilla/5.0 (Windows NT 6.1; WOW64; Trident/7.0; rv:11.0) like Gecko',
 | |
|         ]
 | |
|         raw = download_securely('https://techblog.willshouse.com/2012/01/03/most-common-user-agents/').decode('utf-8')
 | |
|         lines = re.search(r'<textarea.+"get-the-list".+>([^<]+)</textarea>', raw).group(1).splitlines()
 | |
|         return [x.strip() for x in lines if x.strip()]
 | |
| 
 | |
|     def run(self, opts):
 | |
|         lines = self.get_list()[:10]
 | |
|         if not lines:
 | |
|             raise RuntimeError('Failed to download list of common user agents')
 | |
|         with open(self.UA_PATH, 'wb') as f:
 | |
|             f.write('\n'.join(lines).encode('ascii'))
 | |
| 
 | |
| class RapydScript(Command):  # {{{
 | |
| 
 | |
|     description = 'Compile RapydScript to JavaScript'
 | |
| 
 | |
|     def run(self, opts):
 | |
|         from calibre.utils.rapydscript import compile_srv
 | |
|         compile_srv()
 | |
| # }}}
 | |
| 
 | |
| class Resources(Command):  # {{{
 | |
| 
 | |
|     description = 'Compile various needed calibre resources'
 | |
|     sub_commands = ['kakasi', 'coffee', 'rapydscript']
 | |
| 
 | |
|     def run(self, opts):
 | |
|         scripts = {}
 | |
|         for x in ('console', 'gui'):
 | |
|             for name in basenames[x]:
 | |
|                 if name in ('calibre-complete', 'calibre_postinstall'):
 | |
|                     continue
 | |
|                 scripts[name] = x
 | |
| 
 | |
|         dest = self.j(self.RESOURCES, 'scripts.pickle')
 | |
|         if self.newer(dest, self.j(self.SRC, 'calibre', 'linux.py')):
 | |
|             self.info('\tCreating scripts.pickle')
 | |
|             f = open(dest, 'wb')
 | |
|             cPickle.dump(scripts, f, -1)
 | |
| 
 | |
|         from calibre.web.feeds.recipes.collection import \
 | |
|                 serialize_builtin_recipes, iterate_over_builtin_recipe_files
 | |
| 
 | |
|         files = [x[1] for x in iterate_over_builtin_recipe_files()]
 | |
| 
 | |
|         dest = self.j(self.RESOURCES, 'builtin_recipes.xml')
 | |
|         if self.newer(dest, files):
 | |
|             self.info('\tCreating builtin_recipes.xml')
 | |
|             xml = serialize_builtin_recipes()
 | |
|             with open(dest, 'wb') as f:
 | |
|                 f.write(xml)
 | |
| 
 | |
|         recipe_icon_dir = self.a(self.j(self.RESOURCES, '..', 'recipes',
 | |
|             'icons'))
 | |
|         dest = os.path.splitext(dest)[0] + '.zip'
 | |
|         files += glob.glob(self.j(recipe_icon_dir, '*.png'))
 | |
|         if self.newer(dest, files):
 | |
|             self.info('\tCreating builtin_recipes.zip')
 | |
|             with zipfile.ZipFile(dest, 'w', zipfile.ZIP_STORED) as zf:
 | |
|                 for n in sorted(files, key=self.b):
 | |
|                     with open(n, 'rb') as f:
 | |
|                         zf.writestr(os.path.basename(n), f.read())
 | |
| 
 | |
|         dest = self.j(self.RESOURCES, 'ebook-convert-complete.pickle')
 | |
|         files = []
 | |
|         for x in os.walk(self.j(self.SRC, 'calibre')):
 | |
|             for f in x[-1]:
 | |
|                 if f.endswith('.py'):
 | |
|                     files.append(self.j(x[0], f))
 | |
|         if self.newer(dest, files):
 | |
|             self.info('\tCreating ebook-convert-complete.pickle')
 | |
|             complete = {}
 | |
|             from calibre.ebooks.conversion.plumber import supported_input_formats
 | |
|             complete['input_fmts'] = set(supported_input_formats())
 | |
|             from calibre.web.feeds.recipes.collection import get_builtin_recipe_titles
 | |
|             complete['input_recipes'] = [t+'.recipe ' for t in
 | |
|                     get_builtin_recipe_titles()]
 | |
|             from calibre.customize.ui import available_output_formats
 | |
|             complete['output'] = set(available_output_formats())
 | |
|             from calibre.ebooks.conversion.cli import create_option_parser
 | |
|             from calibre.utils.logging import Log
 | |
|             log = Log()
 | |
|             # log.outputs = []
 | |
|             for inf in supported_input_formats():
 | |
|                 if inf in ('zip', 'rar', 'oebzip'):
 | |
|                     continue
 | |
|                 for ouf in available_output_formats():
 | |
|                     of = ouf if ouf == 'oeb' else 'dummy.'+ouf
 | |
|                     p = create_option_parser(('ec', 'dummy1.'+inf, of, '-h'),
 | |
|                             log)[0]
 | |
|                     complete[(inf, ouf)] = [x+' 'for x in
 | |
|                             get_opts_from_parser(p)]
 | |
| 
 | |
|             cPickle.dump(complete, open(dest, 'wb'), -1)
 | |
| 
 | |
|         self.info('\tCreating template-functions.json')
 | |
|         dest = self.j(self.RESOURCES, 'template-functions.json')
 | |
|         function_dict = {}
 | |
|         import inspect
 | |
|         from calibre.utils.formatter_functions import formatter_functions
 | |
|         for obj in formatter_functions().get_builtins().values():
 | |
|             eval_func = inspect.getmembers(obj,
 | |
|                     lambda x: inspect.ismethod(x) and x.__name__ == 'evaluate')
 | |
|             try:
 | |
|                 lines = [l[4:] for l in inspect.getsourcelines(eval_func[0][1])[0]]
 | |
|             except:
 | |
|                 continue
 | |
|             lines = ''.join(lines)
 | |
|             function_dict[obj.name] = lines
 | |
|         import json
 | |
|         json.dump(function_dict, open(dest, 'wb'), indent=4)
 | |
| 
 | |
|         self.info('\tCreating editor-functions.json')
 | |
|         dest = self.j(self.RESOURCES, 'editor-functions.json')
 | |
|         function_dict = {}
 | |
|         from calibre.gui2.tweak_book.function_replace import builtin_functions
 | |
|         for func in builtin_functions():
 | |
|             try:
 | |
|                 src = ''.join(inspect.getsourcelines(func)[0][1:])
 | |
|             except Exception:
 | |
|                 continue
 | |
|             src = src.replace('def ' + func.func_name, 'def replace')
 | |
|             imports = ['from %s import %s' % (x.__module__, x.__name__) for x in func.imports]
 | |
|             if imports:
 | |
|                 src = '\n'.join(imports) + '\n\n' + src
 | |
|             function_dict[func.name] = src
 | |
|         json.dump(function_dict, open(dest, 'wb'), indent=4)
 | |
|         self.info('\tCreating user-manual-translation-stats.json')
 | |
|         d = {}
 | |
|         for lc, stats in json.load(open(self.j(self.d(self.SRC), 'manual', 'locale', 'completed.json'))).iteritems():
 | |
|             total = sum(stats.itervalues())
 | |
|             d[lc] = stats['translated'] / float(total)
 | |
|         json.dump(d, open(self.j(self.RESOURCES, 'user-manual-translation-stats.json'), 'wb'), indent=4)
 | |
| 
 | |
|     def clean(self):
 | |
|         for x in ('scripts', 'ebook-convert-complete'):
 | |
|             x = self.j(self.RESOURCES, x+'.pickle')
 | |
|             if os.path.exists(x):
 | |
|                 os.remove(x)
 | |
|         from setup.commands import kakasi, coffee
 | |
|         kakasi.clean()
 | |
|         coffee.clean()
 | |
|         for x in ('builtin_recipes.xml', 'builtin_recipes.zip',
 | |
|                 'template-functions.json', 'user-manual-translation-stats.json'):
 | |
|             x = self.j(self.RESOURCES, x)
 | |
|             if os.path.exists(x):
 | |
|                 os.remove(x)
 | |
| # }}}
 |