Code to export all data in a calibre library

This commit is contained in:
Kovid Goyal 2015-12-13 13:19:57 +05:30
parent e665108b02
commit 0db0c10811
3 changed files with 70 additions and 7 deletions

View File

@ -1295,7 +1295,7 @@ class DB(object):
except EnvironmentError: except EnvironmentError:
pass # Cover doesn't exist pass # Cover doesn't exist
def copy_cover_to(self, path, dest, windows_atomic_move=None, use_hardlink=False): def copy_cover_to(self, path, dest, windows_atomic_move=None, use_hardlink=False, report_file_size=None):
path = os.path.abspath(os.path.join(self.library_path, path, 'cover.jpg')) path = os.path.abspath(os.path.join(self.library_path, path, 'cover.jpg'))
if windows_atomic_move is not None: if windows_atomic_move is not None:
if not isinstance(dest, basestring): if not isinstance(dest, basestring):
@ -1318,6 +1318,10 @@ class DB(object):
with f: with f:
if hasattr(dest, 'write'): if hasattr(dest, 'write'):
if report_file_size is not None:
f.seek(0, os.SEEK_END)
report_file_size(f.tell())
f.seek(0)
shutil.copyfileobj(f, dest) shutil.copyfileobj(f, dest)
if hasattr(dest, 'flush'): if hasattr(dest, 'flush'):
dest.flush() dest.flush()
@ -1375,7 +1379,7 @@ class DB(object):
save_cover_data_to(data, path) save_cover_data_to(data, path)
def copy_format_to(self, book_id, fmt, fname, path, dest, def copy_format_to(self, book_id, fmt, fname, path, dest,
windows_atomic_move=None, use_hardlink=False): windows_atomic_move=None, use_hardlink=False, report_file_size=None):
path = self.format_abspath(book_id, fmt, fname, path) path = self.format_abspath(book_id, fmt, fname, path)
if path is None: if path is None:
return False return False
@ -1396,6 +1400,10 @@ class DB(object):
else: else:
if hasattr(dest, 'write'): if hasattr(dest, 'write'):
with lopen(path, 'rb') as f: with lopen(path, 'rb') as f:
if report_file_size is not None:
f.seek(0, os.SEEK_END)
report_file_size(f.tell())
f.seek(0)
shutil.copyfileobj(f, dest) shutil.copyfileobj(f, dest)
if hasattr(dest, 'flush'): if hasattr(dest, 'flush'):
dest.flush() dest.flush()
@ -1723,4 +1731,17 @@ class DB(object):
self.execute('UPDATE books SET path=? WHERE id=?', (path.replace(os.sep, '/'), book_id)) self.execute('UPDATE books SET path=? WHERE id=?', (path.replace(os.sep, '/'), book_id))
vals = [(book_id, fmt, size, name) for fmt, size, name in formats] vals = [(book_id, fmt, size, name) for fmt, size, name in formats]
self.executemany('INSERT INTO data (book,format,uncompressed_size,name) VALUES (?,?,?,?)', vals) self.executemany('INSERT INTO data (book,format,uncompressed_size,name) VALUES (?,?,?,?)', vals)
def backup_database(self, path):
# We have to open a new connection to self.dbpath, until this issue is fixed:
# https://github.com/rogerbinns/apsw/issues/199
dest_db = apsw.Connection(path)
source = apsw.Connection(self.dbpath)
with dest_db.backup('main', source, 'main') as b:
while not b.done:
b.step(100)
source.close()
dest_db.cursor().execute('DELETE FROM metadata_dirtied; VACUUM;')
dest_db.close()
# }}} # }}}

View File

@ -684,7 +684,7 @@ class Cache(object):
return self.backend.cover_last_modified(path) return self.backend.cover_last_modified(path)
@read_api @read_api
def copy_cover_to(self, book_id, dest, use_hardlink=False): def copy_cover_to(self, book_id, dest, use_hardlink=False, report_file_size=None):
''' '''
Copy the cover to the file like object ``dest``. Returns False Copy the cover to the file like object ``dest``. Returns False
if no cover exists or dest is the same file as the current cover. if no cover exists or dest is the same file as the current cover.
@ -697,11 +697,11 @@ class Cache(object):
except AttributeError: except AttributeError:
return False return False
return self.backend.copy_cover_to(path, dest, return self.backend.copy_cover_to(path, dest, use_hardlink=use_hardlink,
use_hardlink=use_hardlink) report_file_size=report_file_size)
@read_api @read_api
def copy_format_to(self, book_id, fmt, dest, use_hardlink=False): def copy_format_to(self, book_id, fmt, dest, use_hardlink=False, report_file_size=None):
''' '''
Copy the format ``fmt`` to the file like object ``dest``. If the Copy the format ``fmt`` to the file like object ``dest``. If the
specified format does not exist, raises :class:`NoSuchFormat` error. specified format does not exist, raises :class:`NoSuchFormat` error.
@ -717,7 +717,7 @@ class Cache(object):
raise NoSuchFormat('Record %d has no %s file'%(book_id, fmt)) raise NoSuchFormat('Record %d has no %s file'%(book_id, fmt))
return self.backend.copy_format_to(book_id, fmt, name, path, dest, return self.backend.copy_format_to(book_id, fmt, name, path, dest,
use_hardlink=use_hardlink) use_hardlink=use_hardlink, report_file_size=report_file_size)
@read_api @read_api
def format_abspath(self, book_id, fmt): def format_abspath(self, book_id, fmt):
@ -2096,4 +2096,37 @@ class Cache(object):
if report_progress is not None: if report_progress is not None:
report_progress(i+1, len(book_ids), mi) report_progress(i+1, len(book_ids), mi)
@read_api
def export_library(self, library_key, exporter, progress=None):
from binascii import hexlify
key_prefix = hexlify(library_key)
book_ids = self._all_book_ids()
total = len(book_ids) + 1
format_metadata = {}
if progress is not None:
progress('metadata.db', 0, total)
pt = PersistentTemporaryFile('-export.db')
pt.close()
self.backend.backup_database(pt.name)
dbkey = key_prefix + ':::' + 'metadata.db'
with lopen(pt.name, 'rb') as f:
exporter.add_file(f, dbkey)
os.remove(pt.name)
metadata = {'format_data':format_metadata, 'metadata.db':dbkey}
for i, book_id in enumerate(book_ids):
if progress is not None:
progress(self._field_for('title', book_id), i + 1, total)
format_metadata[book_id] = {}
for fmt in self._formats(book_id):
key = '%s:%s:%s' % (key_prefix, book_id, fmt)
format_metadata[book_id][fmt] = key
with exporter.start_file(key) as dest:
self._copy_format_to(book_id, fmt, dest, report_file_size=dest.ensure_space)
cover_key = '%s:%s:%s' % (key_prefix, book_id, '.cover')
with exporter.start_file(cover_key) as dest:
if not self.copy_cover_to(book_id, dest, report_file_size=dest.ensure_space):
dest.discard()
exporter.set_metadata(library_key, metadata)
if progress is not None:
progress(_('Completed'), total, total)
# }}} # }}}

View File

@ -12,6 +12,7 @@ from io import BytesIO
from calibre.constants import iswindows from calibre.constants import iswindows
from calibre.db.tests.base import BaseTest from calibre.db.tests.base import BaseTest
from calibre.ptempfile import TemporaryDirectory
class FilesystemTest(BaseTest): class FilesystemTest(BaseTest):
@ -142,3 +143,11 @@ class FilesystemTest(BaseTest):
cache.set_field('title', {3:title}) cache.set_field('title', {3:title})
fpath = cache.format_abspath(3, 'TXT') fpath = cache.format_abspath(3, 'TXT')
self.assertEqual(sorted([os.path.basename(fpath)]), sorted(os.listdir(os.path.dirname(fpath)))) self.assertEqual(sorted([os.path.basename(fpath)]), sorted(os.listdir(os.path.dirname(fpath))))
def test_export_import(self):
from calibre.utils.exim import Exporter
cache = self.init_cache()
for part_size in (1024, 100, 1):
with TemporaryDirectory('export_lib') as tdir:
exporter = Exporter(tdir, part_size=part_size)
cache.export_library('l', exporter)