Sync to pluginize

2025-07-09 03:04:10 -04:00 · 2009-04-27 18:48:55 -04:00 · 2009-04-27 18:48:55 -04:00 · 9a363a02cc
commit 9a363a02cc
parent a9a18aa565 dbc2d315ed
25 changed files with 750 additions and 722 deletions
--- a/src/calibre/customize/builtins.py
+++ b/src/calibre/customize/builtins.py
@ -286,6 +286,8 @@ from calibre.ebooks.fb2.input import FB2Input
 from calibre.ebooks.odt.input import ODTInput
 from calibre.ebooks.rtf.input import RTFInput
 from calibre.ebooks.html.input import HTMLInput
 from calibre.ebooks.comic.input import ComicInput
 from calibre.web.feeds.input import RecipeInput
 from calibre.ebooks.oeb.output import OEBOutput
 from calibre.ebooks.epub.output import EPUBOutput
 from calibre.ebooks.txt.output import TXTOutput
@ -294,8 +296,8 @@ from calibre.ebooks.pdb.ereader.output import EREADEROutput
 from calibre.customize.profiles import input_profiles, output_profiles
 plugins = [HTML2ZIP, EPUBInput, MOBIInput, PDBInput, PDFInput, HTMLInput,
-        TXTInput, OEBOutput, TXTOutput, PDFOutput, LITInput,
+        TXTInput, OEBOutput, TXTOutput, PDFOutput, LITInput, ComicInput,
-        FB2Input, ODTInput, RTFInput, EPUBOutput, EREADEROutput]
+        FB2Input, ODTInput, RTFInput, EPUBOutput, EREADEROutput, RecipeInput]
 plugins += [x for x in list(locals().values()) if isinstance(x, type) and \
                                        x.__name__.endswith('MetadataReader')]
 plugins += [x for x in list(locals().values()) if isinstance(x, type) and \
--- a/src/calibre/customize/conversion.py
+++ b/src/calibre/customize/conversion.py
@ -96,6 +96,11 @@ class InputFormatPlugin(Plugin):
    #: For example: ``set(['azw', 'mobi', 'prc'])``
    file_types     = set([])
    #: If True, this input plugin generates a collection of images,
    #: one per HTML file. You can obtain access to the images via
    #: convenience method, :method:`get_image_collection`.
    is_image_collection = False
    #: Options shared by all Input format plugins. Do not override
    #: in sub-classes. Use :member:`options` instead. Every option must be an
    #: instance of :class:`OptionRecommendation`.
@ -128,6 +133,14 @@ class InputFormatPlugin(Plugin):
    #: (option_name, recommended_value, recommendation_level)
    recommendations = set([])
    def get_images(self):
        '''
        Return a list of absolute paths to the images, if this input plugin
        represents an image collection. The list of images is in the same order
        as the spine and the TOC.
        '''
        raise NotImplementedError()
    def convert(self, stream, options, file_ext, log, accelerators):
        '''
        This method must be implemented in sub-classes. It must return
--- a/src/calibre/customize/profiles.py
+++ b/src/calibre/customize/profiles.py
@ -148,6 +148,8 @@ class OutputProfile(Plugin):
    remove_special_chars      = re.compile(u'[\u200b\u00ad]')
    # ADE falls to the ground in a dead faint when it sees an <object>
    remove_object_tags        = True
    # The image size for comics
    comic_screen_size = (584, 754)
 class SonyReaderOutput(OutputProfile):
@ -162,6 +164,18 @@ class SonyReaderOutput(OutputProfile):
    fbase                     = 12
    fsizes                    = [7.5, 9, 10, 12, 15.5, 20, 22, 24]
 class SonyReaderLandscapeOutput(SonyReaderOutput):
    name        = 'Sony Reader Landscape'
    short_name  = 'sony-landscape'
    description = _('This profile is intended for the SONY PRS line. '
                    'The 500/505/700 etc, in landscape mode. Mainly useful '
                    'for comics.')
    screen_size               = (784, 1012)
    comic_screen_size         = (784, 1012)
 class MSReaderOutput(OutputProfile):
    name        = 'Microsoft Reader'
@ -223,4 +237,5 @@ class KindleOutput(OutputProfile):
    fsizes                    = [12, 12, 14, 16, 18, 20, 22, 24]
 output_profiles = [OutputProfile, SonyReaderOutput, MSReaderOutput,
-        MobipocketOutput, HanlinV3Output, CybookG3Output, KindleOutput]
+        MobipocketOutput, HanlinV3Output, CybookG3Output, KindleOutput,
        SonyReaderLandscapeOutput]
--- a/src/calibre/ebooks/lrf/comic/init.py
+++ b/src/calibre/ebooks/lrf/comic/init.py
--- a/src/calibre/ebooks/comic/input.py
+++ b/src/calibre/ebooks/comic/input.py
@ -0,0 +1,460 @@
 from __future__ import with_statement
 __license__   = 'GPL v3'
 __copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
 __docformat__ = 'restructuredtext en'
 '''
 Based on ideas from comiclrf created by FangornUK.
 '''
 import os, shutil, traceback, textwrap
 from calibre.customize.conversion import InputFormatPlugin, OptionRecommendation
 from calibre import extract, CurrentDir
 from calibre.ptempfile import PersistentTemporaryDirectory
 from calibre.parallel import Server, ParallelJob
 def extract_comic(path_to_comic_file):
    '''
    Un-archive the comic file.
    '''
    tdir = PersistentTemporaryDirectory(suffix='_comic_extract')
    extract(path_to_comic_file, tdir)
    return tdir
 def find_pages(dir, sort_on_mtime=False, verbose=False):
    '''
    Find valid comic pages in a previously un-archived comic.
    :param dir: Directory in which extracted comic lives
    :param sort_on_mtime: If True sort pages based on their last modified time.
                          Otherwise, sort alphabetically.
    '''
    extensions = ['jpeg', 'jpg', 'gif', 'png']
    pages = []
    for datum in os.walk(dir):
        for name in datum[-1]:
            path = os.path.join(datum[0], name)
            for ext in extensions:
                if path.lower().endswith('.'+ext):
                    pages.append(path)
                    break
    if sort_on_mtime:
        comparator = lambda x, y : cmp(os.stat(x).st_mtime, os.stat(y).st_mtime)
    else:
        comparator = lambda x, y : cmp(os.path.basename(x), os.path.basename(y))
    pages.sort(cmp=comparator)
    if verbose:
        print 'Found comic pages...'
        print '\t'+'\n\t'.join([os.path.basename(p) for p in pages])
    return pages
 class PageProcessor(list):
    '''
    Contains the actual image rendering logic. See :method:`render` and
    :method:`process_pages`.
    '''
    def __init__(self, path_to_page, dest, opts, num):
        list.__init__(self)
        self.path_to_page = path_to_page
        self.opts         = opts
        self.num          = num
        self.dest         = dest
        self.rotate       = False
        self.render()
    def render(self):
        import calibre.utils.PythonMagickWand as pw
        img = pw.NewMagickWand()
        if img < 0:
            raise RuntimeError('Cannot create wand.')
        if not pw.MagickReadImage(img, self.path_to_page):
            raise IOError('Failed to read image from: %'%self.path_to_page)
        width  = pw.MagickGetImageWidth(img)
        height = pw.MagickGetImageHeight(img)
        if self.num == 0: # First image so create a thumbnail from it
            thumb = pw.CloneMagickWand(img)
            if thumb < 0:
                raise RuntimeError('Cannot create wand.')
            pw.MagickThumbnailImage(thumb, 60, 80)
            pw.MagickWriteImage(thumb, os.path.join(self.dest, 'thumbnail.png'))
            pw.DestroyMagickWand(thumb)
        self.pages = [img]
        if width > height:
            if self.opts.landscape:
                self.rotate = True
            else:
                split1, split2 = map(pw.CloneMagickWand, (img, img))
                pw.DestroyMagickWand(img)
                if split1 < 0 or split2 < 0:
                    raise RuntimeError('Cannot create wand.')
                pw.MagickCropImage(split1, (width/2)-1, height, 0, 0)
                pw.MagickCropImage(split2, (width/2)-1, height, width/2, 0 )
                self.pages = [split2, split1] if self.opts.right2left else [split1, split2]
        self.process_pages()
    def process_pages(self):
        import calibre.utils.PythonMagickWand as p
        for i, wand in enumerate(self.pages):
            pw = p.NewPixelWand()
            try:
                if pw < 0:
                    raise RuntimeError('Cannot create wand.')
                p.PixelSetColor(pw, 'white')
                p.MagickSetImageBorderColor(wand, pw)
                if self.rotate:
                    p.MagickRotateImage(wand, pw, -90)
                # 25 percent fuzzy trim?
                if not self.opts.disable_trim:
                    p.MagickTrimImage(wand, 25*65535/100)
                p.MagickSetImagePage(wand, 0,0,0,0)   #Clear page after trim, like a "+repage"
                # Do the Photoshop "Auto Levels" equivalent
                if not self.opts.dont_normalize:
                    p.MagickNormalizeImage(wand)
                sizex = p.MagickGetImageWidth(wand)
                sizey = p.MagickGetImageHeight(wand)
                SCRWIDTH, SCRHEIGHT = self.opts.output_profile.comic_screen_size
                if self.opts.keep_aspect_ratio:
                    # Preserve the aspect ratio by adding border
                    aspect = float(sizex) / float(sizey)
                    if aspect <= (float(SCRWIDTH) / float(SCRHEIGHT)):
                        newsizey = SCRHEIGHT
                        newsizex = int(newsizey * aspect)
                        deltax = (SCRWIDTH - newsizex) / 2
                        deltay = 0
                    else:
                        newsizex = SCRWIDTH
                        newsizey = int(newsizex / aspect)
                        deltax = 0
                        deltay = (SCRHEIGHT - newsizey) / 2
                    p.MagickResizeImage(wand, newsizex, newsizey, p.CatromFilter, 1.0)
                    p.MagickSetImageBorderColor(wand, pw)
                    p.MagickBorderImage(wand, pw, deltax, deltay)
                elif self.opts.wide:
                    # Keep aspect and Use device height as scaled image width so landscape mode is clean
                    aspect = float(sizex) / float(sizey)
                    screen_aspect = float(SCRWIDTH) / float(SCRHEIGHT)
                    # Get dimensions of the landscape mode screen
                    # Add 25px back to height for the battery bar.
                    wscreenx = SCRHEIGHT + 25
                    wscreeny = int(wscreenx / screen_aspect)
                    if aspect <= screen_aspect:
                        newsizey = wscreeny
                        newsizex = int(newsizey * aspect)
                        deltax = (wscreenx - newsizex) / 2
                        deltay = 0
                    else:
                        newsizex = wscreenx
                        newsizey = int(newsizex / aspect)
                        deltax = 0
                        deltay = (wscreeny - newsizey) / 2
                    p.MagickResizeImage(wand, newsizex, newsizey, p.CatromFilter, 1.0)
                    p.MagickSetImageBorderColor(wand, pw)
                    p.MagickBorderImage(wand, pw, deltax, deltay)
                else:
                    p.MagickResizeImage(wand, SCRWIDTH, SCRHEIGHT, p.CatromFilter, 1.0)
                if not self.opts.dont_sharpen:
                    p.MagickSharpenImage(wand, 0.0, 1.0)
                p.MagickSetImageType(wand, p.GrayscaleType)
                if self.opts.despeckle:
                    p.MagickDespeckleImage(wand)
                p.MagickQuantizeImage(wand, self.opts.colors, p.RGBColorspace, 0, 1, 0)
                dest = '%d_%d.png'%(self.num, i)
                dest = os.path.join(self.dest, dest)
                p.MagickWriteImage(wand, dest+'8')
                os.rename(dest+'8', dest)
                self.append(dest)
            finally:
                if pw > 0:
                    p.DestroyPixelWand(pw)
                p.DestroyMagickWand(wand)
 def render_pages(tasks, dest, opts, notification=None):
    '''
    Entry point for the job server.
    '''
    failures, pages = [], []
    from calibre.utils.PythonMagickWand import ImageMagick
    with ImageMagick():
        for num, path in tasks:
            try:
                pages.extend(PageProcessor(path, dest, opts, num))
                msg = _('Rendered %s')
            except:
                failures.append(path)
                msg = _('Failed %s')
                if opts.verbose:
                    msg += '\n' + traceback.format_exc()
            msg = msg%path
            if notification is not None:
                notification(0.5, msg)
    return pages, failures
 class JobManager(object):
    '''
    Simple job manager responsible for keeping track of overall progress.
    '''
    def __init__(self, total, update):
        self.total  = total
        self.update = update
        self.done   = 0
        self.add_job        = lambda j: j
        self.output         = lambda j: j
        self.start_work     = lambda j: j
        self.job_done       = lambda j: j
    def status_update(self, job):
        self.done += 1
        #msg = msg%os.path.basename(job.args[0])
        self.update(float(self.done)/self.total, job.msg)
 def process_pages(pages, opts, update, tdir):
    '''
    Render all identified comic pages.
    '''
    from calibre.utils.PythonMagickWand import ImageMagick
    ImageMagick
    job_manager = JobManager(len(pages), update)
    server = Server()
    jobs = []
    tasks = server.split(pages)
    for task in tasks:
        jobs.append(ParallelJob('render_pages', lambda s:s, job_manager=job_manager,
                                args=[task, tdir, opts]))
        server.add_job(jobs[-1])
    server.wait()
    server.killall()
    server.close()
    ans, failures = [], []
    for job in jobs:
        if job.result is None:
            raise Exception(_('Failed to process comic: %s\n\n%s')%(job.exception, job.traceback))
        pages, failures_ = job.result
        ans += pages
        failures += failures_
    return ans, failures
 class ComicInput(InputFormatPlugin):
    name        = 'Comic Input'
    author      = 'Kovid Goyal'
    description = 'Optimize comic files (.cbz, .cbr, .cbc) for viewing on portable devices'
    file_types  = set(['cbz', 'cbr', 'cbc'])
    is_image_collection = True
    options = set([
        OptionRecommendation(name='colors', recommended_value=64,
            help=_('Number of colors for grayscale image conversion. Default: %default')),
        OptionRecommendation(name='dont_normalize', recommended_value=False,
            help=_('Disable normalize (improve contrast) color range '
            'for pictures. Default: False')),
        OptionRecommendation(name='keep_aspect_ratio', recommended_value=False,
            help=_('Maintain picture aspect ratio. Default is to fill the screen.')),
        OptionRecommendation(name='dont_sharpen', recommended_value=False,
            help=_('Disable sharpening.')),
        OptionRecommendation(name='disable_trim', recommended_value=False,
            help=_('Disable trimming of comic pages. For some comics, '
                     'trimming might remove content as well as borders.')),
        OptionRecommendation(name='landspace', recommended_value=False,
            help=_("Don't split landscape images into two portrait images")),
        OptionRecommendation(name='wide', recommended_value=False,
            help=_("Keep aspect ratio and scale image using screen height as "
            "image width for viewing in landscape mode.")),
        OptionRecommendation(name='right2left', recommended_value=False,
              help=_('Used for right-to-left publications like manga. '
              'Causes landscape pages to be split into portrait pages '
              'from right to left.')),
        OptionRecommendation(name='despeckle', recommended_value=False,
              help=_('Enable Despeckle. Reduces speckle noise. '
              'May greatly increase processing time.')),
        OptionRecommendation(name='no_sort', recommended_value=False,
              help=_("Don't sort the files found in the comic "
              "alphabetically by name. Instead use the order they were "
              "added to the comic.")),
        OptionRecommendation(name='no_process', recommended_value=False,
              help=_("Apply no processing to the image")),
        ])
    recommendations = set([
        ('margin_left', 0, OptionRecommendation.HIGH),
        ('margin_top',  0, OptionRecommendation.HIGH),
        ('margin_right', 0, OptionRecommendation.HIGH),
        ('margin_bottom', 0, OptionRecommendation.HIGH),
        ('insert_blank_line', False, OptionRecommendation.HIGH),
        ('remove_paragraph_spacing',  False, OptionRecommendation.HIGH),
        ('dont_justify', True, OptionRecommendation.HIGH),
        ('dont_split_on_pagebreaks', True, OptionRecommendation.HIGH),
        ('chapter', None, OptionRecommendation.HIGH),
        ('page_breaks_brefore', None, OptionRecommendation.HIGH),
        ('use_auto_toc', False, OptionRecommendation.HIGH),
        ])
    def get_comics_from_collection(self, stream):
        from calibre.libunzip import extract as zipextract
        tdir = PersistentTemporaryDirectory('_comic_collection')
        zipextract(stream, tdir)
        comics = []
        with CurrentDir(tdir):
            if not os.path.exists('comics.txt'):
                raise ValueError('%s is not a valid comic collection'
                        %stream.name)
            for line in open('comics.txt',
                    'rb').read().decode('utf-8').splitlines():
                fname, title = line.partition(':')[0], line.partition(':')[-1]
                fname = os.path.join(tdir, *fname.split('/'))
                if not title:
                    title = os.path.basename(fname).rpartition('.')[0]
                if os.access(fname, os.R_OK):
                    comics.append([title, fname])
        if not comics:
            raise ValueError('%s has no comics'%stream.name)
        return comics
    def get_pages(self, comic, tdir2):
        tdir  = extract_comic(comic)
        new_pages = find_pages(tdir, sort_on_mtime=self.opts.no_sort,
                verbose=self.opts.verbose)
        thumbnail = None
        if not new_pages:
            raise ValueError('Could not find any pages in the comic: %s'
                    %comic)
        if self.opts.no_process:
            n2 = []
            for page in new_pages:
                n2.append(os.path.join(tdir2, os.path.basename(page)))
                shutil.copyfile(page, n2[-1])
            new_pages = n2
        else:
            new_pages, failures = process_pages(new_pages, self.opts,
                    self.progress, tdir2)
            if not new_pages:
                raise ValueError('Could not find any valid pages in comic: %s'
                        % comic)
            if failures:
                self.log.warning('Could not process the following pages '
                '(run with --verbose to see why):')
                for f in failures:
                    self.log.warning('\t', f)
            thumbnail = os.path.join(tdir2, 'thumbnail.png')
            if not os.access(thumbnail, os.R_OK):
                thumbnail = None
        return new_pages
    def get_images(self):
        return self._images
    def convert(self, stream, opts, file_ext, log, accelerators,
            progress=lambda p, m : m):
        from calibre.ebooks.metadata import MetaInformation
        from calibre.ebooks.metadata.opf2 import OPFCreator
        from calibre.ebooks.metadata.toc import TOC
        self.opts, self.log, self.progress = opts, log, progress
        if file_ext == 'cbc':
            comics_ = self.get_comics_from_collection(stream)
        else:
            comics_ = [['Comic', os.path.abspath(stream.name)]]
        stream.close()
        comics = []
        for i, x in enumerate(comics_):
            title, fname = x
            cdir = 'comic_%d'%(i+1) if len(comics_) > 1 else '.'
            cdir = os.path.abspath(cdir)
            if not os.path.exists(cdir):
                os.makedirs(cdir)
            pages = self.get_pages(fname, cdir)
            if not pages: continue
            wrappers = self.create_wrappers(pages)
            comics.append((title, pages, wrappers))
        if not comics:
            raise ValueError('No comic pages found in %s'%stream.name)
        mi  = MetaInformation(os.path.basename(stream.name).rpartition('.')[0],
            [_('Unknown')])
        opf = OPFCreator(os.path.abspath('.'), mi)
        entries = []
        def href(x):
            if len(comics) == 1: return os.path.basename(x)
            return '/'.join(x.split(os.sep)[-2:])
        for comic in comics:
            pages, wrappers = comic[1:]
            entries += [(w, None) for w in map(href, wrappers)] + \
                    [(x, None) for x in map(href, pages)]
        opf.create_manifest(entries)
        spine = []
        for comic in comics:
            spine.extend(map(href, comic[2]))
        self._images = []
        for comic in comics:
            self._images.extend(comic[1])
        opf.create_spine(spine)
        toc = TOC()
        if len(comics) == 1:
            wrappers = comics[0][2]
            for i, x in enumerate(wrappers):
                toc.add_item(href(x), None, _('Page')+' %d'%(i+1),
                        play_order=i)
        else:
            po = 0
            for comic in comics:
                po += 1
                wrappers = comic[2]
                stoc = toc.add_item(href(wrappers[0]),
                        None, comic[0], play_order=po)
                for i, x in enumerate(wrappers):
                    stoc.add_item(href(x), None,
                            _('Page')+' %d'%(i+1), play_order=po)
                    po += 1
        opf.set_toc(toc)
        m, n = open('metadata.opf', 'wb'), open('toc.ncx', 'wb')
        opf.render(m, n, 'toc.ncx')
        return os.path.abspath('metadata.opf')
    def create_wrappers(self, pages):
        from calibre.ebooks.oeb.base import XHTML_NS
        wrappers = []
        WRAPPER = textwrap.dedent('''\
        <html xmlns="%s">
            <head>
                <title>Page #%d</title>
                <style type="text/css">
                    @page { margin:0pt; padding: 0pt}
                    body { margin: 0pt; padding: 0pt}
                    div { text-align: center }
                </style>
            </head>
            <body>
                <div>
                    <img src="%s" alt="comic page #%d" />
                </div>
            </body>
        </html>
        ''')
        dir = os.path.dirname(pages[0])
        for i, page in enumerate(pages):
            wrapper = WRAPPER%(XHTML_NS, i+1, os.path.basename(page), i+1)
            page = os.path.join(dir, 'page_%d.xhtml'%(i+1))
            open(page, 'wb').write(wrapper)
            wrappers.append(page)
        return wrappers
--- a/src/calibre/ebooks/conversion/cli.py
+++ b/src/calibre/ebooks/conversion/cli.py
@ -47,12 +47,12 @@ def print_help(parser, log):
 def check_command_line_options(parser, args, log):
    if len(args) < 3 or args[1].startswith('-') or args[2].startswith('-'):
-        print_help(parser)
+        print_help(parser, log)
        log.error('\n\nYou must specify the input AND output files')
        raise SystemExit(1)
    input = os.path.abspath(args[1])
-    if not os.access(input, os.R_OK):
+    if not input.endswith('.recipe') and not os.access(input, os.R_OK):
        log.error('Cannot read from', input)
        raise SystemExit(1)
@ -169,6 +169,9 @@ def add_pipeline_options(parser, plumber):
            if rec.level < rec.HIGH:
                option_recommendation_to_cli_option(add_option, rec)
    option_recommendation_to_cli_option(parser.add_option,
            plumber.get_option_by_name('list_recipes'))
 def option_parser():
    return OptionParser(usage=USAGE)
--- a/src/calibre/ebooks/conversion/plumber.py
+++ b/src/calibre/ebooks/conversion/plumber.py
@ -360,6 +360,10 @@ OptionRecommendation(name='book_producer',
 OptionRecommendation(name='language',
    recommended_value=None, level=OptionRecommendation.LOW,
    help=_('Set the language.')),
 OptionRecommendation(name='list_recipes',
    recommended_value=False, help=_('List available recipes.')),
 ]
        input_fmt = os.path.splitext(self.input)[1]
@ -525,6 +529,13 @@ OptionRecommendation(name='language',
        self.setup_options()
        if self.opts.verbose:
            self.log.filter_level = self.log.DEBUG
        if self.opts.list_recipes:
            from calibre.web.feeds.recipes import titles
            self.log('Available recipes:')
            for title in sorted(titles):
                self.log('\t'+title)
            self.log('%d recipes available'%len(titles))
            raise SystemExit(0)
        # Run any preprocess plugins
        from calibre.customize.ui import run_plugins_on_preprocess
@ -535,8 +546,13 @@ OptionRecommendation(name='language',
        accelerators = {}
        tdir = PersistentTemporaryDirectory('_plumber')
        stream = self.input if self.input_fmt == 'recipe' else \
                open(self.input, 'rb')
-        self.oeb = self.input_plugin(open(self.input, 'rb'), self.opts,
+        if hasattr(self.opts, 'lrf') and self.output_plugin.file_type == 'lrf':
            self.opts.lrf = True
        self.oeb = self.input_plugin(stream, self.opts,
                                    self.input_fmt, self.log,
                                    accelerators, tdir)
        if self.opts.debug_input is not None:
--- a/src/calibre/ebooks/lit/reader.py
+++ b/src/calibre/ebooks/lit/reader.py
@ -882,6 +882,9 @@ class LitContainer(object):
            unbin = UnBinary(raw, path, self._litfile.manifest, OPF_MAP)
        return str(unbin)
    def get_metadata(self):
        return self._read_meta()
 class LitReader(OEBReader):
    Container = LitContainer
--- a/src/calibre/ebooks/lrf/comic/convert_from.py
+++ b/src/calibre/ebooks/lrf/comic/convert_from.py
@ -1,562 +0,0 @@
 from __future__ import with_statement
 __license__   = 'GPL v3'
 __copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
 __docformat__ = 'restructuredtext en'
 '''
 Based on ideas from comiclrf created by FangornUK.
 '''
 import os, sys, shutil, traceback, textwrap, fnmatch
 from uuid import uuid4
 from calibre import extract, terminal_controller, __appname__, __version__
 from calibre.utils.config import Config, StringConfig
 from calibre.ptempfile import PersistentTemporaryDirectory
 from calibre.parallel import Server, ParallelJob
 from calibre.utils.terminfo import ProgressBar
 from calibre.ebooks.lrf.pylrs.pylrs import Book, BookSetting, ImageStream, ImageBlock
 from calibre.ebooks.metadata import MetaInformation
 from calibre.ebooks.metadata.opf import OPFCreator
 from calibre.ebooks.epub.from_html import config as html2epub_config, convert as html2epub
 from calibre.customize.ui import run_plugins_on_preprocess
 try:
    from calibre.utils.PythonMagickWand import \
            NewMagickWand, NewPixelWand, \
            MagickSetImageBorderColor, \
            MagickReadImage, MagickRotateImage, \
            MagickTrimImage, PixelSetColor,\
            MagickNormalizeImage, MagickGetImageWidth, \
            MagickGetImageHeight, \
            MagickResizeImage, MagickSetImageType, \
            GrayscaleType, CatromFilter,  MagickSetImagePage, \
            MagickBorderImage, MagickSharpenImage, MagickDespeckleImage, \
            MagickQuantizeImage, RGBColorspace, \
            MagickWriteImage, DestroyPixelWand, \
            DestroyMagickWand, CloneMagickWand, \
            MagickThumbnailImage, MagickCropImage, ImageMagick
    _imagemagick_loaded = True
 except:
    _imagemagick_loaded = False
 PROFILES = {
            # Name : (width, height) in pixels
            'prs500':(584, 754),
            # The SONY's LRF renderer (on the PRS500) only uses the first 800x600 block of the image 
            'prs500-landscape': (784, 1012)
            }
 def extract_comic(path_to_comic_file):
    '''
    Un-archive the comic file.
    '''
    tdir = PersistentTemporaryDirectory(suffix='_comic_extract')
    extract(path_to_comic_file, tdir)
    return tdir
 def find_pages(dir, sort_on_mtime=False, verbose=False):
    '''
    Find valid comic pages in a previously un-archived comic. 
    :param dir: Directory in which extracted comic lives
    :param sort_on_mtime: If True sort pages based on their last modified time.
                          Otherwise, sort alphabetically.
    '''
    extensions = ['jpeg', 'jpg', 'gif', 'png']
    pages = []
    for datum in os.walk(dir):
        for name in datum[-1]:
            path = os.path.join(datum[0], name)
            for ext in extensions:
                if path.lower().endswith('.'+ext):
                    pages.append(path)
                    break
    if sort_on_mtime:
        comparator = lambda x, y : cmp(os.stat(x).st_mtime, os.stat(y).st_mtime)
    else:
        comparator = lambda x, y : cmp(os.path.basename(x), os.path.basename(y))
    pages.sort(cmp=comparator)
    if verbose:
        print 'Found comic pages...'
        print '\t'+'\n\t'.join([os.path.basename(p) for p in pages])
    return pages
 class PageProcessor(list):
    '''
    Contains the actual image rendering logic. See :method:`render` and 
    :method:`process_pages`.
    '''
    def __init__(self, path_to_page, dest, opts, num):
        list.__init__(self)
        self.path_to_page = path_to_page
        self.opts         = opts
        self.num          = num
        self.dest         = dest
        self.rotate       = False
        self.render()
    def render(self):
        img = NewMagickWand()
        if img < 0:
            raise RuntimeError('Cannot create wand.')
        if not MagickReadImage(img, self.path_to_page):
            raise IOError('Failed to read image from: %'%self.path_to_page)
        width  = MagickGetImageWidth(img)
        height = MagickGetImageHeight(img)
        if self.num == 0: # First image so create a thumbnail from it
            thumb = CloneMagickWand(img)
            if thumb < 0:
                raise RuntimeError('Cannot create wand.')
            MagickThumbnailImage(thumb, 60, 80)
            MagickWriteImage(thumb, os.path.join(self.dest, 'thumbnail.png'))
            DestroyMagickWand(thumb)
        self.pages = [img]
        if width > height:
            if self.opts.landscape:
                self.rotate = True
            else:
                split1, split2 = map(CloneMagickWand, (img, img))
                DestroyMagickWand(img)
                if split1 < 0 or split2 < 0:
                    raise RuntimeError('Cannot create wand.')
                MagickCropImage(split1, (width/2)-1, height, 0, 0)
                MagickCropImage(split2, (width/2)-1, height, width/2, 0 )
                self.pages = [split2, split1] if self.opts.right2left else [split1, split2]
        self.process_pages()
    def process_pages(self):
        for i, wand in enumerate(self.pages):
            pw = NewPixelWand()
            try:
                if pw < 0:
                    raise RuntimeError('Cannot create wand.')
                PixelSetColor(pw, 'white')
                MagickSetImageBorderColor(wand, pw)
                if self.rotate:
                    MagickRotateImage(wand, pw, -90)
                # 25 percent fuzzy trim?
                if not self.opts.disable_trim:
                    MagickTrimImage(wand, 25*65535/100)
                MagickSetImagePage(wand, 0,0,0,0)   #Clear page after trim, like a "+repage"
                # Do the Photoshop "Auto Levels" equivalent
                if not self.opts.dont_normalize:
                    MagickNormalizeImage(wand)
                sizex = MagickGetImageWidth(wand)
                sizey = MagickGetImageHeight(wand)
                SCRWIDTH, SCRHEIGHT = PROFILES[self.opts.profile]
                if self.opts.keep_aspect_ratio:
                    # Preserve the aspect ratio by adding border
                    aspect = float(sizex) / float(sizey)
                    if aspect <= (float(SCRWIDTH) / float(SCRHEIGHT)):
                        newsizey = SCRHEIGHT
                        newsizex = int(newsizey * aspect)
                        deltax = (SCRWIDTH - newsizex) / 2
                        deltay = 0
                    else:
                        newsizex = SCRWIDTH
                        newsizey = int(newsizex / aspect)
                        deltax = 0
                        deltay = (SCRHEIGHT - newsizey) / 2
                    MagickResizeImage(wand, newsizex, newsizey, CatromFilter, 1.0)
                    MagickSetImageBorderColor(wand, pw)
                    MagickBorderImage(wand, pw, deltax, deltay)
                elif self.opts.wide:
                    # Keep aspect and Use device height as scaled image width so landscape mode is clean
                    aspect = float(sizex) / float(sizey)
                    screen_aspect = float(SCRWIDTH) / float(SCRHEIGHT)
                    # Get dimensions of the landscape mode screen
                    # Add 25px back to height for the battery bar.
                    wscreenx = SCRHEIGHT + 25
                    wscreeny = int(wscreenx / screen_aspect)
                    if aspect <= screen_aspect:
                        newsizey = wscreeny
                        newsizex = int(newsizey * aspect)
                        deltax = (wscreenx - newsizex) / 2
                        deltay = 0
                    else:
                        newsizex = wscreenx
                        newsizey = int(newsizex / aspect)
                        deltax = 0
                        deltay = (wscreeny - newsizey) / 2
                    MagickResizeImage(wand, newsizex, newsizey, CatromFilter, 1.0)
                    MagickSetImageBorderColor(wand, pw)
                    MagickBorderImage(wand, pw, deltax, deltay)
                else:
                    MagickResizeImage(wand, SCRWIDTH, SCRHEIGHT, CatromFilter, 1.0)
                if not self.opts.dont_sharpen:
                    MagickSharpenImage(wand, 0.0, 1.0)
                MagickSetImageType(wand, GrayscaleType)
                if self.opts.despeckle:
                    MagickDespeckleImage(wand)
                MagickQuantizeImage(wand, self.opts.colors, RGBColorspace, 0, 1, 0)
                dest = '%d_%d.png'%(self.num, i)
                dest = os.path.join(self.dest, dest)
                MagickWriteImage(wand, dest+'8')
                os.rename(dest+'8', dest)
                self.append(dest)
            finally:
                if pw > 0:
                    DestroyPixelWand(pw)
                DestroyMagickWand(wand)
 def render_pages(tasks, dest, opts, notification=None):
    '''
    Entry point for the job server.
    '''
    failures, pages = [], []
    with ImageMagick():
        for num, path in tasks:
            try:
                pages.extend(PageProcessor(path, dest, opts, num))
                msg = _('Rendered %s') 
            except:
                failures.append(path)
                msg = _('Failed %s')
                if opts.verbose:
                    msg += '\n' + traceback.format_exc() 
            msg = msg%path
            if notification is not None:
                notification(0.5, msg)
    return pages, failures
 class JobManager(object):
    '''
    Simple job manager responsible for keeping track of overall progress.
    '''
    def __init__(self, total, update):
        self.total  = total
        self.update = update
        self.done   = 0
        self.add_job        = lambda j: j
        self.output         = lambda j: j
        self.start_work     = lambda j: j
        self.job_done       = lambda j: j
    def status_update(self, job):
        self.done += 1
        #msg = msg%os.path.basename(job.args[0])
        self.update(float(self.done)/self.total, job.msg)
 def process_pages(pages, opts, update):
    '''
    Render all identified comic pages.
    '''
    if not _imagemagick_loaded:
        raise RuntimeError('Failed to load ImageMagick')
    tdir = PersistentTemporaryDirectory('_comic2lrf_pp')
    job_manager = JobManager(len(pages), update)
    server = Server()
    jobs = []
    tasks = server.split(pages)
    for task in tasks:
        jobs.append(ParallelJob('render_pages', lambda s:s, job_manager=job_manager,
                                args=[task, tdir, opts]))
        server.add_job(jobs[-1])
    server.wait()
    server.killall()
    server.close()
    ans, failures = [], []
    for job in jobs:
        if job.result is None:
            raise Exception(_('Failed to process comic: %s\n\n%s')%(job.exception, job.traceback))
        pages, failures_ = job.result
        ans += pages
        failures += failures_
    return ans, failures, tdir
 def config(defaults=None,output_format='lrf'):
    desc = _('Options to control the conversion of comics (CBR, CBZ) files into ebooks')
    if defaults is None:
        c = Config('comic', desc)
    else:
        c = StringConfig(defaults, desc)
    c.add_opt('title', ['-t', '--title'],
              help=_('Title for generated ebook. Default is to use the filename.'))
    c.add_opt('author', ['-a', '--author'],
              help=_('Set the author in the metadata of the generated ebook. Default is %default'),
              default=_('Unknown'))
    c.add_opt('output', ['-o', '--output'],
              help=_('Path to output file. By default a file is created in the current directory.'))
    c.add_opt('colors', ['-c', '--colors'], type='int', default=64,
              help=_('Number of colors for grayscale image conversion. Default: %default'))
    c.add_opt('dont_normalize', ['-n', '--disable-normalize'], default=False,
              help=_('Disable normalize (improve contrast) color range for pictures. Default: False'))
    c.add_opt('keep_aspect_ratio', ['-r', '--keep-aspect-ratio'], default=False,
              help=_('Maintain picture aspect ratio. Default is to fill the screen.'))
    c.add_opt('dont_sharpen', ['-s', '--disable-sharpen'], default=False,
              help=_('Disable sharpening.'))
    c.add_opt('disable_trim', ['--disable-trim'], default=False,
              help=_('Disable trimming of comic pages. For some comics, '
                     'trimming might remove content as well as borders.'))
    c.add_opt('landscape', ['-l', '--landscape'], default=False,
              help=_("Don't split landscape images into two portrait images"))
    c.add_opt('wide', ['-w', '--wide-aspect'], default=False,
              help=_("Keep aspect ratio and scale image using screen height as image width for viewing in landscape mode."))
    c.add_opt('right2left', ['--right2left'], default=False, action='store_true',
              help=_('Used for right-to-left publications like manga. Causes landscape pages to be split into portrait pages from right to left.'))
    c.add_opt('despeckle', ['-d', '--despeckle'], default=False,
              help=_('Enable Despeckle. Reduces speckle noise. May greatly increase processing time.'))
    c.add_opt('no_sort', ['--no-sort'], default=False,
              help=_("Don't sort the files found in the comic alphabetically by name. Instead use the order they were added to the comic."))
    c.add_opt('profile', ['-p', '--profile'], default='prs500', choices=PROFILES.keys(),
              help=_('Choose a profile for the device you are generating this file for. The default is the SONY PRS-500 with a screen size of 584x754 pixels. This is suitable for any reader with the same screen size. Choices are %s')%PROFILES.keys())
    c.add_opt('verbose', ['-v', '--verbose'], default=0, action='count',
              help=_('Be verbose, useful for debugging. Can be specified multiple times for greater verbosity.'))
    c.add_opt('no_progress_bar', ['--no-progress-bar'], default=False,
                      help=_("Don't show progress bar."))
    if output_format == 'pdf':
        c.add_opt('no_process',['--no_process'], default=False,
    		      help=_("Apply no processing to the image"))
    return c
 def option_parser(output_format='lrf'):
    c = config(output_format=output_format)
    return c.option_parser(usage=_('''\
 %prog [options] comic.cb[z|r]
 Convert a comic in a CBZ or CBR file to an ebook. 
 '''))
 def create_epub(pages, profile, opts, thumbnail=None):
    wrappers = []
    WRAPPER = textwrap.dedent('''\
    <html>
        <head>
            <title>Page #%d</title>
            <style type="text/css">@page {margin:0pt; padding: 0pt;}</style>
        </head>
        <body style="margin: 0pt; padding: 0pt">
            <div style="text-align:center">
                <img src="%s" alt="comic page #%d" />
            </div>
        </body>
    </html>        
    ''')
    dir = os.path.dirname(pages[0])
    for i, page in enumerate(pages):
        wrapper = WRAPPER%(i+1, os.path.basename(page), i+1)
        page = os.path.join(dir, 'page_%d.html'%(i+1))
        open(page, 'wb').write(wrapper)
        wrappers.append(page)
    mi  = MetaInformation(opts.title, [opts.author])
    opf = OPFCreator(dir, mi)
    opf.create_manifest([(w, None) for w in wrappers])
    opf.create_spine(wrappers)
    metadata = os.path.join(dir, 'metadata.opf')
    opf.render(open(metadata, 'wb'))
    opts2 = html2epub_config('margin_left=0\nmargin_right=0\nmargin_top=0\nmargin_bottom=0').parse()
    opts2.output = opts.output
    html2epub(metadata, opts2)
 def create_lrf(pages, profile, opts, thumbnail=None):
    width, height = PROFILES[profile]
    ps = {}
    ps['topmargin']      = 0
    ps['evensidemargin'] = 0
    ps['oddsidemargin']  = 0
    ps['textwidth']      = width
    ps['textheight']     = height
    book = Book(title=opts.title, author=opts.author,
            bookid=uuid4().hex,
            publisher='%s %s'%(__appname__, __version__), thumbnail=thumbnail,
            category='Comic', pagestyledefault=ps, 
            booksetting=BookSetting(screenwidth=width, screenheight=height))
    for page in pages:
        imageStream = ImageStream(page)
        _page = book.create_page()
        _page.append(ImageBlock(refstream=imageStream, 
                    blockwidth=width, blockheight=height, xsize=width, 
                    ysize=height, x1=width, y1=height))
        book.append(_page)
    book.renderLrf(open(opts.output, 'wb'))
    print _('Output written to'), opts.output
 def create_pdf(pages, profile, opts, thumbnail=None,toc=None):
    width, height = PROFILES[profile]
    from reportlab.pdfgen import canvas
    cur_page=0
    heading = []
    if toc != None:
        if len(toc) == 1:
            toc = None
        else:
            toc_index = 0
            base_cur = 0
            rem = 0
            breaker = False
            while True:
                letter=toc[0][0][base_cur]
                for i in range(len(toc)):
                    if letter != toc[i][0][base_cur]:
                        breaker = True
                if breaker:
                    break
                if letter == os.sep:
                    rem=base_cur
                base_cur += 1
            toc.append(("Not seen",-1))
    pdf = canvas.Canvas(filename=opts.output, pagesize=(width,height+15))
    pdf.setAuthor(opts.author)
    pdf.setTitle(opts.title)
    for page in pages:
        if opts.keep_aspect_ratio:
            img = NewMagickWand()
            if img < 0:
                raise RuntimeError('Cannot create wand.')
            if not MagickReadImage(img, page):
                raise IOError('Failed to read image from: %'%page)
            sizex  = MagickGetImageWidth(img)
            sizey = MagickGetImageHeight(img)
            if opts.keep_aspect_ratio:
                # Preserve the aspect ratio by adding border
                aspect = float(sizex) / float(sizey)
                if aspect <= (float(width) / float(height)):
                    newsizey = height 
                    newsizex = int(newsizey * aspect)
                    deltax = (width - newsizex) / 2
                    deltay = 0
                else:
                    newsizex = width 
                    newsizey = int(newsizex / aspect)
                    deltax = 0
                    deltay = (height - newsizey) / 2
            pdf.drawImage(page, x=deltax,y=deltay,width=newsizex, height=newsizey)
        else:
            pdf.drawImage(page, x=0,y=0,width=width, height=height) 
        if toc != None:
            if toc[toc_index][1] == cur_page:
                tmp=toc[toc_index][0]
                toc_current=tmp[rem:len(tmp)-4]
                index=0
                while True:
                    key = 'page%d-%d' % (cur_page, index)
                    pdf.bookmarkPage(key)
                    (head,dummy,list)=toc_current.partition(os.sep)
                    try:
                        if heading[index] != head:
                            heading[index] = head
                            pdf.addOutlineEntry(title=head,key=key,level=index)
                    except:
                        heading.append(head)
                        pdf.addOutlineEntry(title=head,key=key,level=index)
                    index += 1
                    toc_current=list
                    if dummy == "":
                        break
                toc_index += 1
            cur_page += 1
        pdf.showPage()
    # Write the document to disk
    pdf.save() 
 def do_convert(path_to_file, opts, notification=lambda m, p: p, output_format='lrf'):
    path_to_file = run_plugins_on_preprocess(path_to_file)
    source = path_to_file
    to_delete = []
    toc = []
    list = [] 
    pages = []
    if not opts.title:
        opts.title = os.path.splitext(os.path.basename(source))[0]
    if not opts.output:
        opts.output = os.path.abspath(os.path.splitext(os.path.basename(source))[0]+'.'+output_format)
    if os.path.isdir(source):
        for path in all_files( source , '*.cbr|*.cbz' ):
            list.append( path )
    else:
            list= [ os.path.abspath(source) ]
    for source in list:
        tdir  = extract_comic(source)
        new_pages = find_pages(tdir, sort_on_mtime=opts.no_sort, verbose=opts.verbose)
        thumbnail = None
        if not new_pages:
            raise ValueError('Could not find any pages in the comic: %s'%source)
        if not getattr(opts, 'no_process', False):
            new_pages, failures, tdir2 = process_pages(new_pages, opts, notification)
            if not new_pages:
                raise ValueError('Could not find any valid pages in the comic: %s'%source)
            if failures:
                print 'Could not process the following pages (run with --verbose to see why):'
                for f in failures:
                    print '\t', f
            thumbnail = os.path.join(tdir2, 'thumbnail.png')
            if not os.access(thumbnail, os.R_OK):
                thumbnail = None
        toc.append((source,len(pages)))
        pages.extend(new_pages)
        to_delete.append(tdir)
    if output_format == 'lrf':
        create_lrf(pages, opts.profile, opts, thumbnail=thumbnail)
    if output_format == 'epub':
        create_epub(pages, opts.profile, opts, thumbnail=thumbnail)
    if output_format == 'pdf':
        create_pdf(pages, opts.profile, opts, thumbnail=thumbnail,toc=toc)
    for tdir in to_delete:
        shutil.rmtree(tdir)
 def all_files(root, patterns='*'):
    # Expand patterns from semicolon-separated string to list
    patterns = patterns.split('|')
    for path, subdirs, files in os.walk(root):
        files.sort( )
        for name in files:
            for pattern in patterns:
                if fnmatch.fnmatch(name, pattern):
                    yield os.path.join(path, name)
                    break
 def main(args=sys.argv, notification=None, output_format='lrf'):
    parser = option_parser(output_format=output_format)
    opts, args = parser.parse_args(args)
    if len(args) < 2:
        parser.print_help()
        print '\nYou must specify a file to convert'
        return 1
    if not callable(notification):
        pb = ProgressBar(terminal_controller, _('Rendering comic pages...'), 
                         no_progress_bar=opts.no_progress_bar or getattr(opts, 'no_process', False))
        notification = pb.update
    source = os.path.abspath(args[1])
    do_convert(source, opts, notification, output_format=output_format)
    return 0
 if __name__ == '__main__':
    sys.exit(main())
--- a/src/calibre/ebooks/lrf/lrfparser.py
+++ b/src/calibre/ebooks/lrf/lrfparser.py
@ -5,16 +5,16 @@ __copyright__ = '2008, Kovid Goyal <kovid at kovidgoyal.net>'
 import sys, array, os, re, codecs, logging
 from calibre import setup_cli_handlers, sanitize_file_name
-from calibre.utils.config import OptionParser 
+from calibre.utils.config import OptionParser
 from calibre.ebooks.lrf.meta import LRFMetaFile
 from calibre.ebooks.lrf.objects import get_object, PageTree, StyleObject, \
                                         Font, Text, TOCObject, BookAttr, ruby_tags
-                                         
+
 class LRFDocument(LRFMetaFile):
-    
+
    class temp(object): pass
-    
+
    def __init__(self, stream):
        LRFMetaFile.__init__(self, stream)
        self.scramble_key = self.xor_key
@ -23,11 +23,11 @@ class LRFDocument(LRFMetaFile):
        self.image_map = {}
        self.toc = ''
        self.keep_parsing = True
-        
+
    def parse(self):
        self._parse_objects()
        self.metadata = LRFDocument.temp()
-        for a in ('title', 'title_reading', 'author', 'author_reading', 'book_id', 
+        for a in ('title', 'title_reading', 'author', 'author_reading', 'book_id',
                  'classification', 'free_text', 'publisher', 'label', 'category'):
            setattr(self.metadata, a, getattr(self, a))
        self.doc_info = LRFDocument.temp()
@ -37,7 +37,7 @@ class LRFDocument(LRFMetaFile):
        self.device_info = LRFDocument.temp()
        for a in ('dpi', 'width', 'height'):
            setattr(self.device_info, a, getattr(self, a))
-        
+
    def _parse_objects(self):
        self.objects = {}
        self._file.seek(self.object_index_offset)
@ -68,15 +68,15 @@ class LRFDocument(LRFMetaFile):
                attr = h[0]
                if hasattr(obj, attr):
                    self.ruby_tags[attr] = getattr(obj, attr)
-    
+
    def __iter__(self):
        for pt in self.page_trees:
            yield pt
-        
+
    def write_files(self):
        for obj in self.image_map.values() + self.font_map.values():
-            open(obj.file, 'wb').write(obj.stream)            
+            open(obj.file, 'wb').write(obj.stream)
-        
+
    def to_xml(self, write_files=True):
        bookinfo = u'<BookInformation>\n<Info version="1.1">\n<BookInfo>\n'
        bookinfo += u'<Title reading="%s">%s</Title>\n'%(self.metadata.title_reading, self.metadata.title)
@ -113,7 +113,7 @@ class LRFDocument(LRFMetaFile):
                pages += unicode(page)
            pages += close
        traversed_objects = [int(i) for i in re.findall(r'objid="(\w+)"', pages)] + [pt_id]
-        
+
        objects = u'\n<Objects>\n'
        styles  = u'\n<Style>\n'
        for obj in self.objects:
@ -131,16 +131,16 @@ class LRFDocument(LRFMetaFile):
        if write_files:
            self.write_files()
        return '<BBeBXylog version="1.0">\n' + bookinfo + pages + styles + objects + '</BBeBXylog>'
-        
+
 def option_parser():
    parser = OptionParser(usage=_('%prog book.lrf\nConvert an LRF file into an LRS (XML UTF-8 encoded) file'))
    parser.add_option('--output', '-o', default=None, help=_('Output LRS file'), dest='out')
-    parser.add_option('--dont-output-resources', default=True, action='store_false', 
+    parser.add_option('--dont-output-resources', default=True, action='store_false',
-                      help=_('Do not save embedded image and font files to disk'), 
+                      help=_('Do not save embedded image and font files to disk'),
                      dest='output_resources')
    parser.add_option('--verbose', default=False, action='store_true', dest='verbose')
    return parser
-    
+
 def main(args=sys.argv, logger=None):
    parser = option_parser()
    opts, args = parser.parse_args(args)
--- a/src/calibre/ebooks/lrf/objects.py
+++ b/src/calibre/ebooks/lrf/objects.py
@ -970,7 +970,12 @@ class Canvas(LRFStream):
        stream = cStringIO.StringIO(self.stream)
        while stream.tell() < len(self.stream):
            tag = Tag(stream)
-            self._contents.append(PutObj(self._document.objects, *struct.unpack("<HHI", tag.contents)))
+            try:
                self._contents.append(
                    PutObj(self._document.objects,
                        *struct.unpack("<HHI", tag.contents)))
            except struct.error:
                print 'Canvas object has errors, skipping.'
    def __unicode__(self):
        s = '\n<%s objid="%s" '%(self.__class__.__name__, self.id,)
--- a/src/calibre/ebooks/metadata/lit.py
+++ b/src/calibre/ebooks/metadata/lit.py
@ -4,15 +4,16 @@ __copyright__ = '2008, Kovid Goyal <kovid at kovidgoyal.net>'
 Support for reading the metadata from a LIT file.
 '''
-import sys, cStringIO, os
+import cStringIO, os
 from calibre.ebooks.metadata import MetaInformation
 from calibre.ebooks.metadata.opf2 import OPF
 from calibre.ebooks.lit.reader import LitReader
 def get_metadata(stream):
-    litfile = LitReader(stream)
+    from calibre.ebooks.lit.reader import LitContainer
-    src = litfile.meta.encode('utf-8')
+    litfile = LitContainer(stream)
    src = litfile.get_metadata().encode('utf-8')
    litfile = litfile._litfile
    opf = OPF(cStringIO.StringIO(src), os.getcwd())
    mi = MetaInformation(opf)
    covers = []
--- a/src/calibre/ebooks/mobi/reader.py
+++ b/src/calibre/ebooks/mobi/reader.py
@ -313,8 +313,10 @@ class MobiReader(object):
            self.read_embedded_metadata(root, metadata_elems[0], guide)
        for elem in guides + metadata_elems:
            elem.getparent().remove(elem)
        fname = self.name.encode('ascii', 'replace')
        fname = re.sub(r'[\x08\x15\0]+', '', fname)
        htmlfile = os.path.join(output_dir,
-                                sanitize_file_name(self.name)+'.html')
+                                sanitize_file_name(fname)+'.html')
        try:
            for ref in guide.xpath('descendant::reference'):
                if ref.attrib.has_key('href'):
@ -396,8 +398,8 @@ class MobiReader(object):
                    'xx-large' : '6',
                    }
        mobi_version = self.book_header.mobi_version
        style_map = {}
        for i, tag in enumerate(root.iter(etree.Element)):
            tag.attrib.pop('xmlns', '')
            if tag.tag in ('country-region', 'place', 'placetype', 'placename',
                           'state', 'city', 'street', 'address', 'content'):
                tag.tag = 'div' if tag.tag == 'content' else 'span'
--- a/src/calibre/ebooks/oeb/base.py
+++ b/src/calibre/ebooks/oeb/base.py
@ -1578,15 +1578,15 @@ class OEBBook(object):
                return data.decode('utf-16')
            except UnicodeDecodeError:
                pass
        try:
            return data.decode('utf-8')
        except UnicodeDecodeError:
            pass
        if self.encoding is not None:
            try:
                return data.decode(self.encoding)
            except UnicodeDecodeError:
                pass
        try:
            return data.decode('utf-8')
        except UnicodeDecodeError:
            pass
        data, _ = xml_to_unicode(data)
        data = data.replace('\r\n', '\n')
        data = data.replace('\r', '\n')
--- a/src/calibre/ebooks/oeb/iterator.py
+++ b/src/calibre/ebooks/oeb/iterator.py
@ -128,6 +128,8 @@ class EbookIterator(object):
        plumber.setup_options()
        if hasattr(plumber.opts, 'dont_package'):
            plumber.opts.dont_package = True
        if hasattr(plumber.opts, 'no_process'):
            plumber.opts.no_process = True
        self.pathtoopf = plumber.input_plugin(open(plumber.input, 'rb'),
                plumber.opts, plumber.input_fmt, self.log,
                {}, self.base)
--- a/src/calibre/ebooks/oeb/transforms/split.py
+++ b/src/calibre/ebooks/oeb/transforms/split.py
@ -59,6 +59,7 @@ class Split(object):
        self.fix_links()
    def split_item(self, item):
        page_breaks, page_break_ids = [], []
        if self.split_on_page_breaks:
            page_breaks, page_break_ids = self.find_page_breaks(item)
--- a/src/calibre/ebooks/pdf/output.py
+++ b/src/calibre/ebooks/pdf/output.py
@ -40,7 +40,7 @@ class PDFOutput(OutputFormatPlugin):
                    OptionRecommendation(name='margin_right', recommended_value='1',
                        level=OptionRecommendation.LOW,
                        help=_('The right margin around the document.')),
-                        
+
                    OptionRecommendation(name='unit', recommended_value='inch',
                        level=OptionRecommendation.LOW, short_switch='u', choices=UNITS.keys(),
                        help=_('The unit of measure. Default is inch. Choices '
@ -58,15 +58,18 @@ class PDFOutput(OutputFormatPlugin):
                        help=_('The orientation of the page. Default is portrait. Choices '
                        'are %s' % ORIENTATIONS.keys())),
                 ])
-                 
+
    def convert(self, oeb_book, output_path, input_plugin, opts, log):
        self.opts, self.log = opts, log
        if input_plugin.is_image_collection:
            self.convert_images(input_plugin.get_images())
        with TemporaryDirectory('_pdf_out') as oebdir:
            OEBOutput(None).convert(oeb_book, oebdir, input_plugin, opts, log)
            opf = glob.glob(os.path.join(oebdir, '*.opf'))[0]
            writer = PDFWriter(log, opts)
-        
+
            close = False
            if not hasattr(output_path, 'write'):
                close = True
@ -75,10 +78,10 @@ class PDFOutput(OutputFormatPlugin):
                out_stream = open(output_path, 'wb')
            else:
                out_stream = output_path
-            
+
            out_stream.seek(0)
            out_stream.truncate()
            writer.dump(opf, out_stream, PDFMetadata(oeb_book.metadata))
-            
+
            if close:
                out_stream.close()
--- a/src/calibre/ebooks/pdf/writer.py
+++ b/src/calibre/ebooks/pdf/writer.py
@ -9,12 +9,11 @@ __docformat__ = 'restructuredtext en'
 Write content to PDF.
 '''
-import os, shutil, sys
+import os, shutil
 from calibre.ptempfile import PersistentTemporaryDirectory
 from calibre.customize.profiles import OutputProfile
 from calibre.ebooks.pdf.pageoptions import unit, paper_size, \
-    orientation, size 
+    orientation, size
 from calibre.ebooks.metadata import authors_to_string
 from calibre.ebooks.metadata.opf2 import OPF
@ -24,12 +23,12 @@ from PyQt4.Qt import QUrl, QEventLoop, SIGNAL, QObject, \
 from PyQt4.QtWebKit import QWebView
 from pyPdf import PdfFileWriter, PdfFileReader
-        
+
 class PDFMetadata(object):
    def __init__(self, oeb_metadata=None):
        self.title = _('Unknown')
        self.author = _('Unknown')
-        
+
        if oeb_metadata != None:
            if len(oeb_metadata.title) >= 1:
                self.title = oeb_metadata.title[0].value
@ -42,16 +41,16 @@ class PDFWriter(QObject):
        if QApplication.instance() is None:
            QApplication([])
        QObject.__init__(self)
-        
+
        self.logger = log
-        
+
        self.loop = QEventLoop()
        self.view = QWebView()
        self.connect(self.view, SIGNAL('loadFinished(bool)'), self._render_html)
        self.render_queue = []
        self.combine_queue = []
        self.tmp_path = PersistentTemporaryDirectory('_pdf_output_parts')
-        
+
        self.custom_size = None
        if opts.custom_size != None:
            width, sep, height = opts.custom_size.partition('x')
@ -62,44 +61,44 @@ class PDFWriter(QObject):
                    self.custom_size = (width, height)
                except:
                    self.custom_size = None
-        
+
        self.opts = opts
-        
+
    def dump(self, opfpath, out_stream, pdf_metadata):
        self.metadata = pdf_metadata
        self._delete_tmpdir()
-        
+
        opf = OPF(opfpath, os.path.dirname(opfpath))
        self.render_queue = [i.path for i in opf.spine]
        self.combine_queue = []
        self.out_stream = out_stream
-        
+
        QMetaObject.invokeMethod(self, "_render_book", Qt.QueuedConnection)
        self.loop.exec_()
-        
+
    @QtCore.pyqtSignature('_render_book()')
    def _render_book(self):
        if len(self.render_queue) == 0:
            self._write()
        else:
            self._render_next()
-            
+
    def _render_next(self):
        item = str(self.render_queue.pop(0))
        self.combine_queue.append(os.path.join(self.tmp_path, '%i.pdf' % (len(self.combine_queue) + 1)))
-        
+
        self.logger.info('Processing %s...' % item)
-    
+
        self.view.load(QUrl(item))
    def _render_html(self, ok):
        if ok:
            item_path = os.path.join(self.tmp_path, '%i.pdf' % len(self.combine_queue))
-            
+
            self.logger.debug('\tRendering item %s as %i' % (os.path.basename(str(self.view.url().toLocalFile())), len(self.combine_queue)))
-        
+
            printer = QPrinter(QPrinter.HighResolution)
-                        
+
            if self.opts.output_profile.short_name == 'default':
                if self.custom_size == None:
                    printer.setPaperSize(paper_size(self.opts.paper_size))
@ -107,7 +106,7 @@ class PDFWriter(QObject):
                    printer.setPaperSize(QSizeF(self.custom_size[0], self.custom_size[1]), unit(self.opts.unit))
            else:
                printer.setPaperSize(QSizeF(self.opts.output_profile.width / self.opts.output_profile.dpi, self.opts.output_profile.height / self.opts.output_profile.dpi), QPrinter.Inch)
-                        
+
            printer.setPageMargins(size(self.opts.margin_left), size(self.opts.margin_top), size(self.opts.margin_right), size(self.opts.margin_bottom), unit(self.opts.unit))
            printer.setOrientation(orientation(self.opts.orientation))
            printer.setOutputFormat(QPrinter.PdfFormat)
@ -122,7 +121,7 @@ class PDFWriter(QObject):
    def _write(self):
        self.logger.info('Combining individual PDF parts...')
-    
+
        try:
            outPDF = PdfFileWriter(title=self.metadata.title, author=self.metadata.author)
            for item in self.combine_queue:
--- a/src/calibre/libunzip.py
+++ b/src/calibre/libunzip.py
@ -3,19 +3,19 @@ __license__   = 'GPL v3'
 __copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
 __docformat__ = 'restructuredtext en'
-import os, re
+import re
 from calibre.utils import zipfile
 def update(pathtozip, patterns, filepaths, names, compression=zipfile.ZIP_DEFLATED, verbose=True):
    '''
-    Update files in the zip file at `pathtozip` matching the given 
+    Update files in the zip file at `pathtozip` matching the given
    `patterns` with the given `filepaths`. If more than
-    one file matches, all of the files are replaced. 
+    one file matches, all of the files are replaced.
-    
+
    :param patterns:    A list of compiled regular expressions
    :param filepaths:   A list of paths to the replacement files. Must have the
                        same length as `patterns`.
-    :param names:       A list of archive names for each file in filepaths. 
+    :param names:       A list of archive names for each file in filepaths.
                        A name can be `None` in which case the name of the existing
                        file in the archive is used.
    :param compression: The compression to use when replacing files. Can be
@ -48,4 +48,4 @@ def extract_member(filename, match=re.compile(r'\.(jpg|jpeg|gif|png)\s*$', re.I)
    names = zf.namelist()
    for name in names:
        if match.search(name):
-            return name, zf.read(name)
+            return name, zf.read(name)
--- a/src/calibre/parallel.py
+++ b/src/calibre/parallel.py
@ -43,7 +43,7 @@ PARALLEL_FUNCS = {
      'lrfviewer'    :
        ('calibre.gui2.lrf_renderer.main', 'main', {}, None),
-        
+
      'ebook-viewer'    :
        ('calibre.gui2.viewer.main', 'main', {}, None),
@ -52,34 +52,34 @@ PARALLEL_FUNCS = {
      'render_table' :
        ('calibre.ebooks.lrf.html.table_as_image', 'do_render', {}, None),
-        
+
      'render_pages' :
-        ('calibre.ebooks.lrf.comic.convert_from', 'render_pages', {}, 'notification'),
+        ('calibre.ebooks.comic.input', 'render_pages', {}, 'notification'),
      'comic2lrf'    :
        ('calibre.ebooks.lrf.comic.convert_from', 'do_convert', {}, 'notification'),
-        
+
      'any2epub'     :
        ('calibre.ebooks.epub.from_any', 'any2epub', {}, None),
-        
+
      'feeds2epub'   :
        ('calibre.ebooks.epub.from_feeds', 'main', {}, 'notification'),
-        
+
      'comic2epub'    :
        ('calibre.ebooks.epub.from_comic', 'convert', {}, 'notification'),
-        
+
      'any2mobi'     :
        ('calibre.ebooks.mobi.from_any', 'any2mobi', {}, None),
-        
+
      'any2pdf'     :
-        ('calibre.ebooks.pdf.from_any', 'any2pdf', {}, None),        
+        ('calibre.ebooks.pdf.from_any', 'any2pdf', {}, None),
-        
+
      'feeds2mobi'   :
        ('calibre.ebooks.mobi.from_feeds', 'main', {}, 'notification'),
-        
+
      'comic2mobi'    :
        ('calibre.ebooks.mobi.from_comic', 'convert', {}, 'notification'),
-        
+
      'ebook-convert'     :
        ('calibre.ebooks.conversion.cli', 'main', {}, None),
 }
@ -174,7 +174,7 @@ class WorkerMother(object):
                contents = os.path.join(contents, 'console.app', 'Contents')
                self.executable = os.path.join(contents, 'MacOS',
                                               os.path.basename(sys.executable))
-                
+
                resources = os.path.join(contents, 'Resources')
                fd = os.path.join(contents, 'Frameworks')
                sp = os.path.join(resources, 'lib', 'python'+sys.version[:3], 'site-packages.zip')
@ -198,7 +198,7 @@ class WorkerMother(object):
        for func in ('spawn_free_spirit', 'spawn_worker'):
            setattr(self, func, getattr(self, func+'_'+ext))
-    
+
    def cleanup_child_windows(self, child, name=None, fd=None):
        try:
            child.kill()
@ -526,8 +526,8 @@ class JobKilled(Exception):
    pass
 class Job(object):
-    
+
-    def __init__(self, job_done, job_manager=None, 
+    def __init__(self, job_done, job_manager=None,
                 args=[], kwargs={}, description=None):
        self.args            = args
        self.kwargs          = kwargs
@ -540,9 +540,9 @@ class Job(object):
        self.description     = description
        self.start_time      = None
        self.running_time    = None
-        
+
        self.result = self.exception = self.traceback = self.log = None
-    
+
    def __cmp__(self, other):
        sstatus, ostatus = self.status(), other.status()
        if sstatus == ostatus or (self.has_run and other.has_run):
@ -557,8 +557,8 @@ class Job(object):
            return -1
        if ostatus == 'WAITING':
            return 1
-        
+
-    
+
    def job_done(self):
        self.is_running, self.has_run = False, True
        self.running_time = (time.time() - self.start_time) if \
@ -566,14 +566,14 @@ class Job(object):
        if self.job_manager is not None:
            self.job_manager.job_done(self)
        self._job_done(self)
-        
+
    def start_work(self):
        self.is_running = True
        self.has_run    = False
        self.start_time = time.time()
        if self.job_manager is not None:
            self.job_manager.start_work(self)
-    
+
    def update_status(self, percent, msg=None):
        self.percent = percent
        self.msg     = msg
@ -582,7 +582,7 @@ class Job(object):
                self.job_manager.status_update(self)
            except:
                traceback.print_exc()
-        
+
    def status(self):
        if self.is_running:
            return 'WORKING'
@ -592,7 +592,7 @@ class Job(object):
            if self.exception is None:
                return 'DONE'
            return 'ERROR'
-            
+
    def console_text(self):
        ans = [u'Job: ']
        if self.description:
@ -610,13 +610,13 @@ class Job(object):
            if self.traceback:
                ans.append(u'**Traceback**:')
                ans.extend(self.traceback.split('\n'))
-        
+
        if self.log:
            if isinstance(self.log, str):
                self.log = unicode(self.log, 'utf-8', 'replace')
            ans.append(self.log)
        return (u'\n'.join(ans)).encode('utf-8')
-    
+
    def gui_text(self):
        ans = [u'Job: ']
        if self.description:
@ -641,19 +641,19 @@ class Job(object):
            if isinstance(self.log, str):
                self.log = unicode(self.log, 'utf-8', 'replace')
            ans.extend(self.log.split('\n'))
-        
+
        ans = [x.decode(preferred_encoding, 'replace') if isinstance(x, str) else x for x in ans]
-        
+
        return u'<br>'.join(ans)
 class ParallelJob(Job):
-    
+
    def __init__(self, func, *args, **kwargs):
        Job.__init__(self, *args, **kwargs)
        self.func = func
        self.done = self.job_done
-        
+
    def output(self, msg):
        if not self.log:
            self.log = u''
@ -663,7 +663,7 @@ class ParallelJob(Job):
            self.log += msg
        if self.job_manager is not None:
            self.job_manager.output(self)
-    
+
 def remove_ipc_socket(path):
    os = __import__('os')
@ -702,7 +702,7 @@ class Server(Thread):
        self.result_lock = RLock()
        self.pool_lock = RLock()
        self.start()
-        
+
    def split(self, tasks):
        '''
        Split a list into a list of sub lists, with the number of sub lists being
@ -720,7 +720,7 @@ class Server(Thread):
            ans.append(section)
            pos += delta
        return ans
-        
+
    def close(self):
        try:
@ -733,7 +733,7 @@ class Server(Thread):
            self.jobs.append(job)
        if job.job_manager is not None:
            job.job_manager.add_job(job)
-            
+
    def poll(self):
        '''
        Return True if the server has either working or queued jobs
@ -741,14 +741,14 @@ class Server(Thread):
        with self.job_lock:
            with self.working_lock:
                return len(self.jobs) + len(self.working) > 0
-            
+
    def wait(self, sleep=1):
        '''
        Wait until job queue is empty
        '''
        while self.poll():
            time.sleep(sleep)
-    
+
    def run(self):
        while True:
            job = None
@ -935,7 +935,7 @@ def work(client_socket, func, args, kwdargs):
                func(*args, **kwargs)
            except (Exception, SystemExit):
                continue
-                
+
        time.sleep(5) # Give any in progress BufferedSend time to complete
@ -948,7 +948,7 @@ def worker(host, port):
    if msg != 'OK':
        return 1
    write(client_socket, 'WAITING')
-    
+
    sys.stdout = BufferedSender(client_socket)
    sys.stderr = sys.stdout
--- a/src/calibre/utils/smtp.py
+++ b/src/calibre/utils/smtp.py
@ -81,7 +81,12 @@ def sendmail(msg, from_, to, localhost=None, verbose=0, timeout=30,
        for x in to:
            return sendmail_direct(from_, x, msg, timeout, localhost, verbose)
    import smtplib
-    cls = smtplib.SMTP if encryption == 'TLS' else smtplib.SMTP_SSL
+    class SMTP_SSL(smtplib.SMTP_SSL): # Workaround for bug in smtplib.py
        def _get_socket(self, host, port, timeout):
            smtplib.SMTP_SSL._get_socket(self, host, port, timeout)
            return self.sock
    cls = smtplib.SMTP if encryption == 'TLS' else SMTP_SSL
    timeout = None # Non-blocking sockets sometimes don't work
    port = int(port)
    s = cls(timeout=timeout, local_hostname=localhost)
@ -93,6 +98,8 @@ def sendmail(msg, from_, to, localhost=None, verbose=0, timeout=30,
        s.starttls()
        s.ehlo()
    if username is not None and password is not None:
        if encryption == 'SSL':
            s.sock = s.file.sslobj
        s.login(username, password)
    s.sendmail(from_, to, msg)
    return s.quit()
--- a/src/calibre/utils/terminfo.py
+++ b/src/calibre/utils/terminfo.py
@ -7,22 +7,22 @@ import sys, re, os
 class TerminalController:
    """
    A class that can be used to portably generate formatted output to
-    a terminal.  
+    a terminal.
-    
+
    `TerminalController` defines a set of instance variables whose
    values are initialized to the control sequence necessary to
    perform a given action.  These can be simply included in normal
    output to the terminal:
-    
+
    >>> term = TerminalController()
    >>> print 'This is '+term.GREEN+'green'+term.NORMAL
-    
+
    Alternatively, the `render()` method can used, which replaces
    '${action}' with the string required to perform 'action':
-    
+
    >>> term = TerminalController()
    >>> print term.render('This is ${GREEN}green${NORMAL}')
-    
+
    If the terminal doesn't support a given action, then the value of
    the corresponding instance variable will be set to ''.  As a
    result, the above code will still work on terminals that do not
@ -30,11 +30,11 @@ class TerminalController:
    Also, this means that you can test whether the terminal supports a
    given action by simply testing the truth value of the
    corresponding instance variable:
-    
+
    >>> term = TerminalController()
    >>> if term.CLEAR_SCREEN:
    ...     print 'This terminal supports clearing the screen.'
-    
+
    Finally, if the width and height of the terminal are known, then
    they will be stored in the `COLS` and `LINES` attributes.
    """
@ -44,35 +44,35 @@ class TerminalController:
    DOWN = ''            #: Move the cursor down one line
    LEFT = ''            #: Move the cursor left one char
    RIGHT = ''           #: Move the cursor right one char
-    
+
    # Deletion:
    CLEAR_SCREEN = ''    #: Clear the screen and move to home position
    CLEAR_EOL = ''       #: Clear to the end of the line.
    CLEAR_BOL = ''       #: Clear to the beginning of the line.
    CLEAR_EOS = ''       #: Clear to the end of the screen
-    
+
    # Output modes:
    BOLD = ''            #: Turn on bold mode
    BLINK = ''           #: Turn on blink mode
    DIM = ''             #: Turn on half-bright mode
    REVERSE = ''         #: Turn on reverse-video mode
    NORMAL = ''          #: Turn off all modes
-    
+
    # Cursor display:
    HIDE_CURSOR = ''     #: Make the cursor invisible
    SHOW_CURSOR = ''     #: Make the cursor visible
-    
+
    # Terminal size:
    COLS = None          #: Width of the terminal (None for unknown)
    LINES = None         #: Height of the terminal (None for unknown)
-    
+
    # Foreground colors:
    BLACK = BLUE = GREEN = CYAN = RED = MAGENTA = YELLOW = WHITE = ''
-    
+
    # Background colors:
    BG_BLACK = BG_BLUE = BG_GREEN = BG_CYAN = ''
    BG_RED = BG_MAGENTA = BG_YELLOW = BG_WHITE = ''
-    
+
    _STRING_CAPABILITIES = """
    BOL=cr UP=cuu1 DOWN=cud1 LEFT=cub1 RIGHT=cuf1
    CLEAR_SCREEN=clear CLEAR_EOL=el CLEAR_BOL=el1 CLEAR_EOS=ed BOLD=bold
@ -80,7 +80,7 @@ class TerminalController:
    HIDE_CURSOR=cinvis SHOW_CURSOR=cnorm""".split()
    _COLORS = """BLACK BLUE GREEN CYAN RED MAGENTA YELLOW WHITE""".split()
    _ANSICOLORS = "BLACK RED GREEN YELLOW BLUE MAGENTA CYAN WHITE".split()
-    
+
    def __init__(self, term_stream=sys.stdout):
        """
        Create a `TerminalController` and initialize its attributes
@ -92,24 +92,24 @@ class TerminalController:
        # Curses isn't available on all platforms
        try: import curses
        except: return
-        
+
        # If the stream isn't a tty, then assume it has no capabilities.
        if os.environ.get('CALIBRE_WORKER', None) is not None or not hasattr(term_stream, 'isatty') or not term_stream.isatty(): return
-        
+
        # Check the terminal type.  If we fail, then assume that the
        # terminal has no capabilities.
        try: curses.setupterm()
        except: return
-        
+
        # Look up numeric capabilities.
        self.COLS = curses.tigetnum('cols')
        self.LINES = curses.tigetnum('lines')
-        
+
        # Look up string capabilities.
        for capability in self._STRING_CAPABILITIES:
            (attrib, cap_name) = capability.split('=')
            setattr(self, attrib, self._tigetstr(cap_name) or '')
-        
+
        # Colors
        set_fg = self._tigetstr('setf')
        if set_fg:
@ -127,7 +127,7 @@ class TerminalController:
        if set_bg_ansi:
            for i,color in zip(range(len(self._ANSICOLORS)), self._ANSICOLORS):
                setattr(self, 'BG_'+color, curses.tparm(set_bg_ansi, i) or '')
-    
+
    def _tigetstr(self, cap_name):
        # String capabilities can include "delays" of the form "$<2>".
        # For any modern terminal, we should be able to just ignore
@ -135,7 +135,7 @@ class TerminalController:
        import curses
        cap = curses.tigetstr(cap_name) or ''
        return re.sub(r'\$<\d+>[/*]?', '', cap)
-    
+
    def render(self, template):
        """
        Replace each $-substitutions in the given template string with
@ -143,7 +143,7 @@ class TerminalController:
        '' (if it's not).
        """
        return re.sub(r'\$\$|\${\w+}', self._render_sub, template)
-    
+
    def _render_sub(self, match):
        s = match.group()
        if s == '$$': return s
@ -156,20 +156,20 @@ class TerminalController:
 class ProgressBar:
    """
    A 3-line progress bar, which looks like::
-    
+
    Header
    20% [===========----------------------------------]
    progress message
-    
+
    The progress bar is colored, if the terminal supports color
    output; and adjusts to the width of the terminal.
-    
+
    If the terminal doesn't have the required capabilities, it uses a
    simple progress bar.
    """
    BAR = '%3d%% ${GREEN}[${BOLD}%s%s${NORMAL}${GREEN}]${NORMAL}\n'
    HEADER = '${BOLD}${CYAN}%s${NORMAL}\n\n'
-    
+
    def __init__(self, term, header, no_progress_bar = False):
        self.term, self.no_progress_bar = term, no_progress_bar
        self.fancy = self.term.CLEAR_EOL and self.term.UP and self.term.BOL
@ -177,12 +177,14 @@ class ProgressBar:
            self.width = self.term.COLS or 75
            self.bar = term.render(self.BAR)
            self.header = self.term.render(self.HEADER % header.center(self.width))
            if isinstance(self.header, unicode):
                self.header = self.header.encode('utf-8')
            self.cleared = 1 #: true if we haven't drawn the bar yet.
-        
+
    def update(self, percent, message=''):
        if isinstance(message, unicode):
            message = message.encode('utf-8', 'replace')
-        
+
        if self.no_progress_bar:
            if message:
                print message
@ -203,8 +205,8 @@ class ProgressBar:
            else:
                print '%d%%'%(percent*100), message
            sys.stdout.flush()
-            
+
-    
+
    def clear(self):
        if self.fancy and not self.cleared:
            sys.stdout.write(self.term.BOL + self.term.CLEAR_EOL +
--- a/src/calibre/web/init.py
+++ b/src/calibre/web/init.py
@ -2,5 +2,6 @@ __license__   = 'GPL v3'
 __copyright__ = '2008, Kovid Goyal <kovid at kovidgoyal.net>'
 class Recipe(object):
    pass
--- a/src/calibre/web/feeds/input.py
+++ b/src/calibre/web/feeds/input.py
@ -0,0 +1,65 @@
 #!/usr/bin/env python
 # vim:fileencoding=UTF-8:ts=4:sw=4:sta:et:sts=4:ai
 from __future__ import with_statement
 __license__   = 'GPL v3'
 __copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
 __docformat__ = 'restructuredtext en'
 import os
 from calibre.customize.conversion import InputFormatPlugin, OptionRecommendation
 class RecipeInput(InputFormatPlugin):
    name        = 'Recipe Input'
    author      = 'Kovid Goyal'
    description = _('Download periodical content from the internet')
    file_types  = set(['recipe'])
    recommendations = set([
        ('chapter_mark', 'none', OptionRecommendation.HIGH),
        ('dont_split_on_page_breaks', True, OptionRecommendation.HIGH),
        ('use_auto_toc', False, OptionRecommendation.HIGH),
        ])
    options = set([
        OptionRecommendation(name='test', recommended_value=False,
            help=_('Useful for recipe development. Forces '
            'max_articles_per_feed to 2 and downloads at most 2 feeds.')),
        OptionRecommendation(name='username', recommended_value=None,
            help=_('Username for sites that require a login to access '
                'content.')),
        OptionRecommendation(name='password', recommended_value=None,
            help=_('Password for sites that require a login to access '
                'content.')),
        OptionRecommendation(name='lrf', recommended_value=False,
            help='Optimize fetching for subsequent conversion to LRF.'),
        ])
    def convert(self, recipe_or_file, opts, file_ext, log,
            accelerators, progress=lambda x, y: x):
        from calibre.web.feeds.recipes import \
                get_builtin_recipe, compile_recipe
        if os.access(recipe_or_file, os.R_OK):
            recipe = compile_recipe(open(recipe_or_file, 'rb').read())
        else:
            title = os.path.basename(recipe_or_file).rpartition('.')[0]
            recipe = get_builtin_recipe(title)
        if recipe is None:
            raise ValueError('%s is not a valid recipe file or builtin recipe' %
                    recipe_or_file)
        ro = recipe(opts, log, progress)
        ro.download()
        opts.output_profile.flow_size = 0
        for f in os.listdir('.'):
            if f.endswith('.opf'):
                return os.path.abspath(f)
--- a/src/calibre/web/feeds/news.py
+++ b/src/calibre/web/feeds/news.py
@ -20,6 +20,7 @@ from calibre import browser, __appname__, iswindows, \
 from calibre.ebooks.BeautifulSoup import BeautifulSoup, NavigableString, CData, Tag
 from calibre.ebooks.metadata.opf2 import OPFCreator
 from calibre.ebooks.lrf import entity_to_unicode
 from calibre.web import Recipe
 from calibre.ebooks import render_html
 from calibre.ebooks.metadata.toc import TOC
 from calibre.ebooks.metadata import MetaInformation
@ -27,12 +28,11 @@ from calibre.web.feeds import feed_from_xml, templates, feeds_from_index, Feed
 from calibre.web.fetch.simple import option_parser as web2disk_option_parser
 from calibre.web.fetch.simple import RecursiveFetcher
 from calibre.utils.threadpool import WorkRequest, ThreadPool, NoResultsPending
 from calibre.utils.logging import Log
 from calibre.ptempfile import PersistentTemporaryFile, \
                              PersistentTemporaryDirectory
-class BasicNewsRecipe(object):
+class BasicNewsRecipe(Recipe):
    '''
    Abstract base class that contains logic needed in all feed fetchers.
    '''
@ -443,40 +443,34 @@ class BasicNewsRecipe(object):
        '''
        raise NotImplementedError
-    def __init__(self, options, parser, progress_reporter):
+    def __init__(self, options, log, progress_reporter):
        '''
        Initialize the recipe.
        :param options: Parsed commandline options
        :param parser:  Command line option parser. Used to intelligently merge options.
        :param progress_reporter: A Callable that takes two arguments: progress (a number between 0 and 1) and a string message. The message should be optional.
        '''
-        self.log = Log()
+        self.log = log
        if options.verbose:
            self.log.filter_level = self.log.DEBUG
        if not isinstance(self.title, unicode):
            self.title = unicode(self.title, 'utf-8', 'replace')
-        for attr in ('username', 'password', 'lrf', 'output_dir', 'verbose', 'debug', 'test'):
+        self.debug = options.verbose > 1
-            setattr(self, attr, getattr(options, attr))
+        self.output_dir = os.getcwd()
        self.verbose = options.verbose
        self.test = options.test
        self.username = options.username
        self.password = options.password
        self.lrf = options.lrf
        self.output_dir = os.path.abspath(self.output_dir)
        if options.test:
            self.max_articles_per_feed = 2
            self.simultaneous_downloads = min(4, self.simultaneous_downloads)
        if self.debug:
            self.verbose = True
        self.report_progress = progress_reporter
        self.username = self.password = None
        #: If True optimize downloading for eventual conversion to LRF
        self.lrf = False
        defaults = parser.get_default_values()
        for opt in options.__dict__.keys():
            if getattr(options, opt) != getattr(defaults, opt, None):
                setattr(self, opt, getattr(options, opt))
        if isinstance(self.feeds, basestring):
            self.feeds = eval(self.feeds)
            if isinstance(self.feeds, basestring):
@ -493,7 +487,6 @@ class BasicNewsRecipe(object):
            '--timeout', str(self.timeout),
            '--max-recursions', str(self.recursions),
            '--delay', str(self.delay),
            '--timeout', str(self.timeout),
            ]
        if self.encoding is not None:
            web2disk_cmdline.extend(['--encoding', self.encoding])
@ -520,9 +513,6 @@ class BasicNewsRecipe(object):
            self.simultaneous_downloads = 1
        self.navbar = templates.NavBarTemplate()
        self.html2lrf_options.extend(['--page-break-before', '$', '--use-spine', '--header', '--encoding', 'utf-8'])
        if '--base-font-size' not in self.html2lrf_options:
            self.html2lrf_options.extend(['--base-font-size', '12'])
        self.failed_downloads = []
        self.partial_failures = []
@ -557,7 +547,7 @@ class BasicNewsRecipe(object):
        return self.postprocess_html(soup, first_fetch)
-    def download(self, for_lrf=False):
+    def download(self):
        '''
        Download and pre-process all articles from the feeds in this recipe.
        This method should be called only one on a particular Recipe instance.