Merge from trunk

2025-08-30 23:00:21 -04:00 · 2010-10-01 18:21:58 +01:00 · 2010-10-01 18:21:58 +01:00 · a5977d49e4
commit a5977d49e4
parent bb60bba3a9 c3014e5920
11 changed files with 115 additions and 8 deletions
--- a/resources/images/news/science_news_recent_issues.png
+++ b/resources/images/news/science_news_recent_issues.png
--- a/resources/recipes/science_news_recent_issues.recipe
+++ b/resources/recipes/science_news_recent_issues.recipe
@ -0,0 +1,78 @@
 #!/usr/bin/env  python
 __license__   = 'GPL v3'
 '''
 sciencenews.org
 '''
 from calibre.web.feeds.news import BasicNewsRecipe
 class ScienceNewsIssue(BasicNewsRecipe):
    title                 = u'Science News Recent Issues'
    __author__            = u'Darko Miletic, Sujata Raman and Starson17'
    description           = u'''Science News is an award-winning weekly
    newsmagazine covering the most important research in all fields of science.
    Its 16 pages each week are packed with short, accurate articles that appeal
    to both general readers and scientists. Published since 1922, the magazine
    now reaches about 150,000 subscribers and more than 1 million readers.
    These are the latest News Items from Science News. This recipe downloads
    the last 30 days worth of articles.'''
    category              = u'Science, Technology, News'
    publisher             = u'Society for Science & the Public'
    oldest_article        = 30
    language = 'en'
    max_articles_per_feed = 100
    no_stylesheets        = True
    use_embedded_content  = False
    timefmt               = ' [%A, %d %B, %Y]'
    recursions = 1
    remove_attributes = ['style']
    conversion_options = {'linearize_tables'  : True
                        , 'comment'           : description
                        , 'tags'              : category
                        , 'publisher'         : publisher
                        , 'language'          : language
                        }
    extra_css = '''
                .content_description{font-family:georgia ;font-size:x-large; color:#646464 ; font-weight:bold;}
                .content_summary{font-family:georgia ;font-size:small ;color:#585858 ; font-weight:bold;}
                .content_authors{font-family:helvetica,arial ;font-size: xx-small ;color:#14487E ;}
                .content_edition{font-family:helvetica,arial ;font-size: xx-small ;}
                .exclusive{color:#FF0000 ;}
                .anonymous{color:#14487E ;}
                .content_content{font-family:helvetica,arial ;font-size: medium ; color:#000000;}
                .description{color:#585858;font-family:helvetica,arial ;font-size: large ;}
                .credit{color:#A6A6A6;font-family:helvetica,arial ;font-size: xx-small ;}
                '''
    keep_only_tags = [ dict(name='div', attrs={'id':'column_action'}) ]
    remove_tags_after = dict(name='ul', attrs={'id':'content_functions_bottom'})
    remove_tags = [
                     dict(name='ul', attrs={'id':'content_functions_bottom'})
                    ,dict(name='div', attrs={'id':['content_functions_top','breadcrumb_content']})
                    ,dict(name='img', attrs={'class':'icon'})
                    ,dict(name='div', attrs={'class': 'embiggen'})
                  ]
    feeds       = [(u"Science News Current Issues", u'http://www.sciencenews.org/view/feed/type/edition/name/issues.rss')]
    match_regexps = [
            r'www.sciencenews.org/view/feature/id/',
            r'www.sciencenews.org/view/generic/id'
            ]
    def get_cover_url(self):
        cover_url = None
        index = 'http://www.sciencenews.org/view/home'
        soup = self.index_to_soup(index)
        link_item = soup.find(name = 'img',alt = "issue")
        if link_item:
           cover_url = 'http://www.sciencenews.org' + link_item['src'] + '.jpg'
        return cover_url
    def preprocess_html(self, soup):
        for tag in soup.findAll(name=['span']):
            tag.name = 'div'
        return soup
--- a/src/calibre/customize/profiles.py
+++ b/src/calibre/customize/profiles.py
@ -255,6 +255,9 @@ class OutputProfile(Plugin):
    #: Unsupported unicode characters to be replaced during preprocessing
    unsupported_unicode_chars = []
    #: Number of ems that the left margin of a blockquote is rendered as
    mobi_ems_per_blockquote = 1.0
    @classmethod
    def tags_to_string(cls, tags):
        return escape(', '.join(tags))
@ -564,6 +567,7 @@ class KindleOutput(OutputProfile):
    supports_mobi_indexing = True
    periodical_date_in_title = False
    ratings_char = u'\u2605'
    mobi_ems_per_blockquote = 2.0
    @classmethod
    def tags_to_string(cls, tags):
@ -582,6 +586,7 @@ class KindleDXOutput(OutputProfile):
    comic_screen_size         = (741, 1022)
    supports_mobi_indexing = True
    periodical_date_in_title = False
    mobi_ems_per_blockquote = 2.0
    @classmethod
    def tags_to_string(cls, tags):
--- a/src/calibre/ebooks/epub/input.py
+++ b/src/calibre/ebooks/epub/input.py
@ -117,7 +117,8 @@ class EPUBInput(InputFormatPlugin):
        encfile = os.path.abspath(os.path.join('META-INF', 'encryption.xml'))
        opf = None
        for f in walk(u'.'):
-            if f.lower().endswith('.opf') and '__MACOSX' not in f:
+            if f.lower().endswith('.opf') and '__MACOSX' not in f and \
                    not os.path.basename(f).startswith('.'):
                opf = os.path.abspath(f)
                break
        path = getattr(stream, 'name', 'stream')
--- a/src/calibre/ebooks/metadata/fb2.py
+++ b/src/calibre/ebooks/metadata/fb2.py
@ -33,7 +33,10 @@ def get_metadata(stream):
        le = XPath('descendant::fb2:last-name')(au)
        if le:
            lname = tostring(le[0])
-            author += ' '+lname
+            if author:
                author += ' '+lname
            else:
                author = lname
        if author:
            authors.append(author)
        if len(authors) == 1 and author is not None:
--- a/src/calibre/ebooks/mobi/mobiml.py
+++ b/src/calibre/ebooks/mobi/mobiml.py
@ -184,13 +184,14 @@ class MobiMLizer(object):
            elif tag in NESTABLE_TAGS and istate.rendered:
                para = wrapper = bstate.nested[-1]
            elif left > 0 and indent >= 0:
                ems = self.profile.mobi_ems_per_blockquote
                para = wrapper = etree.SubElement(parent, XHTML('blockquote'))
                para = wrapper
-                emleft = int(round(left / self.profile.fbase)) - 1
+                emleft = int(round(left / self.profile.fbase)) - ems
                emleft = min((emleft, 10))
                while emleft > 0:
                    para = etree.SubElement(para, XHTML('blockquote'))
-                    emleft -= 1
+                    emleft -= ems
            else:
                para = wrapper = etree.SubElement(parent, XHTML('p'))
            bstate.inline = bstate.para = para
--- a/src/calibre/ebooks/mobi/output.py
+++ b/src/calibre/ebooks/mobi/output.py
@ -41,6 +41,24 @@ class MOBIOutput(OutputFormatPlugin):
        ),
    ])
    def remove_image_transparencies(self):
        from calibre.utils.magick.draw import save_cover_data_to
        for item in self.oeb.manifest:
            if item.media_type.startswith('image'):
                raw = item.data
                ext = item.media_type.split('/')[-1].lower()
                if ext not in ('png', 'gif') or not raw:
                    continue
                try:
                    data = save_cover_data_to(raw, 'img.'+ext, return_data=True)
                except:
                    self.log.exception('Failed to remove transparency from',
                            item.href)
                    data = None
                if data is not None:
                    item.data = data
                    item.unload_data_from_memory()
    def check_for_periodical(self):
        if self.oeb.metadata.publication_type and \
            unicode(self.oeb.metadata.publication_type[0]).startswith('periodical:'):
@ -160,6 +178,7 @@ class MOBIOutput(OutputFormatPlugin):
        from calibre.ebooks.oeb.transforms.rasterize import SVGRasterizer, Unavailable
        from calibre.ebooks.oeb.transforms.htmltoc import HTMLTOCAdder
        from calibre.customize.ui import plugin_for_input_format
        self.remove_image_transparencies()
        imagemax = PALM_MAX_IMAGE_SIZE if opts.rescale_images else None
        if not opts.no_inline_toc:
            tocadder = HTMLTOCAdder(title=opts.toc_title)
--- a/src/calibre/ebooks/mobi/reader.py
+++ b/src/calibre/ebooks/mobi/reader.py
@ -234,7 +234,7 @@ class MobiReader(object):
        self.debug = debug
        self.embedded_mi = None
        self.base_css_rules = textwrap.dedent('''
-                blockquote { margin: 0em 0em 0em 1.25em; text-align: justify }
+                blockquote { margin: 0em 0em 0em 2em; text-align: justify }
                p { margin: 0em; text-align: justify }
--- a/src/calibre/ebooks/oeb/transforms/rescale.py
+++ b/src/calibre/ebooks/oeb/transforms/rescale.py
@ -39,7 +39,7 @@ class RescaleImages(object):
            if item.media_type.startswith('image'):
                ext = item.media_type.split('/')[-1].upper()
                if ext == 'JPG': ext = 'JPEG'
-                if ext not in ('PNG', 'JPEG'):
+                if ext not in ('PNG', 'JPEG', 'GIF'):
                    ext = 'JPEG'
                raw = item.data
--- a/src/calibre/gui2/dialogs/tweak_epub.ui
+++ b/src/calibre/gui2/dialogs/tweak_epub.ui
@ -10,7 +10,7 @@
    <x>0</x>
    <y>0</y>
    <width>382</width>
-    <height>242</height>
+    <height>265</height>
   </rect>
  </property>
  <property name="windowTitle">
--- a/src/calibre/gui2/preferences/plugboard.ui
+++ b/src/calibre/gui2/preferences/plugboard.ui
@ -19,7 +19,7 @@
     <property name="text">
      <string>Here you can change the metadata calibre uses to update a book when saving to disk or sending to device.
-Use this dialog to define a 'plugboard' for a format (or all formats) and a device (or all devices). The plugboard spefies what template is connected to what field. The template is used to compute a value, and that value is assigned to the connected field.
+Use this dialog to define a 'plugboard' for a format (or all formats) and a device (or all devices). The plugboard specifies what template is connected to what field. The template is used to compute a value, and that value is assigned to the connected field.
 Often templates will contain simple references to composite columns, but this is not necessary. You can use any template in a source box that you can use elsewhere in calibre.