Sync to trunk.

2025-07-09 03:04:10 -04:00 · 2009-07-13 23:21:05 -04:00 · 2009-07-13 23:21:05 -04:00 · 2e6baa0cd7
commit 2e6baa0cd7
parent 70661a50f2 284c3b1797
6 changed files with 100 additions and 12 deletions
--- a/src/calibre/devices/usbms/driver.py
+++ b/src/calibre/devices/usbms/driver.py
@ -10,9 +10,11 @@ for a particular device.
 import os
 import fnmatch
 import shutil
+from math import ceil
 from itertools import cycle

 from calibre import sanitize_file_name as sanitize
+from calibre.constants import iswindows
 from calibre.ebooks.metadata import authors_to_string
 from calibre.devices.usbms.cli import CLI
 from calibre.devices.usbms.device import Device
@ -127,6 +129,7 @@ class USBMS(CLI, Device):

        for i, infile in enumerate(files):
            newpath = path
+            resizable = []

            if self.SUPPORTS_SUB_DIRS:
                mdata = metadata.next()
@ -135,23 +138,54 @@ class USBMS(CLI, Device):
                    for tag in mdata['tags']:
                        if tag.startswith(_('News')):
                            newpath = os.path.join(newpath, 'news')
-                            newpath = os.path.join(newpath, sanitize(mdata.get('title', '')))
-                            newpath = os.path.join(newpath, sanitize(mdata.get('timestamp', '')))
+                            c = sanitize(mdata.get('title', ''))
+                            if c:
+                                newpath = os.path.join(newpath, c)
+                                resizable.append(c)
+                            c = sanitize(mdata.get('timestamp', ''))
+                            if c:
+                                newpath = os.path.join(newpath, c)
+                                resizable.append(c)
                            break
                        elif tag.startswith('/'):
-                            newpath += tag
-                            newpath = os.path.normpath(newpath)
+                            for c in tag.split('/'):
+                                c = sanitize(c)
+                                if not c: continue
+                                newpath = os.path.join(newpath, c)
+                                resizable.append(c)
                            break

                if newpath == path:
-                    newpath = os.path.join(newpath,
-                        sanitize(mdata.get('authors', _('Unknown'))),
-                        sanitize(mdata.get('title', _('Unknown'))))
+                    c = sanitize(mdata.get('authors', _('Unknown')))
+                    if c:
+                        newpath = os.path.join(newpath, c)
+                        resizable.append(c)
+                    c = sanitize(mdata.get('title', _('Unknown')))
+                    if c:
+                        newpath = os.path.join(newpath, c)
+                        resizable.append(c)
+
+            newpath = os.path.abspath(newpath)
+            fname = sanitize(names.next())
+            resizable.append(fname)
+            filepath = os.path.join(newpath, fname)
+
+            if iswindows and len(filepath) > 250:
+                extra = len(filepath) - 250
+                delta = int(ceil(extra/float(len(resizable))))
+                for x in resizable:
+                    if delta > len(x):
+                        r = ''
+                    else:
+                        r = x[:-delta]
+                    filepath = filepath.replace(os.sep+x+os.sep, os.sep+r+os.sep)
+                filepath = filepath.replace(os.sep+os.sep, os.sep)
+                newpath = os.path.dirname(filepath)
+

            if not os.path.exists(newpath):
                os.makedirs(newpath)

-            filepath = os.path.join(newpath, sanitize(names.next()))
            paths.append(filepath)

            if hasattr(infile, 'read'):
--- a/src/calibre/ebooks/mobi/writer.py
+++ b/src/calibre/ebooks/mobi/writer.py
@ -1957,6 +1957,17 @@ class MobiWriter(object):
                    # Test to see if this child's offset is the same as the previous child's
                    # offset, skip it
                    h = child.href
+                    first = False
+
+                    if h is None:
+                        self._oeb.logger.warn('  Ignoring TOC entry with no href:',
+                                child.title)
+                        continue
+                    if h not in self._id_offsets:
+                        self._oeb.logger.warn('  Ignoring missing TOC entry:',
+                                child)
+                        continue
+
                    currentOffset = self._id_offsets[h]
                    # print "_generate_ctoc: child offset: 0x%X" % currentOffset

@ -1967,7 +1978,6 @@ class MobiWriter(object):
                    else :
                        self._oeb.logger.warn("  Ignoring redundant href: %s in '%s'" % (h, child.title))

-                    first = False
                else :
                    if self.opts.verbose > 2 :
                        self._oeb.logger.info("skipping class: %s depth %d at position %d" % \
--- a/src/calibre/ebooks/oeb/iterator.py
+++ b/src/calibre/ebooks/oeb/iterator.py
@ -41,9 +41,12 @@ class SpineItem(unicode):

    def __new__(cls, *args):
        args = list(args)
-        args[0] = args[0].partition('#')[0]
-        obj = super(SpineItem, cls).__new__(cls, *args)
        path = args[0]
+        ppath = path.partition('#')[0]
+        if not os.path.exists(path) and os.path.exists(ppath):
+            path = ppath
+        args[0] = path
+        obj = super(SpineItem, cls).__new__(cls, *args)
        raw = open(path, 'rb').read()
        raw, obj.encoding = xml_to_unicode(raw)
        obj.character_count = character_count(raw)
--- a/src/calibre/gui2/images/news/noaa.png
+++ b/src/calibre/gui2/images/news/noaa.png
--- a/src/calibre/web/feeds/recipes/init.py
+++ b/src/calibre/web/feeds/recipes/init.py
@ -47,7 +47,7 @@ recipe_modules = ['recipe_' + r for r in (
           'climate_progress', 'carta', 'slashdot', 'publico',
           'the_budget_fashionista', 'elperiodico_catalan',
           'elperiodico_spanish', 'expansion_spanish', 'lavanguardia',
-           'marca', 'kellog_faculty', 'kellog_insight',
+           'marca', 'kellog_faculty', 'kellog_insight', 'noaa',
           'theeconomictimes_india', '7dias', 'buenosaireseconomico',
           'diagonales', 'miradasalsur', 'newsweek_argentina', 'veintitres',
           'gva_be', 'hln', 'tijd', 'degentenaar', 'inquirer_net', 'uncrate',
--- a/src/calibre/web/feeds/recipes/recipe_noaa.py
+++ b/src/calibre/web/feeds/recipes/recipe_noaa.py
@ -0,0 +1,41 @@
+#!/usr/bin/env  python
+
+__license__   = 'GPL v3'
+__copyright__ = '2009, Darko Miletic <darko.miletic at gmail.com>'
+'''
+noaa.com
+'''
+
+from calibre.web.feeds.news import BasicNewsRecipe
+from calibre.ebooks.BeautifulSoup import Tag
+
+class NOAA(BasicNewsRecipe):
+    title                  = 'NOAA Online'
+    __author__             = 'Darko Miletic'
+    description            = 'NOAA'
+    publisher              = 'NOAA'
+    category               = 'news, science, US, ocean'
+    oldest_article         = 15
+    max_articles_per_feed  = 100
+    no_stylesheets         = True
+    use_embedded_content   = False
+    simultaneous_downloads = 1
+    encoding               = 'utf-8'
+    lang                   = 'en-US'
+    language               = _('English')
+
+
+    remove_tags        = [dict(name=['embed','object'])]
+    keep_only_tags     = [dict(name='div', attrs={'id':'contentArea'})]
+
+    feeds          = [(u'NOAA articles', u'http://www.rss.noaa.gov/noaarss.xml')]
+
+    def preprocess_html(self, soup):
+        soup.html['xml:lang'] = self.lang
+        soup.html['lang']     = self.lang
+        mlang = Tag(soup,'meta',[("http-equiv","Content-Language"),("content",self.lang)])
+        mcharset = Tag(soup,'meta',[("http-equiv","Content-Type"),("content","text/html; charset=UTF-8")])
+        soup.head.insert(0,mlang)
+        soup.head.insert(1,mcharset)
+        return self.adeify_images(soup)
+