revisions for annotations

2025-07-09 03:04:10 -04:00 · 2010-03-05 10:48:49 -08:00 · 2010-03-05 10:48:49 -08:00 · b86b7a9a80
commit b86b7a9a80
parent a14fdbc543 8ba4e70997
24 changed files with 801 additions and 226 deletions
--- a/resources/recipes/apod.recipe
+++ b/resources/recipes/apod.recipe
@ -0,0 +1,37 @@
 from calibre.web.feeds.news import BasicNewsRecipe
 class APOD(BasicNewsRecipe):
    title          = u'Astronomy Picture of the Day'
    __author__  = 'Starson17'
    description = 'Astronomy Pictures'
    language = 'en'
    use_embedded_content    = False
    no_stylesheets        = True
    cover_url     = 'http://apod.nasa.gov/apod/image/1003/m78_torregrosa.jpg'
    remove_javascript = True
    recursions = 0
    oldest_article        = 14
    feeds = [
             (u'Astronomy Picture of the Day', u'http://apod.nasa.gov/apod.rss')
             ]
    extra_css = '''
                    h1{font-family:Arial,Helvetica,sans-serif; font-weight:bold;font-size:large;}
                    h2{font-family:Arial,Helvetica,sans-serif; font-weight:normal;font-size:small;}
                    p{font-family:Arial,Helvetica,sans-serif;font-size:small;}
                    body{font-family:Helvetica,Arial,sans-serif;font-size:small;}
 		'''
    def postprocess_html(self, soup, first_fetch):
        center_tags = soup.findAll(['center'])
        p_tags = soup.findAll(['p'])
        last_center = center_tags[-1:]
        last_center[0].extract()
        first_p = p_tags[:1]
        for tag in first_p:
            tag.extract()
        last2_p = p_tags[-2:]
        for tag in last2_p:
            tag.extract()
        return soup
--- a/resources/recipes/ars_technica.recipe
+++ b/resources/recipes/ars_technica.recipe
@ -5,6 +5,7 @@ __copyright__ = '2008-2010, Darko Miletic <darko.miletic at gmail.com>'
 arstechnica.com
 '''
 import re
 from calibre.web.feeds.news import BasicNewsRecipe
 from calibre.ebooks.BeautifulSoup import BeautifulSoup, Tag
@ -20,7 +21,7 @@ class ArsTechnica2(BasicNewsRecipe):
    no_stylesheets        = True
    encoding              = 'utf-8'
    use_embedded_content  = False
-    extra_css             = ' body {font-family: sans-serif} .byline{font-weight: bold; line-height: 1em; font-size: 0.625em; text-decoration: none} '
+    extra_css             = ' body {font-family: Arial,Helvetica,sans-serif} .title{text-align: left} .byline{font-weight: bold; line-height: 1em; font-size: 0.625em; text-decoration: none} '
    conversion_options = {
                             'comments'  : description
@ -30,6 +31,10 @@ class ArsTechnica2(BasicNewsRecipe):
                         }
    preprocess_regexps = [
                (re.compile(r'<div class="news-item-figure', re.DOTALL|re.IGNORECASE),lambda match: '<div class="news-item-figure"')
               ,(re.compile(r'</title>.*?</head>', re.DOTALL|re.IGNORECASE),lambda match: '</title></head>')
                         ]
    keep_only_tags = [dict(name='div', attrs={'id':['story','etc-story']})]
@ -37,7 +42,7 @@ class ArsTechnica2(BasicNewsRecipe):
                     dict(name=['object','link','embed'])
                    ,dict(name='div', attrs={'class':'read-more-link'})
                  ]
-
+    remove_attributes=['width','height']
    feeds = [
              (u'Infinite Loop (Apple content)'        , u'http://feeds.arstechnica.com/arstechnica/apple/'      )
@ -90,3 +95,5 @@ class ArsTechnica2(BasicNewsRecipe):
        return soup
    def get_article_url(self, article):
        return article.get('guid',  None).rpartition('?')[0]
--- a/resources/recipes/johm.recipe
+++ b/resources/recipes/johm.recipe
@ -0,0 +1,87 @@
 # -*- coding: utf-8 -*-
 from calibre.web.feeds.recipes import BasicNewsRecipe
 class JournalofHospitalMedicine(BasicNewsRecipe):
    title       = 'Journal of Hospital Medicine'
    __author__  = 'Krittika Goyal'
    description = 'Medical news'
    timefmt = ' [%d %b, %Y]'
    needs_subscription = True
    no_stylesheets = True
    #remove_tags_before = dict(name='div', attrs={'align':'center'})
    #remove_tags_after  = dict(name='ol', attrs={'compact':'COMPACT'})
    remove_tags = [
       dict(name='iframe'),
       dict(name='div', attrs={'class':'subContent'}),
       dict(name='div', attrs={'id':['contentFrame']}),
       #dict(name='form', attrs={'onsubmit':"return verifySearch(this.w,'Keyword, citation, or author')"}),
       #dict(name='table', attrs={'align':'RIGHT'}),
    ]
   # TO LOGIN
    def get_browser(self):
        br = BasicNewsRecipe.get_browser()
        br.open('http://www3.interscience.wiley.com/cgi-bin/home')
        br.select_form(name='siteLogin')
        br['LoginName'] = self.username
        br['Password'] = self.password
        response = br.submit()
        raw = response.read()
        if 'userName = ""' in raw:
            raise Exception('Login failed. Check your username and password')
        return br
    #TO GET ARTICLE TOC
    def johm_get_index(self):
            return self.index_to_soup('http://www3.interscience.wiley.com/journal/111081937/home')
    # To parse artice toc
    def parse_index(self):
            parse_soup = self.johm_get_index()
            div = parse_soup.find(id='contentCell')
            current_section = None
            current_articles = []
            feeds = []
            for x in div.findAll(True):
                if x.name == 'h4':
                    # Section heading found
                    if current_articles and current_section:
                        feeds.append((current_section, current_articles))
                    current_section = self.tag_to_string(x)
                    current_articles = []
                    self.log('\tFound section:', current_section)
                if current_section is not None and x.name == 'strong':
                    title = self.tag_to_string(x)
                    p = x.parent.parent.find('a', href=lambda x: x and '/HTMLSTART' in x)
                    if p is None:
                        continue
                    url = p.get('href', False)
                    if not url or not title:
                        continue
                    if url.startswith('/'):
                         url = 'http://www3.interscience.wiley.com'+url
                    url = url.replace('/HTMLSTART', '/main.html,ftx_abs')
                    self.log('\t\tFound article:', title)
                    self.log('\t\t\t', url)
                    #if url.startswith('/'):
                        #url = 'http://online.wsj.com'+url
                    current_articles.append({'title': title, 'url':url,
                        'description':'', 'date':''})
            if current_articles and current_section:
                feeds.append((current_section, current_articles))
            return feeds
    def preprocess_html(self, soup):
        for img in soup.findAll('img', src=True):
            img['src'] = img['src'].replace('tfig', 'nfig')
        return soup
--- a/resources/recipes/sfbg.recipe
+++ b/resources/recipes/sfbg.recipe
@ -0,0 +1,42 @@
 from calibre.web.feeds.news import BasicNewsRecipe
 from calibre.ebooks.BeautifulSoup import BeautifulSoup
 class SanFranciscoBayGuardian(BasicNewsRecipe):
    title          = u'San Francisco Bay Guardian'
    language       = 'en'
    __author__     = 'Krittika Goyal'
    oldest_article = 1 #days
    max_articles_per_feed = 25
    #encoding = 'latin1'
    no_stylesheets = True
    remove_tags_before = dict(name='div', attrs={'id':'story_header'})
    remove_tags_after  = dict(name='div', attrs={'id':'shirttail'})
    remove_tags = [
       dict(name='iframe'),
       #dict(name='div', attrs={'class':'related-articles'}),
        dict(name='div', attrs={'id':['story_tools', 'toolbox', 'shirttail', 'comment_widget']}),
       #dict(name='ul', attrs={'class':'article-tools'}),
       dict(name='ul', attrs={'id':'story_tabs'}),
    ]
    feeds = [
        ('Cover', 'http://www.newsobserver.com/100/index.rss'),
        ('News', 'http://www.newsobserver.com/102/index.rss'),
        ('Politics', 'http://www.newsobserver.com/105/index.rss'),
        ('Business', 'http://www.newsobserver.com/104/index.rss'),
        ('Sports', 'http://www.newsobserver.com/103/index.rss'),
        ('College Sports', 'http://www.newsobserver.com/119/index.rss'),
        ('Lifestyles', 'http://www.newsobserver.com/106/index.rss'),
        ('Editorials', 'http://www.newsobserver.com/158/index.rss')]
    def preprocess_html(self, soup):
        story = soup.find(name='div', attrs={'id':'story_body'})
        #td = heading.findParent(name='td')
        #td.extract()
        soup = BeautifulSoup('<html><head><title>t</title></head><body></body></html>')
        body = soup.find(name='body')
        body.insert(0, story)
        return soup
--- a/resources/recipes/smith.recipe
+++ b/resources/recipes/smith.recipe
@ -0,0 +1,52 @@
 from calibre.web.feeds.news import BasicNewsRecipe
 from calibre.ebooks.BeautifulSoup import BeautifulSoup
 class SmithsonianMagazine(BasicNewsRecipe):
    title          = u'Smithsonian Magazine'
    language       = 'en'
    __author__     = 'Krittika Goyal'
    oldest_article = 31#days
    max_articles_per_feed = 50
    #encoding = 'latin1'
    recursions = 1
    match_regexps = ['&page=[2-9]$']
    remove_stylesheets = True
    #remove_tags_before = dict(name='h1', attrs={'class':'heading'})
    remove_tags_after  = dict(name='p', attrs={'id':'articlePaginationWrapper'})
    remove_tags = [
       dict(name='iframe'),
       dict(name='div', attrs={'class':'article_sidebar_border'}),
       dict(name='div', attrs={'id':['article_sidebar_border', 'most-popular_large']}),
       #dict(name='ul', attrs={'class':'article-tools'}),
       dict(name='ul', attrs={'class':'cat-breadcrumb col three last'}),
    ]
    feeds          = [
 ('History and Archeology',
 'http://feeds.feedburner.com/smithsonianmag/history-archaeology'),
 ('People and Places',
 'http://feeds.feedburner.com/smithsonianmag/people-places'),
 ('Science and Nature',
 'http://feeds.feedburner.com/smithsonianmag/science-nature'),
 ('Arts and Culture',
 'http://feeds.feedburner.com/smithsonianmag/arts-culture'),
 ('Travel',
 'http://feeds.feedburner.com/smithsonianmag/travel'),
 ]
    def preprocess_html(self, soup):
        story = soup.find(name='div', attrs={'id':'article-left'})
        #td = heading.findParent(name='td')
        #td.extract()
        soup = BeautifulSoup('<html><head><title>t</title></head><body></body></html>')
        body = soup.find(name='body')
        body.insert(0, story)
        return soup
    def postprocess_html(self, soup, first):
        for p in soup.findAll(id='articlePaginationWrapper'): p.extract()
        if not first:
             for div in soup.findAll(id='article-head'): div.extract()
        return soup
--- a/setup/extensions.py
+++ b/setup/extensions.py
@ -143,7 +143,7 @@ extensions = [
 if iswindows:
    extensions.append(Extension('winutil',
                ['calibre/utils/windows/winutil.c'],
-                libraries=['shell32', 'setupapi'],
+                libraries=['shell32', 'setupapi', 'wininet'],
                cflags=['/X']
                ))
--- a/src/calibre/devices/interface.py
+++ b/src/calibre/devices/interface.py
@ -6,6 +6,7 @@ the GUI. A device backend must subclass the L{Device} class. See prs500.py for
 a backend that implement the Device interface for the SONY PRS500 Reader.
 """
 import os
 from collections import namedtuple
 from calibre.customize import Plugin
 from calibre.constants import iswindows
@ -43,6 +44,9 @@ class DevicePlugin(Plugin):
    #: Icon for this device
    icon = I('reader.svg')
    # Used by gui2.ui:annotations_fetched() and devices.kindle.driver:get_annotations()
    UserAnnotation = namedtuple('Annotation','type, bookmark')
    @classmethod
    def get_gui_name(cls):
        if hasattr(cls, 'gui_name'):
--- a/src/calibre/devices/kindle/driver.py
+++ b/src/calibre/devices/kindle/driver.py
@ -7,15 +7,12 @@ __docformat__ = 'restructuredtext en'
 '''
 Device driver for Amazon's Kindle
 '''
-
+import os, re, sys
 from cStringIO import StringIO
 import os
 import re
 from struct import unpack
 import sys
 from calibre.devices.usbms.driver import USBMS
-from calibre.ebooks.metadata.mobi import StreamSlicer
+from calibre.utils.logging import Log
 class KINDLE(USBMS):
@ -65,6 +62,16 @@ class KINDLE(USBMS):
        return mi
    def get_annotations(self, path_map):
        MBP_FORMATS = [u'azw', u'mobi', u'prc', u'txt']
        TAN_FORMATS = [u'tpz', u'azw1']
        mbp_formats = set()
        for fmt in MBP_FORMATS:
            mbp_formats.add(fmt)
        tan_formats = set()
        for fmt in TAN_FORMATS:
            tan_formats.add(fmt)
        def get_storage():
            storage = []
            if self._main_prefix:
@ -75,36 +82,49 @@ class KINDLE(USBMS):
                storage.append(os.path.join(self._card_b_prefix, self.EBOOK_DIR_CARD_B))
            return storage
-        def resolve_mbp_paths(storage, path_map):
+        def resolve_bookmark_paths(storage, path_map):
            pop_list = []
            book_ext = {}
            for id in path_map:
-                for vol in storage:
+                file_fmts = set()
-                    #print "path_map[id]: %s" % path_map[id]
+                for fmt in path_map[id]['fmts']:
-                    mbp_path = path_map[id].replace(os.path.abspath('/<storage>'),vol)
+                    file_fmts.add(fmt)
-                    #print "looking for mbp_path: %s" % mbp_path
+
-                    if os.path.exists(mbp_path):
+                bookmark_extension = None
-                        #print "mbp_path found"
+                if file_fmts.intersection(mbp_formats):
-                        path_map[id] = mbp_path
+                    book_extension = list(file_fmts.intersection(mbp_formats))[0]
-                        break
+                    bookmark_extension = 'mbp'
                elif file_fmts.intersection(tan_formats):
                    book_extension = list(file_fmts.intersection(tan_formats))[0]
                    bookmark_extension = 'tan'
                if bookmark_extension:
                    for vol in storage:
                        bkmk_path = path_map[id]['path'].replace(os.path.abspath('/<storage>'),vol)
                        bkmk_path = bkmk_path.replace('bookmark',bookmark_extension)
                        if os.path.exists(bkmk_path):
                            path_map[id] = bkmk_path
                            book_ext[id] = book_extension
                            break
                    else:
                        pop_list.append(id)
                else:
                    #print "mbp_path not found"
                    pop_list.append(id)
-            # Remove non-existent mbp files
+            # Remove non-existent bookmark templates
            for id in pop_list:
                path_map.pop(id)
-            return path_map
+            return path_map, book_ext
        log = Log()
        storage = get_storage()
-        path_map = resolve_mbp_paths(storage, path_map)
+        path_map, book_ext = resolve_bookmark_paths(storage, path_map)
        # path_map is now a mapping of valid mbp files
        # Not yet implemented - Topaz annotations
        bookmarked_books = {}
        MBP_FORMATS = ['azw', 'mobi', 'prc', 'txt']
        for id in path_map:
-            myBookmark = Bookmark(path_map[id], MBP_FORMATS, id)
+            bookmark_ext = path_map[id].rpartition('.')[2]
-            bookmarked_books[id] = self.UserAnnotation(type='mobi', bookmark=myBookmark)
+            myBookmark = Bookmark(path_map[id], id, book_ext[id], bookmark_ext)
            bookmarked_books[id] = self.UserAnnotation(type='kindle', bookmark=myBookmark)
        # This returns as job.result in gui2.ui.annotations_fetched(self,job)
        return bookmarked_books
@ -134,22 +154,25 @@ class Bookmark():
    A simple class fetching bookmark data
    Kindle-specific
    '''
-    def __init__(self, path, formats, id):
+    def __init__(self, path, id, book_format, bookmark_extension):
-        self.book_format = None
+        self.book_format = book_format
        self.bookmark_extension = bookmark_extension
        self.book_length = 0
        self.id = id
        self.last_read = 0
        self.last_read_location = 0
        self.timestamp = 0
        self.user_notes = None
        self.get_bookmark_data(path)
-        self.get_book_length(path, formats)
+        self.get_book_length(path)
        try:
-            self.percent_read = float(100*self.last_read_location / self.book_length)
+            self.percent_read = float(100*self.last_read / self.book_length)
        except:
            self.percent_read = 0
    def record(self, n):
        from calibre.ebooks.metadata.mobi import StreamSlicer
        if n >= self.nrecs:
            raise ValueError('non-existent record %r' % n)
        offoff = 78 + (8 * n)
@ -159,19 +182,22 @@ class Bookmark():
            stop, = unpack('>I', self.data[offoff + 8:offoff + 12])
        return StreamSlicer(self.stream, start, stop)
-    def get_bookmark_data(self, path, fetchUserNotes=True):
+    def get_bookmark_data(self, path):
        ''' Return the timestamp and last_read_location '''
-        with open(path,'rb') as f:
+        from calibre.ebooks.metadata.mobi import StreamSlicer
-            stream = StringIO(f.read())
+        user_notes = {}
-            data = StreamSlicer(stream)
+        if self.bookmark_extension == 'mbp':
-            self.timestamp, = unpack('>I', data[0x24:0x28])
+            with open(path,'rb') as f:
-            bpar_offset, = unpack('>I', data[0x4e:0x52])
+                stream = StringIO(f.read())
-            lrlo = bpar_offset + 0x0c
+                data = StreamSlicer(stream)
-            self.last_read_location = int(unpack('>I', data[lrlo:lrlo+4])[0])
+                self.timestamp, = unpack('>I', data[0x24:0x28])
-            entries, = unpack('>I', data[0x4a:0x4e])
+                bpar_offset, = unpack('>I', data[0x4e:0x52])
                lrlo = bpar_offset + 0x0c
                self.last_read = int(unpack('>I', data[lrlo:lrlo+4])[0])
                self.last_read_location = self.last_read/150 + 1
                entries, = unpack('>I', data[0x4a:0x4e])
-            # Store the annotations/locations
+                # Store the annotations/locations
            if fetchUserNotes:
                bpl = bpar_offset + 4
                bpar_len, = unpack('>I', data[bpl:bpl+4])
                bpar_len += 8
@ -184,7 +210,6 @@ class Bookmark():
                current_entry = 1
                sig = data[eo:eo+4]
                previous_block = None
                user_notes = {}
                while sig == 'DATA':
                    text = None
@ -206,8 +231,11 @@ class Bookmark():
                        text = data[eo+8:eo+8+rec_len].decode('utf-16-be')
                    if entry_type:
-                        user_notes[location] = dict(type=entry_type, id=self.id,
+                        displayed_location = location/150 + 1
-                                                    text=data[eo+8:eo+8+rec_len].decode('utf-16-be'))
+                        user_notes[location] = dict(id=self.id,
                                                    displayed_location=displayed_location,
                                                    type=entry_type,
                                                    text=text)
                        #print " %2d: %s %s" % (current_entry, entry_type,'at %d' % location if location else '')
                    #if current_block == 'text_block':
                        #self.textdump(text)
@ -229,38 +257,104 @@ class Bookmark():
                        # If a bookmark coincides with a user annotation, the locs could
                        # be the same - cheat by nudging -1
                        # Skip bookmark for last_read_location
-                        if end_loc != self.last_read_location:
+                        if end_loc != self.last_read:
-                            user_notes[end_loc - 1] = dict(type='Bookmark',id=self.id,text=None)
+                            displayed_location = end_loc/150 + 1
                            user_notes[end_loc - 1] = dict(id=self.id,
                                                           displayed_location=displayed_location,
                                                           type='Bookmark',
                                                           text=None)
                    rec_len, = unpack('>I', data[eo+4:eo+8])
                    eo += rec_len + 8
                    sig = data[eo:eo+4]
        elif self.bookmark_extension == 'tan':
            # TAN bookmarks
            self.timestamp = os.path.getmtime(path)
            with open(path,'rb') as f:
                stream = StringIO(f.read())
                data = StreamSlicer(stream)
                self.last_read = int(unpack('>I', data[5:9])[0])
                self.last_read_location = self.last_read/33
                entries, = unpack('>I', data[9:13])
                current_entry = 0
                e_base = 0x0d
                while current_entry < entries:
                    location, = unpack('>I', data[e_base+2:e_base+6])
                    text = None
                    text_len, = unpack('>I', data[e_base+0xA:e_base+0xE])
                    e_type, = unpack('>B', data[e_base+1])
                    if e_type == 0:
                        e_type = 'Bookmark'
                    elif e_type == 1:
                        e_type = 'Highlight'
                        text = "(Topaz highlights not yet supported)"
                    elif e_type == 2:
                        e_type = 'Note'
                        text = data[e_base+0x10:e_base+0x10+text_len]
                    else:
                        e_type = 'Unknown annotation type'
                    if self.book_format in ['tpz','azw1']:
                        # *** This needs fine-tuning
                        displayed_location = location/33
                    elif self.book_format == 'pdf':
                        # *** This needs testing
                        displayed_location = location
                    user_notes[location] = dict(id=self.id,
                                                displayed_location=displayed_location,
                                                type=e_type,
                                                text=text)
                    if text_len == 0xFFFFFFFF:
                        e_base = e_base + 14
                    else:
                        e_base = e_base + 14 + 2 + text_len
                    current_entry += 1
                for location in user_notes:
                    if location == self.last_read:
                        user_notes.pop(location)
                        break
        else:
            print "unsupported bookmark_extension: %s" % self.bookmark_extension
        self.user_notes = user_notes
        '''
        for location in sorted(user_notes):
-            print '  Location %d: %s\n%s' % self.magicKindleLocationCalculator(location),
+            print '  Location %d: %s\n%s' % (user_notes[location]['displayed_location'],
                                                     user_notes[location]['type'],
                                    '\n'.join(self.textdump(user_notes[location]['text'])))
        '''
        self.user_notes = user_notes
-    def get_book_length(self, path, formats):
+    def get_book_length(self, path):
-        # This assumes only one of the possible formats exists on the Kindle
+        from calibre.ebooks.metadata.mobi import StreamSlicer
-        book_fs = None
+        book_fs = path.replace('.%s' % self.bookmark_extension,'.%s' % self.book_format)
-        for format in formats:
+
-            fmt = format.rpartition('.')[2]
+        self.book_length = 0
-            book_fs = path.replace('.mbp','.%s' % fmt)
+        if self.bookmark_extension == 'mbp':
-            if os.path.exists(book_fs):
+            # Read the book len from the header
-                self.book_format = fmt
+            with open(book_fs,'rb') as f:
-                break
+                self.stream = StringIO(f.read())
                self.data = StreamSlicer(self.stream)
                self.nrecs, = unpack('>H', self.data[76:78])
                record0 = self.record(0)
                self.book_length = int(unpack('>I', record0[0x04:0x08])[0])
        elif self.bookmark_extension == 'tan':
            # Read bookLength from metadata
            with open(book_fs,'rb') as f:
                stream = StringIO(f.read())
                raw = stream.read(8*1024)
                if not raw.startswith('TPZ'):
                    raise ValueError('Not a Topaz file')
                first = raw.find('metadata')
                if first < 0:
                    raise ValueError('Invalid Topaz file')
                second = raw.find('metadata', first+10)
                if second < 0:
                    raise ValueError('Invalid Topaz file')
                raw = raw[second:second+1000]
                idx = raw.find('bookLength')
                if idx > -1:
                    length = ord(raw[idx+len('bookLength')])
                    self.book_length = int(raw[idx+len('bookLength')+1:idx+len('bookLength')+1+length])
        else:
-            #print "no files matching library formats exist on device"
+            print "unsupported bookmark_extension: %s" % bookmark_extension
            self.book_length = 0
            return
        # Read the book len from the header
        with open(book_fs,'rb') as f:
            self.stream = StringIO(f.read())
            self.data = StreamSlicer(self.stream)
            self.nrecs, = unpack('>H', self.data[76:78])
            record0 = self.record(0)
            self.book_length = int(unpack('>I', record0[0x04:0x08])[0])
--- a/src/calibre/devices/usbms/device.py
+++ b/src/calibre/devices/usbms/device.py
@ -18,7 +18,6 @@ import re
 import sys
 import glob
 from collections import namedtuple
 from itertools import repeat
 from calibre.devices.interface import DevicePlugin
@ -90,8 +89,6 @@ class Device(DeviceConfig, DevicePlugin):
    EBOOK_DIR_CARD_B = ''
    DELETE_EXTS = []
    # Used by gui2.ui:annotations_fetched() and devices.kindle.driver:get_annotations()
    UserAnnotation = namedtuple('Annotation','type, bookmark')
    def reset(self, key='-1', log_packets=False, report_progress=None,
            detected_device=None):
--- a/src/calibre/ebooks/chardet/init.py
+++ b/src/calibre/ebooks/chardet/init.py
@ -53,13 +53,15 @@ _CHARSET_ALIASES = { "macintosh" : "mac-roman",
                        "x-sjis" : "shift-jis" }
-def force_encoding(raw, verbose):
+def force_encoding(raw, verbose, assume_utf8=False):
    from calibre.constants import preferred_encoding
    try:
        chardet = detect(raw)
    except:
        chardet = {'encoding':preferred_encoding, 'confidence':0}
    encoding = chardet['encoding']
    if chardet['confidence'] < 1 and assume_utf8:
        encoding = 'utf-8'
    if chardet['confidence'] < 1 and verbose:
        print 'WARNING: Encoding detection confidence %d%%'%(chardet['confidence']*100)
    if not encoding:
@ -73,7 +75,7 @@ def force_encoding(raw, verbose):
 def xml_to_unicode(raw, verbose=False, strip_encoding_pats=False,
-                   resolve_entities=False):
+                   resolve_entities=False, assume_utf8=False):
    '''
    Force conversion of byte string to unicode. Tries to look for XML/HTML
    encoding declaration first, if not found uses the chardet library and
@ -95,7 +97,7 @@ def xml_to_unicode(raw, verbose=False, strip_encoding_pats=False,
                encoding = match.group(1)
                break
        if encoding is None:
-            encoding = force_encoding(raw, verbose)
+            encoding = force_encoding(raw, verbose, assume_utf8=assume_utf8)
        try:
            if encoding.lower().strip() == 'macintosh':
                encoding = 'mac-roman'
--- a/src/calibre/ebooks/epub/input.py
+++ b/src/calibre/ebooks/epub/input.py
@ -3,7 +3,7 @@ __license__ = 'GPL 3'
 __copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
 __docformat__ = 'restructuredtext en'
-import os, re, uuid
+import os, uuid
 from itertools import cycle
 from lxml import etree
@ -19,8 +19,7 @@ class EPUBInput(InputFormatPlugin):
    recommendations = set([('page_breaks_before', '/', OptionRecommendation.MED)])
-    @classmethod
+    def decrypt_font(self, key, path):
    def decrypt_font(cls, key, path):
        raw = open(path, 'rb').read()
        crypt = raw[:1024]
        key = cycle(iter(key))
@ -29,13 +28,18 @@ class EPUBInput(InputFormatPlugin):
            f.write(decrypt)
            f.write(raw[1024:])
-    @classmethod
+    def process_encryption(self, encfile, opf, log):
    def process_encryption(cls, encfile, opf, log):
        key = None
-        m = re.search(r'(?i)(urn:uuid:[0-9a-f-]+)', open(opf, 'rb').read())
+        for item in opf.identifier_iter():
-        if m:
+            scheme = None
-            key = m.group(1)
+            for key in item.attrib.keys():
-            key = list(map(ord, uuid.UUID(key).bytes))
+                if key.endswith('scheme'):
                    scheme = item.get(key)
            if (scheme and scheme.lower() == 'uuid') or \
                    (item.text and item.text.startswith('urn:uuid:')):
                key = str(item.text).rpartition(':')[-1]
                key = list(map(ord, uuid.UUID(key).bytes))
        try:
            root = etree.parse(encfile)
            for em in root.xpath('descendant::*[contains(name(), "EncryptionMethod")]'):
@ -46,7 +50,8 @@ class EPUBInput(InputFormatPlugin):
                uri = cr.get('URI')
                path = os.path.abspath(os.path.join(os.path.dirname(encfile), '..', *uri.split('/')))
                if os.path.exists(path):
-                    cls.decrypt_font(key, path)
+                    self._encrypted_font_uris.append(uri)
                    self.decrypt_font(key, path)
            return True
        except:
            import traceback
@ -115,14 +120,17 @@ class EPUBInput(InputFormatPlugin):
        if opf is None:
            raise ValueError('%s is not a valid EPUB file'%path)
        if os.path.exists(encfile):
            if not self.process_encryption(encfile, opf, log):
                raise DRMError(os.path.basename(path))
        opf = os.path.relpath(opf, os.getcwdu())
        parts = os.path.split(opf)
        opf = OPF(opf, os.path.dirname(os.path.abspath(opf)))
        self._encrypted_font_uris = []
        if os.path.exists(encfile):
            if not self.process_encryption(encfile, opf, log):
                raise DRMError(os.path.basename(path))
        self.encrypted_fonts = self._encrypted_font_uris
        if len(parts) > 1 and parts[0]:
            delta = '/'.join(parts[:-1])+'/'
            for elem in opf.itermanifest():
--- a/src/calibre/ebooks/epub/output.py
+++ b/src/calibre/ebooks/epub/output.py
@ -12,8 +12,9 @@ from urllib import unquote
 from calibre.customize.conversion import OutputFormatPlugin
 from calibre.ptempfile import TemporaryDirectory
 from calibre.constants import __appname__, __version__
-from calibre import strftime, guess_type, prepare_string_for_xml
+from calibre import strftime, guess_type, prepare_string_for_xml, CurrentDir
 from calibre.customize.conversion import OptionRecommendation
 from calibre.constants import filesystem_encoding
 from lxml import etree
@ -170,6 +171,19 @@ class EPUBOutput(OutputFormatPlugin):
        self.workaround_sony_quirks()
        from calibre.ebooks.oeb.base import OPF
        identifiers = oeb.metadata['identifier']
        uuid = None
        for x in identifiers:
            if x.get(OPF('scheme'), None).lower() == 'uuid' or unicode(x).startswith('urn:uuid:'):
                uuid = unicode(x).split(':')[-1]
                break
        if uuid is None:
            self.log.warn('No UUID identifier found')
            from uuid import uuid4
            uuid = str(uuid4())
            oeb.metadata.add('identifier', uuid, scheme='uuid', id=uuid)
        with TemporaryDirectory('_epub_output') as tdir:
            from calibre.customize.ui import plugin_for_output_format
            oeb_output = plugin_for_output_format('oeb')
@ -177,10 +191,16 @@ class EPUBOutput(OutputFormatPlugin):
            opf = [x for x in os.listdir(tdir) if x.endswith('.opf')][0]
            self.condense_ncx([os.path.join(tdir, x) for x in os.listdir(tdir)\
                    if x.endswith('.ncx')][0])
            encrypted_fonts = getattr(input_plugin, 'encrypted_fonts', [])
            encryption = None
            if encrypted_fonts:
                encryption = self.encrypt_fonts(encrypted_fonts, tdir, uuid)
            from calibre.ebooks.epub import initialize_container
            epub = initialize_container(output_path, os.path.basename(opf))
            epub.add_dir(tdir)
            if encryption is not None:
                epub.writestr('META-INF/encryption.xml', encryption)
            if opts.extract_to is not None:
                if os.path.exists(opts.extract_to):
                    shutil.rmtree(opts.extract_to)
@ -189,6 +209,52 @@ class EPUBOutput(OutputFormatPlugin):
                self.log.info('EPUB extracted to', opts.extract_to)
            epub.close()
    def encrypt_fonts(self, uris, tdir, uuid):
        from binascii import unhexlify
        key = re.sub(r'[^a-fA-F0-9]', '', uuid)
        if len(key) < 16:
            raise ValueError('UUID identifier %r is invalid'%uuid)
        key = unhexlify((key + key)[:32])
        key = tuple(map(ord, key))
        paths = []
        with CurrentDir(tdir):
            paths = [os.path.join(*x.split('/')) for x in uris]
            uris = dict(zip(uris, paths))
            fonts = []
            for uri in list(uris.keys()):
                path = uris[uri]
                if isinstance(path, unicode):
                    path = path.encode(filesystem_encoding)
                if not os.path.exists(path):
                    uris.pop(uri)
                    continue
                self.log.debug('Encrypting font:', uri)
                with open(path, 'r+b') as f:
                    data = f.read(1024)
                    f.seek(0)
                    for i in range(1024):
                        f.write(chr(ord(data[i]) ^ key[i%16]))
                if not isinstance(uri, unicode):
                    uri = uri.decode('utf-8')
                fonts.append(u'''
                <enc:EncryptedData>
                    <enc:EncryptionMethod Algorithm="http://ns.adobe.com/pdf/enc#RC"/>
                    <enc:CipherData>
                    <enc:CipherReference URI="%s"/>
                    </enc:CipherData>
                </enc:EncryptedData>
                '''%(uri.replace('"', '\\"')))
            if fonts:
                    ans = '''<encryption
                    xmlns="urn:oasis:names:tc:opendocument:xmlns:container"
                    xmlns:enc="http://www.w3.org/2001/04/xmlenc#"
                    xmlns:deenc="http://ns.adobe.com/digitaleditions/enc">
                    '''
                    ans += (u'\n'.join(fonts)).encode('utf-8')
                    ans += '\n</encryption>'
                    return ans
    def default_cover(self):
        '''
        Create a generic cover for books that dont have a cover
--- a/src/calibre/ebooks/metadata/opf2.py
+++ b/src/calibre/ebooks/metadata/opf2.py
@ -779,6 +779,9 @@ class OPF(object):
            self.set_text(matches[0], unicode(val))
        return property(fget=fget, fset=fset)
    def identifier_iter(self):
        for item in self.identifier_path(self.metadata):
            yield item
    def guess_cover(self):
        '''
--- a/src/calibre/ebooks/metadata/toc.py
+++ b/src/calibre/ebooks/metadata/toc.py
@ -149,7 +149,8 @@ class TOC(list):
    def read_ncx_toc(self, toc):
        self.base_path = os.path.dirname(toc)
-        soup = NCXSoup(xml_to_unicode(open(toc, 'rb').read())[0])
+        raw  = xml_to_unicode(open(toc, 'rb').read(), assume_utf8=True)[0]
        soup = NCXSoup(raw)
        def process_navpoint(np, dest):
            play_order = np.get('playOrder', None)
@ -160,7 +161,7 @@ class TOC(list):
            if nl is not None:
                text = u''
                for txt in nl.findAll(re.compile('text')):
-                    text += ''.join([unicode(s) for s in txt.findAll(text=True)])
+                    text += u''.join([unicode(s) for s in txt.findAll(text=True)])
                content = np.find(re.compile('content'))
                if content is None or not content.has_key('src') or not txt:
                    return
--- a/src/calibre/ebooks/oeb/iterator.py
+++ b/src/calibre/ebooks/oeb/iterator.py
@ -152,13 +152,17 @@ class EbookIterator(object):
                        prints('Substituting font family: %s -> %s'%(bad, good))
                        return match.group().replace(bad, '"%s"'%good)
            from calibre.ebooks.chardet import force_encoding
            for csspath in css_files:
                with open(csspath, 'r+b') as f:
                    css = f.read()
-                    css = font_family_pat.sub(prepend_embedded_font, css)
+                    enc = force_encoding(css, False)
-                    f.seek(0)
+                    css = css.decode(enc, 'replace')
-                    f.truncate()
+                    ncss = font_family_pat.sub(prepend_embedded_font, css)
-                    f.write(css)
+                    if ncss != css:
                        f.seek(0)
                        f.truncate()
                        f.write(ncss.encode(enc))
    def __enter__(self, processed=False):
        self.delete_on_exit = []
--- a/src/calibre/ebooks/oeb/reader.py
+++ b/src/calibre/ebooks/oeb/reader.py
@ -331,7 +331,10 @@ class OEBReader(object):
            id = child.get('id')
            klass = child.get('class', 'chapter')
-            po = int(child.get('playOrder', self.oeb.toc.next_play_order()))
+            try:
                po = int(child.get('playOrder', self.oeb.toc.next_play_order()))
            except:
                po = self.oeb.toc.next_play_order()
            authorElement = xpath(child,
                    'descendant::calibre:meta[@name = "author"]')
--- a/src/calibre/ebooks/pdb/pdf/reader.py
+++ b/src/calibre/ebooks/pdb/pdf/reader.py
@ -27,7 +27,7 @@ class Reader(FormatReader):
        self.log.info('Extracting PDF...')
        with TemporaryFile() as pdf_n:
-            pdf = open(pdf_n, 'rw+b')
+            pdf = open(pdf_n, 'rwb')
            for x in xrange(self.header.section_count()):
                pdf.write(self.header.section_data(x))
--- a/src/calibre/gui2/dialogs/scheduler.py
+++ b/src/calibre/gui2/dialogs/scheduler.py
@ -18,6 +18,7 @@ from calibre.gui2 import config as gconf, error_dialog
 from calibre.web.feeds.recipes.model import RecipeModel
 from calibre.ptempfile import PersistentTemporaryFile
 from calibre.utils.date import utcnow
 from calibre.utils.network import internet_connected
 class SchedulerDialog(QDialog, Ui_Dialog):
@ -304,6 +305,8 @@ class Scheduler(QObject):
            self.download(urn)
    def download(self, urn):
        if not internet_connected():
            return
        self.lock.lock()
        doit = urn not in self.download_queue
        self.lock.unlock()
--- a/src/calibre/gui2/ui.py
+++ b/src/calibre/gui2/ui.py
@ -10,7 +10,6 @@ __docformat__ = 'restructuredtext en'
 '''The main GUI'''
 import collections, datetime, os, shutil, sys, textwrap, time
 from collections import namedtuple
 from xml.parsers.expat import ExpatError
 from Queue import Queue, Empty
 from threading import Thread
@ -20,7 +19,7 @@ from PyQt4.Qt import Qt, SIGNAL, QObject, QCoreApplication, QUrl, QTimer, \
                     QToolButton, QDialog, QDesktopServices, QFileDialog, \
                     QSystemTrayIcon, QApplication, QKeySequence, QAction, \
                     QMessageBox, QStackedLayout, QHelpEvent, QInputDialog,\
-                     QThread
+                     QThread, pyqtSignal
 from PyQt4.QtSvg import QSvgRenderer
 from calibre import  prints, patheq, strftime
@ -31,7 +30,7 @@ from calibre.ptempfile import PersistentTemporaryFile
 from calibre.utils.config import prefs, dynamic
 from calibre.utils.ipc.server import Server
 from calibre.gui2 import warning_dialog, choose_files, error_dialog, \
-                            question_dialog,\
+                           question_dialog,\
                           pixmap_to_data, choose_dir, \
                           Dispatcher, gprefs, \
                           available_height, \
@ -57,7 +56,6 @@ from calibre.gui2.dialogs.choose_format import ChooseFormatDialog
 from calibre.gui2.dialogs.book_info import BookInfo
 from calibre.ebooks import BOOK_EXTENSIONS
 from calibre.ebooks.BeautifulSoup import BeautifulSoup, Tag, NavigableString
 from calibre.library.cli import send_message as calibre_send_message
 from calibre.library.database2 import LibraryDatabase2, CoverCache
 from calibre.gui2.dialogs.confirm_delete import confirm
@ -928,9 +926,7 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
    ######################### Fetch annotations ################################
    def fetch_annotations(self, *args):
-    	# Figure out a list of ids using the same logic as the catalog generation
+		# Generate a path_map from selected ids
    	# FUnction.  Use the currently connected device to map ids to paths
        def get_ids_from_selected_rows():
 			rows = self.library_view.selectionModel().selectedRows()
 			if not rows or len(rows) < 2:
@ -938,15 +934,22 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
 			ids = map(self.library_view.model().id, rows)
 			return ids
 		def get_formats(id):
 			book_data = db.get_data_as_dict(ids=[id])[0]
 			formats = book_data['formats']
 			fmts = []
 			for format in formats:
 				fmts.append(format.rpartition('.')[2])
 			return fmts
 		def generate_annotation_paths(ids, db, device):
-			# Generate a dict {1:'documents/documents/Asimov, Isaac/Foundation - Isaac Asimov.epub'}
+			# Generate path templates
-			# These are the not the absolute paths - individual storage mount points will need to be
+			# Individual storage mount points scanned/resolved in driver.get_annotations()
 			# prepended during the search
 			path_map = {}
 			for id in ids:
 				mi = db.get_metadata(id, index_is_id=True)
-				a_path = device.create_upload_path(os.path.abspath('/<storage>'), mi, 'x.mbp', create_dirs=False)
+				a_path = device.create_upload_path(os.path.abspath('/<storage>'), mi, 'x.bookmark', create_dirs=False)
-				path_map[id] = a_path
+				path_map[id] = dict(path=a_path, fmts=get_formats(id))
 			return path_map
 		device = self.device_manager.device
@ -976,16 +979,24 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
 		from calibre.gui2.dialogs.progress import ProgressDialog
 		class Updater(QThread):
-			def __init__(self, parent, db, annotation_map):
+
            update_progress = pyqtSignal(int)
            update_done     = pyqtSignal()
 			def __init__(self, parent, db, annotation_map, done_callback):
 				QThread.__init__(self, parent)
 				self.db = db
 				self.pd = ProgressDialog(_('Merging user annotations into database'), '',
-                			             0, len(job.result), parent=parent)
+                        0, len(job.result), parent=parent)
 				self.am = annotation_map
                self.done_callback = done_callback
 				self.connect(self.pd, SIGNAL('canceled()'), self.canceled)
 				self.pd.setModal(True)
 				self.pd.show()
                self.update_progress.connect(self.pd.set_value,
                        type=Qt.QueuedConnection)
                self.update_done.connect(self.pd.hide, type=Qt.QueuedConnection)
 			def generate_annotation_html(self, bookmark):
 				# Returns <div class="user_annotations"> ... </div>
@ -1003,8 +1014,7 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
 				spanTag['style'] = 'font-weight:bold'
 				spanTag.insert(0,NavigableString("%s<br />Last Page Read: Location %d (%d%%)" % \
 								(strftime(u'%x', timestamp.timetuple()),
-								 last_read_location/150 + 1,
+                                last_read_location, percent_read)))
 								 percent_read)))
 				divTag.insert(dtc, spanTag)
 				dtc += 1
@ -1020,15 +1030,15 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
 					for location in sorted(user_notes):
 						if user_notes[location]['text']:
 							annotations.append('<b>Location %d &bull; %s</b><br />%s<br />' % \
-												(location/150 + 1,
+												(user_notes[location]['displayed_location'],
 												 user_notes[location]['type'],
-												 user_notes[location]['text'] if \
+                                                 user_notes[location]['text'] if \
-													user_notes[location]['type'] == 'Note' else \
+												    user_notes[location]['type'] == 'Note' else \
 													'<i>%s</i>' % user_notes[location]['text']))
 						else:
 							annotations.append('<b>Location %d &bull; %s</b><br />' % \
-												(location/150 + 1,
+												(user_notes[location]['displayed_location'],
-												 user_notes[location]['type']))
+                                                 user_notes[location]['type']))
 					for annotation in annotations:
 						divTag.insert(dtc, annotation)
@ -1040,33 +1050,33 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
 			def canceled(self):
 				self.pd.hide()
-			def start(self):
+			def run(self):
 				QApplication.processEvents()
 				for (i, id) in enumerate(self.am):
 					bm = Device.UserAnnotation(self.am[id][0],self.am[id][1])
 					user_notes_soup = self.generate_annotation_html(bm.bookmark)
 					mi = self.db.get_metadata(id, index_is_id=True)
 					a_offset = mi.comments.find('<div class="user_annotations">')
 					ad_offset = mi.comments.find('<hr class="annotations_divider" />')
 					if a_offset >= 0:
 						mi.comments = mi.comments[:a_offset]
 					if ad_offset >= 0:
 						mi.comments = mi.comments[:ad_offset]
 					if mi.comments:
-						hrTag = Tag(user_notes_soup,'hr')
+						a_offset = mi.comments.find('<div class="user_annotations">')
-						hrTag['class'] = 'annotations_divider'
+						ad_offset = mi.comments.find('<hr class="annotations_divider" />')
 						user_notes_soup.insert(0,hrTag)
-					mi.comments += user_notes_soup.prettify()
+						if a_offset >= 0:
 							mi.comments = mi.comments[:a_offset]
 						if ad_offset >= 0:
 							mi.comments = mi.comments[:ad_offset]
 						if mi.comments:
 							hrTag = Tag(user_notes_soup,'hr')
 							hrTag['class'] = 'annotations_divider'
 							user_notes_soup.insert(0,hrTag)
 						mi.comments += user_notes_soup.prettify()
 					else:
 						mi.comments = unicode(user_notes_soup.prettify())
 					# Update library comments
 					self.db.set_comment(id, mi.comments)
-
+                    self.update_progress.emit(i)
-					self.pd.set_value(i)
+                self.update_done.emit()
-				self.pd.hide()
+                self.done_callback(self.am.keys())
 				calibre_send_message()
        if not job.result: return
@ -1076,9 +1086,9 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
                    show=True)
        db = self.library_view.model().db
-        self.__annotation_updater = Updater(self, db, job.result)
+        self.__annotation_updater = Updater(self, db, job.result,
                Dispatcher(self.library_view.model().refresh_ids))
        self.__annotation_updater.start()
        return
    ############################################################################
--- a/src/calibre/library/catalog.py
+++ b/src/calibre/library/catalog.py
@ -1175,14 +1175,18 @@ class EPUB_MOBI(CatalogPlugin):
            Preferences|Add/Save|Sending to device, not a customized one specified in
            the Kindle plugin
            '''
            from cStringIO import StringIO
            from struct import unpack
            from calibre.devices.usbms.device import Device
            from calibre.devices.kindle.driver import Bookmark
            from calibre.ebooks.metadata import MetaInformation
-            from calibre.ebooks.metadata.mobi import StreamSlicer
+
            MBP_FORMATS = [u'azw', u'mobi', u'prc', u'txt']
            TAN_FORMATS = [u'tpz', u'azw1']
            mbp_formats = set()
            for fmt in MBP_FORMATS:
                mbp_formats.add(fmt)
            tan_formats = set()
            for fmt in TAN_FORMATS:
                tan_formats.add(fmt)
            class BookmarkDevice(Device):
                def initialize(self, save_template):
@ -1191,6 +1195,40 @@ class EPUB_MOBI(CatalogPlugin):
                def save_template(self):
                    return self._save_template
            def resolve_bookmark_paths(storage, path_map):
                pop_list = []
                book_ext = {}
                for id in path_map:
                    file_fmts = set()
                    for fmt in path_map[id]['fmts']:
                        file_fmts.add(fmt)
                    bookmark_extension = None
                    if file_fmts.intersection(mbp_formats):
                        book_extension = list(file_fmts.intersection(mbp_formats))[0]
                        bookmark_extension = 'mbp'
                    elif file_fmts.intersection(tan_formats):
                        book_extension = list(file_fmts.intersection(tan_formats))[0]
                        bookmark_extension = 'tan'
                    if bookmark_extension:
                        for vol in storage:
                            bkmk_path = path_map[id]['path'].replace(os.path.abspath('/<storage>'),vol)
                            bkmk_path = bkmk_path.replace('bookmark',bookmark_extension)
                            print "looking for %s" % bkmk_path
                            if os.path.exists(bkmk_path):
                                path_map[id] = bkmk_path
                                book_ext[id] = book_extension
                                break
                        else:
                            pop_list.append(id)
                    else:
                        pop_list.append(id)
                # Remove non-existent bookmark templates
                for id in pop_list:
                    path_map.pop(id)
                return path_map, book_ext
            if self.generateRecentlyRead:
                self.opts.log.info("     Collecting Kindle bookmarks matching catalog entries")
@ -1199,26 +1237,32 @@ class EPUB_MOBI(CatalogPlugin):
                bookmarks = {}
                for book in self.booksByTitle:
-                    original_title = book['title'][book['title'].find(':') + 2:] if book['series'] \
+                    if 'formats' in book:
-                               else book['title']
+                        path_map = {}
-                    myMeta = MetaInformation(original_title,
+                        id = book['id']
-                                             authors=book['authors'])
+                        original_title = book['title'][book['title'].find(':') + 2:] if book['series'] \
-                    myMeta.author_sort = book['author_sort']
+                                   else book['title']
-                    bm_found = False
+                        myMeta = MetaInformation(original_title,
-                    for vol in self.opts.connected_device['storage']:
+                                                 authors=book['authors'])
-                        bm_path = d.create_upload_path(vol, myMeta, 'x.mbp', create_dirs=False)
+                        myMeta.author_sort = book['author_sort']
-                        if os.path.exists(bm_path):
+                        a_path = d.create_upload_path('/<storage>', myMeta, 'x.bookmark', create_dirs=False)
-                            myBookmark = Bookmark(bm_path, book['formats'], book['id'])
+                        path_map[id] = dict(path=a_path, fmts=[x.rpartition('.')[2] for x in book['formats']])
                        path_map, book_ext = resolve_bookmark_paths(self.opts.connected_device['storage'], path_map)
                        if path_map:
                            bookmark_ext = path_map[id].rpartition('.')[2]
                            myBookmark = Bookmark(path_map[id], id, book_ext[id], bookmark_ext)
                            print "book: %s\nlast_read_location: %d\nlength: %d" % (book['title'],
                                                                                    myBookmark.last_read_location,
                                                                                    myBookmark.book_length)
                            if myBookmark.book_length:
                                book['percent_read'] = float(100*myBookmark.last_read_location / myBookmark.book_length)
                                dots = int((book['percent_read'] + 5)/10)
                                dot_string = self.READ_PROGRESS_SYMBOL * dots
                                empty_dots = self.UNREAD_PROGRESS_SYMBOL * (10 - dots)
                                book['reading_progress'] = '%s%s' % (dot_string,empty_dots)
-                                bookmarks[book['id']] = ((myBookmark,book))
+                                bookmarks[id] = ((myBookmark,book))
-                                bm_found = True
+
                        if bm_found:
                            break
                self.bookmarked_books = bookmarks
            else:
                self.bookmarked_books = {}
--- a/src/calibre/library/server.py
+++ b/src/calibre/library/server.py
@ -20,10 +20,10 @@ try:
 except ImportError:
    import Image as PILImage
-from calibre.constants import __version__, __appname__
+from calibre.constants import __version__, __appname__, iswindows
 from calibre.utils.genshi.template import MarkupTemplate
 from calibre import fit_image, guess_type, prepare_string_for_xml, \
-        strftime as _strftime, prints
+        strftime as _strftime
 from calibre.library import server_config as config
 from calibre.library.database2 import LibraryDatabase2, FIELD_MAP
 from calibre.utils.config import config_dir
@ -423,10 +423,8 @@ class LibraryServer(object):
                             self.opts.port, {'path':'/stanza'})
            except:
                import traceback
-                print 'Failed to start BonJour:'
+                cherrypy.log.error('Failed to start BonJour:')
-                cherrypy.log('Failed to start BonJour:')
+                cherrypy.log.error(traceback.format_exc())
                cherrypy.log(traceback.format_exc())
                traceback.print_exc()
            cherrypy.engine.block()
        except Exception, e:
            self.exception = e
@ -436,10 +434,8 @@ class LibraryServer(object):
                stop_zeroconf()
            except:
                import traceback
-                print 'Failed to stop BonJour:'
+                cherrypy.log.error('Failed to stop BonJour:')
-                cherrypy.log('Failed to stop BonJour:')
+                cherrypy.log.error(traceback.format_exc())
                cherrypy.log(traceback.format_exc())
                traceback.print_exc()
    def exit(self):
        cherrypy.engine.exit()
@ -472,7 +468,8 @@ class LibraryServer(object):
            return of.getvalue()
        except Exception, err:
            import traceback
-            traceback.print_exc()
+            cherrypy.log.error('Failed to generate cover:')
            cherrypy.log.error(traceback.print_exc())
            raise cherrypy.HTTPError(404, 'Failed to generate cover: %s'%err)
    def get_format(self, id, format):
@ -813,7 +810,7 @@ class LibraryServer(object):
        # A better search would be great
        want_mobile = self.MOBILE_UA.search(ua) is not None
        if self.opts.develop and not want_mobile:
-            prints('User agent:', ua)
+            cherrypy.log('User agent: '+ua)
        if want_opds:
            return self.stanza(search=kwargs.get('search', None), sortby=kwargs.get('sortby',None), authorid=kwargs.get('authorid',None),
@ -882,12 +879,55 @@ def option_parser():
    parser = config().option_parser('%prog '+ _('[options]\n\nStart the calibre content server.'))
    parser.add_option('--with-library', default=None,
            help=_('Path to the library folder to serve with the content server'))
    parser.add_option('--pidfile', default=None,
            help=_('Write process PID to the specified file'))
    parser.add_option('--daemonize', default=False, action='store_true',
            help='Run process in background as a daemon. No effect on windows.')
    return parser
 def daemonize(stdin='/dev/null', stdout='/dev/null', stderr='/dev/null'):
    try:
        pid = os.fork()
        if pid > 0:
            # exit first parent
            sys.exit(0)
    except OSError, e:
        print >>sys.stderr, "fork #1 failed: %d (%s)" % (e.errno, e.strerror)
        sys.exit(1)
    # decouple from parent environment
    os.chdir("/")
    os.setsid()
    os.umask(0)
    # do second fork
    try:
        pid = os.fork()
        if pid > 0:
            # exit from second parent
            sys.exit(0)
    except OSError, e:
        print >>sys.stderr, "fork #2 failed: %d (%s)" % (e.errno, e.strerror)
        sys.exit(1)
    # Redirect standard file descriptors.
    si = file(stdin, 'r')
    so = file(stdout, 'a+')
    se = file(stderr, 'a+', 0)
    os.dup2(si.fileno(), sys.stdin.fileno())
    os.dup2(so.fileno(), sys.stdout.fileno())
    os.dup2(se.fileno(), sys.stderr.fileno())
 def main(args=sys.argv):
    parser = option_parser()
    opts, args = parser.parse_args(args)
    if opts.daemonize and not iswindows:
        daemonize()
    if opts.pidfile is not None:
        with open(opts.pidfile, 'wb') as f:
            f.write(str(os.getpid()))
    cherrypy.log.screen = True
    from calibre.utils.config import prefs
    if opts.with_library is None:
--- a/src/calibre/utils/network.py
+++ b/src/calibre/utils/network.py
@ -0,0 +1,54 @@
 #!/usr/bin/env python
 # vim:fileencoding=UTF-8:ts=4:sw=4:sta:et:sts=4:ai
 from __future__ import with_statement
 __license__   = 'GPL v3'
 __copyright__ = '2010, Kovid Goyal <kovid@kovidgoyal.net>'
 __docformat__ = 'restructuredtext en'
 from calibre.constants import iswindows, islinux, isfreebsd
 class LinuxNetworkStatus(object):
    def __init__(self):
        try:
            import dbus
            bus = dbus.SystemBus()
            proxy = bus.get_object("org.freedesktop.NetworkManager",
                        "/org/freedesktop/NetworkManager")
            self.manager = dbus.Interface(proxy, "org.freedesktop.DBus.Properties")
        except:
            self.manager = None
    def __call__(self):
        if self.manager is None:
            return True
        try:
            connections = self.manager.Get("org.freedesktop.NetworkManager",
                        "ActiveConnections")
            return len(connections) > 0
        except:
            return True
 class WindowsNetworkStatus(object):
    def __init__(self):
        from calibre.constants import plugins
        self.winutil = plugins['winutil'][0]
    def __call__(self):
        if self.winutil is None:
            return True
        return self.winutil.internet_connected()
 class DummyNetworkStatus(object):
    def __call__(self):
        return True
 _network_status = WindowsNetworkStatus() if iswindows else \
        LinuxNetworkStatus() if (islinux or isfreebsd) else \
        DummyNetworkStatus()
 def internet_connected():
    return _network_status()
--- a/src/calibre/utils/windows/winutil.c
+++ b/src/calibre/utils/windows/winutil.c
@ -51,11 +51,15 @@ wherever possible in this module.
    script being run. So to replace sys.argv, you should use
    `if len(sys.argv) > 1: sys.argv[1:] = winutil.argv()[1-len(sys.argv):]`
 .. function:: internet_connected() -> Return True if there is an active
   internet connection.
 */
 #define UNICODE
 #include <Windows.h>
 #include <Wininet.h>
 #include <Python.h>
 #include <structseq.h>
 #include <timefuncs.h>
@ -771,6 +775,15 @@ gettmarg(PyObject *args, struct tm *p)
 	return 1;
 }
 static PyObject *
 winutil_internet_connected(PyObject *self, PyObject *args) {
    DWORD flags;
    BOOL ans = InternetGetConnectedState(&flags, 0);
    if (ans) Py_RETURN_TRUE;
    Py_RETURN_FALSE;
 }
 static PyObject *
 winutil_strftime(PyObject *self, PyObject *args)
 {
@ -919,6 +932,10 @@ be a unicode string. Returns unicode strings."
 			"eject_drive(drive_letter)\n\nEject a drive. Raises an exception on failure."
 	},
    {"internet_connected", winutil_internet_connected, METH_VARARGS,
        "internet_connected()\n\nReturn True if there is an active internet connection"
    },
    {NULL, NULL, 0, NULL}
 };