merging 0.6.24

2025-07-09 03:04:10 -04:00 · 2010-02-21 10:37:59 -08:00 · 2010-02-21 10:37:59 -08:00 · ba051d2480
commit ba051d2480
parent ac8ccceef8 673002d89c
47 changed files with 17448 additions and 7002 deletions
--- a/Changelog.yaml
+++ b/Changelog.yaml
@ -4,6 +4,80 @@
 # for important features/bug fixes.
 # Also, each release can have new and improved recipes.

+- version: 0.6.42
+  date: 2010-02-20
+
+  bug fixes:
+    - title: "Fix regression that broke catalog generation from the Graphical User Interface in 0.6.41"
+    
+    - title: "Fix right edge of comics like Dilbert and xkcd getting cut off on the SONY reader. More generally, take page margins into account when rescaling images to fit in the selected output profile."
+
+
+- version: 0.6.41
+  date: 2010-02-19
+
+  new features:
+    - title: "Make calibre timezone aware. This required lots of internal changes, so I may have broken something"
+      type: major
+
+    - title: "Allow editing of metadata in DRMed MOBI files"
+      type: major
+
+    - title: "ebook-convert: Allow passing URLs as argument to --cover"
+      tickets: [4909]
+
+    - title: "OS X/linux driver for EB511"
+
+    - title: "ebook-meta: Allow changing of published date"
+
+    - title: "Make replacing of files in ZIP archives faster and (hopefully) more robust"
+
+    - title: "Speed optimization for viewing large EPUB files"
+
+    - title: "Speed up parsing of OPF files"
+      tickets: [4908]
+
+  bug fixes:
+    - title: "Fix drag and drop of multiple books to OS X dock icon"
+      tickets: [4849]
+
+    - title: "MOBI Output: Encode titles as UTF-8 in the PalmDoc header as well as the EXTH header, since there are apparently MOBI readers that use the title from the PalmDoc header in preference to the title from the EXTH header."
+
+    - title: "MOBI Output: Remove soft hyphens as the Kindle doesn't support them."
+      tickets: [4887]
+
+    - title: "Fix Boox main mem and SD card swapped on windows"
+
+    - title: "Fix sending large ebook fiels to devices"
+      tickets: [4896]
+
+    - title: "EPUB Output: Strip invalid anchors from NCX TOC as Adobe Digital Editions cries when it sees one"
+      tickets: [4907]
+
+    - title: "EPUB metadata: Don't set title_sort as a file_as attribute, as the brain-dead OPF spec doesn't allow this"
+
+    - title: "Make publishing the content server via mDNS a little more robust"
+
+    - title: "Content server: Use new exact matching for greater precision when generating OPDS catalogs. Also fix regression that broke rowsing by Tags on Stanza."
+
+    - title: "Proper fix for breakage in LRF viewer caused by API change in QGraphicsItem in Qt 4.6"
+
+  new recipes:
+    - title: Various Polish news sources
+      author: Tomaz Dlugosz
+
+    - title: Que Leer, Wired UK
+      author: Darko Miletic
+
+    - title: Kathermini and Ta Nea
+      author: Pan
+
+    - title: Winter Olympics
+      author: Starson17
+
+  improved recipes:
+    - Wired Magazine
+
 - version: 0.6.40
  date: 2010-02-12

--- a/resources/images/news/wired_uk.png
+++ b/resources/images/news/wired_uk.png
--- a/resources/recipes/di.recipe
+++ b/resources/recipes/di.recipe
@ -0,0 +1,60 @@
+#!/usr/bin/env  python
+
+__license__	= 'GPL v3'
+__author__ = 'Mori'
+__version__ = 'v. 0.5'
+'''
+di.com.pl
+'''
+
+from calibre.web.feeds.news import BasicNewsRecipe
+import re
+
+class DziennikInternautowRecipe(BasicNewsRecipe):
+	__author__ = 'Mori'
+	language = 'pl'
+
+	title = u'Dziennik Internautow'
+	publisher = u'Dziennik Internaut\xc3\xb3w Sp. z o.o.'
+	description =u'Internet w \xc5\xbcyciu i biznesie. Porady, wywiady, interwencje, bezpiecze\xc5\x84stwo w Sieci, technologia.'
+
+	max_articles_per_feed = 100
+	oldest_article = 7
+	cover_url = 'http://di.com.pl/pic/logo_di_norm.gif'
+
+	no_stylesheets = True
+	remove_javascript = True
+	encoding = 'utf-8'
+
+	extra_css = '''
+		.fotodesc{font-size: 75%;}
+		.pub_data{font-size: 75%;}
+		.fotonews{clear: both; padding-top: 10px; padding-bottom: 10px;}
+		#pub_foto{font-size: 75%; float: left; padding-right: 10px;}
+	'''
+
+	feeds = [
+		(u'Dziennik Internautów', u'http://feeds.feedburner.com/glowny-di')
+	]
+
+	keep_only_tags = [
+		dict(name = 'div', attrs = {'id' : 'pub_head'}),
+		dict(name = 'div', attrs = {'id' : 'pub_content'})
+	]
+
+	remove_tags = [
+		dict(name = 'div', attrs = {'class' : 'poradniki_context'}),
+		dict(name = 'div', attrs = {'class' : 'uniBox'}),
+		dict(name = 'object', attrs = {}),
+		dict(name = 'h3', attrs = {})
+	]
+
+	preprocess_regexps = [
+		(re.compile(i[0], re.IGNORECASE | re.DOTALL), i[1]) for i in
+		[
+			(r', <a href="http://di.com.pl/komentarze,.*?</div>', lambda match: '</div>'),
+			(r'<div class="fotonews".*?">', lambda match: '<div class="fotonews">'),
+			(r'http://di.com.pl/pic/photo/mini/', lambda match: 'http://di.com.pl/pic/photo/oryginal/'),
+			(r'\s*</', lambda match: '</'),
+		]
+	]
--- a/resources/recipes/eclicto.recipe
+++ b/resources/recipes/eclicto.recipe
@ -0,0 +1,49 @@
+#!/usr/bin/env  python
+
+__license__ = 'GPL v3'
+__author__ = 'Mori'
+__version__ = 'v. 0.1'
+'''
+blog.eclicto.pl
+'''
+
+from calibre.web.feeds.news import BasicNewsRecipe
+import re
+
+class BlogeClictoRecipe(BasicNewsRecipe):
+    __author__ = 'Mori'
+    language = 'pl'
+
+    title = u'Blog eClicto'
+    publisher = u'Blog eClicto'
+    description = u'Blog o e-papierze i e-bookach'
+
+    max_articles_per_feed = 100
+    cover_url = 'http://blog.eclicto.pl/wordpress/wp-content/themes/blog_eclicto/g/logo.gif'
+
+    no_stylesheets = True
+    remove_javascript = True
+    encoding = 'utf-8'
+
+    extra_css = '''
+        img{float: left; padding-right: 10px; padding-bottom: 5px;}
+    '''
+
+    feeds = [
+        (u'Blog eClicto', u'http://blog.eclicto.pl/feed/')
+    ]
+
+    remove_tags = [
+        dict(name = 'span', attrs = {'id' : 'tags'})
+    ]
+
+    remove_tags_after = [
+        dict(name = 'div', attrs = {'class' : 'post'})
+    ]
+
+    preprocess_regexps = [
+        (re.compile(i[0], re.IGNORECASE | re.DOTALL), i[1]) for i in
+        [
+            (r'\s*</', lambda match: '</'),
+        ]
+    ]
--- a/resources/recipes/eksiazki.recipe
+++ b/resources/recipes/eksiazki.recipe
@ -1,6 +1,6 @@
 #!/usr/bin/env  python

-__license__   = 'GPL v2'
+__license__   = 'GPL v3'
 __copyright__ = u'2010, Tomasz Dlugosz <tomek3d@gmail.com>'
 '''
 eksiazki.org
@ -10,17 +10,17 @@ from calibre.web.feeds.news import BasicNewsRecipe

 class eksiazki(BasicNewsRecipe):

-    title          = u'eksiazki.org'
-    desciption     = u'Twoje centrum wiedzy o epapierze i ebookach'
+    title          = u'eKsiazki.org'
+    desciption     = u'Twoje centrum wiedzy o ePapierze i eBookach'
    language = 'pl'
    __author__ = u'Tomasz D\u0142ugosz'
    no_stylesheets = True
    remove_javascript = True

-    feeds          = [(u'wpisy', u'http://www.eksiazki.org/feed/')]
+    feeds          = [(u'eKsiazki.org', u'http://www.eksiazki.org/feed/')]

    keep_only_tags = [dict(name='div', attrs={'id':'content-body'})]
    remove_tags = [
-	    dict(name='span', attrs={'class':'nr_comm'}),
-	    dict(name='div', attrs={'id':'tabsContainer'}),
+        dict(name='span', attrs={'class':'nr_comm'}),
+        dict(name='div', attrs={'id':'tabsContainer'}),
        dict(name='div', attrs={'class':'next_previous_links'})]
--- a/resources/recipes/interia_fakty.recipe
+++ b/resources/recipes/interia_fakty.recipe
@ -0,0 +1,38 @@
+#!/usr/bin/env  python
+
+__license__   = 'GPL v3'
+__copyright__ = u'2010, Tomasz Dlugosz <tomek3d@gmail.com>'
+'''
+fakty.interia.pl
+'''
+
+from calibre.web.feeds.news import BasicNewsRecipe
+
+class InteriaFakty(BasicNewsRecipe):
+    title          = u'Interia.pl - Fakty'
+    language = 'pl'
+    oldest_article = 7
+    __author__ = u'Tomasz D\u0142ugosz'
+    simultaneous_downloads = 2
+    no_stylesheets = True
+    remove_javascript = True
+    max_articles_per_feed = 100
+
+    feeds          = [(u'Kraj', u'http://kanaly.rss.interia.pl/kraj.xml'),
+                      (u'\u015awiat', u'http://kanaly.rss.interia.pl/swiat.xml'), 
+                      (u'Wiadomo\u015bci dnia', u'http://kanaly.rss.interia.pl/fakty.xml'), 
+                      (u'Przegl\u0105d prasy', u'http://kanaly.rss.interia.pl/przeglad_prasy.xml'), 
+                      (u'Wywiady', u'http://kanaly.rss.interia.pl/wywiady.xml'), 
+                      (u'Ciekawostki', u'http://kanaly.rss.interia.pl/ciekawostki.xml')]
+
+    keep_only_tags = [dict(name='div', attrs={'id':'article'})]
+
+    remove_tags = [
+        dict(name='div', attrs={'class':'box fontSizeSwitch'}),
+        dict(name='div', attrs={'class':'clear'}),
+        dict(name='div', attrs={'class':'embed embedLeft articleEmbedArticleList articleEmbedArticleListTitle'}),
+        dict(name='span', attrs={'class':'keywords'})]
+
+    extra_css = '''
+	    h2 { font-size: 1.2em; }
+	'''
--- a/resources/recipes/interia_sport.recipe
+++ b/resources/recipes/interia_sport.recipe
@ -0,0 +1,71 @@
+#!/usr/bin/env  python
+
+__license__   = 'GPL v3'
+__copyright__ = u'2010, Tomasz Dlugosz <tomek3d@gmail.com>'
+'''
+sport.interia.pl
+'''
+
+import re
+from calibre.web.feeds.news import BasicNewsRecipe
+
+class InteriaSport(BasicNewsRecipe):
+    title          = u'Interia.pl - Sport'
+    language = 'pl'
+    oldest_article = 7
+    __author__ = u'Tomasz D\u0142ugosz'
+    simultaneous_downloads = 3
+    no_stylesheets = True
+    remove_javascript = True
+    max_articles_per_feed = 100
+
+    feeds          = [(u'Wydarzenia sportowe', u'http://kanaly.rss.interia.pl/sport.xml'), 
+                      (u'Pi\u0142ka no\u017cna', u'http://kanaly.rss.interia.pl/pilka_nozna.xml'), 
+                      (u'Siatk\xf3wka', u'http://kanaly.rss.interia.pl/siatkowka.xml'), 
+                      (u'Koszyk\xf3wka', u'http://kanaly.rss.interia.pl/koszykowka.xml'), 
+                      (u'NBA', u'http://kanaly.rss.interia.pl/nba.xml'), 
+                      (u'Kolarstwo', u'http://kanaly.rss.interia.pl/kolarstwo.xml'), 
+                      (u'\u017bu\u017cel', u'http://kanaly.rss.interia.pl/zuzel.xml'), 
+                      (u'Tenis', u'http://kanaly.rss.interia.pl/tenis.xml')]
+
+    keep_only_tags = [dict(name='div', attrs={'id':'article'})]
+
+    remove_tags = [dict(name='div', attrs={'class':'object gallery'})]
+
+    extra_css = '''
+        .articleDate {
+        font-size: 0.5em;
+        color: black;
+        }
+
+        .articleFoto {
+        display: block;
+        font-family: sans;
+        font-size: 0.5em;
+        text-indent: 0
+        color: black;
+        }
+
+        .articleText {
+        display: block;
+        margin-bottom: 1em;
+        margin-left: 0;
+        margin-right: 0;
+        margin-top: 1em
+        color: black;
+        }
+
+        .articleLead {
+        font-size: 1.2em;
+        }
+        '''
+
+    preprocess_regexps = [
+        (re.compile(i[0], re.IGNORECASE | re.DOTALL), i[1]) for i in 
+        [
+            (r'<p><a href.*?</a></p>', lambda match: ''),
+           # FIXME
+           #(r'(<div id="newsAddContent">)(.*?)(<a href=".*">)(.*?)(</a>)', lambda match: '\1\2\4'),
+            (r'<p>(<i>)?<b>(ZOBACZ|CZYTAJ) T.*?</div>', lambda match: '</div>')
+        ]
+    ]
--- a/resources/recipes/legeartis.recipe
+++ b/resources/recipes/legeartis.recipe
@ -0,0 +1,43 @@
+#!/usr/bin/env  python
+
+__license__ = 'GPL v3'
+__author__ = 'Mori'
+__version__ = 'v. 0.1'
+'''
+olgierd.bblog.pl
+'''
+
+from calibre.web.feeds.news import BasicNewsRecipe
+
+class LegeArtisRecipe(BasicNewsRecipe):
+    __author__ = 'Mori'
+    language = 'pl'
+
+    title = u'Lege Artis'
+    publisher = u'Olgierd Rudak'
+    description = u'Wszystko, co chcieliby\xc5\x9bcie wiedzie\xc4\x87 o prawie, ale wstydzicie si\xc4\x99 zapyta\xc4\x87'
+
+    max_articles_per_feed = 100
+
+    no_stylesheets = True
+    remove_javascript = True
+
+    extra_css = '''
+        img{clear: both;}
+    '''
+
+    feeds = [
+        (u'Lege Artis', u'http://olgierd.bblog.pl/rss/rss20.xml')
+    ]
+
+    keep_only_tags = [
+        dict(name = 'div', attrs = {'class' : 'post_title'}),
+        dict(name = 'div', attrs = {'class' : 'post_date'}),
+        dict(name = 'div', attrs = {'class' : 'post_content'})
+    ]
+
+    remove_tags = [
+        dict(name = 'div', attrs = {'id' : 'bb_tools'}),
+        dict(name = 'div', attrs = {'class' : 'post_comments'}),
+        dict(name = 'object', attrs = {})
+    ]
--- a/resources/recipes/legitymizm.recipe
+++ b/resources/recipes/legitymizm.recipe
@ -0,0 +1,49 @@
+#!/usr/bin/env  python
+
+__license__   = 'GPL v3'
+__copyright__ = u'2010, Tomasz Dlugosz <tomek3d@gmail.com>'
+'''
+legitymizm.org
+'''
+
+from calibre.web.feeds.news import BasicNewsRecipe
+
+class Legitymizm(BasicNewsRecipe):
+    title          = u'Organizacja Monarchist\xf3w Polskich'
+    language = 'pl'
+    oldest_article = 7
+    __author__ = u'Tomasz D\u0142ugosz'
+    max_articles_per_feed = 100
+    cover_url      = 'http://www.legitymizm.org/img_omp/logo.gif'
+    no_stylesheets = True
+
+    feeds          = [(u'Aktualno\u015bci i publicystyka', u'http://www.legitymizm.org/rss.php')]
+
+    keep_only_tags = [dict(name='div', attrs={'id':'szeroka_kolumna'})]
+    remove_tags    = [dict(name = 'div', attrs = {'class' : 'koniec_tresci_wlasciwej'}),
+                      dict(name = 'div', attrs = {'class' : 'return'})]
+
+    extra_css = '''
+        body { font-family: Georgia, 'Times New Roman', Times, serif; }
+        h1 { color: #898981; font-weight: normal; font-size: 26px; letter-spacing: -1px; line-height: 23px; text-align: left; }
+        h2, h3 { font-weight: normal; font-size: 20px; line-height: 23px; letter-spacing: -1px; margin: 0 0 3px 0; text-align: left; }
+        #szeroka_kolumna { float: left; line-height: 20px; }
+        #szeroka_kolumna ul.wykaz { list-style-type: none; margin: 0 0 1.2em 0; padding: 0; }
+        #szeroka_kolumna ul.wykaz li.wykaz_2 { font-weight: bold; margin: 0.6em 0 0 0; }
+        #szeroka_kolumna ul.wykaz a { text-decoration: none; }
+        #szeroka_kolumna ul.wykaz li.wykaz_1, #szeroka_kolumna ul.wykaz li.wykaz_2 ul li { list-style-type: square; color: #898981; text-transform: none; font-weight: normal; padding: 0; } 
+        #szeroka_kolumna ul.wykaz li.wykaz_1 { margin: 0 0 0 1.3em; }
+        #szeroka_kolumna ul.wykaz li.wykaz_2 ul { margin: 0; padding: 0 0 0 1.3em; }
+        #szeroka_kolumna h3.autor { background-color: #898981; color: #f9f9f8; margin: -25px 0px 30px 0; text-align: left; padding: 0 0 0 2px; }
+        .tresc_wlasciwa { border-top: 1px solid #898981; padding: 30px 0px 0px 0px; position: relative; }
+        #cytat { font-size: 11px; line-height: 19px; font-style: italic; text-align: justify; }
+        #cytat img { width: 100px; height: 105px; float: right; margin: 3px 0 0 10px; }
+        .duzy_cytat { padding: 20px 20px 10px 20px; margin: 0 0 1.2em 0; }
+        #szeroka_kolumna img, #szeroka_kolumna object { padding: 3px; border: 1px solid #898981; }
+        #szeroka_kolumna img.ilustracja { margin: 0px 10px 0 0; float: left; }
+        p { margin: 0 0 1.2em 0; }
+        #cytat p.sentencja { margin: 0; }
+        #cytat p.sentencja:first-letter { font-size: 44px; line-height: 33px; margin: 0 2px 0 0; font-style: normal; float: left; display: block; }
+        p.autor { text-transform: uppercase; color: #898981; font-style: normal; text-align: left; }
+    '''
+
--- a/resources/recipes/michalkiewicz.recipe
+++ b/resources/recipes/michalkiewicz.recipe
@ -0,0 +1,26 @@
+#!/usr/bin/env  python
+
+__license__   = 'GPL v3'
+__copyright__ = '2010, Tomasz Dlugosz <tomek3d@gmail.com>'
+'''
+michalkiewicz.pl
+'''
+
+from calibre.web.feeds.news import BasicNewsRecipe
+
+# 
+
+class michalkiewicz(BasicNewsRecipe):
+    title          = u'Stanis\u0142aw Michalkiewicz'
+    desciption     = u'Strona autorska * felietony * artyku\u0142y * komentarze'
+    __author__     = u'Tomasz D\u0142ugosz'
+    language       = 'pl'
+    oldest_article = 7
+    max_articles_per_feed = 100
+    no_stylesheets = True
+
+    keep_only_tags = [dict(name='div', attrs={'class':'modul_srodek'})]
+    remove_tags = [dict(name='ul', attrs={'class':'menu'})]
+
+    feeds          = [(u'Teksty', u'http://www.michalkiewicz.pl/rss.xml')]
+
--- a/resources/recipes/nczas.recipe
+++ b/resources/recipes/nczas.recipe
@ -0,0 +1,35 @@
+#!/usr/bin/env  python
+
+__license__   = 'GPL v3'
+__copyright__ = '2010, Tomasz Dlugosz <tomek3d@gmail.com>'
+'''
+nczas.com
+'''
+
+from calibre.web.feeds.news import BasicNewsRecipe
+
+# 
+
+class NCzas(BasicNewsRecipe):
+    title          = u'Najwy\u017cszy Czas!'
+    desciption     = u'Najwy\u017cszy Czas!\nwydanie internetowe'
+    __author__     = u'Tomasz D\u0142ugosz'
+    language       = 'pl'
+    oldest_article = 7
+    max_articles_per_feed = 100
+    no_stylesheets = True
+    cover_url      = 'http://nczas.com/wp-content/themes/default/grafika/logo.png'
+
+    keep_only_tags = [dict(name='div', attrs={'class':'trescartykulu'})]
+
+    feeds          = [(u'Najwy\u017cszy Czas!', u'http://nczas.com/feed/')]
+
+    def postprocess_html(self, soup, first):
+
+            for tag in soup.findAll(name= 'img', alt=""):
+                    tag.extract()
+
+            for item in soup.findAll(align = "right"):
+                del item['align']
+
+            return soup
--- a/resources/recipes/queleer.recipe
+++ b/resources/recipes/queleer.recipe
@ -0,0 +1,56 @@
+__license__   = 'GPL v3'
+__copyright__ = '2010, Darko Miletic <darko.miletic at gmail.com>'
+'''
+www.que-leer.com
+'''
+
+import re
+from calibre.web.feeds.news import BasicNewsRecipe
+
+class QueLeer(BasicNewsRecipe):
+    title                 = 'Que Leer'
+    __author__            = 'Darko Miletic'
+    description           = 'Libros, Novedades en libros, Criticas, Noticias libro'
+    publisher             = 'MC Ediciones, S.A.'
+    category              = 'news, books, criticas, libros'
+    oldest_article        = 7
+    max_articles_per_feed = 200
+    no_stylesheets        = True
+    encoding              = 'utf-8'
+    use_embedded_content  = False
+    language              = 'es'
+    remove_empty_feeds    = True
+    masthead_url          = 'http://www.que-leer.com/wp-content/themes/queleer/images/backgrounds/que-leer.jpg'
+    extra_css             = ' body{font-family: Arial,sans-serif } img{margin-bottom: 0.4em} '
+
+    conversion_options = {
+                          'comment'   : description
+                        , 'tags'      : category
+                        , 'publisher' : publisher
+                        , 'language'  : language
+                        }
+
+    preprocess_regexps = [(re.compile(r'<h2 class="izq">.*?</body>', re.DOTALL|re.IGNORECASE),lambda match: '')]
+
+    remove_tags = [
+                     dict(attrs={'class':['post-ratings','post-ratings-loading','sociable','toc-anchor']})
+                    ,dict(name=['object','embed','iframe','link'])
+                    ,dict(attrs={'id':'left'})
+                  ]
+
+    remove_tags_after = dict(attrs={'class':'sociable'})
+    remove_attributes = ['width','height']
+    keep_only_tags    = [dict(attrs={'class':'post'})]
+
+    feeds = [(u'Articulos', u'http://www.que-leer.com/feed')]
+
+    def preprocess_html(self, soup):
+        for item in soup.findAll(style=True):
+            del item['style']
+        url = 'http://www.que-leer.com/comprar-libros-tienda-que-leer/libros-recomendados'
+        fitem = soup.find('a',href=url)
+        if fitem:
+           par = fitem.parent
+           par.extract()
+        return self.adeify_images(soup)
+
--- a/resources/recipes/wired_uk.recipe
+++ b/resources/recipes/wired_uk.recipe
@ -0,0 +1,74 @@
+
+__license__   = 'GPL v3'
+__copyright__ = '2010, Darko Miletic <darko.miletic at gmail.com>'
+'''
+www.wired.co.uk
+'''
+
+from calibre import strftime
+from calibre.web.feeds.news import BasicNewsRecipe
+
+class Wired_UK(BasicNewsRecipe):
+    title                 = 'Wired Magazine - UK edition'
+    __author__            = 'Darko Miletic'
+    description           = 'Gaming news'
+    publisher             = 'Conde Nast Digital'
+    category              = 'news, games, IT, gadgets'
+    oldest_article        = 32
+    max_articles_per_feed = 100
+    no_stylesheets        = True
+    encoding              = 'utf-8'
+    use_embedded_content  = False
+    masthead_url          = 'http://www.wired.co.uk/_/media/wired-logo_UK.gif'
+    language              = 'en_GB'
+    extra_css             = ' body{font-family: Palatino,"Palatino Linotype","Times New Roman",Times,serif} img{margin-bottom: 0.8em } .img-descr{font-family: Tahoma,Arial,Helvetica,sans-serif; font-size: 0.6875em; display: block} '
+    index                 = 'http://www.wired.co.uk/wired-magazine.aspx'
+
+    conversion_options = {
+                          'comment'   : description
+                        , 'tags'      : category
+                        , 'publisher' : publisher
+                        , 'language'  : language
+                        }
+
+    keep_only_tags = [dict(name='div', attrs={'class':'article-box'})]
+    remove_tags = [
+                     dict(name=['object','embed','iframe','link'])
+                    ,dict(attrs={'class':['opts','comment','stories']})
+                  ]
+    remove_tags_after = dict(name='div',attrs={'class':'stories'})
+    remove_attributes = ['height','width']
+
+
+    def parse_index(self):
+        totalfeeds = []
+        soup   = self.index_to_soup(self.index)
+        maincontent = soup.find('div',attrs={'class':'main-content'})
+        mfeed = []
+        if maincontent:
+           st = maincontent.find(attrs={'class':'most-wired-box'})
+           if st:
+              for itt in st.findAll('a',href=True):
+               url   = 'http://www.wired.co.uk' + itt['href']
+               title = self.tag_to_string(itt)
+               description = ''
+               date  = strftime(self.timefmt)
+               mfeed.append({
+                                  'title'      :title
+                                 ,'date'       :date
+                                 ,'url'        :url
+                                 ,'description':description
+                                })
+        totalfeeds.append(('Articles', mfeed))
+        return totalfeeds
+
+    def get_cover_url(self):
+        cover_url = None
+        soup = self.index_to_soup(self.index)
+        cover_item = soup.find('span', attrs={'class':'cover'})
+        if cover_item:
+           cover_url = cover_item.img['src']
+        return cover_url
+
+    def print_version(self, url):
+        return url + '?page=all'
--- a/src/calibre/constants.py
+++ b/src/calibre/constants.py
@ -2,7 +2,7 @@ __license__   = 'GPL v3'
 __copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
 __docformat__ = 'restructuredtext en'
 __appname__   = 'calibre'
-__version__   = '0.6.40'
+__version__   = '0.6.42'
 __author__    = "Kovid Goyal <kovid@kovidgoyal.net>"

 import re
--- a/src/calibre/customize/init.py
+++ b/src/calibre/customize/init.py
@ -139,12 +139,11 @@ class FileTypePlugin(Plugin):
    #: to the database
    on_import      = False

-    #: If True, this plugin is run whenever an any2* tool
-    #: is used, on the file passed to the any2* tool.
+    #: If True, this plugin is run just before a conversion
    on_preprocess  = False

-    #: If True, this plugin is run after an any2* tool is
-    #: used, on the final file produced by the tool.
+    #: If True, this plugin is run after conversion
+    #: on the final file produced by the conversion output plugin.
    on_postprocess = False

    type = _('File type')
@ -249,6 +248,7 @@ class CatalogPlugin(Plugin):
    #:                       dest = 'catalog_title',
    #:                       help = (_('Title of generated catalog. \nDefault:') + " '" +
    #:                       '%default' + "'"))]
+    #: cli_options parsed in library.cli:catalog_option_parser()

    cli_options = []

@ -275,9 +275,10 @@ class CatalogPlugin(Plugin):
    def get_output_fields(self, opts):
        # Return a list of requested fields, with opts.sort_by first
        all_fields = set(
-                          ['author_sort','authors','comments','cover','formats',                           'id','isbn','pubdate','publisher','rating',
-                          'series_index','series','size','tags','timestamp',
-                          'title','uuid'])
+                          ['author_sort','authors','comments','cover','formats',
+                           'id','isbn','pubdate','publisher','rating',
+                           'series_index','series','size','tags','timestamp',
+                           'title','uuid'])

        fields = all_fields
        if opts.fields != 'all':
--- a/src/calibre/ebooks/chm/input.py
+++ b/src/calibre/ebooks/chm/input.py
@ -4,27 +4,21 @@ __license__ = 'GPL v3'
 __copyright__  = '2008, Kovid Goyal <kovid at kovidgoyal.net>,' \
                 ' and Alex Bramley <a.bramley at gmail.com>.'

-import sys, logging, os, re, shutil, subprocess, uuid
-from shutil import rmtree
+import os, shutil, uuid
 from tempfile import mkdtemp
 from mimetypes import guess_type as guess_mimetype
-from htmlentitydefs import name2codepoint
-from pprint import PrettyPrinter

-from BeautifulSoup import BeautifulSoup, NavigableString
-from lxml import html, etree
+from BeautifulSoup import BeautifulSoup
+from lxml import html
 from pychm.chm import CHMFile
 from pychm.chmlib import (
  CHM_RESOLVE_SUCCESS, CHM_ENUMERATE_NORMAL,
-  chm_enumerate, chm_retrieve_object,
+  chm_enumerate,
 )

 from calibre.customize.conversion import InputFormatPlugin, OptionRecommendation
 from calibre.utils.config import OptionParser
-from calibre.ebooks.metadata import MetaInformation
-from calibre.ebooks.metadata.opf2 import OPFCreator, Guide
 from calibre.ebooks.metadata.toc import TOC
-from calibre.ebooks.lrf.html.convert_from import process_file as html_process_file
 from calibre.utils.localization import get_lang
 from calibre.utils.filenames import ascii_filename

@ -35,17 +29,6 @@ def match_string(s1, s2_already_lowered):
            return True
    return False

-def check_all_prev_empty(tag):
-    if tag is None:
-        return True
-    if tag.__class__ == NavigableString and not check_empty(tag):
-        return False
-    return check_all_prev_empty(tag.previousSibling)
-
-def check_empty(s, rex = re.compile(r'\S')):
-    return rex.search(s) is None
-
-
 def option_parser():
    parser = OptionParser(usage=_('%prog [options] mybook.chm'))
    parser.add_option('--output-dir', '-d', default='.', help=_('Output directory. Defaults to current directory'), dest='output')
@ -150,18 +133,18 @@ class CHMReader(CHMFile):

    def _reformat(self, data):
        try:
-            html = BeautifulSoup(data)
+            soup = BeautifulSoup(data)
        except UnicodeEncodeError:
            # hit some strange encoding problems...
            print "Unable to parse html for cleaning, leaving it :("
            return data
        # nuke javascript...
-        [s.extract() for s in html('script')]
+        [s.extract() for s in soup('script')]
        # remove forward and back nav bars from the top/bottom of each page
        # cos they really fuck with the flow of things and generally waste space
        # since we can't use [a,b] syntax to select arbitrary items from a list
        # we'll have to do this manually...
-        t = html('table')
+        t = soup('table')
        if t:
            if (t[0].previousSibling is None
              or t[0].previousSibling.previousSibling is None):
@ -171,15 +154,9 @@ class CHMReader(CHMFile):
                t[-1].extract()
        # for some very odd reason each page's content appears to be in a table
        # too. and this table has sub-tables for random asides... grr.
-        
-        # remove br at top of page if present after nav bars removed
-        br = html('br')
-        if br:
-            if check_all_prev_empty(br[0].previousSibling):
-                br[0].extract()

        # some images seem to be broken in some chm's :/
-        for img in html('img'):
+        for img in soup('img'):
            try:
                # some are supposedly "relative"... lies.
                while img['src'].startswith('../'): img['src'] = img['src'][3:]
@ -189,7 +166,7 @@ class CHMReader(CHMFile):
                # and some don't even have a src= ?!
                pass
        # now give back some pretty html.
-        return html.prettify()
+        return soup.prettify()

    def Contents(self):
        if self._contents is not None:
@ -247,7 +224,7 @@ class CHMInput(InputFormatPlugin):
        no_images = False #options.no_images
        chm_name = stream.name
        #chm_data = stream.read()
-        
+
        #closing stream so CHM can be opened by external library
        stream.close()
        log.debug('tdir=%s' % tdir)
@ -257,7 +234,6 @@ class CHMInput(InputFormatPlugin):

        metadata = get_metadata_(tdir)

-        cwd = os.getcwdu()
        odi = options.debug_pipeline
        options.debug_pipeline = None
        # try a custom conversion:
@ -277,15 +253,11 @@ class CHMInput(InputFormatPlugin):
        htmlinput = HTMLInput(None)
        oeb = htmlinput.create_oebbook(htmlpath, basedir, opts, log, mi)
        return oeb
-        
+

    def _create_oebbook(self, hhcpath, basedir, opts, log, mi):
        from calibre.ebooks.conversion.plumber import create_oebbook
-        from calibre.ebooks.oeb.base import DirContainer, \
-            rewrite_links, urlnormalize, urldefrag, BINARY_MIME, OEB_STYLES, \
-            xpath
-        from calibre import guess_type
-        import cssutils
+        from calibre.ebooks.oeb.base import DirContainer
        oeb = create_oebbook(log, None, opts, self,
                encoding=opts.input_encoding, populate=False)
        self.oeb = oeb
@ -305,10 +277,10 @@ class CHMInput(InputFormatPlugin):
            metadata.add('language', get_lang())
        if not metadata.creator:
            oeb.logger.warn('Creator not specified')
-            metadata.add('creator', self.oeb.translate(__('Unknown')))
+            metadata.add('creator', _('Unknown'))
        if not metadata.title:
            oeb.logger.warn('Title not specified')
-            metadata.add('title', self.oeb.translate(__('Unknown')))
+            metadata.add('title', _('Unknown'))

        bookid = str(uuid.uuid4())
        metadata.add('identifier', bookid, id='uuid_id', scheme='uuid')
@ -325,7 +297,7 @@ class CHMInput(InputFormatPlugin):
        #print etree.tostring(hhcroot, pretty_print=True)
        #print "============================="
        log.debug('Found %d section nodes' % len(chapters))
-        
+
        if len(chapters) > 0:
            path0 = chapters[0][1]
            subpath = os.path.dirname(path0)
--- a/src/calibre/ebooks/conversion/cli.py
+++ b/src/calibre/ebooks/conversion/cli.py
@ -233,14 +233,18 @@ def create_option_parser(args, log):

    return parser, plumber

+def abspath(x):
+    if x.startswith('http:') or x.startswith('https:'):
+        return x
+    return os.path.abspath(os.path.expanduser(x))
+
 def main(args=sys.argv):
    log = Log()
    parser, plumber = create_option_parser(args, log)
    opts = parser.parse_args(args)[0]
-    y = lambda q : os.path.abspath(os.path.expanduser(q))
    for x in ('read_metadata_from_opf', 'cover'):
        if getattr(opts, x, None) is not None:
-            setattr(opts, x, y(getattr(opts, x)))
+            setattr(opts, x, abspath(getattr(opts, x)))
    recommendations = [(n.dest, getattr(opts, n.dest),
                        OptionRecommendation.HIGH) \
                                        for n in parser.options_iter()
--- a/src/calibre/ebooks/conversion/plumber.py
+++ b/src/calibre/ebooks/conversion/plumber.py
@ -424,7 +424,7 @@ OptionRecommendation(name='author_sort',

 OptionRecommendation(name='cover',
    recommended_value=None, level=OptionRecommendation.LOW,
-    help=_('Set the cover to the specified file.')),
+    help=_('Set the cover to the specified file or URL')),

 OptionRecommendation(name='comments',
    recommended_value=None, level=OptionRecommendation.LOW,
@ -638,6 +638,20 @@ OptionRecommendation(name='timestamp',
                        continue
                setattr(mi, x, val)

+    def download_cover(self, url):
+        from calibre import browser
+        from PIL import Image
+        from cStringIO import StringIO
+        from calibre.ptempfile import PersistentTemporaryFile
+        self.log('Downloading cover from %r'%url)
+        br = browser()
+        raw = br.open_novisit(url).read()
+        buf = StringIO(raw)
+        pt = PersistentTemporaryFile('.jpg')
+        pt.close()
+        img = Image.open(buf)
+        img.convert('RGB').save(pt.name)
+        return pt.name

    def read_user_metadata(self):
        '''
@ -655,6 +669,8 @@ OptionRecommendation(name='timestamp',
            mi = MetaInformation(opf)
        self.opts_to_mi(mi)
        if mi.cover:
+            if mi.cover.startswith('http:') or mi.cover.startswith('https:'):
+                mi.cover = self.download_cover(mi.cover)
            mi.cover_data = ('', open(mi.cover, 'rb').read())
            mi.cover = None
        self.user_metadata = mi
@ -770,6 +786,7 @@ OptionRecommendation(name='timestamp',
            self.oeb = create_oebbook(self.log, self.oeb, self.opts,
                    self.input_plugin)
        self.input_plugin.postprocess_book(self.oeb, self.opts, self.log)
+        self.opts.is_image_collection = self.input_plugin.is_image_collection
        pr = CompositeProgressReporter(0.34, 0.67, self.ui_reporter)
        self.flush()
        if self.opts.debug_pipeline is not None:
--- a/src/calibre/ebooks/metadata/mobi.py
+++ b/src/calibre/ebooks/metadata/mobi.py
@ -85,6 +85,8 @@ class StreamSlicer(object):
        self._stream.truncate(value)

 class MetadataUpdater(object):
+    DRM_KEY_SIZE = 48
+
    def __init__(self, stream):
        self.stream = stream
        data = self.data = StreamSlicer(stream)
@ -105,6 +107,13 @@ class MetadataUpdater(object):
        self.timestamp = None
        self.pdbrecords = self.get_pdbrecords()

+        self.drm_block = None
+        if self.encryption_type != 0:
+            if self.have_exth:
+                self.drm_block = self.fetchDRMdata()
+            else:
+                raise MobiError('Unable to set metadata on DRM file without EXTH header')
+
        self.original_exth_records = {}
        if not have_exth:
            self.create_exth()
@ -112,6 +121,16 @@ class MetadataUpdater(object):
        # Fetch timestamp, cover_record, thumbnail_record
        self.fetchEXTHFields()

+    def fetchDRMdata(self):
+        ''' Fetch the DRM keys '''
+        drm_offset = int(unpack('>I', self.record0[0xa8:0xac])[0])
+        self.drm_key_count = int(unpack('>I', self.record0[0xac:0xb0])[0])
+        drm_keys = ''
+        for x in range(self.drm_key_count):
+            base_addr = drm_offset + (x * self.DRM_KEY_SIZE)
+            drm_keys += self.record0[base_addr:base_addr + self.DRM_KEY_SIZE]
+        return drm_keys
+
    def fetchEXTHFields(self):
        stream = self.stream
        record0 = self.record0
@ -186,7 +205,8 @@ class MetadataUpdater(object):

    def create_exth(self, new_title=None, exth=None):
        # Add an EXTH block to record 0, rewrite the stream
-        # self.hexdump(self.record0)
+        if isinstance(new_title, unicode):
+            new_title = new_title.encode(self.codec, 'replace')

        # Fetch the existing title
        title_offset, = unpack('>L', self.record0[0x54:0x58])
@ -210,8 +230,14 @@ class MetadataUpdater(object):
            exth = ['EXTH', pack('>II', 12, 0), pad]
            exth = ''.join(exth)

-        # Update title_offset, title_len if new_title
-        self.record0[0x54:0x58] = pack('>L', 0x10 + mobi_header_length + len(exth))
+        # Update drm_offset(0xa8), title_offset(0x54)
+        if self.encryption_type != 0:
+            self.record0[0xa8:0xac] = pack('>L', 0x10 + mobi_header_length + len(exth))
+            self.record0[0xb0:0xb4] = pack('>L', len(self.drm_block))
+            self.record0[0x54:0x58] = pack('>L', 0x10 + mobi_header_length + len(exth) + len(self.drm_block))
+        else:
+            self.record0[0x54:0x58] = pack('>L', 0x10 + mobi_header_length + len(exth))
+
        if new_title:
            self.record0[0x58:0x5c] = pack('>L', len(new_title))

@ -219,20 +245,15 @@ class MetadataUpdater(object):
        new_record0 = StringIO()
        new_record0.write(self.record0[:0x10 + mobi_header_length])
        new_record0.write(exth)
-        if new_title:
-            #new_record0.write(new_title.encode(self.codec, 'replace'))
-            new_title = (new_title or _('Unknown')).encode(self.codec, 'replace')
-            new_record0.write(new_title)
-        else:
-            new_record0.write(title_in_file)
+        if self.encryption_type != 0:
+            new_record0.write(self.drm_block)
+        new_record0.write(new_title if new_title else title_in_file)

        # Pad to a 4-byte boundary
        trail = len(new_record0.getvalue()) % 4
        pad = '\0' * (4 - trail) # Always pad w/ at least 1 byte
        new_record0.write(pad)

-        #self.hexdump(new_record0.getvalue())
-
        # Rebuild the stream, update the pdbrecords pointers
        self.patchSection(0,new_record0.getvalue())

@ -342,10 +363,7 @@ class MetadataUpdater(object):
            recs.append((202, pack('>I', self.thumbnail_rindex)))
            pop_exth_record(202)

-        if getattr(self, 'encryption_type', -1) != 0:
-            raise MobiError('Setting metadata in DRMed MOBI files is not supported.')
-
-        # Restore any original EXTH fields that weren't modified/updated
+        # Restore any original EXTH fields that weren't updated
        for id in sorted(self.original_exth_records):
            recs.append((id, self.original_exth_records[id]))
        recs = sorted(recs, key=lambda x:(x[0],x[0]))
--- a/src/calibre/ebooks/mobi/writer.py
+++ b/src/calibre/ebooks/mobi/writer.py
@ -1376,7 +1376,7 @@ class MobiWriter(object):
            self._text_length,
            self._text_nrecords-1, RECORD_SIZE, 0, 0)) # 0 - 15 (0x0 - 0xf)
        uid = random.randint(0, 0xffffffff)
-        title = str(metadata.title[0])
+        title = unicode(metadata.title[0]).encode('utf-8')
        # The MOBI Header

        # 0x0 - 0x3
--- a/src/calibre/ebooks/oeb/transforms/rescale.py
+++ b/src/calibre/ebooks/oeb/transforms/rescale.py
@ -29,6 +29,9 @@ class RescaleImages(object):


        page_width, page_height = self.opts.dest.width, self.opts.dest.height
+        if not self.opts.is_image_collection:
+            page_width -= (self.opts.margin_left + self.opts.margin_right) * self.opts.dest.dpi/72.
+            page_height -= (self.opts.margin_top + self.opts.margin_bottom) * self.opts.dest.dpi/72.
        for item in self.oeb.manifest:
            if item.media_type.startswith('image'):
                raw = item.data
@ -53,7 +56,8 @@ class RescaleImages(object):
                scaled, new_width, new_height = fit_image(width, height,
                        page_width, page_height)
                if scaled:
-                    self.log('Rescaling image', item.href)
+                    self.log('Rescaling image from %dx%d to %dx%d'%(
+                        width, height, new_width, new_height), item.href)
                    if qt:
                        img = img.scaled(new_width, new_height,
                                Qt.IgnoreAspectRatio, Qt.SmoothTransformation)
--- a/src/calibre/gui2/init.py
+++ b/src/calibre/gui2/init.py
@ -2,9 +2,11 @@ __license__   = 'GPL v3'
 __copyright__ = '2008, Kovid Goyal <kovid at kovidgoyal.net>'
 """ The GUI """
 import os
+from threading import RLock
+
 from PyQt4.QtCore import QVariant, QFileInfo, QObject, SIGNAL, QBuffer, Qt, QSize, \
                         QByteArray, QTranslator, QCoreApplication, QThread, \
-                         QEvent
+                         QEvent, QTimer, pyqtSignal
 from PyQt4.QtGui import QFileDialog, QMessageBox, QPixmap, QFileIconProvider, \
                        QIcon, QTableView, QApplication, QDialog, QPushButton

@ -234,16 +236,17 @@ def human_readable(size):
    return size + " " + suffix

 class Dispatcher(QObject):
-    '''Convenience class to ensure that a function call always happens in the GUI thread'''
-    SIGNAL = SIGNAL('dispatcher(PyQt_PyObject,PyQt_PyObject)')
+    '''Convenience class to ensure that a function call always happens in the
+    thread the reciver was created in.'''
+    dispatch_signal = pyqtSignal(object, object)

    def __init__(self, func):
        QObject.__init__(self)
        self.func = func
-        self.connect(self, self.SIGNAL, self.dispatch, Qt.QueuedConnection)
+        self.dispatch_signal.connect(self.dispatch, type=Qt.QueuedConnection)

    def __call__(self, *args, **kwargs):
-        self.emit(self.SIGNAL, args, kwargs)
+        self.dispatch_signal.emit(args, kwargs)

    def dispatch(self, args, kwargs):
        self.func(*args, **kwargs)
@ -533,6 +536,8 @@ class Application(QApplication):
        self._translator = None
        self.load_translations()
        qt_app = self
+        self._file_open_paths = []
+        self._file_open_lock = RLock()

        if islinux:
            self.setStyleSheet('''
@ -545,6 +550,12 @@ class Application(QApplication):
                    }
            ''')

+    def _send_file_open_events(self):
+        with self._file_open_lock:
+            if self._file_open_paths:
+                self.file_event_hook(self._file_open_paths)
+                self._file_open_paths = []
+

    def load_translations(self):
        if self._translator is not None:
@ -557,7 +568,9 @@ class Application(QApplication):
        if callable(self.file_event_hook) and e.type() == QEvent.FileOpen:
            path = unicode(e.file())
            if os.access(path, os.R_OK):
-                self.file_event_hook(path)
+                with self._file_open_lock:
+                    self._file_open_paths.append(path)
+                QTimer.singleShot(1000, self._send_file_open_events)
            return True
        else:
            return QApplication.event(self, e)
--- a/src/calibre/gui2/ui.py
+++ b/src/calibre/gui2/ui.py
@ -601,6 +601,8 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
        if dynamic.get('tag_view_visible', False):
            self.status_bar.tag_view_button.toggle()

+        self._add_filesystem_book = Dispatcher(self.__add_filesystem_book)
+

    def resizeEvent(self, ev):
        MainWindow.resizeEvent(self, ev)
@ -988,15 +990,24 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
            self.cover_cache.refresh([cid])
            self.library_view.model().current_changed(current_idx, current_idx)

-    def add_filesystem_book(self, path, allow_device=True):
-        if os.access(path, os.R_OK):
-            books = [os.path.abspath(path)]
+    def __add_filesystem_book(self, paths, allow_device=True):
+        print 222, paths
+        if isinstance(paths, basestring):
+            paths = [paths]
+        books = [path for path in map(os.path.abspath, paths) if os.access(path,
+            os.R_OK)]
+
+        if books:
            to_device = allow_device and self.stack.currentIndex() != 0
            self._add_books(books, to_device)
            if to_device:
                self.status_bar.showMessage(\
                        _('Uploading books to device.'), 2000)

+
+    def add_filesystem_book(self, paths, allow_device=True):
+        self._add_filesystem_book(paths, allow_device=allow_device)
+
    def add_books(self, checked):
        '''
        Add books from the local filesystem to either the library or the device.
@ -1042,21 +1053,23 @@ class Main(MainWindow, Ui_MainWindow, DeviceGUI):
                                infos, on_card=on_card)
            self.status_bar.showMessage(
                    _('Uploading books to device.'), 2000)
-        if self._adder.number_of_books_added > 0:
+        if getattr(self._adder, 'number_of_books_added', 0) > 0:
            self.library_view.model().books_added(self._adder.number_of_books_added)
            if hasattr(self, 'db_images'):
                self.db_images.reset()
-        if self._adder.critical:
+        if getattr(self._adder, 'critical', None):
            det_msg = []
            for name, log in self._adder.critical.items():
                if isinstance(name, str):
                    name = name.decode(filesystem_encoding, 'replace')
                det_msg.append(name+'\n'+log)
+
            warning_dialog(self, _('Failed to read metadata'),
                    _('Failed to read metadata from the following')+':',
                    det_msg='\n\n'.join(det_msg), show=True)

-        self._adder.cleanup()
+        if hasattr(self._adder, 'cleanup'):
+            self._adder.cleanup()
        self._adder = None


--- a/src/calibre/library/catalog.py
+++ b/src/calibre/library/catalog.py
@ -1,4 +1,4 @@
-import datetime, htmlentitydefs, os, re, shutil, time
+import datetime, htmlentitydefs, os, re, shutil

 from collections import namedtuple
 from copy import deepcopy
@ -11,7 +11,7 @@ from calibre.customize.conversion import OptionRecommendation, DummyReporter
 from calibre.ebooks.BeautifulSoup import BeautifulSoup, BeautifulStoneSoup, Tag, NavigableString
 from calibre.ptempfile import PersistentTemporaryDirectory
 from calibre.utils.logging import Log
-from calibre.utils.date import isoformat
+from calibre.utils.date import isoformat, now as nowf

 FIELDS = ['all', 'author_sort', 'authors', 'comments',
          'cover', 'formats', 'id', 'isbn', 'pubdate', 'publisher', 'rating',
@ -21,7 +21,7 @@ FIELDS = ['all', 'author_sort', 'authors', 'comments',
 class CSV_XML(CatalogPlugin):
    'CSV/XML catalog generator'

-    Option = namedtuple('Option', 'option, default, dest, help')
+    Option = namedtuple('Option', 'option, default, dest, action, help')

    name = 'Catalog_CSV_XML'
    description = 'CSV/XML catalog generator'
@ -34,6 +34,7 @@ class CSV_XML(CatalogPlugin):
            Option('--fields',
                default = 'all',
                dest = 'fields',
+                action = None,
                help = _('The fields to output when cataloging books in the '
                    'database.  Should be a comma-separated list of fields.\n'
                    'Available fields: %s.\n'
@ -43,6 +44,7 @@ class CSV_XML(CatalogPlugin):
            Option('--sort-by',
                default = 'id',
                dest = 'sort_by',
+                action = None,
                help = _('Output field to sort on.\n'
                'Available fields: author_sort, id, rating, size, timestamp, title.\n'
                "Default: '%default'\n"
@ -241,7 +243,7 @@ class CSV_XML(CatalogPlugin):
 class EPUB_MOBI(CatalogPlugin):
    'ePub catalog generator'

-    Option = namedtuple('Option', 'option, default, dest, help')
+    Option = namedtuple('Option', 'option, default, dest, action, help')

    name = 'Catalog_EPUB_MOBI'
    description = 'EPUB/MOBI catalog generator'
@ -254,12 +256,14 @@ class EPUB_MOBI(CatalogPlugin):
    cli_options = [Option('--catalog-title',
                          default = 'My Books',
                          dest = 'catalog_title',
+                          action = None,
                          help = _('Title of generated catalog used as title in metadata.\n'
                          "Default: '%default'\n"
                          "Applies to: ePub, MOBI output formats")),
                   Option('--debug-pipeline',
                           default=None,
                           dest='debug_pipeline',
+                           action = None,
                           help=_("Save the output from different stages of the conversion "
                           "pipeline to the specified "
                           "directory. Useful if you are unsure at which stage "
@ -269,48 +273,56 @@ class EPUB_MOBI(CatalogPlugin):
                   Option('--exclude-genre',
                          default='\[[\w ]*\]',
                          dest='exclude_genre',
+                          action = None,
                          help=_("Regex describing tags to exclude as genres.\n" "Default: '%default' excludes bracketed tags, e.g. '[<tag>]'\n"
                          "Applies to: ePub, MOBI output formats")),
                   Option('--exclude-tags',
                          default=('~,'+_('Catalog')),
                          dest='exclude_tags',
+                          action = None,
                          help=_("Comma-separated list of tag words indicating book should be excluded from output.  Case-insensitive.\n"
                          "--exclude-tags=skip will match 'skip this book' and 'Skip will like this'.\n"
                          "Default: '%default'\n"
                          "Applies to: ePub, MOBI output formats")),
                   Option('--generate-titles',
-                          default=True,
+                          default=False,
                          dest='generate_titles',
+                          action = 'store_true',
                          help=_("Include 'Titles' section in catalog.\n"
                          "Default: '%default'\n"
                          "Applies to: ePub, MOBI output formats")),
                   Option('--generate-recently-added',
-                          default=True,
+                          default=False,
                          dest='generate_recently_added',
+                          action = 'store_true',
                          help=_("Include 'Recently Added' section in catalog.\n"
                          "Default: '%default'\n"
                          "Applies to: ePub, MOBI output formats")),
                   Option('--note-tag',
                          default='*',
                          dest='note_tag',
+                          action = None,
                          help=_("Tag prefix for user notes, e.g. '*Jeff might enjoy reading this'.\n"
                          "Default: '%default'\n"
                          "Applies to: ePub, MOBI output formats")),
                   Option('--numbers-as-text',
                          default=False,
                          dest='numbers_as_text',
+                          action = None,
                          help=_("Sort titles with leading numbers as text, e.g.,\n'2001: A Space Odyssey' sorts as \n'Two Thousand One: A Space Odyssey'.\n"
                          "Default: '%default'\n"
                          "Applies to: ePub, MOBI output formats")),
                   Option('--output-profile',
                          default=None,
                          dest='output_profile',
+                          action = None,
                          help=_("Specifies the output profile.  In some cases, an output profile is required to optimize the catalog for the device.  For example, 'kindle' or 'kindle_dx' creates a structured Table of Contents with Sections and Articles.\n"
                          "Default: '%default'\n"
                          "Applies to: ePub, MOBI output formats")),
                   Option('--read-tag',
                          default='+',
                          dest='read_tag',
+                          action = None,
                          help=_("Tag indicating book has been read.\n" "Default: '%default'\n"
                          "Applies to: ePub, MOBI output formats")),
                          ]
@ -1749,9 +1761,8 @@ class EPUB_MOBI(CatalogPlugin):
                        book['title_sort'] = self.generateSortTitle(book['title'])
                self.booksByDateRange = sorted(nspt, key=lambda x:(x['timestamp'], x['timestamp']),reverse=True)

-            today = datetime.datetime.now()
            date_range_list = []
-            today_time = datetime.datetime(today.year, today.month, today.day)
+            today_time = nowf().replace(hour=23, minute=59, second=59)
            books_added_in_date_range = False
            for (i, date) in enumerate(self.DATE_RANGE):
                date_range_limit = self.DATE_RANGE[i]
@ -1759,14 +1770,16 @@ class EPUB_MOBI(CatalogPlugin):
                    date_range = '%d to %d days ago' % (self.DATE_RANGE[i-1], self.DATE_RANGE[i])
                else:
                    date_range = 'Last %d days' % (self.DATE_RANGE[i])
+
                for book in self.booksByDateRange:
-                    book_time = datetime.datetime(book['timestamp'].year, book['timestamp'].month, book['timestamp'].day)
-                    if (today_time-book_time).days <= date_range_limit:
-                        #print "generateHTMLByDateAdded: %s added %d days ago" % (book['title'], (today_time-book_time).days)
+                    book_time = book['timestamp']
+                    delta = today_time-book_time
+                    if delta.days <= date_range_limit:
                        date_range_list.append(book)
                        books_added_in_date_range = True
                    else:
                        break
+
                dtc = add_books_to_HTML_by_date_range(date_range_list, date_range, dtc)
                date_range_list = [book]

@ -3412,13 +3425,12 @@ class EPUB_MOBI(CatalogPlugin):
    def run(self, path_to_output, opts, db, notification=DummyReporter()):
        opts.log = log = Log()
        opts.fmt = self.fmt = path_to_output.rpartition('.')[2]
-        self.opts = opts

        # Add local options
        opts.creator = "calibre"

        # Finalize output_profile
-        op = self.opts.output_profile
+        op = opts.output_profile
        if op is None:
            op = 'default'
        if opts.connected_device['name'] and 'kindle' in opts.connected_device['name'].lower():
@ -3428,59 +3440,61 @@ class EPUB_MOBI(CatalogPlugin):
                op = "kindle"
        opts.descriptionClip = 380 if op.endswith('dx') or 'kindle' not in op else 100
        opts.authorClip = 100 if op.endswith('dx') or 'kindle' not in op else 60
-        self.opts.output_profile = op
+        opts.output_profile = op

        opts.basename = "Catalog"
        opts.cli_environment = not hasattr(opts,'sync')
-        # GwR *** hardwired to sort by author, could be an option if passed in opts
        opts.sort_descriptions_by_author = True

-        if opts.verbose:
-            opts_dict = vars(opts)
-            log(u"%s(): Generating %s %sin %s environment" %
-                (self.name,self.fmt,'for %s ' % opts.output_profile if opts.output_profile else '',
-                 'CLI' if opts.cli_environment else 'GUI'))
-            if opts_dict['ids']:
-                log(" Book count: %d" % len(opts_dict['ids']))
+        build_log = []

-            sections_list = ['Descriptions','Authors']
-            if opts.generate_titles:
-                sections_list.append('Titles')
-            if opts.generate_recently_added:
-                sections_list.append('Recently Added')
-            if not opts.exclude_genre.strip() == '.':
-                sections_list.append('Genres')
-            log(u"Creating Sections for %s" % ', '.join(sections_list))
-
-            # If exclude_genre is blank, assume user wants all genre tags included
-            if opts.exclude_genre.strip() == '':
-                opts.exclude_genre = '\[^.\]'
-                log(" converting empty exclude_genre to '\[^.\]'")
-
-            if opts.connected_device['name']:
-                if opts.connected_device['serial']:
-                    log(" connected_device: '%s' #%s%s " % \
-                        (opts.connected_device['name'],
-                         opts.connected_device['serial'][0:4],
-                         'x' * (len(opts.connected_device['serial']) - 4)))
-                else:
-                    log(" connected_device: '%s'" % opts.connected_device['name'])
+        # If exclude_genre is blank, assume user wants all genre tags included
+        if opts.exclude_genre.strip() == '':
+            opts.exclude_genre = '\[^.\]'
+            build_log.append(" converting empty exclude_genre to '\[^.\]'")

+        if opts.connected_device['name']:
+            if opts.connected_device['serial']:
+                build_log.append(" connected_device: '%s' #%s%s " % \
+                    (opts.connected_device['name'],
+                     opts.connected_device['serial'][0:4],
+                     'x' * (len(opts.connected_device['serial']) - 4)))
+            else:
+                build_log.append(" connected_device: '%s'" % opts.connected_device['name'])
                for storage in opts.connected_device['storage']:
                    if storage:
-                        log("  mount point: %s" % storage)
-#                 for book in opts.connected_device['books']:
-#                     log("%s: %s" % (book.title, book.path))
+                        build_log.append("  mount point: %s" % storage)

-            # Display opts
-            keys = opts_dict.keys()
-            keys.sort()
-            log(" opts:")
-            for key in keys:
-                if key in ['catalog_title','authorClip','descriptionClip','exclude_genre','exclude_tags',
-                           'note_tag','numbers_as_text','read_tag',
-                           'search_text','sort_by','sort_descriptions_by_author','sync']:
-                    log("  %s: %s" % (key, opts_dict[key]))
+        opts_dict = vars(opts)
+        build_log.append(u"%s(): Generating %s %sin %s environment" %
+            (self.name,self.fmt,'for %s ' % opts.output_profile if opts.output_profile else '',
+             'CLI' if opts.cli_environment else 'GUI'))
+        if opts_dict['ids']:
+            build_log.append(" Book count: %d" % len(opts_dict['ids']))
+
+        sections_list = ['Descriptions','Authors']
+        if opts.generate_titles:
+            sections_list.append('Titles')
+        if opts.generate_recently_added:
+            sections_list.append('Recently Added')
+        if not opts.exclude_genre.strip() == '.':
+            sections_list.append('Genres')
+        build_log.append(u"Creating Sections for %s" % ', '.join(sections_list))
+
+        # Display opts
+        keys = opts_dict.keys()
+        keys.sort()
+        build_log.append(" opts:")
+        for key in keys:
+            if key in ['catalog_title','authorClip','descriptionClip','exclude_genre','exclude_tags',
+                       'note_tag','numbers_as_text','read_tag',
+                       'search_text','sort_by','sort_descriptions_by_author','sync']:
+                build_log.append("  %s: %s" % (key, opts_dict[key]))
+
+        if opts.verbose:
+            log('\n'.join(line for line in build_log))
+
+        self.opts = opts

        # Launch the Catalog builder
        catalog = self.CatalogBuilder(db, opts, self, report_progress=notification)
@ -3498,7 +3512,8 @@ class EPUB_MOBI(CatalogPlugin):

        if catalog_source_built:
            recommendations = []
-            # recommendations.append(('cover', I('catalog.svg'), OptionRecommendation.HIGH))
+            recommendations.append(('comments', '\n'.join(line for line in build_log),
+                    OptionRecommendation.HIGH))

            dp = getattr(opts, 'debug_pipeline', None)
            if dp is not None:
@ -3519,7 +3534,6 @@ class EPUB_MOBI(CatalogPlugin):
                            opts.basename + '.opf'), path_to_output, log, report_progress=notification,
                            abort_after_input_dump=False)
            plumber.merge_ui_recommendations(recommendations)
-
            plumber.run()
            return 0
        else:
--- a/src/calibre/library/cli.py
+++ b/src/calibre/library/cli.py
@ -587,9 +587,6 @@ def command_export(args, dbpath):
    do_export(get_db(dbpath, opts), ids, dir, opts)
    return 0

-
-#   GR additions
-
 def catalog_option_parser(args):
    from calibre.customize.ui import available_catalog_formats, plugin_for_catalog_format
    from calibre.utils.logging import Log
@ -599,10 +596,17 @@ def catalog_option_parser(args):
        # Fetch the extension-specific CLI options from the plugin
        plugin = plugin_for_catalog_format(fmt)
        for option in plugin.cli_options:
-            parser.add_option(option.option,
-                              default=option.default,
-                              dest=option.dest,
-                              help=option.help)
+            if option.action:
+                parser.add_option(option.option,
+                                  default=option.default,
+                                  dest=option.dest,
+                                  action=option.action,
+                                  help=option.help)
+            else:
+                parser.add_option(option.option,
+                                  default=option.default,
+                                  dest=option.dest,
+                                  help=option.help)

        return plugin

--- a/src/calibre/library/database2.py
+++ b/src/calibre/library/database2.py
@ -1458,35 +1458,35 @@ class LibraryDatabase2(LibraryDatabase):

    def add_catalog(self, path, title):
        format = os.path.splitext(path)[1][1:].lower()
-        stream = path if hasattr(path, 'read') else open(path, 'rb')
-        stream.seek(0)
-        matches = self.data.get_matches('title', title)
-        if matches:
-            tag_matches = self.data.get_matches('tags', _('Catalog'))
-            matches = matches.intersection(tag_matches)
-        db_id, existing = None, False
-        if matches:
-            db_id = list(matches)[0]
-            existing = True
-        if db_id is None:
-            obj = self.conn.execute('INSERT INTO books(title, author_sort) VALUES (?, ?)',
-                                (title, 'calibre'))
-            db_id = obj.lastrowid
-            self.data.books_added([db_id], self)
-            self.set_path(db_id, index_is_id=True)
-            self.conn.commit()
-            mi = MetaInformation(title, ['calibre'])
+        with open(path, 'rb') as stream:
+            matches = self.data.get_matches('title', '='+title)
+            if matches:
+                tag_matches = self.data.get_matches('tags', '='+_('Catalog'))
+                matches = matches.intersection(tag_matches)
+            db_id = None
+            if matches:
+                db_id = list(matches)[0]
+            if db_id is None:
+                obj = self.conn.execute('INSERT INTO books(title, author_sort) VALUES (?, ?)',
+                                    (title, 'calibre'))
+                db_id = obj.lastrowid
+                self.data.books_added([db_id], self)
+                self.set_path(db_id, index_is_id=True)
+                self.conn.commit()
+            try:
+                mi = get_metadata(stream, format)
+            except:
+                mi = MetaInformation(title, ['calibre'])
+            stream.seek(0)
+            mi.title, mi.authors = title, ['calibre']
            mi.tags = [_('Catalog')]
+            mi.pubdate = mi.timestamp = utcnow()
+            if format == 'mobi':
+                mi.cover, mi.cover_data = None, (None, None)
            self.set_metadata(db_id, mi)
+            self.add_format(db_id, format, stream, index_is_id=True)

-        self.add_format(db_id, format, stream, index_is_id=True)
-        if not hasattr(path, 'read'):
-            stream.close()
        self.conn.commit()
-        if existing:
-            t = utcnow()
-            self.set_timestamp(db_id, t, notify=False)
-            self.set_pubdate(db_id, t, notify=False)
        self.data.refresh_ids(self, [db_id]) # Needed to update format list and size
        return db_id

@ -1509,6 +1509,10 @@ class LibraryDatabase2(LibraryDatabase):
        self.data.books_added([id], self)
        self.set_path(id, index_is_id=True)
        self.conn.commit()
+        if mi.pubdate is None:
+            mi.pubdate = utcnow()
+        if mi.timestamp is None:
+            mi.timestamp = utcnow()
        self.set_metadata(id, mi)

        self.add_format(id, format, stream, index_is_id=True)
@ -1546,6 +1550,10 @@ class LibraryDatabase2(LibraryDatabase):
        self.data.books_added([id], self)
        self.set_path(id, True)
        self.conn.commit()
+        if mi.timestamp is None:
+            mi.timestamp = utcnow()
+        if mi.pubdate is None:
+            mi.pubdate = utcnow()
        self.set_metadata(id, mi)
        if cover is not None:
            self.set_cover(id, cover)
@ -1581,7 +1589,9 @@ class LibraryDatabase2(LibraryDatabase):
            self.set_path(id, True)
            self.conn.commit()
            if mi.timestamp is None:
-                mi.timestamp = nowf()
+                mi.timestamp = utcnow()
+            if mi.pubdate is None:
+                mi.pubdate = utcnow()
            self.set_metadata(id, mi)
            npath = self.run_import_plugins(path, format)
            format = os.path.splitext(npath)[-1].lower().replace('.', '').upper()
@ -1614,7 +1624,9 @@ class LibraryDatabase2(LibraryDatabase):
        self.data.books_added([id], self)
        self.set_path(id, True)
        if mi.timestamp is None:
-            mi.timestamp = nowf()
+            mi.timestamp = utcnow()
+        if mi.pubdate is None:
+            mi.pubdate = utcnow()
        self.set_metadata(id, mi, ignore_errors=True)
        for path in formats:
            ext = os.path.splitext(path)[1][1:].lower()
--- a/src/calibre/library/sqlite.py
+++ b/src/calibre/library/sqlite.py
@ -23,7 +23,7 @@ def convert_timestamp(val):
    return parse_date(val, as_utc=False)

 def adapt_datetime(dt):
-    return isoformat(dt)
+    return isoformat(dt, sep=' ')

 sqlite.register_adapter(datetime, adapt_datetime)
 sqlite.register_converter('timestamp', convert_timestamp)
--- a/src/calibre/translations/ar.po
+++ b/src/calibre/translations/ar.po
--- a/src/calibre/translations/calibre.pot
+++ b/src/calibre/translations/calibre.pot
--- a/src/calibre/translations/de.po
+++ b/src/calibre/translations/de.po
--- a/src/calibre/translations/en_CA.po
+++ b/src/calibre/translations/en_CA.po
--- a/src/calibre/translations/es.po
+++ b/src/calibre/translations/es.po
--- a/src/calibre/translations/fr.po
+++ b/src/calibre/translations/fr.po
--- a/src/calibre/translations/gl.po
+++ b/src/calibre/translations/gl.po
--- a/src/calibre/translations/hr.po
+++ b/src/calibre/translations/hr.po
--- a/src/calibre/translations/it.po
+++ b/src/calibre/translations/it.po
--- a/src/calibre/translations/ja.po
+++ b/src/calibre/translations/ja.po
--- a/src/calibre/translations/lv.po
+++ b/src/calibre/translations/lv.po
--- a/src/calibre/translations/nb.po
+++ b/src/calibre/translations/nb.po
--- a/src/calibre/translations/nl.po
+++ b/src/calibre/translations/nl.po
--- a/src/calibre/translations/pl.po
+++ b/src/calibre/translations/pl.po
--- a/src/calibre/translations/pt.po
+++ b/src/calibre/translations/pt.po
--- a/src/calibre/translations/ru.po
+++ b/src/calibre/translations/ru.po
--- a/src/calibre/translations/sq.po
+++ b/src/calibre/translations/sq.po
--- a/src/calibre/translations/sv.po
+++ b/src/calibre/translations/sv.po
--- a/src/calibre/translations/zh_TW.po
+++ b/src/calibre/translations/zh_TW.po
--- a/src/calibre/utils/date.py
+++ b/src/calibre/utils/date.py
@ -72,7 +72,7 @@ def qt_to_dt(qdate_or_qdatetime, as_utc=True):
    return dt.astimezone(_utc_tz if as_utc else _local_tz)

 def fromtimestamp(ctime, as_utc=True):
-    dt = datetime.utcfromtimestamp().replace(tzinfo=_utc_tz)
+    dt = datetime.utcfromtimestamp(ctime).replace(tzinfo=_utc_tz)
    if not as_utc:
        dt = dt.astimezone(_local_tz)
    return dt