Merge from trunk

2025-07-09 03:04:10 -04:00 · 2010-12-12 00:13:33 +01:00 · 2010-12-12 00:13:33 +01:00 · 042474b1eb
commit 042474b1eb
parent 1d968f71b7 1761b6fb92
87 changed files with 235318 additions and 123553 deletions
--- a/Changelog.yaml
+++ b/Changelog.yaml
@ -4,6 +4,81 @@
 # for important features/bug fixes.
 # Also, each release can have new and improved recipes.

+- version: 0.7.33
+  date: 2010-12-10
+
+  new features:
+    - title: "Language sensitive sorting"
+      type: major
+      description: >
+        "calibre now sorts using language specific rules. The language used is the language of the calibre interface, which can be changed via Preferences->Look & Feel. There is also
+        a tweak that allows you to use a different language from the one used for the calibre interface. Powered by the ICU library."
+
+    - title: "Add an action to merge only formats and leave metadata alone (Shift+Alt+M)"
+      tickets: [7709]
+
+    - title: "Add a tweak to control which custom columns are displayed in the Book details panel."
+
+    - title: "Implement a more sophisticated 'functional programming' template language. See the User Manual for details."
+
+    - title: "Speed up deleting of large numbers of books and show progress while doing so"
+
+    - title: "Adding books: Dont refresh the Tag Browser while adding multiple books. Should speed up the adding of large numbers of books."
+
+    - title: "Edit metadata dialog: When trying to download metadata, if there are multiple matches indicate which matches have a cover and summary in the list. Also add an option to automatically download the cover of the selected match."
+
+    - title: "Drivers for the HTC Legend and Samsung Epic"
+
+    - title: "FB2 Output: Convert SVG images in the input document to raster images"
+
+    - title: "News download: Localize the navigation bars in the downloaded news to the language the user has selected for their calibre interface"
+
+  bug fixes:
+    - title: "Various fixes to the Title Case function"
+      tickets: [7846]
+
+    - title: "Content server: Fix --url-prefix being ignored for links at the Top level"
+
+    - title: "News download: When generating periodicals for the SONY use the local timezone in the SONY specific metadata"
+
+    - title: "Fix bug in cover cache that could cause it to keep a large number of covers in memory. Showed up when adding large numbers of books to calibre."
+      tickets: [7813]
+
+    - title: "Adding books: Run in the main thread to prevent unfortunate interactions with the metadata backup. Also fix regression that broke the Abort button."
+
+    - title: "Fix a crash on OS X if OK is clicked inthe edit metadata button while downloading a cover"
+      tickets: [7716]
+
+    - title: "E-book viewer: Fix a regression that prevented booksmarks from working with some EPUB files"
+      tickets: [7812]
+
+    - title: "Save to disk: Refactor to not open a database connection in the worker process. Also fix a bug that could lead to save failures not being reported."
+
+    - title: "Fix regression in 0.7.32 that broke opening formats in the ebook viewer from the edit metadata dialog"
+
+    - title: "FB2 Output: Generate output 100% compliant with the FB2 spec"
+
+    - title: "Fix Saved search dropdown box looses selected search"
+      tickets: [7787]
+
+    - title: "TXT Output: Fix an issue where the br to space conversion was not being handled properly."
+
+  improved recipes:
+    - Le Monde
+    - Ming Pao
+    - New Yorker
+
+  new recipes:
+    - title: "ToyoKeizai News and Nikkei Social News"
+      author: "Hiroshi Miura"
+      
+    - title: "St. Louis Post Dispatch"
+      author: "cisaak"
+
+    - title: "Heise Open and Technology Review"
+      author: "Anton Gillert"
+
+
 - version: 0.7.32
  date: 2010-12-03

--- a/resources/default_tweaks.py
+++ b/resources/default_tweaks.py
@ -181,19 +181,25 @@ max_content_server_tags_shown=5
 # content_server_will_display is a list of custom fields to be displayed.
 # content_server_wont_display is a list of custom fields not to be displayed.
 # wont_display has priority over will_display.
-# The special value '*' means all custom fields.
+# The special value '*' means all custom fields. The value [] means no entries.
 # Defaults:
 #    content_server_will_display = ['*']
-#    content_server_wont_display = ['']
+#    content_server_wont_display = []
 # Examples:
 # To display only the custom fields #mytags and #genre:
 #   content_server_will_display = ['#mytags', '#genre']
-#   content_server_wont_display = ['']
+#   content_server_wont_display = []
 # To display all fields except #mycomments:
 #   content_server_will_display = ['*']
 #   content_server_wont_display['#mycomments']
 content_server_will_display = ['*']
-content_server_wont_display = ['']
+content_server_wont_display = []
+
+# Same as above (content server) but for the book details pane. Same syntax.
+# As above, this tweak affects only display of custom fields. The standard
+# fields are not affected
+book_details_will_display = ['*']
+book_details_wont_display = []


 # Set the maximum number of sort 'levels' that calibre will use to resort the
--- a/resources/recipes/heise_open.recipe
+++ b/resources/recipes/heise_open.recipe
@ -0,0 +1,38 @@
+__license__   = 'GPL v3'
+__copyright__ = '2010, Anton Gillert <atx at binaryninja.de>'
+
+'''
+Fetch Heise Open.
+'''
+from calibre.web.feeds.news import BasicNewsRecipe
+
+
+class HeiseOpenDe(BasicNewsRecipe):
+
+    title = 'Heise Open'
+    description = 'Opensource news from Germany'
+    __author__ = 'Anton Gillert'
+    use_embedded_content   = False
+    language = 'de'
+    timefmt = ' [%d %b %Y]'
+    max_articles_per_feed = 40
+    no_stylesheets = True
+
+    feeds =  [ ('Heise Open', 'http://www.heise.de/open/news/news-atom.xml') ]
+
+    def print_version(self, url):
+        return url + '?view=print'
+
+    remove_tags = [dict(id='navi_top'),
+		   dict(id='navi_bottom'),
+		   dict(name='div', attrs={'class':'navi_top_logo'}),
+		   dict(name='img', attrs={'src':'/open/icons/open_logo_2009_weiss.gif'}),
+		   dict(name='h5', attrs={'style':'margin: 0.5em 0;'}),
+		   dict(name='p', attrs={'class':'news_datum'}),
+		   dict(name='p', attrs={'class':'size80'})]
+    remove_tags_after = [dict(name='p', attrs={'class':'size80'})]
+
+    def get_cover_url(self):
+        return 'http://www.heise.de/open/icons/open_logo_2009_weiss.gif'
+
+
--- a/resources/recipes/kompiutierra.recipe
+++ b/resources/recipes/kompiutierra.recipe
@ -0,0 +1,36 @@
+#!/usr/bin/python
+# -*- coding: utf-8 -*-
+
+__license__   = 'GPL v3'
+__copyright__ = '2010, Vadim Dyadkin, dyadkin@gmail.com'
+__author__ = 'Vadim Dyadkin'
+
+from calibre.web.feeds.news import BasicNewsRecipe
+
+class Computerra(BasicNewsRecipe):
+    title = u'\u041a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u0440\u0430'
+    recursion = 50
+    oldest_article = 100
+    __author__  = 'Vadim Dyadkin'
+    max_articles_per_feed = 100
+    use_embedded_content  = False
+    simultaneous_downloads = 5
+    language = 'ru'
+    description = u'\u041a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u044b, \u043e\u043a\u043e\u043b\u043e\u043d\u0430\u0443\u0447\u043d\u044b\u0435 \u0438 \u043e\u043a\u043e\u043b\u043e\u0444\u0438\u043b\u043e\u0441\u043e\u0444\u0441\u043a\u0438\u0435 \u0441\u0442\u0430\u0442\u044c\u0438, \u0433\u0430\u0434\u0436\u0435\u0442\u044b.'
+
+    keep_only_tags = [dict(name='div', attrs={'id': 'content'}),]
+
+
+    feeds = [(u'\u041a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u0440\u0430', 'http://feeds.feedburner.com/ct_news/'),]
+
+    remove_tags = [dict(name='div', attrs={'id': ['fin', 'idc-container', 'idc-noscript',]}),
+                   dict(name='ul', attrs={'class': "related_post"}),
+                   dict(name='p', attrs={'class': 'info'}),
+                   dict(name='a', attrs={'rel': 'tag', 'class': 'twitter-share-button', 'type': 'button_count'}),
+                   dict(name='h2', attrs={}),]
+
+    extra_css = 'body { text-align: justify; }'
+
+    def get_article_url(self, article):
+        return article.get('feedburner:origLink', article.get('guid'))
+
--- a/resources/recipes/le_monde.recipe
+++ b/resources/recipes/le_monde.recipe
@ -1,106 +1,89 @@
-#!/usr/bin/env  python
-
-__license__   = 'GPL v3'
-__copyright__ = '2008, Mathieu Godlewski <mathieu at godlewski.fr>'
-'''
-lemonde.fr
-'''
-
 import re
-from calibre.web.feeds.news import BasicNewsRecipe
-
+from calibre.web.feeds.recipes import BasicNewsRecipe

 class LeMonde(BasicNewsRecipe):
-    title          = 'LeMonde.fr'
-    __author__ = 'Mathieu Godlewski and Sujata Raman'
-    description = 'Global news in french'
-    oldest_article = 3
-    language = 'fr'
+    title                  = 'Le Monde'
+    __author__             = 'veezh'
+    description            = 'Actualités'
+    oldest_article         = 1
+    max_articles_per_feed  = 100
+    no_stylesheets         = True
+    #delay                  = 1
+    use_embedded_content   = False
+    encoding               = 'cp1252'
+    publisher              = 'lemonde.fr'
+    language               = 'fr'
+    conversion_options = {
+                             'comments'        : description
+                            ,'language'        : language
+                            ,'publisher'       : publisher
+                            ,'linearize_tables': True
+                         }

-    max_articles_per_feed = 30
-    no_stylesheets = True
-    remove_javascript = True
+    remove_empty_feeds = True

+    filterDuplicates = True

-   # cover_url='http://abonnes.lemonde.fr/titresdumonde/'+date.today().strftime("%y%m%d")+'/1.jpg'
+    def preprocess_html(self, soup):
+        for alink in soup.findAll('a'):
+            if alink.string is not None:
+               tstr = alink.string
+               alink.replaceWith(tstr)
+        return soup

-
-    extra_css = '''
-                    .dateline{color:#666666;font-family:verdana,sans-serif;font-size:x-small;}
-                    .author{font-family:verdana,sans-serif;font-size:x-small;color:#222222;}
-                    .articleImage{color:#666666;font-family:verdana,sans-serif;font-size:x-small;}
-                    .mainText{font-family:Georgia,serif;color:#222222;}
-                    .LM_articleText{font-family:Arial,Helvetica,sans-serif;}
-                    .LM_titleZone{font-family:Arial,Helvetica,sans-serif;}
-                    .mainContent{font-family:Georgia,serif;}
-                    .LM_content{font-family:Georgia,serif;}
-                    .LM_caption{font-family:Georgia,serif;font-size:-small;}
-                    .LM_imageSource{font-family:Arial,Helvetica,sans-serif;font-size:x-small;color:#666666;}
-                    h1{font-family:Arial,Helvetica,sans-serif;font-size:medium;color:#000000;}
-                    .post{font-family:Arial,Helvetica,sans-serif;}
-                    .mainTitle{font-family:Georgia,serif;}
-                    .content{font-family:Georgia,serif;}
-                    .entry{font-family:Georgia,serif;}
-                    h2{font-family:Arial,Helvetica,sans-serif;font-size:large;}
-                    small{font-family:Arial,Helvetica,sans-serif;  color:#ED1B23;}
-                '''
-
-    feeds =  [
-             ('A la Une', 'http://www.lemonde.fr/rss/une.xml'),
-             ('International', 'http://www.lemonde.fr/rss/sequence/0,2-3210,1-0,0.xml'),
-             ('Europe', 'http://www.lemonde.fr/rss/sequence/0,2-3214,1-0,0.xml'),
-             ('Societe', 'http://www.lemonde.fr/rss/sequence/0,2-3224,1-0,0.xml'),
-             ('Economie', 'http://www.lemonde.fr/rss/sequence/0,2-3234,1-0,0.xml'),
-             ('Medias', 'http://www.lemonde.fr/rss/sequence/0,2-3236,1-0,0.xml'),
-             ('Rendez-vous', 'http://www.lemonde.fr/rss/sequence/0,2-3238,1-0,0.xml'),
-             ('Sports', 'http://www.lemonde.fr/rss/sequence/0,2-3242,1-0,0.xml'),
-             ('Planete', 'http://www.lemonde.fr/rss/sequence/0,2-3244,1-0,0.xml'),
-             ('Culture', 'http://www.lemonde.fr/rss/sequence/0,2-3246,1-0,0.xml'),
-             ('Technologies', 'http://www.lemonde.fr/rss/sequence/0,2-651865,1-0,0.xml'),
-             ('Cinema', 'http://www.lemonde.fr/rss/sequence/0,2-3476,1-0,0.xml'),
-             ('Voyages', 'http://www.lemonde.fr/rss/sequence/0,2-3546,1-0,0.xml'),
-             ('Livres', 'http://www.lemonde.fr/rss/sequence/0,2-3260,1-0,0.xml'),
-             ('Examens', 'http://www.lemonde.fr/rss/sequence/0,2-3404,1-0,0.xml'),
-             ('Opinions', 'http://www.lemonde.fr/rss/sequence/0,2-3232,1-0,0.xml')
-             ]
-    keep_only_tags = [dict(name='div', attrs={'id':["mainTitle","mainContent","LM_content","content"]}),
-                      dict(name='div', attrs={'class':["post"]})
-                      ]
-
-    remove_tags    = [dict(name='img', attrs={'src':'http://medias.lemonde.fr/mmpub/img/lgo/lemondefr_pet.gif'}),
-                                    dict(name='div', attrs={'id':'xiti-logo-noscript'}),
-                                    dict(name='br', attrs={}),
-                                    dict(name='iframe', attrs={}),
-                     dict(name='table', attrs={'id':["toolBox"]}),
-                      dict(name='table', attrs={'class':["bottomToolBox"]}),
-                      dict(name='div', attrs={'class':["pageNavigation","LM_pagination","fenetreBoxesContainer","breakingNews","LM_toolsBottom","LM_comments","LM_tools","pave_meme_sujet_hidden","boxMemeSujet"]}),
-                      dict(name='div', attrs={'id':["miniUne","LM_sideBar"]}),
-    ]
-
-    preprocess_regexps = [ (re.compile(i[0], re.IGNORECASE|re.DOTALL), i[1]) for i in
-        [
-            (r'<html.*(<div class="post".*?>.*?</div>.*?<div class="entry">.*?</div>).*You can start editing here.*</html>', lambda match : '<html><body>'+match.group(1)+'</body></html>'),
-            (r'<p>&nbsp;</p>', lambda match : ''),
-            (r'<img src="http://medias\.lemonde\.fr/mmpub/img/let/(.)\.gif"[^>]*><div class=ar-txt>', lambda match : '<div class=ar-txt>'+match.group(1).upper()),
-            (r'<img src="http://medias\.lemonde\.fr/mmpub/img/let/q(.)\.gif"[^>]*><div class=ar-txt>', lambda match : '<div class=ar-txt>"'+match.group(1).upper()),
-            (r'(<div class=desc><b>.*</b></div>).*</body>', lambda match : match.group(1)),
+    preprocess_regexps = [
+        (re.compile(r' \''), lambda match: ' &lsquo;'),
+        (re.compile(r'\''), lambda match: '&rsquo;'),
+        (re.compile(r'"<'), lambda match: '&nbsp;&raquo;<'),
+        (re.compile(r'>"'), lambda match: '>&laquo;&nbsp;'),
+        (re.compile(r'&rsquo;"'), lambda match: '&rsquo;«&nbsp;'),
+        (re.compile(r' "'), lambda match: ' &laquo;&nbsp;'),
+        (re.compile(r'" '), lambda match: '&nbsp;&raquo; '),
+        (re.compile(r'\("'), lambda match: '(&laquo;&nbsp;'),
+        (re.compile(r'"\)'), lambda match: '&nbsp;&raquo;)'),
+        (re.compile(r'"\.'), lambda match: '&nbsp;&raquo;.'),
+        (re.compile(r'",'), lambda match: '&nbsp;&raquo;,'),
+        (re.compile(r'"\?'), lambda match: '&nbsp;&raquo;?'),
+        (re.compile(r'":'), lambda match: '&nbsp;&raquo;:'),
+        (re.compile(r'";'), lambda match: '&nbsp;&raquo;;'),
+        (re.compile(r'"\!'), lambda match: '&nbsp;&raquo;!'),
+        (re.compile(r' :'), lambda match: '&nbsp;:'),
+        (re.compile(r' ;'), lambda match: '&nbsp;;'),
+        (re.compile(r' \?'), lambda match: '&nbsp;?'),
+        (re.compile(r' \!'), lambda match: '&nbsp;!'),
+        (re.compile(r'\s»'), lambda match: '&nbsp;»'),
+        (re.compile(r'«\s'), lambda match: '«&nbsp;'),
+        (re.compile(r' %'), lambda match: '&nbsp;%'),
+        (re.compile(r'\.jpg&nbsp;&raquo; border='), lambda match: '.jpg'),
+        (re.compile(r'\.png&nbsp;&raquo; border='), lambda match: '.png'),
        ]
-    ]

-    article_match_regexps = [ (re.compile(i)) for i in
-        [
-            (r'http://www\.lemonde\.fr/\S+/article/.*'),
-            (r'http://www\.lemonde\.fr/\S+/portfolio/.*'),
-            (r'http://www\.lemonde\.fr/\S+/article_interactif/.*'),
-            (r'http://\S+\.blog\.lemonde\.fr/.*'),
-        ]
-    ]
+    keep_only_tags    = [
+                       dict(name='div', attrs={'class':['contenu']})
+                        ]

-   # def print_version(self, url):
-   #     return re.sub('http://www\.lemonde\.fr/.*_([0-9]+)_[0-9]+\.html.*','http://www.lemonde.fr/web/imprimer_element/0,40-0,50-\\1,0.html' ,url)
+    remove_tags_after = [dict(id='appel_temoignage')]

-    # Used to filter duplicated articles
-    articles_list = []
+    def get_article_url(self, article):
+        link = article.get('link')
+        if 'blog' not in link:
+             return link
+
+
+
+    feeds          = [
+                      ('A la une', 'http://www.lemonde.fr/rss/une.xml'),
+                      ('International', 'http://www.lemonde.fr/rss/tag/international.xml'),
+                      ('Europe', 'http://www.lemonde.fr/rss/tag/europe.xml'),
+                      (u'Société', 'http://www.lemonde.fr/rss/tag/societe.xml'),
+                      ('Economie', 'http://www.lemonde.fr/rss/tag/economie.xml'),
+                      (u'Médias', 'http://www.lemonde.fr/rss/tag/actualite-medias.xml'),
+                      (u'Planète', 'http://www.lemonde.fr/rss/tag/planete.xml'),
+                      ('Culture', 'http://www.lemonde.fr/rss/tag/culture.xml'),
+                      ('Technologies', 'http://www.lemonde.fr/rss/tag/technologies.xml'),
+                      ('Livres', 'http://www.lemonde.fr/rss/tag/livres.xml'),
+
+                    ]

    def get_cover_url(self):
        cover_url = None
@ -111,42 +94,3 @@ class LeMonde(BasicNewsRecipe):
           cover_url = link_item.img['src']

        return cover_url
-
-    def get_article_url(self, article):
-        url=article.get('link',  None)
-        url=url[0:url.find("#")]
-        if url in self.articles_list:
-            self.log_debug(_('Skipping duplicated article: %s')%url)
-            return False
-        if self.is_article_wanted(url):
-            self.articles_list.append(url)
-            if '/portfolio/' in url or '/video/' in url:
-              url = None
-        return url
-        self.log_debug(_('Skipping filtered article: %s')%url)
-        url = article.get('guid', None)
-
-
-        return False
-
-
-    def is_article_wanted(self, url):
-        if self.article_match_regexps:
-            for m in self.article_match_regexps:
-                if m.search(url):
-                    return True
-            return False
-        return False
-
-    def preprocess_html(self, soup):
-
-          for item in soup.findAll(style=True):
-              del item['style']
-
-          for item in soup.findAll(face=True):
-              del item['face']
-          for tag in soup.findAll(name=['ul','li']):
-                tag.name = 'div'
-
-          return soup
-
--- a/resources/recipes/toyokeizai.recipe
+++ b/resources/recipes/toyokeizai.recipe
@ -64,5 +64,5 @@ class Toyokeizai(BasicNewsRecipe):
            br.select_form(nr=0)
            br['kaiin_id']   = self.username
            br['password'] = self.password
-            res = br.submit()
+            br.submit()
        return br
--- a/resources/recipes/tr.recipe
+++ b/resources/recipes/tr.recipe
@ -0,0 +1,37 @@
+__license__   = 'GPL v3'
+__copyright__ = '2010, Anton Gillert <atx at binaryninja.de>'
+
+'''
+Fetch Technology Review.
+'''
+from time import strftime
+from calibre.web.feeds.news import BasicNewsRecipe
+
+
+class TechnologyReviewDe(BasicNewsRecipe):
+
+    title = 'Technology Review'
+    description = 'Technology news from Germany'
+    __author__ = 'Anton Gillert'
+    use_embedded_content   = False
+    language = 'de'
+    timefmt = ' [%d %b %Y]'
+    max_articles_per_feed = 40
+    no_stylesheets = True
+
+    feeds =  [ ('Technology Review', 'http://www.heise.de/tr/news-atom.xml') ]
+
+    def print_version(self, url):
+        return url + '?view=print'
+
+    remove_tags = [dict(id='navi_top'),
+		   dict(id='navi_bottom'),
+		   dict(name='div', attrs={'class':'navi_top_logo'}),
+		   dict(name='img', attrs={'src':'/tr/icons/tr_logo2006.gif'}),
+		   dict(name='p', attrs={'class':'size80'})]
+    remove_tags_after = [dict(name='p', attrs={'class':'size80'})]
+
+    def get_cover_url(self):
+        return 'http://www.heise-medien.de/presseinfo/bilder/tr/' + strftime("%y/tr%m%Y.jpg")
+
+
--- a/src/calibre/constants.py
+++ b/src/calibre/constants.py
@ -2,7 +2,7 @@ __license__   = 'GPL v3'
 __copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
 __docformat__ = 'restructuredtext en'
 __appname__   = 'calibre'
-__version__   = '0.7.32'
+__version__   = '0.7.33'
 __author__    = "Kovid Goyal <kovid@kovidgoyal.net>"

 import re
--- a/src/calibre/devices/cybook/driver.py
+++ b/src/calibre/devices/cybook/driver.py
@ -65,6 +65,7 @@ class ORIZON(CYBOOK):

    BCD         = [0x319]

+    VENDOR_NAME = ['BOOKEEN', 'LINUX']
    WINDOWS_MAIN_MEM = re.compile(r'(CYBOOK_ORIZON__-FD)|(FILE-STOR_GADGET)')
    WINDOWS_CARD_A_MEM = re.compile('(CYBOOK_ORIZON__-SD)|(FILE-STOR_GADGET)')

--- a/src/calibre/devices/usbms/books.py
+++ b/src/calibre/devices/usbms/books.py
@ -240,7 +240,7 @@ class CollectionsBookList(BookList):
                return 1
            if y is None:
                return -1
-            if isinstance(x, (unicode, str)):
+            if isinstance(x, basestring) and isinstance(y, basestring):
                c = strcmp(force_unicode(x), force_unicode(y))
            else:
                c = cmp(x, y)
--- a/src/calibre/ebooks/epub/periodical.py
+++ b/src/calibre/ebooks/epub/periodical.py
@ -6,9 +6,11 @@ __copyright__ = '2010, Kovid Goyal <kovid@kovidgoyal.net>'
 __docformat__ = 'restructuredtext en'

 from uuid import uuid4
+import time

 from calibre.constants import __appname__, __version__
 from calibre import strftime, prepare_string_for_xml as xml
+from calibre.utils.date import parse_date

 SONY_METADATA = u'''\
 <?xml version="1.0" encoding="utf-8"?>
@ -87,7 +89,8 @@ def sony_metadata(oeb):
        pass

    try:
-        date = unicode(m.date[0]).split('T')[0]
+        date = parse_date(unicode(m.date[0]),
+                as_utc=False).strftime('%Y-%m-%d')
    except:
        date = strftime('%Y-%m-%d')
    try:
@ -101,7 +104,7 @@ def sony_metadata(oeb):
            publisher=xml(publisher), issue_date=xml(date),
            language=xml(language))

-    updated = strftime('%Y-%m-%dT%H:%M:%SZ')
+    updated = strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime())

    def cal_id(x):
        for k, v in x.attrib.items():
--- a/src/calibre/gui2/actions/edit_metadata.py
+++ b/src/calibre/gui2/actions/edit_metadata.py
@ -54,6 +54,10 @@ class EditMetadataAction(InterfaceAction):
        mb.addAction(_('Merge into first selected book - keep others'),
                partial(self.merge_books, safe_merge=True),
                Qt.AltModifier+Qt.Key_M)
+        mb.addSeparator()
+        mb.addAction(_('Merge only formats into first selected book - delete others'),
+                partial(self.merge_books, merge_only_formats=True),
+                Qt.AltModifier+Qt.ShiftModifier+Qt.Key_M)
        self.merge_menu = mb
        self.action_merge.setMenu(mb)
        md.addSeparator()
@ -206,7 +210,7 @@ class EditMetadataAction(InterfaceAction):
            self.gui.library_view.select_rows(ids)

    # Merge books {{{
-    def merge_books(self, safe_merge=False):
+    def merge_books(self, safe_merge=False, merge_only_formats=False):
        '''
        Merge selected books in library.
        '''
@ -220,6 +224,12 @@ class EditMetadataAction(InterfaceAction):
            return error_dialog(self.gui, _('Cannot merge books'),
                        _('At least two books must be selected for merging'),
                        show=True)
+        if len(rows) > 5:
+            if not confirm('<p>'+_('You are about to merge more than 5 books.  '
+                                    'Are you <b>sure</b> you want to proceed?')
+                                +'</p>', 'merge_too_many_books', self.gui):
+                return
+
        dest_id, src_books, src_ids = self.books_to_merge(rows)
        title = self.gui.library_view.model().db.title(dest_id, index_is_id=True)
        if safe_merge:
@ -234,6 +244,22 @@ class EditMetadataAction(InterfaceAction):
                return
            self.add_formats(dest_id, src_books)
            self.merge_metadata(dest_id, src_ids)
+        elif merge_only_formats:
+            if not confirm('<p>'+_(
+                'Book formats from the selected books will be merged '
+                'into the <b>first selected book</b> (%s). '
+                'Metadata in the first selected book will not be changed.'
+                'Author, Title, ISBN and all other metadata will <i>not</i> be merged.<br><br>'
+                'After merger the second and subsequently '
+                'selected books, with any metadata they have will be <b>deleted</b>. <br><br>'
+                'All book formats of the first selected book will be kept '
+                'and any duplicate formats in the second and subsequently selected books '
+                'will be permanently <b>deleted</b> from your calibre library.<br><br>  '
+                'Are you <b>sure</b> you want to proceed?')%title
+            +'</p>', 'merge_only_formats', self.gui):
+                return
+            self.add_formats(dest_id, src_books)
+            self.delete_books_after_merge(src_ids)
        else:
            if not confirm('<p>'+_(
                'Book formats and metadata from the selected books will be merged '
@ -243,15 +269,10 @@ class EditMetadataAction(InterfaceAction):
                'subsequently selected books will be <b>deleted</b>. <br><br>'
                'All book formats of the first selected book will be kept '
                'and any duplicate formats in the second and subsequently selected books '
-                'will be permanently <b>deleted</b> from your computer.<br><br>  '
+                'will be permanently <b>deleted</b> from your calibre library.<br><br>  '
                'Are you <b>sure</b> you want to proceed?')%title
            +'</p>', 'merge_books', self.gui):
                return
-            if len(rows)>5:
-                if not confirm('<p>'+_('You are about to merge more than 5 books.  '
-                                        'Are you <b>sure</b> you want to proceed?')
-                                    +'</p>', 'merge_too_many_books', self.gui):
-                    return
            self.add_formats(dest_id, src_books)
            self.merge_metadata(dest_id, src_ids)
            self.delete_books_after_merge(src_ids)
--- a/src/calibre/gui2/dialogs/comments_dialog.py
+++ b/src/calibre/gui2/dialogs/comments_dialog.py
@ -3,7 +3,7 @@ __copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
 __docformat__ = 'restructuredtext en'
 __license__   = 'GPL v3'

-from PyQt4.Qt import Qt, QDialog
+from PyQt4.Qt import Qt, QDialog, QDialogButtonBox
 from calibre.gui2.dialogs.comments_dialog_ui import Ui_CommentsDialog

 class CommentsDialog(QDialog, Ui_CommentsDialog):
@ -20,3 +20,6 @@ class CommentsDialog(QDialog, Ui_CommentsDialog):
        if text is not None:
            self.textbox.setPlainText(text)
        self.textbox.setTabChangesFocus(True)
+        self.buttonBox.button(QDialogButtonBox.Ok).setText(_('&OK'))
+        self.buttonBox.button(QDialogButtonBox.Cancel).setText(_('&Cancel'))
+
--- a/src/calibre/gui2/dialogs/comments_dialog.ui
+++ b/src/calibre/gui2/dialogs/comments_dialog.ui
@ -19,15 +19,6 @@
  <property name="windowTitle">
   <string>Edit Comments</string>
  </property>
-  <widget class="QWidget" name="verticalLayoutWidget">
-   <property name="geometry">
-    <rect>
-     <x>10</x>
-     <y>10</y>
-     <width>311</width>
-     <height>211</height>
-    </rect>
-   </property>
   <layout class="QVBoxLayout" name="verticalLayout">
    <item>
     <widget class="QPlainTextEdit" name="textbox"/>
@ -43,7 +34,6 @@
     </widget>
    </item>
   </layout>
-  </widget>
 </widget>
 <resources/>
 <connections>
--- a/src/calibre/gui2/dialogs/confirm_delete.py
+++ b/src/calibre/gui2/dialogs/confirm_delete.py
@ -31,4 +31,5 @@ def confirm(msg, name, parent=None, pixmap='dialog_warning.png'):
    d = Dialog(msg, name, parent)
    d.label.setPixmap(QPixmap(I(pixmap)))
    d.setWindowIcon(QIcon(I(pixmap)))
+    d.resize(d.sizeHint())
    return d.exec_() == d.Accepted
--- a/src/calibre/gui2/dialogs/edit_authors_dialog.py
+++ b/src/calibre/gui2/dialogs/edit_authors_dialog.py
@ -8,13 +8,14 @@ from PyQt4.Qt import Qt, QDialog, QTableWidgetItem, QAbstractItemView
 from calibre.ebooks.metadata import author_to_author_sort
 from calibre.gui2 import error_dialog
 from calibre.gui2.dialogs.edit_authors_dialog_ui import Ui_EditAuthorsDialog
+from calibre.utils.icu import sort_key, strcmp

 class tableItem(QTableWidgetItem):
    def __ge__(self, other):
-        return unicode(self.text()).lower() >= unicode(other.text()).lower()
+        return sort_key(unicode(self.text())) >= sort_key(unicode(other.text()))

    def __lt__(self, other):
-        return unicode(self.text()).lower() < unicode(other.text()).lower()
+        return sort_key(unicode(self.text())) < sort_key(unicode(other.text()))

 class EditAuthorsDialog(QDialog, Ui_EditAuthorsDialog):

@ -36,6 +37,7 @@ class EditAuthorsDialog(QDialog, Ui_EditAuthorsDialog):
        self.authors = {}
        auts = db.get_authors_with_ids()
        self.table.setRowCount(len(auts))
+        setattr(self.table, '__lt__', lambda x, y: True if strcmp(x, y) < 0 else False)
        select_item = None
        for row, (id, author, sort) in enumerate(auts):
            author = author.replace('|', ',')
--- a/src/calibre/gui2/library/delegates.py
+++ b/src/calibre/gui2/library/delegates.py
@ -349,10 +349,19 @@ class CcTemplateDelegate(QStyledItemDelegate): # {{{
        QStyledItemDelegate.__init__(self, parent)

    def createEditor(self, parent, option, index):
-        return EnLineEdit(parent)
+        m = index.model()
+        text = m.custom_columns[m.column_map[index.column()]]['display']['composite_template']
+        editor = CommentsDialog(parent, text)
+        editor.setWindowTitle(_("Edit template"))
+        editor.textbox.setTabChangesFocus(False)
+        editor.textbox.setTabStopWidth(20)
+        d = editor.exec_()
+        if d:
+            m.setData(index, QVariant(editor.textbox.toPlainText()), Qt.EditRole)
+        return None

    def setModelData(self, editor, model, index):
-        val = unicode(editor.text())
+        val = unicode(editor.textbox.toPlainText())
        try:
            validation_formatter.validate(val)
        except Exception, err:
@ -364,7 +373,7 @@ class CcTemplateDelegate(QStyledItemDelegate): # {{{
    def setEditorData(self, editor, index):
        m = index.model()
        val = m.custom_columns[m.column_map[index.column()]]['display']['composite_template']
-        editor.setText(val)
+        editor.textbox.setPlainText(val)


 # }}}
--- a/src/calibre/gui2/library/models.py
+++ b/src/calibre/gui2/library/models.py
@ -303,6 +303,20 @@ class BooksModel(QAbstractTableModel): # {{{
        return self.rowCount(None)

    def get_book_display_info(self, idx):
+        def custom_keys_to_display():
+            ans = getattr(self, '_custom_fields_in_book_info', None)
+            if ans is None:
+                cfkeys = set(self.db.custom_field_keys())
+                yes_fields = set(tweaks['book_details_will_display'])
+                no_fields = set(tweaks['book_details_wont_display'])
+                if '*' in yes_fields:
+                    yes_fields = cfkeys
+                if '*' in no_fields:
+                    no_fields = cfkeys
+                ans = frozenset(yes_fields - no_fields)
+                setattr(self, '_custom_fields_in_book_info', ans)
+            return ans
+
        data = {}
        cdata = self.cover(idx)
        if cdata:
@ -334,7 +348,10 @@ class BooksModel(QAbstractTableModel): # {{{
                _('Book %s of %s.')%\
                    (sidx, prepare_string_for_xml(series))
        mi = self.db.get_metadata(idx)
+        cf_to_display = custom_keys_to_display()
        for key in mi.custom_field_keys():
+            if key not in cf_to_display:
+                continue
            name, val = mi.format_field(key)
            if val:
                data[name] = val
--- a/src/calibre/library/server/base.py
+++ b/src/calibre/library/server/base.py
@ -43,6 +43,9 @@ class DispatchController(object): # {{{
        kwargs['action'] = 'f_%d'%len(self.funcs)
        if route != '/':
            route = self.prefix + route
+        elif self.prefix:
+            self.dispatcher.connect(name+'prefix_extra', self.prefix, self,
+                    **kwargs)
        self.dispatcher.connect(name, route, self, **kwargs)
        self.funcs.append(expose(func))

--- a/src/calibre/library/server/browse.py
+++ b/src/calibre/library/server/browse.py
@ -359,7 +359,7 @@ class BrowseServer(object):
                icon = 'blank.png'
            cats.append((meta['name'], category, icon))

-        cats = [(u'<li><a title="{2} {0}" href="/browse/category/{1}">&nbsp;</a>'
+        cats = [(u'<li><a title="{2} {0}" href="{3}/browse/category/{1}">&nbsp;</a>'
                 u'<img src="{3}{src}" alt="{0}" />'
                 u'<span class="label">{0}</span>'
                 u'</li>')
--- a/src/calibre/manual/template_lang.rst
+++ b/src/calibre/manual/template_lang.rst
@ -101,8 +101,8 @@ Composite columns can use any template option, including formatting.

 You cannot change the data contained in a composite column. If you edit a composite column by double-clicking on any item, you will open the template for editing, not the underlying data. Editing the template on the GUI is a quick way of testing and changing composite columns.

-Using functions in templates
-----------------------------
+Using functions in templates - single-function mode
+---------------------------------------------------

 Suppose you want to display the value of a field in upper case, when that field is normally in title case. You can do this (and many more things) using the functions available for templates. For example, to display the title in upper case, use ``{title:uppercase()}``. To display it in title case, use ``{title:titlecase()}``.

@ -137,6 +137,82 @@ Note that you can use the prefix and suffix as well. If you want the number to a
    {#myint:0>3s:ifempty(0)|[|]}
    

+Using functions in templates - program mode
+-------------------------------------------
+
+The template language program mode differs from single-function mode in that it permits you to write template expressions that refer to other metadata fields, modify values, and do arithmetic. It is a reasonably complete programming language.
+
+Beginning with an example, assume that you want your template to show the series for a book if it has one, otherwise show the value of a custom field #genre. You cannot do this in the basic language because you cannot make reference to another metadata field within a template expression. In program mode, you can. The following expression works::
+
+    {#series:'ifempty($, field('#genre'))'}
+
+The example shows several things:
+
+    * program mode is used if the expression begins with ``:'`` and ends with ``'``. Anything else is assumed to be single-function.
+    * the variable ``$`` stands for the field the expression is operating upon, ``#series`` in this case.
+    * functions must be given all their arguments. There is no default value. This is true for the standard builtin functions, and is a significant difference from single-function mode.
+    * white space is ignored and can be used anywhere within the expression.
+    * constant strings are enclosed in matching quotes, either ``'`` or ``"``.
+    
+The language is similar to ``functional`` languages in that it is built almost entirely from functions. A statement is a function. An expression is a function. Constants and identifiers can be thought of as functions returning the value indicated by the constant or stored in the identifier.
+
+The syntax of the language is shown by the following grammar::
+
+    constant   ::= " string " | ' string ' | number
+    identifier ::= sequence of letters or ``_`` characters
+    function   ::= identifier ( statement [ , statement ]* )
+    expression ::= identifier | constant | function
+    statement  ::= expression [ ; expression ]*
+    program    ::= statement
+
+An ``expression`` always has a value, either the value of the constant, the value contained in the identifier, or the value returned by a function. The value of a ``statement`` is the value of the last expression in the sequence of statements. As such, the value of the program (statement)::
+
+    1; 2; 'foobar'; 3
+    
+is 3.
+
+Another example of a complex but rather silly program might help make things clearer::
+
+    {series_index:'
+        substr(
+            strcat($, '->', 
+                cmp(divide($, 2), 1, 
+                    assign(c, 1); substr('lt123', c, 0), 
+                    'eq', 'gt')),
+            0, 6)
+       '| prefix | suffix}
+    
+This program does the following: 
+
+    * specify that the field being looked at is series_index. This sets the value of the variable ``$``.
+    * calls the ``substr`` function, which takes 3 parameters ``(str, start, end)``. It returns a string formed by extracting the start through end characters from string, zero-based (the first character is character zero). In this case the string will be computed by the ``strcat`` function, the start is 0, and the end is 6. In this case it will return the first 6 characters of the string returned by ``strcat``, which must be evaluated before substr can return.
+    * calls the ``strcat`` (string concatenation) function. Strcat accepts 1 or more arguments, and returns a string formed by concatenating all the values. In this case there are three arguments. The first parameter is the value in ``$``, which here is the value of ``series_index``. The second paremeter is the constant string ``'->'``. The third parameter is the value returned by the ``cmp`` function, which must be fully evaluated before ``strcat`` can return.
+    * The ``cmp`` function takes 5 arguments ``(x, y, lt, eq, gt)``. It compares x and y and returns the third argument ``lt`` if x < y, the fourth argument ``eq`` if x == y, and the fifth argument ``gt`` if x > y. As with all functions, all of the parameters can be statements. In this case the first parameter (the value for ``x``) is the result of dividing the series_index by 2. The second parameter ``y`` is the constant ``1``. The third parameter ``lt`` is a statement (more later). The fourth parameter ``eq`` is the constant string ``'eq'``. The fifth parameter is the constant string ``'gt'``.
+    * The third parameter (the one for ``lt``) is a statement, or a sequence of expressions. Remember that a statement (a sequence of semicolon-separated expressions) is also an expression, returning the value of the last expression in the list. In this case, the program first assigns the value ``1`` to a local variable ``c``, then returns a substring made by extracting the c'th character to the end. Since c always contains the constant ``1``, the substring will return the second through end'th characters, or ``'t123'``.
+    * Once the statement providing the value to the third parameter is executed, ``cmp`` can return a value. At that point, ``strcat` can return a value, then ``substr`` can return a value. The program then terminates.
+
+For various values of series_index, the program returns:
+
+    * series_index == undefined, result = ``prefix ->t123 suffix``
+    * series_index == 0.5, result = ``prefix 0.50-> suffix``
+    * series_index == 1, result = ``prefix 1->t12 suffix``
+    * series_index == 2, result = ``prefix 2->eq suffix``
+    * series_index == 3, result = ``prefix 3->gt suffix``
+
+All the functions listed under single-function mode can be used in program mode, noting that unlike the functions described below you must supply a first parameter providing the value the function is to act upon. 
+
+The following functions are available in addition to those described in single-function mode. With the exception of the ``id`` parameter of assign, all parameters can be statements (sequences of expressions):
+
+    * ``add(x, y)``	-- returns x + y. Throws an exception if either x or y are not numbers.
+    * ``assign(id, val)`` -- assigns val to id, then returns val. id must be an identifier, not an expression
+    * ``cmp(x, y, lt, eq, gt)`` -- compares x and y after converting both to numbers. Returns ``lt`` if x < y. Returns ``eq`` if x == y. Otherwise returns ``gt``.
+    * ``divide(x, y)``	-- returns x / y. Throws an exception if either x or y are not numbers.
+    * ``field(name)`` -- returns the metadata field named by ``name``.
+    * ``multiply``	-- returns x * y. Throws an exception if either x or y are not numbers.
+    * ``strcat(a, b, ...)`` -- can take any number of arguments. Returns a string formed by concatenating all the arguments.
+    * ``strcmp(x, y, lt, eq, gt)`` -- does a case-insensitive comparison x and y as strings. Returns ``lt`` if x < y. Returns ``eq`` if x == y. Otherwise returns ``gt``.
+    * ``substr(str, start, end)`` -- returns the ``start``'th through the ``end``'th characters of ``str``. The first character in ``str`` is the zero'th character. If end is negative, then it indicates that many characters counting from the right. If end is zero, then it indicates the last character. For example, ``substr('12345', 1, 0)`` returns ``'2345'``, and ``substr('12345', 1, -1)`` returns ``'234'``.
+    * ``subtract``	-- returns x - y. Throws an exception if either x or y are not numbers.
    
 Special notes for save/send templates
 -------------------------------------
--- a/src/calibre/translations/af.po
+++ b/src/calibre/translations/af.po
--- a/src/calibre/translations/ar.po
+++ b/src/calibre/translations/ar.po
--- a/src/calibre/translations/ast.po
+++ b/src/calibre/translations/ast.po
--- a/src/calibre/translations/bg.po
+++ b/src/calibre/translations/bg.po
--- a/src/calibre/translations/bn.po
+++ b/src/calibre/translations/bn.po
--- a/src/calibre/translations/ca.po
+++ b/src/calibre/translations/ca.po
--- a/src/calibre/translations/calibre.pot
+++ b/src/calibre/translations/calibre.pot
--- a/src/calibre/translations/cs.po
+++ b/src/calibre/translations/cs.po
--- a/src/calibre/translations/da.po
+++ b/src/calibre/translations/da.po
--- a/src/calibre/translations/de.po
+++ b/src/calibre/translations/de.po
--- a/src/calibre/translations/el.po
+++ b/src/calibre/translations/el.po
--- a/src/calibre/translations/en_AU.po
+++ b/src/calibre/translations/en_AU.po
--- a/src/calibre/translations/en_CA.po
+++ b/src/calibre/translations/en_CA.po
--- a/src/calibre/translations/en_GB.po
+++ b/src/calibre/translations/en_GB.po
--- a/src/calibre/translations/eo.po
+++ b/src/calibre/translations/eo.po
--- a/src/calibre/translations/es.po
+++ b/src/calibre/translations/es.po
--- a/src/calibre/translations/eu.po
+++ b/src/calibre/translations/eu.po
--- a/src/calibre/translations/fa.po
+++ b/src/calibre/translations/fa.po
--- a/src/calibre/translations/fi.po
+++ b/src/calibre/translations/fi.po
--- a/src/calibre/translations/fo.po
+++ b/src/calibre/translations/fo.po
--- a/src/calibre/translations/fr.po
+++ b/src/calibre/translations/fr.po
--- a/src/calibre/translations/gl.po
+++ b/src/calibre/translations/gl.po
--- a/src/calibre/translations/he.po
+++ b/src/calibre/translations/he.po
--- a/src/calibre/translations/hi.po
+++ b/src/calibre/translations/hi.po
--- a/src/calibre/translations/hr.po
+++ b/src/calibre/translations/hr.po
--- a/src/calibre/translations/hu.po
+++ b/src/calibre/translations/hu.po
--- a/src/calibre/translations/id.po
+++ b/src/calibre/translations/id.po
--- a/src/calibre/translations/it.po
+++ b/src/calibre/translations/it.po
--- a/src/calibre/translations/ja.po
+++ b/src/calibre/translations/ja.po
--- a/src/calibre/translations/ko.po
+++ b/src/calibre/translations/ko.po
--- a/src/calibre/translations/lt.po
+++ b/src/calibre/translations/lt.po
--- a/src/calibre/translations/lv.po
+++ b/src/calibre/translations/lv.po
--- a/src/calibre/translations/ml.po
+++ b/src/calibre/translations/ml.po
--- a/src/calibre/translations/mr.po
+++ b/src/calibre/translations/mr.po
--- a/src/calibre/translations/ms.po
+++ b/src/calibre/translations/ms.po
--- a/src/calibre/translations/nb.po
+++ b/src/calibre/translations/nb.po
--- a/src/calibre/translations/nds.po
+++ b/src/calibre/translations/nds.po
--- a/src/calibre/translations/nl.po
+++ b/src/calibre/translations/nl.po
--- a/src/calibre/translations/oc.po
+++ b/src/calibre/translations/oc.po
--- a/src/calibre/translations/pl.po
+++ b/src/calibre/translations/pl.po
--- a/src/calibre/translations/pt.po
+++ b/src/calibre/translations/pt.po
--- a/src/calibre/translations/pt_BR.po
+++ b/src/calibre/translations/pt_BR.po
--- a/src/calibre/translations/ro.po
+++ b/src/calibre/translations/ro.po
--- a/src/calibre/translations/ru.po
+++ b/src/calibre/translations/ru.po
--- a/src/calibre/translations/sc.po
+++ b/src/calibre/translations/sc.po
--- a/src/calibre/translations/sk.po
+++ b/src/calibre/translations/sk.po
--- a/src/calibre/translations/sl.po
+++ b/src/calibre/translations/sl.po
--- a/src/calibre/translations/sq.po
+++ b/src/calibre/translations/sq.po
--- a/src/calibre/translations/sr.po
+++ b/src/calibre/translations/sr.po
--- a/src/calibre/translations/sv.po
+++ b/src/calibre/translations/sv.po
--- a/src/calibre/translations/ta.po
+++ b/src/calibre/translations/ta.po
--- a/src/calibre/translations/te.po
+++ b/src/calibre/translations/te.po
--- a/src/calibre/translations/th.po
+++ b/src/calibre/translations/th.po
--- a/src/calibre/translations/tr.po
+++ b/src/calibre/translations/tr.po
--- a/src/calibre/translations/uk.po
+++ b/src/calibre/translations/uk.po
--- a/src/calibre/translations/ur.po
+++ b/src/calibre/translations/ur.po
--- a/src/calibre/translations/vi.po
+++ b/src/calibre/translations/vi.po
--- a/src/calibre/translations/yi.po
+++ b/src/calibre/translations/yi.po
--- a/src/calibre/translations/zh_CN.po
+++ b/src/calibre/translations/zh_CN.po
--- a/src/calibre/translations/zh_HK.po
+++ b/src/calibre/translations/zh_HK.po
--- a/src/calibre/translations/zh_TW.po
+++ b/src/calibre/translations/zh_TW.po
--- a/src/calibre/utils/formatter.py
+++ b/src/calibre/utils/formatter.py
@ -5,10 +5,183 @@ Created on 23 Sep 2010
 '''

 import re, string, traceback
+from functools import partial

 from calibre.constants import DEBUG
 from calibre.utils.titlecase import titlecase
-from calibre.utils.icu import capitalize
+from calibre.utils.icu import capitalize, strcmp
+
+class _Parser(object):
+    LEX_OP  = 1
+    LEX_ID  = 2
+    LEX_STR = 3
+    LEX_NUM = 4
+    LEX_EOF = 5
+
+    def _strcmp(self, x, y, lt, eq, gt):
+        v = strcmp(x, y)
+        if v < 0:
+            return lt
+        if v == 0:
+            return eq
+        return gt
+
+    def _cmp(self, x, y, lt, eq, gt):
+        x = float(x if x else 0)
+        y = float(y if y else 0)
+        if x < y:
+            return lt
+        if x == y:
+            return eq
+        return gt
+
+    def _assign(self, target, value):
+        setattr(self, target, value)
+        return value
+
+    def _concat(self, *args):
+        i = 0
+        res = ''
+        for i in range(0, len(args)):
+            res += args[i]
+        return res
+
+    def _math(self, x, y, op=None):
+        ops = {
+               '+': lambda x, y: x + y,
+               '-': lambda x, y: x - y,
+               '*': lambda x, y: x * y,
+               '/': lambda x, y: x / y,
+            }
+        x = float(x if x else 0)
+        y = float(y if y else 0)
+        return ops[op](x, y)
+
+    local_functions = {
+            'add'      : (2, partial(_math, op='+')),
+            'assign'   : (2, _assign),
+            'cmp'      : (5, _cmp),
+            'divide'   : (2, partial(_math, op='/')),
+            'field'    : (1, lambda s, x: s.parent.get_value(x, [], s.parent.kwargs)),
+            'multiply' : (2, partial(_math, op='*')),
+            'strcat'   : (-1, _concat),
+            'strcmp'   : (5, _strcmp),
+            'substr'   : (3, lambda s, x, y, z: x[int(y): len(x) if int(z) == 0 else int(z)]),
+            'subtract' : (2, partial(_math, op='-')),
+    }
+
+    def __init__(self, val, prog, parent):
+        self.lex_pos = 0
+        self.prog = prog[0]
+        if prog[1] != '':
+            self.error(_('failed to scan program. Invalid input {0}').format(prog[1]))
+        self.parent = parent
+        setattr(self, '$', val)
+
+    def error(self, message):
+        m = 'Formatter: ' + message + _(' near ')
+        if self.lex_pos > 0:
+            m = '{0} {1}'.format(m, self.prog[self.lex_pos-1][1])
+        m = '{0} {1}'.format(m, self.prog[self.lex_pos][1])
+        if self.lex_pos < len(self.prog):
+            m = '{0} {1}'.format(m, self.prog[self.lex_pos+1][1])
+        raise ValueError(m)
+
+    def token(self):
+        if self.lex_pos >= len(self.prog):
+            return None
+        token = self.prog[self.lex_pos]
+        self.lex_pos += 1
+        return token[1]
+
+    def lookahead(self):
+        if self.lex_pos >= len(self.prog):
+            return (self.LEX_EOF, '')
+        return self.prog[self.lex_pos]
+
+    def consume(self):
+        self.lex_pos += 1
+
+    def token_op_is_a(self, val):
+        token = self.lookahead()
+        return token[0] == self.LEX_OP and token[1] == val
+
+    def token_is_id(self):
+        token = self.lookahead()
+        return token[0] == self.LEX_ID
+
+    def token_is_constant(self):
+        token = self.lookahead()
+        return token[0] == self.LEX_STR or token[0] == self.LEX_NUM
+
+    def token_is_eof(self):
+        token = self.lookahead()
+        return token[0] == self.LEX_EOF
+
+    def program(self):
+        val = self.statement()
+        if not self.token_is_eof():
+            self.error(_('syntax error - program ends before EOF'))
+        return val
+
+    def statement(self):
+        while True:
+            val = self.expr()
+            if self.token_is_eof():
+                return val
+            if not self.token_op_is_a(';'):
+                return val
+            self.consume()
+
+    def expr(self):
+        if self.token_is_id():
+            # We have an identifier. Determine if it is a function
+            id = self.token()
+            if not self.token_op_is_a('('):
+                return getattr(self, id, _('unknown id ') + id)
+            # We have a function.
+            # Check if it is a known one. We do this here so error reporting is
+            # better, as it can identify the tokens near the problem.
+            if id not in self.parent.functions and id not in self.local_functions:
+                self.error(_('unknown function {0}').format(id))
+            # Eat the paren
+            self.consume()
+            args = list()
+            while not self.token_op_is_a(')'):
+                if id == 'assign' and len(args) == 0:
+                    # Must handle the lvalue semantics of the assign function.
+                    # The first argument is the name of the destination, not
+                    # the value.
+                    if not self.token_is_id():
+                        self.error('assign requires the first parameter be an id')
+                    args.append(self.token())
+                else:
+                    # evaluate the argument (recursive call)
+                    args.append(self.statement())
+                if not self.token_op_is_a(','):
+                    break
+                self.consume()
+            if self.token() != ')':
+                self.error(_('missing closing parenthesis'))
+
+            # Evaluate the function
+            if id in self.local_functions:
+                f = self.local_functions[id]
+                if f[0] != -1 and len(args) != f[0]:
+                    self.error('incorrect number of arguments for function {}'.format(id))
+                return f[1](self, *args)
+            else:
+                f = self.parent.functions[id]
+                if f[0] != -1 and len(args) != f[0]+1:
+                    self.error('incorrect number of arguments for function {}'.format(id))
+                return f[1](self.parent, *args)
+            # can't get here
+        elif self.token_is_constant():
+            # String or number
+            return self.token()
+        else:
+            self.error(_('expression is not function or constant'))
+

 class TemplateFormatter(string.Formatter):
    '''
@ -25,6 +198,7 @@ class TemplateFormatter(string.Formatter):
        string.Formatter.__init__(self)
        self.book = None
        self.kwargs = None
+        self.program_cache = {}

    def _lookup(self, val, *args):
        if len(args) == 2: # here for backwards compatibility
@ -135,7 +309,7 @@ class TemplateFormatter(string.Formatter):
                traceback.print_exc()
            return fmt, '', ''

-    format_string_re = re.compile(r'^(.*)\|(.*)\|(.*)$')
+    format_string_re = re.compile(r'^(.*)\|([^\|]*)\|(.*)$', re.DOTALL)
    compress_spaces = re.compile(r'\s+')
    backslash_comma_to_comma = re.compile(r'\\,')

@ -145,6 +319,29 @@ class TemplateFormatter(string.Formatter):
                (r'.*?\)', lambda x,t: t[:-1]),
        ])

+    ################## 'Functional' template language ######################
+
+    lex_scanner = re.Scanner([
+                (r'[(),=;]',            lambda x,t: (1, t)),
+                (r'-?[\d\.]+',          lambda x,t: (3, t)),
+                (r'\$',                 lambda x,t: (2, t)),
+                (r'\w+',                lambda x,t: (2, t)),
+                (r'".*?((?<!\\)")',     lambda x,t: (3, t[1:-1])),
+                (r'\'.*?((?<!\\)\')',   lambda x,t: (3, t[1:-1])),
+                (r'\s',                 None)
+        ])
+
+    def _eval_program(self, val, prog):
+        # keep a cache of the lex'ed program under the theory that re-lexing
+        # is much more expensive than the cache lookup. This is certainly true
+        # for more than a few tokens, but it isn't clear for simple programs.
+        lprog = self.program_cache.get(prog, None)
+        if not lprog:
+            lprog = self.lex_scanner.scan(prog)
+            self.program_cache[prog] = lprog
+        parser = _Parser(val, lprog, self)
+        return parser.program()
+
    ################## Override parent classes methods #####################

    def get_value(self, key, args, kwargs):
@ -155,33 +352,49 @@ class TemplateFormatter(string.Formatter):
        fmt, prefix, suffix = self._explode_format_string(fmt)

        # Handle functions
-        p = fmt.find('(')
-        dispfmt = fmt
-        if p >= 0 and fmt[-1] == ')':
+        # First see if we have a functional-style expression
+        if fmt.startswith('\''):
+            p = 0
+        else:
+            p = fmt.find(':\'')
+            if p >= 0:
+                p += 1
+        if p >= 0 and fmt[-1] == '\'':
+            val = self._eval_program(val, fmt[p+1:-1])
            colon = fmt[0:p].find(':')
            if colon < 0:
                dispfmt = ''
-                colon = 0
            else:
                dispfmt = fmt[0:colon]
-                colon += 1
-            if fmt[colon:p] in self.functions:
-                field = fmt[colon:p]
-                func = self.functions[field]
-                if func[0] == 1:
-                    # only one arg expected. Don't bother to scan. Avoids need
-                    # for escaping characters
-                    args = [fmt[p+1:-1]]
+        else:
+            # check for old-style function references
+            p = fmt.find('(')
+            dispfmt = fmt
+            if p >= 0 and fmt[-1] == ')':
+                colon = fmt[0:p].find(':')
+                if colon < 0:
+                    dispfmt = ''
+                    colon = 0
                else:
-                    args = self.arg_parser.scan(fmt[p+1:])[0]
-                    args = [self.backslash_comma_to_comma.sub(',', a) for a in args]
-                if (func[0] == 0 and (len(args) != 1 or args[0])) or \
-                        (func[0] > 0 and func[0] != len(args)):
-                    raise ValueError('Incorrect number of arguments for function '+ fmt[0:p])
-                if func[0] == 0:
-                    val = func[1](self, val).strip()
-                else:
-                    val = func[1](self, val, *args).strip()
+                    dispfmt = fmt[0:colon]
+                    colon += 1
+                if fmt[colon:p] in self.functions:
+                    field = fmt[colon:p]
+                    func = self.functions[field]
+                    if func[0] == 1:
+                        # only one arg expected. Don't bother to scan. Avoids need
+                        # for escaping characters
+                        args = [fmt[p+1:-1]]
+                    else:
+                        args = self.arg_parser.scan(fmt[p+1:])[0]
+                        args = [self.backslash_comma_to_comma.sub(',', a) for a in args]
+                    if (func[0] == 0 and (len(args) != 1 or args[0])) or \
+                            (func[0] > 0 and func[0] != len(args)):
+                        raise ValueError('Incorrect number of arguments for function '+ fmt[0:p])
+                    if func[0] == 0:
+                        val = func[1](self, val).strip()
+                    else:
+                        val = func[1](self, val, *args).strip()
        if val:
            val = self._do_format(val, dispfmt)
        if not val:
@ -200,10 +413,10 @@ class TemplateFormatter(string.Formatter):
        self.composite_values = {}
        try:
            ans = self.vformat(fmt, [], kwargs).strip()
-        except:
+        except Exception, e:
            if DEBUG:
                traceback.print_exc()
-            ans = error_value
+            ans = error_value + ' ' + e.message
        return ans

 class ValidateFormat(TemplateFormatter):
--- a/src/calibre/utils/icu.c
+++ b/src/calibre/utils/icu.c
@ -329,7 +329,7 @@ icu_lower(PyObject *self, PyObject *args) {
    PyMem_Free(input);

    return ret;
-}
+} // }}}

 // title {{{
 static PyObject *
@ -374,9 +374,22 @@ icu_title(PyObject *self, PyObject *args) {
    PyMem_Free(input);

    return ret;
+} // }}}
+
+
+// set_default_encoding {{{
+static PyObject *
+icu_set_default_encoding(PyObject *self, PyObject *args) {
+    char *encoding;
+    if (!PyArg_ParseTuple(args, "s:setdefaultencoding", &encoding))
+        return NULL;
+    if (PyUnicode_SetDefaultEncoding(encoding))
+        return NULL;
+    Py_INCREF(Py_None);
+    return Py_None;
+
 }
-
-
+// }}}

 static PyMethodDef icu_methods[] = {
    {"upper", icu_upper, METH_VARARGS,
@ -391,6 +404,10 @@ static PyMethodDef icu_methods[] = {
        "title(locale, unicode object) -> Title cased unicode object using locale rules."
    },

+    {"set_default_encoding", icu_set_default_encoding, METH_VARARGS,
+        "set_default_encoding(encoding) -> Set the default encoding for the python unicode implementation."
+    },
+
    {NULL}  /* Sentinel */
 };

--- a/src/calibre/utils/icu.py
+++ b/src/calibre/utils/icu.py
@ -6,6 +6,7 @@ __copyright__ = '2010, Kovid Goyal <kovid@kovidgoyal.net>'
 __docformat__ = 'restructuredtext en'

 # Setup code {{{
+import sys
 from functools import partial

 from calibre.constants import plugins
@ -77,11 +78,20 @@ def py_strcmp(a, b):
 def icu_case_sensitive_strcmp(collator, a, b):
    return collator.strcmp(a, b)

+def icu_capitalize(s):
+    s = lower(s)
+    return s.replace(s[0], upper(s[0]), 1)

 load_icu()
 load_collator()
 _icu_not_ok = _icu is None or _collator is None

+try:
+    if sys.getdefaultencoding().lower() == 'ascii':
+        _icu.set_default_encoding('utf-8')
+except:
+    pass
+
 # }}}

 ################# The string functions ########################################
@ -104,10 +114,6 @@ lower = (lambda s: s.lower()) if _icu_not_ok else \
 title_case = (lambda s: s.title()) if _icu_not_ok else \
    partial(_icu.title, get_locale())

-def icu_capitalize(s):
-    s = lower(s)
-    return s.replace(s[0], upper(s[0]))
-
 capitalize = (lambda s: s.capitalize()) if _icu_not_ok else \
    (lambda s: icu_capitalize(s))

@ -226,12 +232,16 @@ pêché'''
    test_strcmp(german + french)

    print '\nTesting case transforms in current locale'
-    for x in ('a', 'Alice\'s code'):
+    from calibre.utils.titlecase import titlecase
+    for x in ('a', 'Alice\'s code', 'macdonald\'s machine', '02 the wars'):
        print 'Upper:     ', x, '->', 'py:', x.upper().encode('utf-8'), 'icu:', upper(x).encode('utf-8')
        print 'Lower:     ', x, '->', 'py:', x.lower().encode('utf-8'), 'icu:', lower(x).encode('utf-8')
-        print 'Title:     ', x, '->', 'py:', x.title().encode('utf-8'), 'icu:', title_case(x).encode('utf-8')
+        print 'Title:     ', x, '->', 'py:', x.title().encode('utf-8'), 'icu:', title_case(x).encode('utf-8'), 'titlecase:', titlecase(x).encode('utf-8')
        print 'Capitalize:', x, '->', 'py:', x.capitalize().encode('utf-8'), 'icu:', capitalize(x).encode('utf-8')
        print

 # }}}

+if __name__ == '__main__':
+    test()
+
--- a/src/calibre/utils/osx_symlinks.py
+++ b/src/calibre/utils/osx_symlinks.py
@ -75,7 +75,10 @@ def do_it(scripts, links):
            if ph:
                del os.environ['PYTHONHOME']
            pipe = auth.executeWithPrivileges(name)
-            sys.stdout.write(pipe.read())
+            try:
+                sys.stdout.write(pipe.read())
+            except:
+                sys.stdout.write(pipe.read()) # Probably EINTR
            pipe.close()
        except:
            r1, r2 = None, traceback.format_exc()
--- a/src/calibre/utils/titlecase.py
+++ b/src/calibre/utils/titlecase.py
@ -23,11 +23,12 @@ UC_ELSEWHERE = re.compile(r'[%s]*?[a-zA-Z]+[A-Z]+?' % PUNCT)
 CAPFIRST = re.compile(r"^[%s]*?([A-Za-z])" % PUNCT)
 SMALL_FIRST = re.compile(r'^([%s]*)(%s)\b' % (PUNCT, SMALL), re.I)
 SMALL_LAST = re.compile(r'\b(%s)[%s]?$' % (SMALL, PUNCT), re.I)
+SMALL_AFTER_NUM = re.compile(r'(\d+\s+)(a|an|the)\b', re.I)
 SUBPHRASE = re.compile(r'([:.;?!][ ])(%s)' % SMALL)
 APOS_SECOND = re.compile(r"^[dol]{1}['‘]{1}[a-z]+$", re.I)
 ALL_CAPS = re.compile(r'^[A-Z\s%s]+$' % PUNCT)
 UC_INITIALS = re.compile(r"^(?:[A-Z]{1}\.{1}|[A-Z]{1}\.{1}[A-Z]{1})+$")
-MAC_MC = re.compile(r"^([Mm]a?c)(\w+)")
+MAC_MC = re.compile(r"^([Mm]a?c)(.+)")

 def titlecase(text):

@ -44,7 +45,7 @@ def titlecase(text):

    all_caps = ALL_CAPS.match(text)

-    words = re.split('\s', text)
+    words = re.split('\s+', text)
    line = []
    for word in words:
        if all_caps:
@ -55,8 +56,8 @@ def titlecase(text):
                word = icu_lower(word)

        if APOS_SECOND.match(word):
-            word = word.replace(word[0], icu_upper(word[0]))
-            word = word.replace(word[2], icu_upper(word[2]))
+            word = word.replace(word[0], icu_upper(word[0]), 1)
+            word = word[:2] + icu_upper(word[2]) + word[3:]
            line.append(word)
            continue
        if INLINE_PERIOD.search(word) or UC_ELSEWHERE.match(word):
@ -67,7 +68,7 @@ def titlecase(text):
            continue

        match = MAC_MC.match(word)
-        if match:
+        if match and not match.group(2).startswith('hin'):
            line.append("%s%s" % (capitalize(match.group(1)),
                                  capitalize(match.group(2))))
            continue
@ -85,6 +86,10 @@ def titlecase(text):
        capitalize(m.group(2))
    ), result)

+    result = SMALL_AFTER_NUM.sub(lambda m: '%s%s' % (m.group(1),
+        capitalize(m.group(2))
+    ), result)
+
    result = SMALL_LAST.sub(lambda m: capitalize(m.group(0)), result)

    result = SUBPHRASE.sub(lambda m: '%s%s' % (