diff --git a/src/calibre/ebooks/metadata/pdf.py b/src/calibre/ebooks/metadata/pdf.py index e99025057f..3a5ecd1f0c 100644 --- a/src/calibre/ebooks/metadata/pdf.py +++ b/src/calibre/ebooks/metadata/pdf.py @@ -1,5 +1,4 @@ from __future__ import with_statement - __license__ = 'GPL v3' __copyright__ = '2008, Kovid Goyal ' '''Read meta information from PDF files''' diff --git a/src/calibre/gui2/images/news/diepresse.png b/src/calibre/gui2/images/news/diepresse.png new file mode 100644 index 0000000000..41bbdcbf1b Binary files /dev/null and b/src/calibre/gui2/images/news/diepresse.png differ diff --git a/src/calibre/web/feeds/recipes/recipe_diepresse.py b/src/calibre/web/feeds/recipes/recipe_diepresse.py index c806575356..362a08fb3a 100644 --- a/src/calibre/web/feeds/recipes/recipe_diepresse.py +++ b/src/calibre/web/feeds/recipes/recipe_diepresse.py @@ -1,18 +1,42 @@ -import re +# -*- coding: utf-8 -*- + +__license__ = 'GPL v3' +__copyright__ = '2009, Gerhard Aigner ' + +''' http://www.diepresse.at - Austrian Newspaper ''' + +import re from calibre.web.feeds.news import BasicNewsRecipe class DiePresseRecipe(BasicNewsRecipe): - title = u'diePresse' + title = u'diePresse' + __author__ = 'Gerhard Aigner' + description = u'DiePresse.com - Die Online-Ausgabe der Österreichischen Tageszeitung Die Presse.' + publisher ='DiePresse.com' + category = 'news, politics, nachrichten, Austria' + use_embedded_content = False + remove_empty_feeds = True + lang = 'de-AT' + no_stylesheets = True + encoding = 'ISO-8859-1' + language = _('German') + recursions = 0 oldest_article = 1 max_articles_per_feed = 100 - recursions = 0 - language = _('German') - __author__ = 'Gerhard Aigner' + + html2lrf_options = [ + '--comment' , description + , '--category' , category + , '--publisher', publisher + ] + html2epub_options = 'publisher="' + publisher + '"\ncomments="' + description + '"\ntags="' + category + '"' + preprocess_regexps = [ (re.compile(r'Textversion', re.DOTALL), lambda match: ''), ] + remove_tags = [dict(name='hr'), dict(name='br'), dict(name='small'), @@ -21,6 +45,7 @@ class DiePresseRecipe(BasicNewsRecipe): dict(name='h1', attrs={'class':'titel'}), dict(name='a', attrs={'class':'print'}), dict(name='div', attrs={'class':'hline'})] + feeds = [(u'Politik', u'http://diepresse.com/rss/Politik'), (u'Wirtschaft', u'http://diepresse.com/rss/Wirtschaft'), (u'Europa', u'http://diepresse.com/rss/EU'), @@ -29,7 +54,7 @@ class DiePresseRecipe(BasicNewsRecipe): (u'Kultur', u'http://diepresse.com/rss/Kultur'), (u'Leben', u'http://diepresse.com/rss/Leben'), (u'Tech', u'http://diepresse.com/rss/Tech'), - (u'Science', u'http://diepresse.com/rss/Science'), + (u'Wissenschaft', u'http://diepresse.com/rss/Science'), (u'Bildung', u'http://diepresse.com/rss/Bildung'), (u'Gesundheit', u'http://diepresse.com/rss/Gesundheit'), (u'Recht', u'http://diepresse.com/rss/Recht'), @@ -38,3 +63,10 @@ class DiePresseRecipe(BasicNewsRecipe): def print_version(self, url): return url.replace('home','text/home') + + def preprocess_html(self, soup): + soup.html['xml:lang'] = self.lang + soup.html['lang'] = self.lang + mtag = '' + soup.head.insert(0,mtag) + return soup \ No newline at end of file