diff --git a/recipes/neu_osnabrucker_zeitung.recipe b/recipes/neu_osnabrucker_zeitung.recipe new file mode 100644 index 0000000000..dc6a36237e --- /dev/null +++ b/recipes/neu_osnabrucker_zeitung.recipe @@ -0,0 +1,49 @@ +# vim:fileencoding=utf-8 + +from calibre.web.feeds.news import BasicNewsRecipe + +class AdvancedUserRecipe1344926684(BasicNewsRecipe): + title = u'Neue Osnabrücker Zeitung' + __author__ = 'Krittika Goyal' + oldest_article = 7 + max_articles_per_feed = 100 + # auto_cleanup = True + no_stylesheets = True + use_embedded_content = False + language = 'de' + remove_javascript = True + + keep_only_tags = [ + dict(name='div', attrs={'class':'article'}), + dict(name='span', attrs={'id':'articletext'}) + ] + remove_tags = [ + dict(name='div', attrs={'id':'retresco-title'}), + dict(name='div', attrs={'class':'retresco-item s1 relative'}), + dict(name='a', attrs={'class':'medium2 largeSpaceTop icon'}), + dict(name='div', attrs={'class':'articleFunctions inlineTeaserRight'}), + dict(name='div', attrs={'class':'imageContainer '}), + dict(name='div', attrs={'class':'imageContainer centerContainer'}), + dict(name='div', attrs={'class':'grid singleCol articleTeaser'}), + dict(name='h3', attrs={'class':'teaserRow'}), + dict(name='div', attrs={'class':'related-comments'}), + dict(name='a', attrs={'class':' icon'}), + dict(name='a', attrs={'class':'right small'}), + dict(name='span', attrs={'class':'small block spaceBottom rectangleAd'}), + dict(name='div', attrs={'class':'furtherGalleries largeSpaceTop'}) + ] + + feeds = [(u'Lokales', u'http://www.noz.de/rss/Lokales'), +(u'Vermischtes', u'http://www.noz.de/rss/Vermischtes'), +(u'Politik', u'http://www.noz.de/rss/Politik'), +(u'Wirtschaft', u'http://www.noz.de/rss/Wirtschaft'), +(u'Kultur', u'http://www.noz.de/rss/Kultur'), +(u'Medien', u'http://www.noz.de/rss/Medien'), +(u'Wissenschaft', u'http://www.noz.de/rss/wissenschaft'), +(u'Sport', u'http://www.noz.de/rss/Sport'), +(u'Computer', u'http://www.noz.de/rss/Computer'), +(u'Musik', u'http://www.noz.de/rss/Musik'), +(u'Szene', u'http://www.noz.de/rss/Szene'), +(u'Niedersachsen', u'http://www.noz.de/rss/Niedersachsen'), +(u'Kino', u'http://www.noz.de/rss/Kino')] +