diff --git a/src/calibre/web/feeds/recipes/__init__.py b/src/calibre/web/feeds/recipes/__init__.py index 3723483fb7..76bb8112ec 100644 --- a/src/calibre/web/feeds/recipes/__init__.py +++ b/src/calibre/web/feeds/recipes/__init__.py @@ -29,7 +29,7 @@ recipe_modules = ['recipe_' + r for r in ( 'jb_online', 'estadao', 'o_globo', 'vijesti', 'elmundo', 'the_oz', 'honoluluadvertiser', 'starbulletin', 'exiled', 'indy_star', 'dna', 'pobjeda', 'chicago_breaking_news', 'glasgow_herald', 'linuxdevices', - 'hindu' + 'hindu', 'cincinnati_enquirer', )] import re, imp, inspect, time, os diff --git a/src/calibre/web/feeds/recipes/recipe_cincinnati_enquirer.py b/src/calibre/web/feeds/recipes/recipe_cincinnati_enquirer.py new file mode 100644 index 0000000000..8e62c5f1db --- /dev/null +++ b/src/calibre/web/feeds/recipes/recipe_cincinnati_enquirer.py @@ -0,0 +1,34 @@ +#!/usr/bin/env python +__license__ = 'GPL v3' +__copyright__ = '2009 Kovid Goyal ' + +from calibre.web.feeds.news import BasicNewsRecipe + +class AdvancedUserRecipe1234144423(BasicNewsRecipe): + title = u'Cincinnati Enquirer' + oldest_article = 7 + language = _('English') + __author__ = 'Joseph Kitzmiller' + max_articles_per_feed = 100 + no_stylesheets = True + use_embedded_content = False + remove_javascript = True + encoding = 'cp1252' + extra_css = ' p {font-size: medium; font-weight: normal;} ' + + keep_only_tags = [dict(name='div', attrs={'class':'padding'})] + + remove_tags = [ + dict(name=['object','link','table','embed']) + ,dict(name='div',attrs={'id':'pluckcomments'}) + ,dict(name='div',attrs={'class':'articleflex-container'}) + ] + + feeds = [(u'Cincinnati Enquirer', u'http://rss.cincinnati.com/apps/pbcs.dll/section?category=rssenq01&mime=xml')] + + def preprocess_html(self, soup): + for item in soup.findAll(style=True): + del item['style'] + for item in soup.findAll(face=True): + del item['face'] + return soup