From d02bc170756e2f1ec9cd3643f960c5e62aec8651 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Sun, 7 Oct 2012 23:12:28 +0530 Subject: [PATCH] Update Countryfile --- recipes/countryfile.recipe | 13 ++++++++++--- 1 file changed, 10 insertions(+), 3 deletions(-) diff --git a/recipes/countryfile.recipe b/recipes/countryfile.recipe index 71977048c7..4f2e8cd95f 100644 --- a/recipes/countryfile.recipe +++ b/recipes/countryfile.recipe @@ -1,11 +1,13 @@ from calibre import browser from calibre.web.feeds.news import BasicNewsRecipe +import re + class AdvancedUserRecipe1325006965(BasicNewsRecipe): title = u'Countryfile.com' #cover_url = 'http://www.countryfile.com/sites/default/files/imagecache/160px_wide/cover/2_1.jpg' __author__ = 'Dave Asbury' description = 'The official website of Countryfile Magazine' - # last updated 9/9//12 + # last updated 7/10/12 language = 'en_GB' oldest_article = 30 max_articles_per_feed = 25 @@ -13,12 +15,14 @@ class AdvancedUserRecipe1325006965(BasicNewsRecipe): no_stylesheets = True auto_cleanup = True #articles_are_obfuscated = True + ignore_duplicate_articles = {'title'} def get_cover_url(self): soup = self.index_to_soup('http://www.countryfile.com/') - cov = soup.find(attrs={'class' : 'imagecache imagecache-160px_wide imagecache-linked imagecache-160px_wide_linked'}) + + cov = soup.find(attrs={'width' : '160', 'class' : re.compile('imagecache imagecache-160px_wide')}) print '******** ',cov,' ***' cov2 = str(cov) - cov2=cov2[140:223] + cov2=cov2[10:101] print '******** ',cov2,' ***' #cov2='http://www.countryfile.com/sites/default/files/imagecache/160px_wide/cover/1b_0.jpg' # try to get cover - if can't get known cover @@ -40,3 +44,6 @@ class AdvancedUserRecipe1325006965(BasicNewsRecipe): (u'Country News', u'http://www.countryfile.com/rss/news'), (u'Countryside', u'http://www.countryfile.com/rss/countryside'), ] + + +