Update Creative Blog

2025-08-30 23:00:21 -04:00 · 2014-04-13 06:53:07 +05:30 · 2014-04-13 06:53:07 +05:30 · d425bcceca
commit d425bcceca
parent 7ac78e7ab1
1 changed files with 37 additions and 43 deletions
--- a/recipes/dot_net.recipe
+++ b/recipes/dot_net.recipe
@ -1,47 +1,41 @@
 __license__   = 'GPL v3'
 __copyright__ = '2014, Bonni Salles - post in forum for help'
 '''
 Creative Blog (formerly .net magazine)
 '''
 from calibre.web.feeds.news import BasicNewsRecipe
-class dotnetMagazine (BasicNewsRecipe):
+class creativeblog(BasicNewsRecipe):
-    __author__ = u'Bonni Salles'
+    title          = u'Creative Blog'
-    __version__ = '1.1'
+    __author__     = 'Bonni Salles'
    __license__   = 'GPL v3'
    __copyright__ = u'2013, Bonni Salles'
    title                 = '.net magazine'
    oldest_article = 7
-    no_stylesheets        = True
+    publication_type = 'blog'
-    encoding              = 'utf8'
+    max_articles_per_feed = 100
-    use_embedded_content  = False
+    description    = 'Web Design and Tutorials from Creative Blog (part of .Net Magazine and others)'
-    auto_cleanup = True
+    publisher      = 'Creative Blog'
-    # recursion = 1
+    category       = 'internet, web design'
    language       = 'en'
    encoding      = 'utf-8'
    ignore_duplicate_articles = {'title', 'url'}
    remove_empty_feeds    = True
-    extra_css             = ' body{font-family: Arial,Helvetica,sans-serif } img{margin-bottom: 0.4em} '
+    auto_cleanup = True
-    cover_url = u'http://media.netmagazine.futurecdn.net/sites/all/themes/netmag/logo.png'
+# presently this is set to download the whole group of blogs for the feed.  If you want
-
+# to limit it to the specific sections of the blog that you want to download.
    #remove_tags_after = dict(name='footer', id=lambda x:not x)
    #remove_tags_before = dict(name='header', id=lambda x:not x)
    #remove_tags = [
         #dict(name='div', attrs={'class': 'item-list'}),
         #dict(name='h4', attrs={'class': 'std-hdr'}),
         #dict(name='div', attrs={'class': 'item-list share-links'}),  # removes share links
         #dict(name=['script', 'noscript']),
         #dict(name='div', attrs={'id': 'comments-form'}),  # comment these out if you want the comments to show
         #dict(name='div', attrs={'id': re.compile('advertorial_block_($|| )')}),
         #dict(name='div', attrs={'id': 'right-col'}),
         #dict(name='div', attrs={'id': 'comments'}),  # comment these out if you want the comments to show
         #dict(name='div', attrs={'class': 'item-list related-content'}),
         #]
    feeds          = [
-               (u'net', u'http://feeds.feedburner.com/creativebloq/')
+                      (u'Creative Blog', u'http://www.creativebloq.com/feed/'),
 #                      (u'3D', u'http://www.creativebloq.com/feed/3d'),
 #                      (u'Adobe', u'http://www.creativebloq.com/feed/adobe'),
 #                      (u'Animation', u'http://www.creativebloq.com/feed/animation'),
 #                      (u'Apple', u'http://www.creativebloq.com/feed/apple'),
 #                      (u'Branding', u'http://www.creativebloq.com/feed/branding'),
 #                      (u'Graphic Design', u'http://www.creativebloq.com/feed/graphic-design'),
 #                      (u'Illustration', u'http://www.creativebloq.com/feed/illustration'),
 #                      (u'News', u'http://www.creativebloq.com/feed/news'),
 #                      (u'Opinion', u'http://www.creativebloq.com/feed/opinion'),
 #                      (u'Tutorials', u'http://www.creativebloq.com/feed/tutorial'),
 #                      (u'Typography', u'http://www.creativebloq.com/feed/typography'),
 #                      (u'Video', u'http://www.creativebloq.com/feed/video'),
 #                      (u'web design', u'http://www.creativebloq.com/feed/web-design'),
                     ]
    def skip_ad_pages(self, soup):
        text = soup.find(text='click here to continue to article')
        if text:
            a = text.parent
            url = a.get('href')
            if url:
                return self.index_to_soup(url, raw=True)