#!/usr/bin/env python __license__ = 'GPL v3' __copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net' __docformat__ = 'restructuredtext en' ''' globeandmail.com ''' from calibre.web.feeds.news import BasicNewsRecipe class GlobeAndMail(BasicNewsRecipe): title = u'Globe and Mail' language = 'en_CA' __author__ = 'Kovid Goyal' oldest_article = 2 max_articles_per_feed = 10 no_stylesheets = True extra_css = ''' h3 {font-size: 22pt; font-weight:bold; margin:0px; padding:0px 0px 8pt 0px;} h4 {margin-top: 0px;} #byline { font-family: monospace; font-weight:bold; } #placeline {font-weight:bold;} #credit {margin-top:0px;} .tag {font-size: 22pt;}''' description = 'Canada\'s national newspaper' keep_only_tags = [dict(name='article')] remove_tags = [dict(name='aside'), dict(name='footer'), dict(name='div', attrs={'class':(lambda x: isinstance(x, (str,unicode)) and 'articlecommentcountholder' in x.split(' '))}), dict(name='ul', attrs={'class':(lambda x: isinstance(x, (str,unicode)) and 'articletoolbar' in x.split(' '))}), ] feeds = [ (u'Latest headlines', u'http://www.theglobeandmail.com/?service=rss'), (u'Top stories', u'http://www.theglobeandmail.com/?service=rss&feed=topstories'), (u'National', u'http://www.theglobeandmail.com/news/national/?service=rss'), (u'Politics', u'http://www.theglobeandmail.com/news/politics/?service=rss'), (u'World', u'http://www.theglobeandmail.com/news/world/?service=rss'), (u'Business', u'http://www.theglobeandmail.com/report-on-business/?service=rss'), (u'Opinions', u'http://www.theglobeandmail.com/news/opinions/?service=rss'), (u'Columnists', u'http://www.theglobeandmail.com/news/opinions/columnists/?service=rss'), (u'Globe Investor', u'http://www.theglobeandmail.com/globe-investor/?service=rss'), (u'Sports', u'http://www.theglobeandmail.com/sports/?service=rss'), (u'Technology', u'http://www.theglobeandmail.com/news/technology/?service=rss'), (u'Arts', u'http://www.theglobeandmail.com/news/arts/?service=rss'), (u'Life', u'http://www.theglobeandmail.com/life/?service=rss'), (u'Blogs', u'http://www.theglobeandmail.com/blogs/?service=rss'), (u'Real Estate', u'http://www.theglobeandmail.com/real-estate/?service=rss'), (u'Auto', u'http://www.theglobeandmail.com/auto/?service=rss') ] def get_article_url(self, article): url = BasicNewsRecipe.get_article_url(self, article) if '/video/' not in url: return url