from calibre.web.feeds.news import BasicNewsRecipe import re class f1ultra(BasicNewsRecipe): title = u'Formuła 1 - F1 ultra' __license__ = 'GPL v3' __author__ = 'MrStefan , Artur Stachecki ' language = 'pl' description = u'Formuła 1, Robert Kubica, F3, GP2 oraz inne serie wyścigowe.' masthead_url = 'http://www.f1ultra.pl/templates/f1ultra/images/logo.gif' remove_empty_feeds = True oldest_article = 1 max_articles_per_feed = 100 remove_javascript = True no_stylesheets = True keep_only_tags = [(dict(name='div', attrs={'id': 'main'}))] remove_tags_after = [ dict(attrs={'style': 'margin-top:5px;margin-bottom:5px;display: inline;'})] remove_tags = [ (dict(attrs={'class': ['buttonheading', 'avPlayerContainer', 'createdate']}))] remove_tags.append(dict(attrs={'title': ['PDF', 'Drukuj', 'Email']})) remove_tags.append(dict(name='form', attrs={'method': 'post'})) remove_tags.append(dict(name='hr', attrs={'size': '2'})) preprocess_regexps = [(re.compile(r'align="left"'), lambda match: ''), (re.compile(r'align="right"'), lambda match: ''), (re.compile(r'width=\"*\"'), lambda match: ''), (re.compile(r'\'), lambda match: '')] extra_css = '''.contentheading { font-size: 1.4em; font-weight: bold; } img { display: block; clear: both;} ''' remove_attributes = ['width', 'height', 'position', 'float', 'padding-left', 'padding-right', 'padding', 'text-align'] feeds = [ (u'F1 Ultra', u'http://www.f1ultra.pl/index.php?option=com_rd_rss&id=1&Itemid=245')]