import re from calibre.web.feeds.news import BasicNewsRecipe class AdvancedUserRecipe1289939440(BasicNewsRecipe): __author__ = 'FunThomas' title = u'Root.cz' description = u'Zprávičky a články z Root.cz' publisher = u'Internet Info, s.r.o' oldest_article = 2 # max stari clanku ve dnech max_articles_per_feed = 50 # max pocet clanku na feed feeds = [ (u'Články', u'http://www.root.cz/rss/clanky/'), (u'Zprávičky', u'http://www.root.cz/rss/zpravicky/') ] publication_type = u'magazine' language = u'cs' no_stylesheets = True remove_javascript = True cover_url = u'http://i.iinfo.cz/urs/logo-root-bila-oranzova-cerna-111089527143118.gif' remove_attributes = ['width', 'height', 'href'] # ,'href' keep_only_tags = [ dict(name='h1'), dict(name='a', attrs={'class': 'author'}), dict(name='p', attrs={'class': 'intro'}), dict(name='div', attrs={'class': 'urs'}) ] preprocess_regexps = [ (re.compile(u'
[^<]*]*>',
re.DOTALL), lambda match: '
'), (re.compile(u'