#!/usr/bin/env python __license__ = 'GPL v3' __copyright__ = '23 June 2013, desUBIKado' __author__ = 'desUBIKado' __description__ = 'Contemporary Culture Magazine' __version__ = 'v0.03' __date__ = '28, July 2016' ''' http://www.jotdown.es/ ''' import re from calibre.web.feeds.news import BasicNewsRecipe class jotdown(BasicNewsRecipe): author = 'desUBIKado' description = 'Revista digital con magníficos y extensos artículos' title = u'Jot Down - Contemporary Culture Magazine' publisher = 'Wabi Sabi Investments, S.C.' category = 'Opinion, culture, science, movies, TV shows, music, blogs' language = 'es' timefmt = '[%a, %d %b, %Y]' oldest_article = 7 delay = 1 max_articles_per_feed = 20 masthead_url = 'http://www.jotdown.es/wp-content/uploads/2011/04/logoJotDown.png' use_embedded_content = False remove_javascript = True no_stylesheets = True feeds = [ (u'Portada', u'http://www.jotdown.es/feed/') ] keep_only_tags = [dict(name='div', attrs={'id':['content']}), dict(name='div', attrs={'id':['comments']}), ] remove_tags = [dict(name='a', attrs={'href':['http://alternativaseconomicas.coop/']}), dict(name='div', attrs={'class':['reply','after-meta','tags_list','wp_rp_wrap wp_rp_plain','after-meta','share_box']}), dict(name='div', attrs={'align':['center']}), dict(name='span', attrs={'class':['fbreplace','says']}), dict(name='img', attrs={'class':['avatar avatar-60 photo']}), dict(name='li', attrs={'class':['post pingback']}), dict(name='div', attrs={'id':'respond'}) ] remove_tags_after = dict(name='div' , attrs={'id':'respond'}) preprocess_regexps = [ # To change the small size of the text (re.compile(r'font-size: small', re.DOTALL|re.IGNORECASE), lambda match: 'font-size: medium'), # To present the image of the embedded video (re.compile(r'', re.DOTALL|re.IGNORECASE), lambda match: '
'), (re.compile(r' —', re.DOTALL|re.IGNORECASE), lambda match: ''), # To remove the link of the title (re.compile(r'