diff --git a/recipes/inquirer_net.recipe b/recipes/inquirer_net.recipe index 3a3d5b9e89..30f2519f8b 100644 --- a/recipes/inquirer_net.recipe +++ b/recipes/inquirer_net.recipe @@ -7,56 +7,33 @@ www.inquirer.net ''' from calibre.web.feeds.recipes import BasicNewsRecipe -from calibre.ebooks.BeautifulSoup import Tag class InquirerNet(BasicNewsRecipe): title = 'Inquirer.net' - __author__ = 'Darko Miletic' + __author__ = 'Krittika Goyal' description = 'News from Philipines' oldest_article = 2 max_articles_per_feed = 100 no_stylesheets = True use_embedded_content = False - encoding = 'cp1252' + encoding = 'utf8' publisher = 'inquirer.net' category = 'news, politics, philipines' lang = 'en' language = 'en' - extra_css = ' .fontheadline{font-size: x-large} .fontsubheadline{font-size: large} .fontkick{font-size: medium}' + use_embedded_content = False - html2lrf_options = [ - '--comment', description - , '--category', category - , '--publisher', publisher - , '--ignore-tables' - ] - - html2epub_options = 'publisher="' + publisher + '"\ncomments="' + description + '"\ntags="' + category + '"\nlinearize_tables=True' - - remove_tags = [dict(name=['object','link','script','iframe','form'])] + no_stylesheets = True + auto_cleanup = True feeds = [ - (u'Breaking news', u'http://services.inquirer.net/rss/breakingnews.xml' ) - ,(u'Top stories' , u'http://services.inquirer.net/rss/topstories.xml' ) - ,(u'Sports' , u'http://services.inquirer.net/rss/brk_breakingnews.xml' ) - ,(u'InfoTech' , u'http://services.inquirer.net/rss/infotech_tech.xml' ) - ,(u'InfoTech' , u'http://services.inquirer.net/rss/infotech_tech.xml' ) - ,(u'Business' , u'http://services.inquirer.net/rss/inq7money_breaking_news.xml' ) - ,(u'Editorial' , u'http://services.inquirer.net/rss/opinion_editorial.xml' ) - ,(u'Global Nation', u'http://services.inquirer.net/rss/globalnation_breakingnews.xml') + (u'Inquirer', u'http://www.inquirer.net/fullfeed') ] - def preprocess_html(self, soup): - mlang = Tag(soup,'meta',[("http-equiv","Content-Language"),("content",self.lang)]) - mcharset = Tag(soup,'meta',[("http-equiv","Content-Type"),("content","text/html; charset=utf-8")]) - soup.head.insert(0,mlang) - soup.head.insert(1,mcharset) - for item in soup.findAll(style=True): - del item['style'] - return soup + def get_browser(self): + br = BasicNewsRecipe.get_browser(self) + br.set_handle_gzip(True) + return br + - def print_version(self, url): - rest, sep, art = url.rpartition('/view/') - art_id, sp, rrest = art.partition('/') - return 'http://services.inquirer.net/print/print.php?article_id=' + art_id