diff --git a/recipes/dainik_bhaskar.recipe b/recipes/dainik_bhaskar.recipe new file mode 100644 index 0000000000..d9389c234b --- /dev/null +++ b/recipes/dainik_bhaskar.recipe @@ -0,0 +1,48 @@ +#!/usr/bin/env python + +from calibre.web.feeds.news import BasicNewsRecipe, classes + + +class DainikBhaskar(BasicNewsRecipe): + title = 'दैनिक भास्कर' + description = ( + 'Dainik Bhaskar is an Indian Hindi-language daily newspaper owned by the Dainik Bhaskar Group.' + ' It is ranked 4th in the world by circulation and is the largest newspaper in India by circulation.') + language = 'hi' + __author__ = 'unkn0wn' + oldest_article = 1 # days + max_articles_per_feed = 50 + encoding = 'utf-8' + use_embedded_content = False + masthead_url = 'https://tse4.mm.bing.net/th?id=OIP.t6kK1-rSpzNbSerwzD5qbQHaDY' + no_stylesheets = True + remove_attributes = ['style', 'height', 'width'] + ignore_duplicate_articles = {'url'} + + def get_cover_url(self): + soup = self.index_to_soup('https://epaper.bhaskar.com/') + tag = soup.find(attrs={'class': 'scaleDiv'}) + if tag: + self.cover_url = tag.find('img')['src'].replace("_ss.jpg", "_l.jpg") + return super().get_cover_url() + + keep_only_tags = [ + classes('f5afa1d3'), + ] + + remove_tags = [ + classes('_3c197847 _66d97d7f e0d43c76 bhaskar-widget-container-class _28e65306 _8adadf19 _07c65a39'), + dict(name='svg'), + ] + + feeds = [ + ('देश ', 'https://www.bhaskar.com/rss-v1--category-1061.xml'), + ('ओपिनियन', 'https://www.bhaskar.com/rss-v1--category-1944.xml'), + ('विदेश ', 'https://www.bhaskar.com/rss-v1--category-1125.xml'), + ('ओरिजिनल', 'https://www.bhaskar.com/rss-v1--category-4587.xml'), + ('बिजनेस', 'https://www.bhaskar.com/rss-v1--category-1051.xml'), + ('स्पोर्ट्स ', 'https://www.bhaskar.com/rss-v1--category-1053.xml'), + ('मैगजीन ', 'https://www.bhaskar.com/rss-v1--category-1057.xml'), + ('करिअर ', 'https://www.bhaskar.com/rss-v1--category-11945.xml'), + # https://www.bhaskar.com/rss + ]