Dainik Bhaskar by unkn0wn

This commit is contained in:
Kovid Goyal 2022-04-12 17:23:02 +05:30
parent 3f86674de9
commit 7ae6af4542
No known key found for this signature in database
GPG Key ID: 06BC317B515ACE7C

View File

@ -0,0 +1,48 @@
#!/usr/bin/env python
from calibre.web.feeds.news import BasicNewsRecipe, classes
class DainikBhaskar(BasicNewsRecipe):
title = 'दैनिक भास्कर'
description = (
'Dainik Bhaskar is an Indian Hindi-language daily newspaper owned by the Dainik Bhaskar Group.'
' It is ranked 4th in the world by circulation and is the largest newspaper in India by circulation.')
language = 'hi'
__author__ = 'unkn0wn'
oldest_article = 1 # days
max_articles_per_feed = 50
encoding = 'utf-8'
use_embedded_content = False
masthead_url = 'https://tse4.mm.bing.net/th?id=OIP.t6kK1-rSpzNbSerwzD5qbQHaDY'
no_stylesheets = True
remove_attributes = ['style', 'height', 'width']
ignore_duplicate_articles = {'url'}
def get_cover_url(self):
soup = self.index_to_soup('https://epaper.bhaskar.com/')
tag = soup.find(attrs={'class': 'scaleDiv'})
if tag:
self.cover_url = tag.find('img')['src'].replace("_ss.jpg", "_l.jpg")
return super().get_cover_url()
keep_only_tags = [
classes('f5afa1d3'),
]
remove_tags = [
classes('_3c197847 _66d97d7f e0d43c76 bhaskar-widget-container-class _28e65306 _8adadf19 _07c65a39'),
dict(name='svg'),
]
feeds = [
('देश ', 'https://www.bhaskar.com/rss-v1--category-1061.xml'),
('ओपिनियन', 'https://www.bhaskar.com/rss-v1--category-1944.xml'),
('विदेश ', 'https://www.bhaskar.com/rss-v1--category-1125.xml'),
('ओरिजिनल', 'https://www.bhaskar.com/rss-v1--category-4587.xml'),
('बिजनेस', 'https://www.bhaskar.com/rss-v1--category-1051.xml'),
('स्पोर्ट्स ', 'https://www.bhaskar.com/rss-v1--category-1053.xml'),
('मैगजीन ', 'https://www.bhaskar.com/rss-v1--category-1057.xml'),
('करिअर ', 'https://www.bhaskar.com/rss-v1--category-11945.xml'),
# https://www.bhaskar.com/rss
]