more russian and ukranian news sources by bugmen00t

This commit is contained in:
Kovid Goyal 2022-08-02 19:32:00 +05:30
parent b3828dcec7
commit 5f67cc961e
No known key found for this signature in database
GPG Key ID: 06BC317B515ACE7C
21 changed files with 545 additions and 1 deletions

Binary file not shown.

After

Width:  |  Height:  |  Size: 587 B

Binary file not shown.

After

Width:  |  Height:  |  Size: 587 B

BIN
recipes/icons/osvitaua.png Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 1.4 KiB

Binary file not shown.

After

Width:  |  Height:  |  Size: 1.4 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 1.4 KiB

After

Width:  |  Height:  |  Size: 1.3 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 1.4 KiB

After

Width:  |  Height:  |  Size: 1.3 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 1.4 KiB

After

Width:  |  Height:  |  Size: 1.3 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 1.4 KiB

After

Width:  |  Height:  |  Size: 1.3 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 1.4 KiB

After

Width:  |  Height:  |  Size: 1.3 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 1.4 KiB

After

Width:  |  Height:  |  Size: 1.3 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 1.4 KiB

After

Width:  |  Height:  |  Size: 1.3 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 1.4 KiB

After

Width:  |  Height:  |  Size: 1.3 KiB

BIN
recipes/icons/unn_ru.png Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 1.2 KiB

BIN
recipes/icons/unn_ua.png Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 1.2 KiB

View File

@ -11,7 +11,7 @@ class InterfaxUARU(BasicNewsRecipe):
publisher = '\u0418\u043D\u0444\u043E\u0440\u043C\u0430\u0446\u0438\u043E\u043D\u043D\u043E\u0435 \u0430\u0433\u0435\u043D\u0442\u0441\u0442\u0432\u043E \u00AB\u0418\u043D\u0442\u0435\u0440\u0444\u0430\u043A\u0441-\u0423\u043A\u0440\u0430\u0438\u043D\u0430\u00BB' # noqa publisher = '\u0418\u043D\u0444\u043E\u0440\u043C\u0430\u0446\u0438\u043E\u043D\u043D\u043E\u0435 \u0430\u0433\u0435\u043D\u0442\u0441\u0442\u0432\u043E \u00AB\u0418\u043D\u0442\u0435\u0440\u0444\u0430\u043A\u0441-\u0423\u043A\u0440\u0430\u0438\u043D\u0430\u00BB' # noqa
category = 'newspaper' category = 'newspaper'
cover_url = u'https://interfax.com.ua/static/articles/images/interfax_ukraine_logo_rus.svg' cover_url = u'https://interfax.com.ua/static/articles/images/interfax_ukraine_logo_rus.svg'
language = 'ru_UK' language = 'ru'
no_stylesheets = True no_stylesheets = True
remove_javascript = False remove_javascript = False
auto_cleanup = False auto_cleanup = False

198
recipes/liganet_ru.recipe Normal file
View File

@ -0,0 +1,198 @@
#!/usr/bin/env python
# vim:fileencoding=utf-8
from calibre.web.feeds.news import BasicNewsRecipe
class LigaNet(BasicNewsRecipe):
title = '\u041B\u0406\u0413\u0410.net'
__author__ = 'bugmen00t'
description = '\u0414\u0456\u043B\u043E\u0432\u0438\u0439 \u043D\u043E\u0432\u0438\u043D\u043D\u0438\u0439 \u043F\u043E\u0440\u0442\u0430\u043B'
publisher = 'Ligamedia'
category = 'blog'
cover_url = u'https://www.liga.net/design/images/logo_liga.png'
language = 'ru'
no_stylesheets = False
remove_javascript = False
auto_cleanup = False
oldest_article = 7
max_articles_per_feed = 30
remove_tags_before = dict(name='h1')
remove_tags_after = dict(name='div', attrs={'id': 'news-text'})
remove_tags = [
dict(name='footer'),
dict(name='div', attrs={'class': 'more-link red'}),
dict(name='div', attrs={'class': 'read-too'}),
dict(name='div', attrs={'class': 'to-send-row'}),
dict(name='div', attrs={'class': 'hint-row'}),
dict(name='div', attrs={'class': 'chronicle-top-eye'}),
dict(name='div', attrs={'class': 'chronicle-top-comm comm-btns'}),
dict(name='div', attrs={'class': 'chronicle-news m-t-30'}),
dict(name='div', attrs={'class': 'right-inner-content'}),
dict(name='div', attrs={'class': 'right-part'}),
dict(name='div', attrs={'class': 'hreflang-link'}),
dict(name='div', attrs={'class': 'vakansii-block-article'}),
dict(
name='div', attrs={'class': 'col-12 col-md p-side-10 sp-card-paddings'}
),
dict(
name='div',
attrs={'class': 'social-shares d-flex justify-content-center'}
),
dict(name='div', attrs={'class': 'social-shares d-block'}),
dict(name='div', attrs={'class': 'social-likes clearfix hidden-1280 '}),
dict(name='div', attrs={'class': 'soc-item comm-btns'}),
dict(name='div', attrs={'class': 'soc-buttons'}),
dict(
name='div',
attrs={'class': 'warning m-t-20 d-none d-md-none d-lg-block'}
),
dict(name='div', attrs={'id': 'news-list-right'}),
dict(name='div', attrs={'id': 'premium_mobile'}),
dict(name='div', attrs={'id': 'premium2_mobile'}),
dict(name='div', attrs={'class': 'marketing-block'}),
dict(name='span', attrs={'class': 'social-likes__button'}),
dict(name='div', attrs={'class': 'marketing-block'})
]
feeds = [
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u0433\u043B\u0430\u0432\u043D\u044B\u0435 \u043C\u0430\u0442\u0435\u0440\u0438\u0430\u043B\u044B',
'https://www.liga.net/news/top/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u043D\u043E\u0432\u043E\u0441\u0442\u0438',
'https://www.liga.net/news/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u0441\u0442\u0430\u0442\u044C\u0438',
'https://www.liga.net/news/articles/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u0438\u043D\u0442\u0435\u0440\u0432\u044C\u044E',
'https://www.liga.net/news/interview/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u043C\u043D\u0435\u043D\u0438\u044F',
'https://www.liga.net/news/opinion/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u0444\u043E\u0442\u043E\u043C\u0430\u0442\u0435\u0440\u0438\u0430\u043B\u044B',
'https://www.liga.net/news/photo/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u043F\u043E\u043B\u0438\u0442\u0438\u043A\u0430',
'https://www.liga.net/news/politics/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u044D\u043A\u043E\u043D\u043E\u043C\u0438\u043A\u0430',
'https://www.liga.net/news/economics/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u043E\u0431\u0449\u0435\u0441\u0442\u0432\u043E',
'https://www.liga.net/news/society/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u043C\u0438\u0440',
'https://www.liga.net/news/world/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u0441\u0442\u043E\u043B\u0438\u0446\u0430',
'https://www.liga.net/news/capital/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u0441\u043F\u043E\u0440\u0442',
'https://www.liga.net/news/sport/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u0437\u0434\u043E\u0440\u043E\u0432\u044C\u0435',
'https://www.liga.net/news/health/rss.xml'
),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438: \u043A\u0443\u043B\u044C\u0442\u0443\u0440\u0430',
'https://www.liga.net/news/culture/rss.xml'
),
(
'\u0412\u0441\u0435 \u043C\u043D\u0435\u043D\u0438\u044F',
'https://www.liga.net/opinion/rss.xml'
),
(
'\u0411\u0438\u0437\u043D\u0435\u0441: \u0433\u043B\u0430\u0432\u043D\u044B\u0435 \u043C\u0430\u0442\u0435\u0440\u0438\u0430\u043B\u044B',
'https://www.liga.net/biz/top/rss.xml'
),
(
'\u0411\u0438\u0437\u043D\u0435\u0441: \u043D\u043E\u0432\u043E\u0441\u0442\u0438',
'https://www.liga.net/biz/news/rss.xml'
),
(
'\u0411\u0438\u0437\u043D\u0435\u0441: \u0441\u0442\u0430\u0442\u044C\u0438',
'https://www.liga.net/biz/articles/rss.xml'
),
(
'\u0411\u0438\u0437\u043D\u0435\u0441: \u0438\u043D\u0442\u0435\u0440\u0432\u044C\u044E',
'https://www.liga.net/biz/interview/rss.xml'
),
(
'\u0411\u0438\u0437\u043D\u0435\u0441: \u043C\u043D\u0435\u043D\u0438\u044F',
'https://www.liga.net/biz/opinion/rss.xml'
),
(
'\u0411\u0438\u0437\u043D\u0435\u0441: \u0444\u043E\u0442\u043E\u043C\u0430\u0442\u0435\u0440\u0438\u0430\u043B\u044B',
'https://www.liga.net/biz/photo/rss.xml'
),
(
'\u0424\u0438\u043D\u0430\u043D\u0441\u044B: \u0433\u043B\u0430\u0432\u043D\u044B\u0435 \u043C\u0430\u0442\u0435\u0440\u0438\u0430\u043B\u044B',
'https://www.liga.net/fin/export/top.xml'
),
(
'\u0424\u0438\u043D\u0430\u043D\u0441\u044B: \u043C\u043D\u0435\u043D\u0438\u044F',
'https://www.liga.net/fin/opinion/rss.xml'
),
(
'\u0424\u0438\u043D\u0430\u043D\u0441\u044B: \u0431\u0430\u043D\u043A\u0438',
'https://www.liga.net/fin/export/bank.xml'
),
(
'\u0424\u0438\u043D\u0430\u043D\u0441\u044B: \u0441\u0442\u0440\u0430\u0445\u043E\u0432\u0430\u043D\u0438\u0435',
'https://www.liga.net/fin/export/insurance.xml'
),
(
'\u0424\u0438\u043D\u0430\u043D\u0441\u044B: \u043A\u0440\u0438\u043F\u0442\u043E\u044D\u043A\u043E\u043D\u043E\u043C\u0438\u043A\u0430',
'https://www.liga.net/fin/crypto/rss.xml'
),
(
'\u0424\u0438\u043D\u0430\u043D\u0441\u044B: \u0444\u043E\u043D\u0434\u044B',
'https://www.liga.net/fin/export/funds.xml'
),
(
'Tech: \u0433\u043B\u0430\u0432\u043D\u044B\u0435 \u043C\u0430\u0442\u0435\u0440\u0438\u0430\u043B\u044B',
'https://www.liga.net/tech/top/rss.xml'
),
(
'Tech: \u0442\u0435\u0445\u043D\u043E\u043B\u043E\u0433\u0438\u0438',
'https://www.liga.net/tech/technology/rss.xml'
),
(
'Tech: \u0442\u0435\u043B\u0435\u043A\u043E\u043C',
'https://www.liga.net/tech/telecom/rss.xml'
),
(
'Tech: \u0433\u0430\u0434\u0436\u0435\u0442\u044B',
'https://www.liga.net/tech/gadgets/rss.xml'
),
(
'Tech: \u0441\u0432\u043E\u0439 \u0431\u0438\u0437\u043D\u0435\u0441',
'https://www.liga.net/tech/own-business/rss.xml'
),
(
'Tech: \u0431\u0430\u0442\u0442\u043B\u044B',
'https://www.liga.net/tech/battles/rss.xml'
),
(
'\u0411\u043B\u043E\u0433\u0438: \u0432\u0441\u0435 \u043C\u0430\u0442\u0435\u0440\u0438\u0430\u043B\u044B',
'https://www.liga.net/rss/blog.xml'
)
]

70
recipes/liganet_ua.recipe Normal file
View File

@ -0,0 +1,70 @@
#!/usr/bin/env python
# vim:fileencoding=utf-8
from calibre.web.feeds.news import BasicNewsRecipe
class LigaNet(BasicNewsRecipe):
title = '\u041B\u0406\u0413\u0410.net (UA)'
__author__ = 'bugmen00t'
description = '\u0414\u0456\u043B\u043E\u0432\u0438\u0439 \u043D\u043E\u0432\u0438\u043D\u043D\u0438\u0439 \u043F\u043E\u0440\u0442\u0430\u043B'
publisher = 'Ligamedia'
category = 'blog'
cover_url = u'https://www.liga.net/design/images/logo_liga.png'
language = 'uk'
no_stylesheets = False
remove_javascript = False
auto_cleanup = False
oldest_article = 7
max_articles_per_feed = 30
remove_tags_before = dict(name='h1')
remove_tags_after = dict(name='div', attrs={'id': 'news-text'})
remove_tags = [
dict(name='footer'),
dict(name='div', attrs={'class': 'more-link red'}),
dict(name='div', attrs={'class': 'read-too'}),
dict(name='div', attrs={'class': 'to-send-row'}),
dict(name='div', attrs={'class': 'hint-row'}),
dict(name='div', attrs={'class': 'chronicle-top-eye'}),
dict(name='div', attrs={'class': 'chronicle-top-comm comm-btns'}),
dict(name='div', attrs={'class': 'chronicle-news m-t-30'}),
dict(name='div', attrs={'class': 'right-inner-content'}),
dict(name='div', attrs={'class': 'right-part'}),
dict(name='div', attrs={'class': 'hreflang-link'}),
dict(name='div', attrs={'class': 'vakansii-block-article'}),
dict(
name='div', attrs={'class': 'col-12 col-md p-side-10 sp-card-paddings'}
),
dict(
name='div',
attrs={'class': 'social-shares d-flex justify-content-center'}
),
dict(name='div', attrs={'class': 'social-shares d-block'}),
dict(name='div', attrs={'class': 'social-likes clearfix hidden-1280 '}),
dict(name='div', attrs={'class': 'soc-item comm-btns'}),
dict(name='div', attrs={'class': 'soc-buttons'}),
dict(
name='div',
attrs={'class': 'warning m-t-20 d-none d-md-none d-lg-block'}
),
dict(name='div', attrs={'id': 'news-list-right'}),
dict(name='div', attrs={'id': 'premium_mobile'}),
dict(name='div', attrs={'id': 'premium2_mobile'}),
dict(name='div', attrs={'class': 'marketing-block'}),
dict(name='span', attrs={'class': 'social-likes__button'}),
dict(name='div', attrs={'class': 'marketing-block'})
]
feeds = [
(
'\u041D\u043E\u0432\u0438\u043D\u0438: \u0433\u043E\u043B\u043E\u0432\u043D\u0456 \u043C\u0430\u0442\u0435\u0440\u0456\u0430\u043B\u0438',
'https://www.liga.net/newsua/top/rss.xml'
),
(
'\u041D\u043E\u0432\u0438\u043D\u0438: \u0432\u0441\u0456 \u043C\u0430\u0442\u0435\u0440\u0456\u0430\u043B\u0438',
'https://www.liga.net/newsua/all/rss.xml'
)
]

34
recipes/osvitaua.recipe Normal file
View File

@ -0,0 +1,34 @@
#!/usr/bin/env python
# vim:fileencoding=utf-8
from calibre.web.feeds.news import BasicNewsRecipe
class Osvita(BasicNewsRecipe):
title = '\u041E\u0441\u0432\u0456\u0442\u0430.ua'
__author__ = 'bugmen00t'
description = '\u0423\u0441\u0435 \u043F\u0440\u043E \u043E\u0441\u0432\u0456\u0442\u0443 \u0432 \u0423\u043A\u0440\u0430\u0457\u043D\u0456 \u0442\u0430 \u0437\u0430 \u043A\u043E\u0440\u0434\u043E\u043D\u043E\u043C: \u0442\u0435\u043C\u0430\u0442\u0438\u0447\u043D\u0438\u0439 \u0440\u0435\u0441\u0443\u0440\u0441, \u043F\u0440\u0438\u0441\u0432\u044F\u0447\u0435\u043D\u0438\u0439 \u043E\u0441\u0432\u0456\u0442\u0456 \u0432 \u0423\u043A\u0440\u0430\u0457\u043D\u0456 \u0442\u0430 \u0437\u0430 \u0457\u0457 \u043C\u0435\u0436\u0430\u043C\u0438, \u0454 \u0430\u043A\u0442\u0443\u0430\u043B\u044C\u043D\u0438\u043C \u0434\u0436\u0435\u0440\u0435\u043B\u043E\u043C \u0456\u043D\u0444\u043E\u0440\u043C\u0430\u0446\u0456\u0457 \u0443 \u0446\u0456\u0439 \u0441\u0444\u0435\u0440\u0456.' # noqa
publisher = '\u041E\u0441\u0432\u0456\u0442\u0430.ua'
category = 'blog'
cover_url = u'http://osvita.ua/doc/i/Contacts-logo.jpg'
language = 'uk'
no_stylesheets = False
remove_javascript = False
auto_cleanup = False
oldest_article = 7
max_articles_per_feed = 30
remove_tags_before = dict(name='div', attrs={'id': 'body'})
remove_tags_after = dict(name='div', attrs={'id': 'body'})
remove_tags = [
# Unable to fetch images, removing them completely
dict(name='img'),
dict(name='p', attrs={'class': 'info'})
]
feeds = [('\u041D\u043E\u0432\u0438\u043D\u0438', 'https://osvita.ua/rss/')]
def print_version(self, url):
return url + 'print'

View File

@ -0,0 +1,34 @@
#!/usr/bin/env python
# vim:fileencoding=utf-8
from calibre.web.feeds.news import BasicNewsRecipe
class Osvita(BasicNewsRecipe):
title = '\u041E\u0441\u0432\u0456\u0442\u0430.ua'
__author__ = 'bugmen00t'
description = '\u0422\u0435\u043C\u0430\u0442\u0438\u0447\u0435\u0441\u043A\u0438\u0439 \u0440\u0435\u0441\u0443\u0440\u0441, \u043F\u043E\u0441\u0432\u044F\u0449\u0451\u043D\u043D\u044B\u0439 \u043E\u0431\u0440\u0430\u0437\u043E\u0432\u0430\u043D\u0438\u044E \u0432 \u0423\u043A\u0440\u0430\u0438\u043D\u0435 \u0438 \u0437\u0430 \u0440\u0443\u0431\u0435\u0436\u043E\u043C.' # noqa
publisher = '\u041E\u0441\u0432\u0456\u0442\u0430.ua'
category = 'blog'
cover_url = u'http://osvita.ua/doc/i/Contacts-logo.jpg'
language = 'ru'
no_stylesheets = False
remove_javascript = False
auto_cleanup = False
oldest_article = 7
max_articles_per_feed = 30
remove_tags_before = dict(name='div', attrs={'id': 'body'})
remove_tags_after = dict(name='div', attrs={'id': 'body'})
remove_tags = [
# Unable to fetch images, removing them completely
dict(name='img'),
dict(name='p', attrs={'class': 'info'})
]
feeds = [('\u041D\u043E\u0432\u0438\u043D\u0438', 'https://ru.osvita.ua/rss/')]
def print_version(self, url):
return url + 'print'

104
recipes/unn_ru.recipe Normal file
View File

@ -0,0 +1,104 @@
#!/usr/bin/env python
# vim:fileencoding=utf-8
from calibre.web.feeds.news import BasicNewsRecipe
class UNN(BasicNewsRecipe):
title = '\u0423\u043A\u0440\u0430\u0438\u043D\u0441\u043A\u0438\u0435 \u041D\u0430\u0446\u0438\u043E\u043D\u0430\u043B\u044C\u043D\u044B\u0435 \u041D\u043E\u0432\u043E\u0441\u0442\u0438' # noqa
__author__ = 'bugmen00t'
description = '\u0423\u041D\u041D: \u0423\u043A\u0440\u0430\u0438\u043D\u0441\u043A\u0438\u0435 \u041D\u0430\u0446\u0438\u043E\u043D\u0430\u043B\u044C\u043D\u044B\u0435 \u041D\u043E\u0432\u043E\u0441\u0442\u0438' # noqa
publisher = '\u0406\u043D\u0444\u043E\u0440\u043C\u0430\u0446\u0456\u0439\u043D\u0435 \u0430\u0433\u0435\u043D\u0442\u0441\u0442\u0432\u043E \u00AB\u0423\u043A\u0440\u0430\u0457\u043D\u0441\u044C\u043A\u0456 \u041D\u0430\u0446\u0456\u043E\u043D\u0430\u043B\u044C\u043D\u0456 \u041D\u043E\u0432\u0438\u043D\u0438\u00BB' # noqa
category = 'newspaper'
cover_url = u'https://argentum.ua/uploads/portfolio/2012/c043e0e18fd9f89df5fb421ab28cf609197011c2.png'
language = 'ru'
no_stylesheets = False
remove_javascript = False
auto_cleanup = False
oldest_article = 7
max_articles_per_feed = 50
remove_tags_before = dict(name='span', attrs={'itemprop': 'datePublished'})
remove_tags_after = dict(name='div', attrs={'class': 'b-news-full'})
remove_tags = [
dict(name='span', attrs={'class': 'view'}),
dict(name='div', attrs={'class': 'b-news-tags'}),
dict(name='div', attrs={'class': 'b-news-source'}),
dict(name='div', attrs={'class': 'b-news-footer'}),
dict(name='div', attrs={'class': 'b-notice-msg'})
]
feeds = [
(
'\u041E\u043F\u0435\u0440\u0430\u0442\u0438\u0432\u043D\u044B\u0435 \u043D\u043E\u0432\u043E\u0441\u0442\u0438',
'https://www.unn.com.ua/rss/news_ru.xml'
),
(
'\u041F\u0443\u0431\u043B\u0438\u043A\u0430\u0446\u0438\u0438',
'https://www.unn.com.ua/rss/publication_ru.xml'
),
(
'\u042D\u043A\u0441\u043A\u043B\u044E\u0437\u0438\u0432\u043D\u044B\u0435 \u043D\u043E\u0432\u043E\u0441\u0442\u0438',
'https://www.unn.com.ua/rss/exclusive_ru.xml'
),
(
'\u041F\u043E\u043B\u0438\u0442\u0438\u043A\u0430',
'https://www.unn.com.ua/rss/news_politics_ru.xml'
),
(
'\u042D\u043A\u043E\u043D\u043E\u043C\u0438\u043A\u0430',
'https://www.unn.com.ua/rss/news_economics_ru.xml'
),
(
'\u0410\u0433\u0440\u043E\u043D\u043E\u0432\u043E\u0441\u0442\u0438',
'https://www.unn.com.ua/rss/news_agronews_ru.xml'
),
(
'\u041E\u0434\u0435\u0441\u0441\u0430',
'https://www.unn.com.ua/rss/news_odesa_ru.xml'
),
('\u041A\u0438\u0435\u0432', 'https://www.unn.com.ua/rss/news_kiev_ru.xml'),
('COVID-19', 'https://www.unn.com.ua/rss/news_covid19_ru.xml'),
(
'\u041E\u0431\u0449\u0435\u0441\u0442\u0432\u043E',
'https://www.unn.com.ua/rss/news_society_ru.xml'
),
(
'\u0417\u0434\u043E\u0440\u043E\u0432\u044C\u0435',
'https://www.unn.com.ua/rss/news_health_ru.xml'
),
(
'\u0412\u043E\u0439\u043D\u0430',
'https://www.unn.com.ua/rss/news_war_ru.xml'
),
(
'\u041A\u0440\u0438\u043C\u0438\u043D\u0430\u043B \u0438 \u0427\u041F',
'https://www.unn.com.ua/rss/news_criminal_ru.xml'
),
('\u0423\u041D\u041D Lite', 'https://www.unn.com.ua/rss/news_lite_ru.xml'),
(
'\u041D\u043E\u0432\u043E\u0441\u0442\u0438 \u041C\u0438\u0440\u0430',
'https://www.unn.com.ua/rss/news_world_ru.xml'
),
(
'\u0422\u0435\u0445\u043D\u043E\u043B\u043E\u0433\u0438\u0438',
'https://www.unn.com.ua/rss/news_tech_ru.xml'
),
(
'\u0421\u043F\u043E\u0440\u0442',
'https://www.unn.com.ua/rss/news_sport_ru.xml'
),
(
'\u041A\u0443\u043B\u044C\u0442\u0443\u0440\u0430',
'https://www.unn.com.ua/rss/news_culture_ru.xml'
),
(
'\u041C\u0443\u043B\u044C\u0442\u0438\u043C\u0435\u0434\u0438\u0430',
'https://www.unn.com.ua/rss/news_media_ru.xml'
)
]
def print_version(self, url):
return url + '?_part=main&_print=1'

104
recipes/unn_ua.recipe Normal file
View File

@ -0,0 +1,104 @@
#!/usr/bin/env python
# vim:fileencoding=utf-8
from calibre.web.feeds.news import BasicNewsRecipe
class UNN(BasicNewsRecipe):
title = '\u0423\u043A\u0440\u0430\u0457\u043D\u0441\u044C\u043A\u0456 \u041D\u0430\u0446\u0456\u043E\u043D\u0430\u043B\u044C\u043D\u0456 \u041D\u043E\u0432\u0438\u043D\u0438' # noqa
__author__ = 'bugmen00t'
description = '\u0423\u041D\u041D: \u0423\u043A\u0440\u0430\u0457\u043D\u0441\u044C\u043A\u0456 \u041D\u0430\u0446\u0456\u043E\u043D\u0430\u043B\u044C\u043D\u0456 \u041D\u043E\u0432\u0438\u043D\u0438' # noqa
publisher = '\u0406\u043D\u0444\u043E\u0440\u043C\u0430\u0446\u0456\u0439\u043D\u0435 \u0430\u0433\u0435\u043D\u0442\u0441\u0442\u0432\u043E \u00AB\u0423\u043A\u0440\u0430\u0457\u043D\u0441\u044C\u043A\u0456 \u041D\u0430\u0446\u0456\u043E\u043D\u0430\u043B\u044C\u043D\u0456 \u041D\u043E\u0432\u0438\u043D\u0438\u00BB' # noqa
category = 'newspaper'
cover_url = u'https://pechersk.kyivcity.gov.ua/done_img/b/11289.jpg'
language = 'uk'
no_stylesheets = False
remove_javascript = False
auto_cleanup = False
oldest_article = 7
max_articles_per_feed = 50
remove_tags_before = dict(name='span', attrs={'itemprop': 'datePublished'})
remove_tags_after = dict(name='div', attrs={'class': 'b-news-full'})
remove_tags = [
dict(name='span', attrs={'class': 'view'}),
dict(name='div', attrs={'class': 'b-news-tags'}),
dict(name='div', attrs={'class': 'b-news-source'}),
dict(name='div', attrs={'class': 'b-news-footer'}),
dict(name='div', attrs={'class': 'b-notice-msg'})
]
feeds = [
(
'\u041E\u043F\u0435\u0440\u0430\u0442\u0438\u0432\u043D\u0456 \u043D\u043E\u0432\u0438\u043D\u0438',
'https://www.unn.com.ua/rss/news_uk.xml'
),
(
'\u041F\u0443\u0431\u043B\u0456\u043A\u0430\u0446\u0456\u0457',
'https://www.unn.com.ua/rss/publication_uk.xml'
),
(
'\u0415\u043A\u0441\u043A\u043B\u044E\u0437\u0438\u0432\u043D\u0456 \u043D\u043E\u0432\u0438\u043D\u0438',
'https://www.unn.com.ua/rss/exclusive_uk.xml'
),
(
'\u041F\u043E\u043B\u0456\u0442\u0438\u043A\u0430',
'https://www.unn.com.ua/rss/news_politics_uk.xml'
),
(
'\u0415\u043A\u043E\u043D\u043E\u043C\u0456\u043A\u0430',
'https://www.unn.com.ua/rss/news_economics_uk.xml'
),
(
'\u0410\u0433\u0440\u043E\u043D\u043E\u0432\u0438\u043D\u0438',
'https://www.unn.com.ua/rss/news_agronews_uk.xml'
),
(
'\u041E\u0434\u0435\u0441\u0430',
'https://www.unn.com.ua/rss/news_odesa_uk.xml'
),
('\u041A\u0438\u0457\u0432', 'https://www.unn.com.ua/rss/news_kiev_uk.xml'),
('COVID-19', 'https://www.unn.com.ua/rss/news_covid19_uk.xml'),
(
'\u0421\u0443\u0441\u043F\u0456\u043B\u044C\u0441\u0442\u0432\u043E',
'https://www.unn.com.ua/rss/news_society_uk.xml'
),
(
'\u0417\u0434\u043E\u0440\u043E\u0432\u0027\u044F',
'https://www.unn.com.ua/rss/news_health_uk.xml'
),
(
'\u0412\u0456\u0439\u043D\u0430',
'https://www.unn.com.ua/rss/news_war_uk.xml'
),
(
'\u041A\u0440\u0438\u043C\u0456\u043D\u0430\u043B \u0442\u0430 \u041D\u041F',
'https://www.unn.com.ua/rss/news_criminal_uk.xml'
),
('\u0423\u041D\u041D Lite', 'https://www.unn.com.ua/rss/news_lite_uk.xml'),
(
'\u041D\u043E\u0432\u0438\u043D\u0438 \u0421\u0432\u0456\u0442\u0443',
'https://www.unn.com.ua/rss/news_world_uk.xml'
),
(
'\u0422\u0435\u0445\u043D\u043E\u043B\u043E\u0433\u0456\u0457',
'https://www.unn.com.ua/rss/news_tech_uk.xml'
),
(
'\u0421\u043F\u043E\u0440\u0442',
'https://www.unn.com.ua/rss/news_sport_uk.xml'
),
(
'\u041A\u0443\u043B\u044C\u0442\u0443\u0440\u0430',
'https://www.unn.com.ua/rss/news_culture_uk.xml'
),
(
'\u041C\u0443\u043B\u044C\u0442\u0438\u043C\u0435\u0434\u0456\u0430',
'https://www.unn.com.ua/rss/news_media_uk.xml'
)
]
def print_version(self, url):
return url + '?_part=main&_print=1'