diff --git a/recipes/idg_se.recipe b/recipes/idg_se.recipe new file mode 100644 index 0000000000..b4e86f9643 --- /dev/null +++ b/recipes/idg_se.recipe @@ -0,0 +1,33 @@ +__license__ = 'GPLv3' + +from calibre.web.feeds.news import BasicNewsRecipe + +class IDGse(BasicNewsRecipe): + title = 'IDG' + description = 'IDG.se' + language = 'se' + __author__ = 'zapt0' + oldest_article = 1 + max_articles_per_feed = 40 + no_stylesheets = True + encoding = 'ISO-8859-1' + remove_javascript = True + + feeds = [(u'Senaste nytt',u'http://feeds.idg.se/idg/vzzs')] + + def print_version(self,url): + return url + '?articleRenderMode=print&m=print' + + def get_cover_url(this): + return 'http://idgmedia.idg.se/polopoly_fs/2.3275!images/idgmedia_logo_75.jpg' + + keep_only_tags = [ + dict(name='h1'), + dict(name='div', attrs={'class':['divColumn1Article']}), + ] + #remove ads + remove_tags = [ + dict(name='div', attrs={'id':['preamble_ad']}), + dict(name='ul', attrs={'class':['share']}) + ] + diff --git a/recipes/united_daily.recipe b/recipes/united_daily.recipe index 1013b3d2b6..25493a43ac 100644 --- a/recipes/united_daily.recipe +++ b/recipes/united_daily.recipe @@ -64,7 +64,7 @@ class UnitedDaily(BasicNewsRecipe): __author__ = 'Eddie Lau' __version__ = '1.1' - language = 'zh-TW' + language = 'zh_TW' publisher = 'United Daily News Group' description = 'United Daily (Taiwan)' category = 'News, Chinese, Taiwan' diff --git a/recipes/utrinski.recipe b/recipes/utrinski.recipe new file mode 100644 index 0000000000..5256695079 --- /dev/null +++ b/recipes/utrinski.recipe @@ -0,0 +1,71 @@ +#!/usr/bin/env python + +__license__ = 'GPL v3' +__copyright__ = '2011, Darko Spasovski ' +''' +utrinski.com.mk +''' + +import re +import datetime +from calibre.web.feeds.news import BasicNewsRecipe + +class UtrinskiVesnik(BasicNewsRecipe): + + __author__ = 'Darko Spasovski' + INDEX = 'http://www.utrinski.com.mk/' + title = 'Utrinski Vesnik' + description = 'Daily Macedonian newspaper' + masthead_url = 'http://www.utrinski.com.mk/images/LogoTop.jpg' + language = 'mk' + remove_javascript = True + publication_type = 'newspaper' + category = 'news, Macedonia' + oldest_article = 2 + max_articles_per_feed = 100 + no_stylesheets = True + use_embedded_content = False + preprocess_regexps = [(re.compile(i[0], re.IGNORECASE | re.DOTALL), i[1]) for i in + [ + ## Remove anything before the start of the article. + (r'', lambda match: ''), + + ## Remove anything after the end of the article. + (r'