From 5474aa42682d79c9967544f93e38103d70c0b841 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Mon, 24 Jan 2011 09:47:20 -0700 Subject: [PATCH] tportal.h by DM. Fixes #8552 (New recipe for daily tportal) --- resources/images/news/dailytportal.png | Bin 0 -> 635 bytes resources/recipes/dailytportal.recipe | 66 +++++++++++++++++++++++++ src/calibre/utils/localization.py | 1 + 3 files changed, 67 insertions(+) create mode 100644 resources/images/news/dailytportal.png create mode 100644 resources/recipes/dailytportal.recipe diff --git a/resources/images/news/dailytportal.png b/resources/images/news/dailytportal.png new file mode 100644 index 0000000000000000000000000000000000000000..38b06e675a24eccbca5297987fe696e531bf9dfd GIT binary patch literal 635 zcmeAS@N?(olHy`uVBq!ia0vp^0wB!61|;P_|4#%`Y)RhkE)4%caKYZ?lYt_f1s;*b zK-vS0-A-oPfdtD69Mgd`SU*F|v9*U87#Np$x;TbdoQ|EmuusfUpk@E7nf4V;Oe!{v z86sU1J}{_g2sIsCXvk77*68$+!G^`sLhpxlrTT++tQ@;e=7?YkgEE3T@Loz|_Lqpu8ee&5^NbX6LPQi#1fIoIJNiA%1_&qhEj2S!X!+%vf=u zJ><3v%jRCyG%Z)|ly$tt>^_|=Uh-T5eG0}ag;;kSj6alDWaSpw{r%H7hPemr#dALY zej}cLf6tOE|DUhkw7mYD+_dxJw1_qq&tAq(Mhw(q?3UD2yP@O$kAz1hnyT4c3zPwEJq zAY`3Z^!^^#wyB0UdKeRDv)+&uVfLx5oo`cj<=W2ceK#bXgdTod>~m#mmV}<(dWIi= zK6b3$EPQHNC1X&4_<}E{_ZBUGaQ8QVh}ye*JNMS<&t9He^7 z#eYQS#k?EWwH^W^PqoA~q9i4;B-JXpC>2OC7#SEE>KYj88kvL`SX!BwS{WJW8kk!d s7$g;NK0wiso1c=IR*9^^(7?*r2#6pWW~RFK12r&sy85}Sb4q9e0DvF?i~s-t literal 0 HcmV?d00001 diff --git a/resources/recipes/dailytportal.recipe b/resources/recipes/dailytportal.recipe new file mode 100644 index 0000000000..6e2646bfca --- /dev/null +++ b/resources/recipes/dailytportal.recipe @@ -0,0 +1,66 @@ +__license__ = 'GPL v3' +__copyright__ = '2011, Darko Miletic ' +''' +daily.tportal.hr +''' + +from calibre.web.feeds.news import BasicNewsRecipe + +class Pagina12(BasicNewsRecipe): + title = 'Daily tportal.h' + __author__ = 'Darko Miletic' + description = 'News from Croatia' + publisher = 'tportal.hr' + category = 'news, politics, Croatia' + oldest_article = 2 + max_articles_per_feed = 200 + no_stylesheets = True + encoding = 'utf-8' + use_embedded_content = False + language = 'en_HR' + remove_empty_feeds = True + publication_type = 'newsportal' + extra_css = """ + body{font-family: Verdana,sans-serif } + img{margin-bottom: 0.4em; display:block} + h1,h2{color: #2D648A; font-family: Georgia,serif} + .artAbstract{font-size: 1.2em; font-family: Georgia,serif} + """ + + conversion_options = { + 'comment' : description + , 'tags' : category + , 'publisher' : publisher + , 'language' : language + } + + remove_tags = [ + dict(name=['meta','link','embed','object','iframe','base']) + ,dict(name='div', attrs={'class':'artInfo'}) + ] + remove_attributes=['lang'] + + keep_only_tags=dict(attrs={'class':'articleDetails'}) + + feeds = [(u'News', u'http://daily.tportal.hr/rss/dailynaslovnicarss.xml')] + + def preprocess_html(self, soup): + for item in soup.findAll(style=True): + del item['style'] + for item in soup.findAll('a'): + limg = item.find('img') + if item.string is not None: + str = item.string + item.replaceWith(str) + else: + if limg: + item.name = 'div' + item.attrs = [] + else: + str = self.tag_to_string(item) + item.replaceWith(str) + for item in soup.findAll('img'): + if not item.has_key('alt'): + item['alt'] = 'image' + return soup + diff --git a/src/calibre/utils/localization.py b/src/calibre/utils/localization.py index d452721113..b9995db2bf 100644 --- a/src/calibre/utils/localization.py +++ b/src/calibre/utils/localization.py @@ -105,6 +105,7 @@ _extra_lang_codes = { 'en_TH' : _('English (Thailand)'), 'en_CY' : _('English (Cyprus)'), 'en_PK' : _('English (Pakistan)'), + 'en_HR' : _('English (Croatia)'), 'en_IL' : _('English (Israel)'), 'en_SG' : _('English (Singapore)'), 'en_YE' : _('English (Yemen)'),