New Honduran recipes by Darko Miletic

2025-11-18 20:43:04 -05:00 · 2009-07-06 17:16:10 -06:00 · 2009-07-06 17:16:10 -06:00 · 3bb5d82da6
commit 3bb5d82da6
parent 4f1c599581
7 changed files with 174 additions and 1 deletions
--- a/src/calibre/gui2/images/news/eltiempo_hn.png
+++ b/src/calibre/gui2/images/news/eltiempo_hn.png
--- a/src/calibre/gui2/images/news/laprensa_hn.png
+++ b/src/calibre/gui2/images/news/laprensa_hn.png
--- a/src/calibre/gui2/images/news/latribuna.png
+++ b/src/calibre/gui2/images/news/latribuna.png
--- a/src/calibre/web/feeds/recipes/init.py
+++ b/src/calibre/web/feeds/recipes/init.py
@ -51,9 +51,11 @@ recipe_modules = ['recipe_' + r for r in (
           'theeconomictimes_india', '7dias', 'buenosaireseconomico',
           'diagonales', 'miradasalsur', 'newsweek_argentina', 'veintitres',
           'gva_be', 'hln', 'tijd', 'degentenaar', 'inquirer_net', 'uncrate',
-           'fastcompany', 'accountancyage',
+           'fastcompany', 'accountancyage', 'laprensa_hn', 'latribuna',
           'eltiempo_hn',
          )]
 import re, imp, inspect, time, os
 from calibre.web.feeds.news import BasicNewsRecipe, CustomIndexRecipe, AutomaticNewsRecipe
 from calibre.ebooks.BeautifulSoup import BeautifulSoup
--- a/src/calibre/web/feeds/recipes/recipe_eltiempo_hn.py
+++ b/src/calibre/web/feeds/recipes/recipe_eltiempo_hn.py
@ -0,0 +1,52 @@
 #!/usr/bin/env  python
 __license__   = 'GPL v3'
 __copyright__ = '2009, Darko Miletic <darko.miletic at gmail.com>'
 '''
 www.tiempo.hn
 '''
 from calibre.web.feeds.news import BasicNewsRecipe
 from calibre.ebooks.BeautifulSoup import BeautifulSoup, Tag
 class ElTiempoHn(BasicNewsRecipe):
    title                 = 'El Tiempo - Honduras'
    __author__            = 'Darko Miletic'
    description           = 'Noticias de Honduras y mundo'
    publisher             = 'El Tiempo'
    category              = 'news, politics, Honduras'
    oldest_article        = 2
    max_articles_per_feed = 100
    use_embedded_content  = False
    no_stylesheets        = True
    remove_javascript     = True
    encoding              = 'utf-8'
    language              = _('Spanish')
    lang                  = 'es-HN'
    direction             = 'ltr'
    html2lrf_options = [
                          '--comment', description
                        , '--category', category
                        , '--publisher', publisher
                        , '--ignore-tables'
                        ]
    html2epub_options = 'publisher="' + publisher + '"\ncomments="' + description + '"\ntags="' + category + '"\nlinearize_tables=True\npretty_print=True\noverride_css=" p {text-indent: 0cm; margin-top: 0em; margin-bottom: 0.5em} img {text-indent: 0cm; margin-top: 0em; margin-bottom: 0.5em}"' 
    remove_tags = [dict(name=['form','object','embed','base'])]
    keep_only_tags = [dict(name='td' , attrs={'id':'mainbodycont'})]
    feeds = [(u'Noticias', u'http://www.tiempo.hn/index.php?format=feed&type=rss')]
    def preprocess_html(self, soup):
        soup.html['lang'] = self.lang
        soup.html['dir' ] = self.direction
        mlang = Tag(soup,'meta',[("http-equiv","Content-Language"),("content",self.lang)])
        mcharset = Tag(soup,'meta',[("http-equiv","Content-Type"),("content","text/html; charset=utf-8")])
        soup.head.insert(0,mlang)
        soup.head.insert(1,mcharset)
        for item in soup.findAll(style=True):
            del item['style']
        return self.adeify_images(soup)
--- a/src/calibre/web/feeds/recipes/recipe_laprensa_hn.py
+++ b/src/calibre/web/feeds/recipes/recipe_laprensa_hn.py
@ -0,0 +1,54 @@
 #!/usr/bin/env  python
 __license__   = 'GPL v3'
 __copyright__ = '2009, Darko Miletic <darko.miletic at gmail.com>'
 '''
 www.laprensahn.com
 '''
 from calibre.web.feeds.news import BasicNewsRecipe
 from calibre.ebooks.BeautifulSoup import BeautifulSoup, Tag
 class LaPrensaHn(BasicNewsRecipe):
    title                 = 'La Prensa - Honduras'
    __author__            = 'Darko Miletic'
    description           = 'Noticias de Honduras y mundo'
    publisher             = 'La Prensa'
    category              = 'news, politics, Honduras'
    oldest_article        = 2
    max_articles_per_feed = 100
    use_embedded_content  = False
    no_stylesheets        = True
    remove_javascript     = True
    encoding              = 'utf-8'
    language              = _('Spanish')
    lang                  = 'es-HN'
    direction             = 'ltr'
    html2lrf_options = [
                          '--comment', description
                        , '--category', category
                        , '--publisher', publisher
                        ]
    html2epub_options = 'publisher="' + publisher + '"\ncomments="' + description + '"\ntags="' + category + '"\npretty_print=True\noverride_css=" p {text-indent: 0cm; margin-top: 0em; margin-bottom: 0.5em} "' 
    remove_tags = [dict(name=['form','object','embed'])]
    keep_only_tags = [
                         dict(name='h1' , attrs={'class':'titulo1'})
                        ,dict(name='div', attrs={'class':['sumario11','hora','texto']})
                     ]
    feeds = [(u'Noticias', u'http://feeds.feedburner.com/laprensa_titulares')]
    def preprocess_html(self, soup):
        soup.html['lang'] = self.lang
        soup.html['dir' ] = self.direction
        mlang = Tag(soup,'meta',[("http-equiv","Content-Language"),("content",self.lang)])
        mcharset = Tag(soup,'meta',[("http-equiv","Content-Type"),("content","text/html; charset=utf-8")])
        soup.head.insert(0,mlang)
        soup.head.insert(1,mcharset)
        for item in soup.findAll(style=True):
            del item['style']
        return soup
--- a/src/calibre/web/feeds/recipes/recipe_latribuna.py
+++ b/src/calibre/web/feeds/recipes/recipe_latribuna.py
@ -0,0 +1,65 @@
 #!/usr/bin/env  python
 __license__   = 'GPL v3'
 __copyright__ = '2009, Darko Miletic <darko.miletic at gmail.com>'
 '''
 www.latribuna.hn
 '''
 from calibre.web.feeds.news import BasicNewsRecipe
 from calibre.ebooks.BeautifulSoup import BeautifulSoup, Tag
 class LaTribuna(BasicNewsRecipe):
    title                 = 'La Tribuna - Honduras'
    __author__            = 'Darko Miletic'
    description           = 'Noticias de Honduras y mundo'
    publisher             = 'La Tribuna'
    category              = 'news, politics, Honduras'
    oldest_article        = 2
    max_articles_per_feed = 100
    use_embedded_content  = False
    no_stylesheets        = True
    remove_javascript     = True
    encoding              = 'utf-8'
    language              = _('Spanish')
    lang                  = 'es-HN'
    direction             = 'ltr'
    html2lrf_options = [
                          '--comment', description
                        , '--category', category
                        , '--publisher', publisher
                        ]
    html2epub_options = 'publisher="' + publisher + '"\ncomments="' + description + '"\ntags="' + category + '"\npretty_print=True\noverride_css=" p {text-indent: 0cm; margin-top: 0em; margin-bottom: 0.5em} "' 
    remove_tags = [dict(name=['form','object','embed'])]
    keep_only_tags = [
                        dict(name='p', attrs={'id':['BlogTitle','BlogDate']})
                       ,dict(name='div', attrs={'id':'BlogContent'})
                     ]
    feeds = [(u'Noticias', u'http://www.latribuna.hn/web2.0/?feed=rss')]
    def print_version(self, url):
        return url + '&print=1'
    def preprocess_html(self, soup):
        soup.html['lang'] = self.lang
        soup.html['dir' ] = self.direction
        mlang = Tag(soup,'meta',[("http-equiv","Content-Language"),("content",self.lang)])
        mcharset = Tag(soup,'meta',[("http-equiv","Content-Type"),("content","text/html; charset=utf-8")])
        soup.head.insert(0,mlang)
        soup.head.insert(1,mcharset)
        for item in soup.findAll(style=True):
            del item['style']
        return soup
    def get_cover_url(self):
        cover_url = None
        soup = self.index_to_soup('http://www.latribuna.hn/web2.0/')
        cover_item = soup.find('div',attrs={'class':'portada_impresa'})
        if cover_item:
           cover_url = cover_item.a.img['src']
        return cover_url