From da38b6653dc9f6ed8c46fa364ab2fea3412a2ac3 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Wed, 2 Jun 2021 07:56:05 +0530 Subject: [PATCH] Fix #1930480 [Updated recipe for Ambito.com](https://bugs.launchpad.net/calibre/+bug/1930480) --- recipes/ambito.recipe | 40 +++++++++++++++++++++------------------- 1 file changed, 21 insertions(+), 19 deletions(-) diff --git a/recipes/ambito.recipe b/recipes/ambito.recipe index f9a5b1dad1..b1a815b130 100644 --- a/recipes/ambito.recipe +++ b/recipes/ambito.recipe @@ -1,8 +1,9 @@ +#!/usr/bin/env python # -*- mode: python -*- # -*- coding: utf-8 -*- __license__ = 'GPL v3' -__copyright__ = '2008-2018, Darko Miletic ' +__copyright__ = '2008-2021, Darko Miletic ' ''' ambito.com ''' @@ -21,9 +22,13 @@ class Ambito(BasicNewsRecipe): encoding = 'utf8' use_embedded_content = False remove_empty_feeds = True + handle_gzip = True + compress_news_images = True + scale_news_images_to_device = True ignore_duplicate_articles = {'url'} language = 'es_AR' publication_type = 'newsportal' + masthead_url = 'https://www.ambito.com/css-custom/239/images/logo-239-2020v2.svg' extra_css = """ body{font-family: Roboto, sans-serif} """ @@ -35,24 +40,21 @@ class Ambito(BasicNewsRecipe): , 'language' : language } - keep_only_tags = [ - dict(name='h6', attrs={'class': lambda x: x and 'bajada' in x.split()}) - ,dict(name='span', attrs={'class': lambda x: x and 'dia' in x.split()}) - ,dict(attrs={'class': lambda x: x and 'titulo-noticia' in x.split()}) - ,dict(attrs={'class': lambda x: x and 'foto-perfil-columnista' in x.split()}) - ,dict(attrs={'class': lambda x: x and 'despliegue-noticia' in x.split()}) - ] - remove_tags = [dict(name=['object','link','embed','iframe','meta','link'])] + keep_only_tags = [ + dict(name='div', attrs={'class': 'detail-header-wrapper'}), + dict(attrs={'class': lambda x: x and 'detail-body' in x.split()}), + ] + remove_tags = [dict(name=['object', 'link', 'embed', 'iframe', 'meta', 'link', 'img'])] feeds = [ - (u'Principales Noticias', u'http://www.ambito.com/rss/noticiasp.asp') - ,(u'Economia' , u'http://www.ambito.com/rss/noticias.asp?S=Econom%EDa') - ,(u'Politica' , u'http://www.ambito.com/rss/noticias.asp?S=Pol%EDtica') - ,(u'Informacion General' , u'http://www.ambito.com/rss/noticias.asp?S=Informaci%F3n%20General') - ,(u'Campo' , u'http://www.ambito.com/rss/noticias.asp?S=Agro') - ,(u'Internacionales' , u'http://www.ambito.com/rss/noticias.asp?S=Internacionales') - ,(u'Deportes' , u'http://www.ambito.com/rss/noticias.asp?S=Deportes') - ,(u'Espectaculos' , u'http://www.ambito.com/rss/noticias.asp?S=Espect%E1culos') - ,(u'Tecnologia' , u'http://www.ambito.com/rss/noticias.asp?S=Tecnolog%EDa') - ,(u'Ambito Nacional' , u'http://www.ambito.com/rss/noticias.asp?S=Ambito%20Nacional') + (u'Portada' , u'https://www.ambito.com/rss/home.xml') + ,(u'Economia' , u'https://www.ambito.com/rss/economia.xml') + ,(u'Finanzas' , u'https://www.ambito.com/rss/finanzas.xml') + ,(u'Politica' , u'https://www.ambito.com/rss/politica.xml') + ,(u'Opinion' , u'https://www.ambito.com/rss/opinion.xml') + ,(u'Informacion General', u'https://www.ambito.com/rss/informacion-general.xml') + ,(u'Mundo' , u'https://www.ambito.com/rss/mundo.xml') + ,(u'Deportes' , u'https://www.ambito.com/rss/deportes.xml') + ,(u'Espectaculos' , u'https://www.ambito.com/rss/espectaculos.xml') + ,(u'Nacional' , u'https://www.ambito.com/rss/nacional.xml') ]