From 7fdf70f733dfffa59b2dea634f08521b45b71cb2 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Thu, 18 Aug 2022 17:47:51 +0530 Subject: [PATCH] Update Indian Express --- recipes/indian_express.recipe | 13 +++++++++---- 1 file changed, 9 insertions(+), 4 deletions(-) diff --git a/recipes/indian_express.recipe b/recipes/indian_express.recipe index bb4e45f7d4..47fa2bbaae 100644 --- a/recipes/indian_express.recipe +++ b/recipes/indian_express.recipe @@ -25,6 +25,8 @@ class IndianExpress(BasicNewsRecipe): #storycenterbyline {font-size:small;} #img-cap {font-size:small;} blockquote{text-align:center; color:#404040;} + em{font-style:italic; color:#808080;} + #sub-d{color:#202020; font-style:italic;} ''' resolve_internal_links = True remove_empty_feeds = True @@ -64,7 +66,7 @@ class IndianExpress(BasicNewsRecipe): classes( 'share-social appstext ie-int-campign-ad ie-breadcrumb custom_read_button unitimg copyright' ' storytags pdsc-related-modify news-guard premium-story append_social_share' - ' digital-subscriber-only h-text-widget ie-premium ie-first-publish adboxtop adsizes' + ' digital-subscriber-only h-text-widget ie-premium ie-first-publish adboxtop adsizes related-widget immigrationimg' ) ] @@ -107,9 +109,12 @@ class IndianExpress(BasicNewsRecipe): return citem['content'] def preprocess_html(self, soup): - h2 = soup.findAll('h2') - for sub in h2: - sub.name = 'h5' + h1 = soup.find('h1') + if h1: + h2 = h1.findNext('h2') + if h2: + h2.name = 'p' + h2['id'] = 'sub-d' for span in soup.findAll( 'span', attrs={'class': ['ie-custom-caption', 'custom-caption']} ):